{"train/loss": 0.0308, "train/learning_rate": 1.4754098360655737e-06, "train/epoch": 10.0, "train/global_step": 1110, "_runtime": 26546, "_timestamp": 1648513448, "_step": 1113, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 34.0, 74.0, 168.0, 333.0, 235.0, 100.0, 43.0, 9.0, 5.0, 2.0, 0.0, 2.0], "bins": [-4.376101493835449, -4.297544956207275, -4.21898889541626, -4.140432357788086, -4.06187629699707, -3.9833199977874756, -3.904763698577881, -3.826207399368286, -3.7476511001586914, -3.6690948009490967, -3.590538501739502, -3.5119822025299072, -3.4334259033203125, -3.3548696041107178, -3.276313304901123, -3.1977570056915283, -3.1192007064819336, -3.040644407272339, -2.962088108062744, -2.8835318088531494, -2.8049755096435547, -2.72641921043396, -2.6478629112243652, -2.5693066120147705, -2.4907500743865967, -2.412193775177002, -2.3336374759674072, -2.2550811767578125, -2.1765248775482178, -2.097968578338623, -2.0194122791290283, -1.9408559799194336, -1.8622997999191284, -1.7837435007095337, -1.705187201499939, -1.6266309022903442, -1.5480746030807495, -1.4695183038711548, -1.3909618854522705, -1.3124055862426758, -1.233849287033081, -1.1552929878234863, -1.0767366886138916, -0.9981803894042969, -0.9196240901947021, -0.8410677909851074, -0.7625114321708679, -0.6839551329612732, -0.6053988933563232, -0.5268425941467285, -0.4482862949371338, -0.3697299659252167, -0.29117366671562195, -0.21261736750602722, -0.1340610384941101, -0.05550473928451538, 0.023051559925079346, 0.10160786658525467, 0.18016417324543, 0.2587204873561859, 0.33727678656578064, 0.41583308577537537, 0.4943894147872925, 0.5729457139968872, 0.6515020132064819]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 10.0, 7.0, 14.0, 13.0, 15.0, 14.0, 25.0, 35.0, 27.0, 29.0, 39.0, 34.0, 39.0, 40.0, 42.0, 46.0, 33.0, 54.0, 46.0, 39.0, 44.0, 57.0, 32.0, 45.0, 33.0, 27.0, 25.0, 27.0, 18.0, 16.0, 19.0, 14.0, 8.0, 12.0, 1.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5758266448974609, -0.5571876764297485, -0.5385486483573914, -0.519909679889679, -0.5012706518173218, -0.4826316833496094, -0.4639926850795746, -0.4453536868095398, -0.426714688539505, -0.4080756902694702, -0.3894366919994354, -0.37079769372940063, -0.35215872526168823, -0.33351969718933105, -0.31488072872161865, -0.29624173045158386, -0.2776027321815491, -0.2589637339115143, -0.2403247356414795, -0.2216857522726059, -0.2030467540025711, -0.18440775573253632, -0.16576877236366272, -0.14712977409362793, -0.12849077582359314, -0.10985177755355835, -0.09121278673410416, -0.07257379591464996, -0.05393479764461517, -0.03529579937458038, -0.01665680855512619, 0.001982182264328003, 0.020621120929718018, 0.03926011547446251, 0.057899110019207, 0.0765381008386612, 0.09517709910869598, 0.11381609737873077, 0.13245508074760437, 0.15109407901763916, 0.16973307728767395, 0.18837207555770874, 0.20701107382774353, 0.22565005719661713, 0.24428905546665192, 0.2629280686378479, 0.2815670371055603, 0.3002060353755951, 0.3188450336456299, 0.3374840319156647, 0.35612303018569946, 0.37476202845573425, 0.39340102672576904, 0.41203999519348145, 0.43067899346351624, 0.449317991733551, 0.4679569900035858, 0.4865959882736206, 0.505234956741333, 0.5238739848136902, 0.5425129532814026, 0.5611519813537598, 0.5797909498214722, 0.5984299182891846, 0.6170689463615417]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 14.0, 13.0, 25.0, 37.0, 70.0, 78.0, 92.0, 158.0, 186.0, 328.0, 447.0, 763.0, 1228.0, 2196.0, 3983.0, 7429.0, 16140.0, 60534.0, 567329.0, 2653480.0, 762211.0, 79108.0, 18380.0, 8465.0, 4572.0, 2706.0, 1542.0, 919.0, 600.0, 388.0, 236.0, 149.0, 126.0, 99.0, 69.0, 48.0, 33.0, 29.0, 9.0, 15.0, 12.0, 11.0, 4.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7685546875, -1.7087554931640625, -1.648956298828125, -1.5891571044921875, -1.52935791015625, -1.4695587158203125, -1.409759521484375, -1.3499603271484375, -1.2901611328125, -1.2303619384765625, -1.170562744140625, -1.1107635498046875, -1.05096435546875, -0.9911651611328125, -0.931365966796875, -0.8715667724609375, -0.811767578125, -0.7519683837890625, -0.692169189453125, -0.6323699951171875, -0.57257080078125, -0.5127716064453125, -0.452972412109375, -0.3931732177734375, -0.3333740234375, -0.2735748291015625, -0.213775634765625, -0.1539764404296875, -0.09417724609375, -0.0343780517578125, 0.025421142578125, 0.0852203369140625, 0.14501953125, 0.2048187255859375, 0.264617919921875, 0.3244171142578125, 0.38421630859375, 0.4440155029296875, 0.503814697265625, 0.5636138916015625, 0.6234130859375, 0.6832122802734375, 0.743011474609375, 0.8028106689453125, 0.86260986328125, 0.9224090576171875, 0.982208251953125, 1.0420074462890625, 1.101806640625, 1.1616058349609375, 1.221405029296875, 1.2812042236328125, 1.34100341796875, 1.4008026123046875, 1.460601806640625, 1.5204010009765625, 1.5802001953125, 1.6399993896484375, 1.699798583984375, 1.7595977783203125, 1.81939697265625, 1.8791961669921875, 1.938995361328125, 1.9987945556640625, 2.05859375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 6.0, 12.0, 6.0, 10.0, 8.0, 9.0, 13.0, 14.0, 23.0, 32.0, 29.0, 38.0, 38.0, 29.0, 32.0, 44.0, 41.0, 45.0, 45.0, 37.0, 38.0, 44.0, 36.0, 45.0, 49.0, 35.0, 33.0, 25.0, 29.0, 22.0, 23.0, 22.0, 11.0, 16.0, 16.0, 11.0, 2.0, 7.0, 4.0, 10.0, 1.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.998046875, -0.966156005859375, -0.93426513671875, -0.902374267578125, -0.8704833984375, -0.838592529296875, -0.80670166015625, -0.774810791015625, -0.742919921875, -0.711029052734375, -0.67913818359375, -0.647247314453125, -0.6153564453125, -0.583465576171875, -0.55157470703125, -0.519683837890625, -0.48779296875, -0.455902099609375, -0.42401123046875, -0.392120361328125, -0.3602294921875, -0.328338623046875, -0.29644775390625, -0.264556884765625, -0.232666015625, -0.200775146484375, -0.16888427734375, -0.136993408203125, -0.1051025390625, -0.073211669921875, -0.04132080078125, -0.009429931640625, 0.0224609375, 0.054351806640625, 0.08624267578125, 0.118133544921875, 0.1500244140625, 0.181915283203125, 0.21380615234375, 0.245697021484375, 0.277587890625, 0.309478759765625, 0.34136962890625, 0.373260498046875, 0.4051513671875, 0.437042236328125, 0.46893310546875, 0.500823974609375, 0.53271484375, 0.564605712890625, 0.59649658203125, 0.628387451171875, 0.6602783203125, 0.692169189453125, 0.72406005859375, 0.755950927734375, 0.787841796875, 0.819732666015625, 0.85162353515625, 0.883514404296875, 0.9154052734375, 0.947296142578125, 0.97918701171875, 1.011077880859375, 1.04296875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 14.0, 29.0, 44.0, 69.0, 153.0, 684.0, 8936.0, 4174470.0, 8802.0, 687.0, 168.0, 77.0, 39.0, 30.0, 17.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.609375, -16.1414794921875, -15.673583984375, -15.2056884765625, -14.73779296875, -14.2698974609375, -13.802001953125, -13.3341064453125, -12.8662109375, -12.3983154296875, -11.930419921875, -11.4625244140625, -10.99462890625, -10.5267333984375, -10.058837890625, -9.5909423828125, -9.123046875, -8.6551513671875, -8.187255859375, -7.7193603515625, -7.25146484375, -6.7835693359375, -6.315673828125, -5.8477783203125, -5.3798828125, -4.9119873046875, -4.444091796875, -3.9761962890625, -3.50830078125, -3.0404052734375, -2.572509765625, -2.1046142578125, -1.63671875, -1.1688232421875, -0.700927734375, -0.2330322265625, 0.23486328125, 0.7027587890625, 1.170654296875, 1.6385498046875, 2.1064453125, 2.5743408203125, 3.042236328125, 3.5101318359375, 3.97802734375, 4.4459228515625, 4.913818359375, 5.3817138671875, 5.849609375, 6.3175048828125, 6.785400390625, 7.2532958984375, 7.72119140625, 8.1890869140625, 8.656982421875, 9.1248779296875, 9.5927734375, 10.0606689453125, 10.528564453125, 10.9964599609375, 11.46435546875, 11.9322509765625, 12.400146484375, 12.8680419921875, 13.3359375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 17.0, 18.0, 35.0, 59.0, 105.0, 199.0, 638.0, 1652.0, 804.0, 228.0, 111.0, 63.0, 37.0, 23.0, 20.0, 13.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74560546875, -0.7175369262695312, -0.6894683837890625, -0.6613998413085938, -0.633331298828125, -0.6052627563476562, -0.5771942138671875, -0.5491256713867188, -0.52105712890625, -0.49298858642578125, -0.4649200439453125, -0.43685150146484375, -0.408782958984375, -0.38071441650390625, -0.3526458740234375, -0.32457733154296875, -0.2965087890625, -0.26844024658203125, -0.2403717041015625, -0.21230316162109375, -0.184234619140625, -0.15616607666015625, -0.1280975341796875, -0.10002899169921875, -0.07196044921875, -0.04389190673828125, -0.0158233642578125, 0.01224517822265625, 0.040313720703125, 0.06838226318359375, 0.0964508056640625, 0.12451934814453125, 0.152587890625, 0.18065643310546875, 0.2087249755859375, 0.23679351806640625, 0.264862060546875, 0.29293060302734375, 0.3209991455078125, 0.34906768798828125, 0.37713623046875, 0.40520477294921875, 0.4332733154296875, 0.46134185791015625, 0.489410400390625, 0.5174789428710938, 0.5455474853515625, 0.5736160278320312, 0.6016845703125, 0.6297531127929688, 0.6578216552734375, 0.6858901977539062, 0.713958740234375, 0.7420272827148438, 0.7700958251953125, 0.7981643676757812, 0.82623291015625, 0.8543014526367188, 0.8823699951171875, 0.9104385375976562, 0.938507080078125, 0.9665756225585938, 0.9946441650390625, 1.0227127075195312, 1.05078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 4.0, 7.0, 13.0, 15.0, 16.0, 27.0, 36.0, 37.0, 52.0, 50.0, 70.0, 82.0, 99.0, 87.0, 72.0, 74.0, 60.0, 43.0, 35.0, 26.0, 23.0, 11.0, 11.0, 6.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5493606328964233, -1.5017366409301758, -1.4541127681732178, -1.4064887762069702, -1.3588649034500122, -1.3112409114837646, -1.2636170387268066, -1.215993046760559, -1.1683690547943115, -1.120745062828064, -1.073121190071106, -1.0254971981048584, -0.9778733253479004, -0.9302493333816528, -0.88262540102005, -0.8350014686584473, -0.7873775959014893, -0.7397536635398865, -0.6921297311782837, -0.6445057392120361, -0.5968818664550781, -0.5492578744888306, -0.5016339421272278, -0.454010009765625, -0.4063860774040222, -0.35876214504241943, -0.31113821268081665, -0.2635142505168915, -0.2158903181552887, -0.1682663857936859, -0.12064242362976074, -0.07301849126815796, -0.025394439697265625, 0.022229500114917755, 0.06985343992710114, 0.11747738718986511, 0.1651013195514679, 0.21272525191307068, 0.26034921407699585, 0.30797314643859863, 0.3555970788002014, 0.4032210111618042, 0.450844943523407, 0.49846890568733215, 0.5460928678512573, 0.5937167406082153, 0.6413407325744629, 0.6889646649360657, 0.7365885972976685, 0.7842125296592712, 0.831836462020874, 0.8794604539871216, 0.9270843267440796, 0.9747083187103271, 1.0223321914672852, 1.0699561834335327, 1.1175801753997803, 1.1652041673660278, 1.2128280401229858, 1.2604520320892334, 1.3080759048461914, 1.355699896812439, 1.4033238887786865, 1.4509477615356445, 1.4985716342926025]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 2.0, 8.0, 12.0, 20.0, 10.0, 17.0, 18.0, 26.0, 25.0, 25.0, 28.0, 33.0, 41.0, 38.0, 39.0, 36.0, 41.0, 35.0, 39.0, 46.0, 43.0, 28.0, 46.0, 33.0, 40.0, 38.0, 30.0, 29.0, 17.0, 15.0, 25.0, 8.0, 22.0, 15.0, 15.0, 7.0, 6.0, 7.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9994038939476013, -0.9701382517814636, -0.9408726692199707, -0.911607027053833, -0.8823413848876953, -0.8530758023262024, -0.8238101601600647, -0.7945445775985718, -0.7652789354324341, -0.7360132932662964, -0.7067477107048035, -0.6774820685386658, -0.6482164263725281, -0.6189508438110352, -0.5896852016448975, -0.5604195594787598, -0.5311539173126221, -0.5018882751464844, -0.47262266278266907, -0.44335705041885376, -0.41409143805503845, -0.38482582569122314, -0.35556018352508545, -0.32629457116127014, -0.29702895879745483, -0.2677633464336395, -0.23849771916866302, -0.20923209190368652, -0.17996647953987122, -0.15070085227489471, -0.12143522500991821, -0.0921696126461029, -0.0629040002822876, -0.03363838046789169, -0.00437275692820549, 0.024892866611480713, 0.05415848642587662, 0.08342410624027252, 0.11268973350524902, 0.14195534586906433, 0.17122097313404083, 0.20048660039901733, 0.22975221276283264, 0.25901782512664795, 0.28828346729278564, 0.31754907965660095, 0.34681469202041626, 0.37608033418655396, 0.40534594655036926, 0.43461155891418457, 0.46387720108032227, 0.4931428134441376, 0.5224084258079529, 0.5516740679740906, 0.5809396505355835, 0.6102052927017212, 0.6394709348678589, 0.6687365770339966, 0.6980021595954895, 0.7272678017616272, 0.7565334439277649, 0.7857990264892578, 0.8150646686553955, 0.8443303108215332, 0.8735958933830261]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 6.0, 9.0, 20.0, 28.0, 43.0, 69.0, 84.0, 124.0, 205.0, 310.0, 467.0, 788.0, 1255.0, 2086.0, 3416.0, 5622.0, 9460.0, 16580.0, 29324.0, 54762.0, 105941.0, 209747.0, 280857.0, 153086.0, 78141.0, 41614.0, 22626.0, 12912.0, 7396.0, 4483.0, 2701.0, 1649.0, 1037.0, 602.0, 406.0, 247.0, 127.0, 107.0, 67.0, 55.0, 33.0, 9.0, 20.0, 9.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.4306640625, -0.4177207946777344, -0.40477752685546875, -0.3918342590332031, -0.3788909912109375, -0.3659477233886719, -0.35300445556640625, -0.3400611877441406, -0.327117919921875, -0.3141746520996094, -0.30123138427734375, -0.2882881164550781, -0.2753448486328125, -0.2624015808105469, -0.24945831298828125, -0.23651504516601562, -0.22357177734375, -0.21062850952148438, -0.19768524169921875, -0.18474197387695312, -0.1717987060546875, -0.15885543823242188, -0.14591217041015625, -0.13296890258789062, -0.120025634765625, -0.10708236694335938, -0.09413909912109375, -0.08119583129882812, -0.0682525634765625, -0.055309295654296875, -0.04236602783203125, -0.029422760009765625, -0.0164794921875, -0.003536224365234375, 0.00940704345703125, 0.022350311279296875, 0.0352935791015625, 0.048236846923828125, 0.06118011474609375, 0.07412338256835938, 0.087066650390625, 0.10000991821289062, 0.11295318603515625, 0.12589645385742188, 0.1388397216796875, 0.15178298950195312, 0.16472625732421875, 0.17766952514648438, 0.19061279296875, 0.20355606079101562, 0.21649932861328125, 0.22944259643554688, 0.2423858642578125, 0.2553291320800781, 0.26827239990234375, 0.2812156677246094, 0.294158935546875, 0.3071022033691406, 0.32004547119140625, 0.3329887390136719, 0.3459320068359375, 0.3588752746582031, 0.37181854248046875, 0.3847618103027344, 0.397705078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 5.0, 4.0, 3.0, 6.0, 13.0, 12.0, 16.0, 14.0, 24.0, 26.0, 17.0, 36.0, 33.0, 33.0, 44.0, 45.0, 35.0, 40.0, 41.0, 43.0, 43.0, 63.0, 39.0, 51.0, 40.0, 40.0, 31.0, 39.0, 25.0, 15.0, 13.0, 14.0, 13.0, 15.0, 16.0, 13.0, 8.0, 9.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71728515625, -0.6948699951171875, -0.672454833984375, -0.6500396728515625, -0.62762451171875, -0.6052093505859375, -0.582794189453125, -0.5603790283203125, -0.5379638671875, -0.5155487060546875, -0.493133544921875, -0.4707183837890625, -0.44830322265625, -0.4258880615234375, -0.403472900390625, -0.3810577392578125, -0.358642578125, -0.3362274169921875, -0.313812255859375, -0.2913970947265625, -0.26898193359375, -0.2465667724609375, -0.224151611328125, -0.2017364501953125, -0.1793212890625, -0.1569061279296875, -0.134490966796875, -0.1120758056640625, -0.08966064453125, -0.0672454833984375, -0.044830322265625, -0.0224151611328125, 0.0, 0.0224151611328125, 0.044830322265625, 0.0672454833984375, 0.08966064453125, 0.1120758056640625, 0.134490966796875, 0.1569061279296875, 0.1793212890625, 0.2017364501953125, 0.224151611328125, 0.2465667724609375, 0.26898193359375, 0.2913970947265625, 0.313812255859375, 0.3362274169921875, 0.358642578125, 0.3810577392578125, 0.403472900390625, 0.4258880615234375, 0.44830322265625, 0.4707183837890625, 0.493133544921875, 0.5155487060546875, 0.5379638671875, 0.5603790283203125, 0.582794189453125, 0.6052093505859375, 0.62762451171875, 0.6500396728515625, 0.672454833984375, 0.6948699951171875, 0.71728515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 21.0, 27.0, 34.0, 50.0, 82.0, 100.0, 156.0, 258.0, 403.0, 678.0, 1243.0, 2598.0, 5867.0, 15841.0, 48934.0, 169517.0, 475092.0, 229292.0, 64182.0, 20272.0, 7335.0, 3096.0, 1504.0, 765.0, 445.0, 246.0, 172.0, 95.0, 69.0, 52.0, 24.0, 24.0, 19.0, 16.0, 4.0, 10.0, 2.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5904159545898438, -0.5704803466796875, -0.5505447387695312, -0.530609130859375, -0.5106735229492188, -0.4907379150390625, -0.47080230712890625, -0.45086669921875, -0.43093109130859375, -0.4109954833984375, -0.39105987548828125, -0.371124267578125, -0.35118865966796875, -0.3312530517578125, -0.31131744384765625, -0.2913818359375, -0.27144622802734375, -0.2515106201171875, -0.23157501220703125, -0.211639404296875, -0.19170379638671875, -0.1717681884765625, -0.15183258056640625, -0.13189697265625, -0.11196136474609375, -0.0920257568359375, -0.07209014892578125, -0.052154541015625, -0.03221893310546875, -0.0122833251953125, 0.00765228271484375, 0.027587890625, 0.04752349853515625, 0.0674591064453125, 0.08739471435546875, 0.107330322265625, 0.12726593017578125, 0.1472015380859375, 0.16713714599609375, 0.18707275390625, 0.20700836181640625, 0.2269439697265625, 0.24687957763671875, 0.266815185546875, 0.28675079345703125, 0.3066864013671875, 0.32662200927734375, 0.3465576171875, 0.36649322509765625, 0.3864288330078125, 0.40636444091796875, 0.426300048828125, 0.44623565673828125, 0.4661712646484375, 0.48610687255859375, 0.50604248046875, 0.5259780883789062, 0.5459136962890625, 0.5658493041992188, 0.585784912109375, 0.6057205200195312, 0.6256561279296875, 0.6455917358398438, 0.66552734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 8.0, 14.0, 9.0, 12.0, 18.0, 18.0, 23.0, 31.0, 35.0, 32.0, 35.0, 42.0, 50.0, 51.0, 50.0, 55.0, 55.0, 44.0, 38.0, 42.0, 34.0, 34.0, 37.0, 39.0, 29.0, 25.0, 32.0, 20.0, 25.0, 14.0, 4.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.5337371826171875, -1.483489990234375, -1.4332427978515625, -1.38299560546875, -1.3327484130859375, -1.282501220703125, -1.2322540283203125, -1.1820068359375, -1.1317596435546875, -1.081512451171875, -1.0312652587890625, -0.98101806640625, -0.9307708740234375, -0.880523681640625, -0.8302764892578125, -0.780029296875, -0.7297821044921875, -0.679534912109375, -0.6292877197265625, -0.57904052734375, -0.5287933349609375, -0.478546142578125, -0.4282989501953125, -0.3780517578125, -0.3278045654296875, -0.277557373046875, -0.2273101806640625, -0.17706298828125, -0.1268157958984375, -0.076568603515625, -0.0263214111328125, 0.02392578125, 0.0741729736328125, 0.124420166015625, 0.1746673583984375, 0.22491455078125, 0.2751617431640625, 0.325408935546875, 0.3756561279296875, 0.4259033203125, 0.4761505126953125, 0.526397705078125, 0.5766448974609375, 0.62689208984375, 0.6771392822265625, 0.727386474609375, 0.7776336669921875, 0.827880859375, 0.8781280517578125, 0.928375244140625, 0.9786224365234375, 1.02886962890625, 1.0791168212890625, 1.129364013671875, 1.1796112060546875, 1.2298583984375, 1.2801055908203125, 1.330352783203125, 1.3805999755859375, 1.43084716796875, 1.4810943603515625, 1.531341552734375, 1.5815887451171875, 1.6318359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 10.0, 9.0, 11.0, 31.0, 31.0, 42.0, 73.0, 73.0, 121.0, 204.0, 271.0, 459.0, 747.0, 1351.0, 2339.0, 4663.0, 10122.0, 23346.0, 64980.0, 235714.0, 476161.0, 148383.0, 45838.0, 17196.0, 7663.0, 3814.0, 1962.0, 1129.0, 645.0, 395.0, 265.0, 170.0, 108.0, 61.0, 44.0, 38.0, 15.0, 23.0, 10.0, 12.0, 10.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1422119140625, -0.13781356811523438, -0.13341522216796875, -0.12901687622070312, -0.1246185302734375, -0.12022018432617188, -0.11582183837890625, -0.11142349243164062, -0.107025146484375, -0.10262680053710938, -0.09822845458984375, -0.09383010864257812, -0.0894317626953125, -0.08503341674804688, -0.08063507080078125, -0.07623672485351562, -0.07183837890625, -0.06744003295898438, -0.06304168701171875, -0.058643341064453125, -0.0542449951171875, -0.049846649169921875, -0.04544830322265625, -0.041049957275390625, -0.036651611328125, -0.032253265380859375, -0.02785491943359375, -0.023456573486328125, -0.0190582275390625, -0.014659881591796875, -0.01026153564453125, -0.005863189697265625, -0.00146484375, 0.002933502197265625, 0.00733184814453125, 0.011730194091796875, 0.0161285400390625, 0.020526885986328125, 0.02492523193359375, 0.029323577880859375, 0.033721923828125, 0.038120269775390625, 0.04251861572265625, 0.046916961669921875, 0.0513153076171875, 0.055713653564453125, 0.06011199951171875, 0.06451034545898438, 0.06890869140625, 0.07330703735351562, 0.07770538330078125, 0.08210372924804688, 0.0865020751953125, 0.09090042114257812, 0.09529876708984375, 0.09969711303710938, 0.104095458984375, 0.10849380493164062, 0.11289215087890625, 0.11729049682617188, 0.1216888427734375, 0.12608718872070312, 0.13048553466796875, 0.13488388061523438, 0.1392822265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 5.0, 11.0, 10.0, 23.0, 17.0, 29.0, 32.0, 60.0, 94.0, 135.0, 181.0, 100.0, 73.0, 51.0, 39.0, 36.0, 17.0, 18.0, 14.0, 13.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013494491577148438, -0.00013016164302825928, -0.00012537837028503418, -0.00012059509754180908, -0.00011581182479858398, -0.00011102855205535889, -0.00010624527931213379, -0.00010146200656890869, -9.66787338256836e-05, -9.18954610824585e-05, -8.71121883392334e-05, -8.23289155960083e-05, -7.75456428527832e-05, -7.27623701095581e-05, -6.797909736633301e-05, -6.319582462310791e-05, -5.841255187988281e-05, -5.3629279136657715e-05, -4.884600639343262e-05, -4.406273365020752e-05, -3.927946090698242e-05, -3.4496188163757324e-05, -2.9712915420532227e-05, -2.492964267730713e-05, -2.014636993408203e-05, -1.5363097190856934e-05, -1.0579824447631836e-05, -5.796551704406738e-06, -1.0132789611816406e-06, 3.769993782043457e-06, 8.553266525268555e-06, 1.3336539268493652e-05, 1.811981201171875e-05, 2.2903084754943848e-05, 2.7686357498168945e-05, 3.246963024139404e-05, 3.725290298461914e-05, 4.203617572784424e-05, 4.6819448471069336e-05, 5.1602721214294434e-05, 5.638599395751953e-05, 6.116926670074463e-05, 6.595253944396973e-05, 7.073581218719482e-05, 7.551908493041992e-05, 8.030235767364502e-05, 8.508563041687012e-05, 8.986890316009521e-05, 9.465217590332031e-05, 9.943544864654541e-05, 0.00010421872138977051, 0.0001090019941329956, 0.0001137852668762207, 0.0001185685396194458, 0.0001233518123626709, 0.000128135085105896, 0.0001329183578491211, 0.0001377016305923462, 0.0001424849033355713, 0.0001472681760787964, 0.00015205144882202148, 0.00015683472156524658, 0.00016161799430847168, 0.00016640126705169678, 0.00017118453979492188]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 8.0, 13.0, 8.0, 6.0, 14.0, 17.0, 33.0, 62.0, 117.0, 186.0, 440.0, 1051.0, 3239.0, 13769.0, 103624.0, 760750.0, 141917.0, 17167.0, 3898.0, 1234.0, 485.0, 232.0, 101.0, 49.0, 40.0, 20.0, 12.0, 9.0, 11.0, 7.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.386962890625, -0.3771820068359375, -0.367401123046875, -0.3576202392578125, -0.34783935546875, -0.3380584716796875, -0.328277587890625, -0.3184967041015625, -0.3087158203125, -0.2989349365234375, -0.289154052734375, -0.2793731689453125, -0.26959228515625, -0.2598114013671875, -0.250030517578125, -0.2402496337890625, -0.23046875, -0.2206878662109375, -0.210906982421875, -0.2011260986328125, -0.19134521484375, -0.1815643310546875, -0.171783447265625, -0.1620025634765625, -0.1522216796875, -0.1424407958984375, -0.132659912109375, -0.1228790283203125, -0.11309814453125, -0.1033172607421875, -0.093536376953125, -0.0837554931640625, -0.073974609375, -0.0641937255859375, -0.054412841796875, -0.0446319580078125, -0.03485107421875, -0.0250701904296875, -0.015289306640625, -0.0055084228515625, 0.0042724609375, 0.0140533447265625, 0.023834228515625, 0.0336151123046875, 0.04339599609375, 0.0531768798828125, 0.062957763671875, 0.0727386474609375, 0.08251953125, 0.0923004150390625, 0.102081298828125, 0.1118621826171875, 0.12164306640625, 0.1314239501953125, 0.141204833984375, 0.1509857177734375, 0.1607666015625, 0.1705474853515625, 0.180328369140625, 0.1901092529296875, 0.19989013671875, 0.2096710205078125, 0.219451904296875, 0.2292327880859375, 0.239013671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 10.0, 5.0, 8.0, 6.0, 11.0, 13.0, 24.0, 20.0, 28.0, 41.0, 52.0, 55.0, 66.0, 72.0, 91.0, 77.0, 87.0, 57.0, 53.0, 41.0, 32.0, 28.0, 25.0, 13.0, 20.0, 12.0, 9.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.06622314453125, -0.06446170806884766, -0.06270027160644531, -0.06093883514404297, -0.059177398681640625, -0.05741596221923828, -0.05565452575683594, -0.053893089294433594, -0.05213165283203125, -0.050370216369628906, -0.04860877990722656, -0.04684734344482422, -0.045085906982421875, -0.04332447052001953, -0.04156303405761719, -0.039801597595214844, -0.0380401611328125, -0.036278724670410156, -0.03451728820800781, -0.03275585174560547, -0.030994415283203125, -0.02923297882080078, -0.027471542358398438, -0.025710105895996094, -0.02394866943359375, -0.022187232971191406, -0.020425796508789062, -0.01866436004638672, -0.016902923583984375, -0.015141487121582031, -0.013380050659179688, -0.011618614196777344, -0.009857177734375, -0.008095741271972656, -0.0063343048095703125, -0.004572868347167969, -0.002811431884765625, -0.0010499954223632812, 0.0007114410400390625, 0.0024728775024414062, 0.00423431396484375, 0.005995750427246094, 0.0077571868896484375, 0.009518623352050781, 0.011280059814453125, 0.013041496276855469, 0.014802932739257812, 0.016564369201660156, 0.0183258056640625, 0.020087242126464844, 0.021848678588867188, 0.02361011505126953, 0.025371551513671875, 0.02713298797607422, 0.028894424438476562, 0.030655860900878906, 0.03241729736328125, 0.034178733825683594, 0.03594017028808594, 0.03770160675048828, 0.039463043212890625, 0.04122447967529297, 0.04298591613769531, 0.044747352600097656, 0.0465087890625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 13.0, 29.0, 45.0, 108.0, 186.0, 268.0, 169.0, 99.0, 58.0, 19.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6685404777526855, -2.583641767501831, -2.4987430572509766, -2.413844108581543, -2.3289453983306885, -2.244046688079834, -2.1591479778289795, -2.074249267578125, -1.989350438117981, -1.9044517278671265, -1.8195528984069824, -1.734654188156128, -1.6497554779052734, -1.5648566484451294, -1.479957938194275, -1.3950591087341309, -1.3101603984832764, -1.2252616882324219, -1.1403628587722778, -1.0554641485214233, -0.9705653786659241, -0.8856666088104248, -0.8007678985595703, -0.715869128704071, -0.6309703588485718, -0.5460715889930725, -0.46117284893989563, -0.37627410888671875, -0.2913753390312195, -0.20647656917572021, -0.12157785892486572, -0.036679089069366455, 0.04821968078613281, 0.1331184357404709, 0.21801719069480896, 0.30291593074798584, 0.3878147006034851, 0.4727134704589844, 0.5576121807098389, 0.6425109505653381, 0.7274097204208374, 0.8123084902763367, 0.8972072601318359, 0.9821059703826904, 1.067004680633545, 1.151903510093689, 1.2368022203445435, 1.3217010498046875, 1.406599760055542, 1.4914984703063965, 1.5763972997665405, 1.661296010017395, 1.746194839477539, 1.8310935497283936, 1.915992259979248, 2.0008909702301025, 2.085789680480957, 2.1706883907318115, 2.255587100982666, 2.3404860496520996, 2.425384759902954, 2.5102834701538086, 2.595182180404663, 2.6800808906555176, 2.764979839324951]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 1.0, 9.0, 8.0, 6.0, 9.0, 9.0, 22.0, 8.0, 16.0, 22.0, 15.0, 17.0, 28.0, 28.0, 36.0, 36.0, 36.0, 45.0, 23.0, 38.0, 33.0, 46.0, 38.0, 40.0, 42.0, 32.0, 33.0, 44.0, 26.0, 28.0, 27.0, 27.0, 25.0, 21.0, 20.0, 11.0, 17.0, 12.0, 10.0, 12.0, 8.0, 6.0, 5.0, 5.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5722605586051941, -0.5532446503639221, -0.5342288017272949, -0.515212893486023, -0.49619701504707336, -0.4771811366081238, -0.4581652283668518, -0.4391493499279022, -0.42013347148895264, -0.40111759305000305, -0.3821016848087311, -0.3630858063697815, -0.3440699279308319, -0.3250540494918823, -0.30603814125061035, -0.28702226281166077, -0.2680063545703888, -0.24899046123027802, -0.22997458279132843, -0.21095868945121765, -0.19194281101226807, -0.1729269176721573, -0.1539110243320465, -0.13489514589309692, -0.11587925255298615, -0.09686336666345596, -0.07784748077392578, -0.058831587433815, -0.03981570154428482, -0.02079981565475464, -0.0017839223146438599, 0.017231956124305725, 0.036247849464416504, 0.055263735353946686, 0.07427962124347687, 0.09329551458358765, 0.11231140047311783, 0.131327286362648, 0.1503431797027588, 0.16935905814170837, 0.18837495148181915, 0.20739084482192993, 0.22640672326087952, 0.2454226166009903, 0.2644385099411011, 0.28345438838005066, 0.30247026681900024, 0.3214861750602722, 0.3405020534992218, 0.3595179319381714, 0.37853384017944336, 0.39754971861839294, 0.41656559705734253, 0.4355815052986145, 0.4545973837375641, 0.47361326217651367, 0.49262917041778564, 0.5116450786590576, 0.5306609272956848, 0.5496768355369568, 0.5686927437782288, 0.587708592414856, 0.6067245006561279, 0.6257404088973999, 0.6447562575340271]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 11.0, 9.0, 35.0, 29.0, 50.0, 91.0, 133.0, 220.0, 285.0, 417.0, 678.0, 1131.0, 1914.0, 3648.0, 7258.0, 16128.0, 47153.0, 227644.0, 602791.0, 90321.0, 26761.0, 10152.0, 5090.0, 2687.0, 1441.0, 866.0, 559.0, 338.0, 212.0, 162.0, 117.0, 62.0, 51.0, 31.0, 17.0, 14.0, 11.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9065322875976562, -0.8775177001953125, -0.8485031127929688, -0.819488525390625, -0.7904739379882812, -0.7614593505859375, -0.7324447631835938, -0.70343017578125, -0.6744155883789062, -0.6454010009765625, -0.6163864135742188, -0.587371826171875, -0.5583572387695312, -0.5293426513671875, -0.5003280639648438, -0.4713134765625, -0.44229888916015625, -0.4132843017578125, -0.38426971435546875, -0.355255126953125, -0.32624053955078125, -0.2972259521484375, -0.26821136474609375, -0.23919677734375, -0.21018218994140625, -0.1811676025390625, -0.15215301513671875, -0.123138427734375, -0.09412384033203125, -0.0651092529296875, -0.03609466552734375, -0.007080078125, 0.02193450927734375, 0.0509490966796875, 0.07996368408203125, 0.108978271484375, 0.13799285888671875, 0.1670074462890625, 0.19602203369140625, 0.22503662109375, 0.25405120849609375, 0.2830657958984375, 0.31208038330078125, 0.341094970703125, 0.37010955810546875, 0.3991241455078125, 0.42813873291015625, 0.4571533203125, 0.48616790771484375, 0.5151824951171875, 0.5441970825195312, 0.573211669921875, 0.6022262573242188, 0.6312408447265625, 0.6602554321289062, 0.68927001953125, 0.7182846069335938, 0.7472991943359375, 0.7763137817382812, 0.805328369140625, 0.8343429565429688, 0.8633575439453125, 0.8923721313476562, 0.92138671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 7.0, 11.0, 9.0, 7.0, 9.0, 12.0, 12.0, 21.0, 17.0, 12.0, 23.0, 32.0, 29.0, 31.0, 42.0, 41.0, 46.0, 47.0, 61.0, 62.0, 62.0, 49.0, 39.0, 46.0, 44.0, 25.0, 30.0, 24.0, 36.0, 13.0, 15.0, 15.0, 10.0, 11.0, 8.0, 6.0, 5.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.36328125, -4.2236328125, -4.083984375, -3.9443359375, -3.8046875, -3.6650390625, -3.525390625, -3.3857421875, -3.24609375, -3.1064453125, -2.966796875, -2.8271484375, -2.6875, -2.5478515625, -2.408203125, -2.2685546875, -2.12890625, -1.9892578125, -1.849609375, -1.7099609375, -1.5703125, -1.4306640625, -1.291015625, -1.1513671875, -1.01171875, -0.8720703125, -0.732421875, -0.5927734375, -0.453125, -0.3134765625, -0.173828125, -0.0341796875, 0.10546875, 0.2451171875, 0.384765625, 0.5244140625, 0.6640625, 0.8037109375, 0.943359375, 1.0830078125, 1.22265625, 1.3623046875, 1.501953125, 1.6416015625, 1.78125, 1.9208984375, 2.060546875, 2.2001953125, 2.33984375, 2.4794921875, 2.619140625, 2.7587890625, 2.8984375, 3.0380859375, 3.177734375, 3.3173828125, 3.45703125, 3.5966796875, 3.736328125, 3.8759765625, 4.015625, 4.1552734375, 4.294921875, 4.4345703125, 4.57421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 8.0, 7.0, 7.0, 6.0, 16.0, 19.0, 19.0, 20.0, 22.0, 35.0, 38.0, 49.0, 66.0, 93.0, 109.0, 215.0, 468.0, 1372.0, 5561.0, 42980.0, 895651.0, 89831.0, 8674.0, 1753.0, 591.0, 263.0, 155.0, 103.0, 75.0, 64.0, 47.0, 43.0, 34.0, 25.0, 19.0, 18.0, 19.0, 12.0, 10.0, 8.0, 6.0, 4.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.168975830078125, -2.09576416015625, -2.022552490234375, -1.9493408203125, -1.876129150390625, -1.80291748046875, -1.729705810546875, -1.656494140625, -1.583282470703125, -1.51007080078125, -1.436859130859375, -1.3636474609375, -1.290435791015625, -1.21722412109375, -1.144012451171875, -1.07080078125, -0.997589111328125, -0.92437744140625, -0.851165771484375, -0.7779541015625, -0.704742431640625, -0.63153076171875, -0.558319091796875, -0.485107421875, -0.411895751953125, -0.33868408203125, -0.265472412109375, -0.1922607421875, -0.119049072265625, -0.04583740234375, 0.027374267578125, 0.1005859375, 0.173797607421875, 0.24700927734375, 0.320220947265625, 0.3934326171875, 0.466644287109375, 0.53985595703125, 0.613067626953125, 0.686279296875, 0.759490966796875, 0.83270263671875, 0.905914306640625, 0.9791259765625, 1.052337646484375, 1.12554931640625, 1.198760986328125, 1.27197265625, 1.345184326171875, 1.41839599609375, 1.491607666015625, 1.5648193359375, 1.638031005859375, 1.71124267578125, 1.784454345703125, 1.857666015625, 1.930877685546875, 2.00408935546875, 2.077301025390625, 2.1505126953125, 2.223724365234375, 2.29693603515625, 2.370147705078125, 2.443359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 6.0, 6.0, 5.0, 4.0, 13.0, 12.0, 14.0, 9.0, 13.0, 22.0, 19.0, 22.0, 26.0, 33.0, 33.0, 39.0, 40.0, 50.0, 47.0, 44.0, 50.0, 41.0, 41.0, 37.0, 40.0, 27.0, 35.0, 29.0, 25.0, 26.0, 24.0, 26.0, 22.0, 18.0, 14.0, 14.0, 10.0, 4.0, 9.0, 7.0, 7.0, 3.0, 5.0, 4.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.476409912109375, -3.35906982421875, -3.241729736328125, -3.1243896484375, -3.007049560546875, -2.88970947265625, -2.772369384765625, -2.655029296875, -2.537689208984375, -2.42034912109375, -2.303009033203125, -2.1856689453125, -2.068328857421875, -1.95098876953125, -1.833648681640625, -1.71630859375, -1.598968505859375, -1.48162841796875, -1.364288330078125, -1.2469482421875, -1.129608154296875, -1.01226806640625, -0.894927978515625, -0.777587890625, -0.660247802734375, -0.54290771484375, -0.425567626953125, -0.3082275390625, -0.190887451171875, -0.07354736328125, 0.043792724609375, 0.1611328125, 0.278472900390625, 0.39581298828125, 0.513153076171875, 0.6304931640625, 0.747833251953125, 0.86517333984375, 0.982513427734375, 1.099853515625, 1.217193603515625, 1.33453369140625, 1.451873779296875, 1.5692138671875, 1.686553955078125, 1.80389404296875, 1.921234130859375, 2.03857421875, 2.155914306640625, 2.27325439453125, 2.390594482421875, 2.5079345703125, 2.625274658203125, 2.74261474609375, 2.859954833984375, 2.977294921875, 3.094635009765625, 3.21197509765625, 3.329315185546875, 3.4466552734375, 3.563995361328125, 3.68133544921875, 3.798675537109375, 3.916015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 7.0, 9.0, 16.0, 27.0, 43.0, 64.0, 85.0, 159.0, 257.0, 535.0, 1128.0, 2568.0, 7233.0, 57368.0, 944491.0, 25461.0, 5174.0, 1964.0, 877.0, 459.0, 223.0, 135.0, 97.0, 56.0, 32.0, 13.0, 14.0, 14.0, 10.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5304832458496094, -0.5145797729492188, -0.4986763000488281, -0.4827728271484375, -0.4668693542480469, -0.45096588134765625, -0.4350624084472656, -0.419158935546875, -0.4032554626464844, -0.38735198974609375, -0.3714485168457031, -0.3555450439453125, -0.3396415710449219, -0.32373809814453125, -0.3078346252441406, -0.29193115234375, -0.2760276794433594, -0.26012420654296875, -0.24422073364257812, -0.2283172607421875, -0.21241378784179688, -0.19651031494140625, -0.18060684204101562, -0.164703369140625, -0.14879989624023438, -0.13289642333984375, -0.11699295043945312, -0.1010894775390625, -0.08518600463867188, -0.06928253173828125, -0.053379058837890625, -0.0374755859375, -0.021572113037109375, -0.00566864013671875, 0.010234832763671875, 0.0261383056640625, 0.042041778564453125, 0.05794525146484375, 0.07384872436523438, 0.089752197265625, 0.10565567016601562, 0.12155914306640625, 0.13746261596679688, 0.1533660888671875, 0.16926956176757812, 0.18517303466796875, 0.20107650756835938, 0.21697998046875, 0.23288345336914062, 0.24878692626953125, 0.2646903991699219, 0.2805938720703125, 0.2964973449707031, 0.31240081787109375, 0.3283042907714844, 0.344207763671875, 0.3601112365722656, 0.37601470947265625, 0.3919181823730469, 0.4078216552734375, 0.4237251281738281, 0.43962860107421875, 0.4555320739746094, 0.471435546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 11.0, 12.0, 19.0, 58.0, 132.0, 567.0, 112.0, 34.0, 15.0, 13.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.587671279907227e-05, -7.338542491197586e-05, -7.089413702487946e-05, -6.840284913778305e-05, -6.591156125068665e-05, -6.342027336359024e-05, -6.0928985476493835e-05, -5.843769758939743e-05, -5.5946409702301025e-05, -5.345512181520462e-05, -5.0963833928108215e-05, -4.847254604101181e-05, -4.5981258153915405e-05, -4.3489970266819e-05, -4.0998682379722595e-05, -3.850739449262619e-05, -3.6016106605529785e-05, -3.352481871843338e-05, -3.1033530831336975e-05, -2.854224294424057e-05, -2.6050955057144165e-05, -2.355966717004776e-05, -2.1068379282951355e-05, -1.857709139585495e-05, -1.6085803508758545e-05, -1.359451562166214e-05, -1.1103227734565735e-05, -8.61193984746933e-06, -6.120651960372925e-06, -3.6293640732765198e-06, -1.1380761861801147e-06, 1.3532117009162903e-06, 3.844499588012695e-06, 6.3357874751091e-06, 8.827075362205505e-06, 1.131836324930191e-05, 1.3809651136398315e-05, 1.630093902349472e-05, 1.8792226910591125e-05, 2.128351479768753e-05, 2.3774802684783936e-05, 2.626609057188034e-05, 2.8757378458976746e-05, 3.124866634607315e-05, 3.3739954233169556e-05, 3.623124212026596e-05, 3.8722530007362366e-05, 4.121381789445877e-05, 4.3705105781555176e-05, 4.619639366865158e-05, 4.8687681555747986e-05, 5.117896944284439e-05, 5.3670257329940796e-05, 5.61615452170372e-05, 5.8652833104133606e-05, 6.114412099123001e-05, 6.363540887832642e-05, 6.612669676542282e-05, 6.861798465251923e-05, 7.110927253961563e-05, 7.360056042671204e-05, 7.609184831380844e-05, 7.858313620090485e-05, 8.107442408800125e-05, 8.356571197509766e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 17.0, 26.0, 40.0, 72.0, 105.0, 217.0, 374.0, 843.0, 2119.0, 7977.0, 410545.0, 614332.0, 8082.0, 2016.0, 806.0, 412.0, 214.0, 117.0, 87.0, 46.0, 27.0, 15.0, 18.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.6653900146484375, -0.645233154296875, -0.6250762939453125, -0.60491943359375, -0.5847625732421875, -0.564605712890625, -0.5444488525390625, -0.5242919921875, -0.5041351318359375, -0.483978271484375, -0.4638214111328125, -0.44366455078125, -0.4235076904296875, -0.403350830078125, -0.3831939697265625, -0.363037109375, -0.3428802490234375, -0.322723388671875, -0.3025665283203125, -0.28240966796875, -0.2622528076171875, -0.242095947265625, -0.2219390869140625, -0.2017822265625, -0.1816253662109375, -0.161468505859375, -0.1413116455078125, -0.12115478515625, -0.1009979248046875, -0.080841064453125, -0.0606842041015625, -0.04052734375, -0.0203704833984375, -0.000213623046875, 0.0199432373046875, 0.04010009765625, 0.0602569580078125, 0.080413818359375, 0.1005706787109375, 0.1207275390625, 0.1408843994140625, 0.161041259765625, 0.1811981201171875, 0.20135498046875, 0.2215118408203125, 0.241668701171875, 0.2618255615234375, 0.281982421875, 0.3021392822265625, 0.322296142578125, 0.3424530029296875, 0.36260986328125, 0.3827667236328125, 0.402923583984375, 0.4230804443359375, 0.4432373046875, 0.4633941650390625, 0.483551025390625, 0.5037078857421875, 0.52386474609375, 0.5440216064453125, 0.564178466796875, 0.5843353271484375, 0.6044921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 11.0, 7.0, 21.0, 38.0, 69.0, 475.0, 247.0, 54.0, 39.0, 17.0, 7.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232421875, -0.22464752197265625, -0.2168731689453125, -0.20909881591796875, -0.201324462890625, -0.19355010986328125, -0.1857757568359375, -0.17800140380859375, -0.17022705078125, -0.16245269775390625, -0.1546783447265625, -0.14690399169921875, -0.139129638671875, -0.13135528564453125, -0.1235809326171875, -0.11580657958984375, -0.1080322265625, -0.10025787353515625, -0.0924835205078125, -0.08470916748046875, -0.076934814453125, -0.06916046142578125, -0.0613861083984375, -0.05361175537109375, -0.04583740234375, -0.03806304931640625, -0.0302886962890625, -0.02251434326171875, -0.014739990234375, -0.00696563720703125, 0.0008087158203125, 0.00858306884765625, 0.016357421875, 0.02413177490234375, 0.0319061279296875, 0.03968048095703125, 0.047454833984375, 0.05522918701171875, 0.0630035400390625, 0.07077789306640625, 0.07855224609375, 0.08632659912109375, 0.0941009521484375, 0.10187530517578125, 0.109649658203125, 0.11742401123046875, 0.1251983642578125, 0.13297271728515625, 0.1407470703125, 0.14852142333984375, 0.1562957763671875, 0.16407012939453125, 0.171844482421875, 0.17961883544921875, 0.1873931884765625, 0.19516754150390625, 0.20294189453125, 0.21071624755859375, 0.2184906005859375, 0.22626495361328125, 0.234039306640625, 0.24181365966796875, 0.2495880126953125, 0.25736236572265625, 0.26513671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 20.0, 95.0, 338.0, 409.0, 130.0, 20.0, 3.0, 2.0], "bins": [-17.6982421875, -17.39818572998047, -17.098129272460938, -16.79807472229004, -16.498018264770508, -16.197961807250977, -15.897905349731445, -15.59784984588623, -15.2977933883667, -14.997736930847168, -14.697681427001953, -14.397624969482422, -14.097569465637207, -13.797513008117676, -13.497457504272461, -13.19740104675293, -12.897344589233398, -12.597288131713867, -12.297232627868652, -11.997176170349121, -11.697120666503906, -11.397064208984375, -11.097007751464844, -10.796952247619629, -10.496896743774414, -10.196840286254883, -9.896784782409668, -9.596728324890137, -9.296672821044922, -8.99661636352539, -8.69655990600586, -8.396504402160645, -8.096447944641113, -7.79639196395874, -7.496335983276367, -7.196279525756836, -6.896223545074463, -6.59616756439209, -6.296111583709717, -5.996055603027344, -5.6959991455078125, -5.3959431648254395, -5.095887184143066, -4.795830726623535, -4.495774745941162, -4.195718765258789, -3.895662784576416, -3.595606565475464, -3.2955503463745117, -2.9954943656921387, -2.6954381465911865, -2.3953821659088135, -2.0953259468078613, -1.7952699661254883, -1.4952139854431152, -1.195157766342163, -0.8951019048690796, -0.595045804977417, -0.29498976469039917, 0.005066275596618652, 0.30512237548828125, 0.6051784753799438, 0.9052344560623169, 1.205290675163269, 1.505346655845642]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 8.0, 8.0, 11.0, 18.0, 11.0, 22.0, 21.0, 27.0, 24.0, 23.0, 29.0, 33.0, 44.0, 23.0, 40.0, 43.0, 38.0, 53.0, 53.0, 44.0, 41.0, 49.0, 41.0, 30.0, 39.0, 38.0, 25.0, 24.0, 21.0, 15.0, 14.0, 12.0, 11.0, 16.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.079907417297363, -6.875357151031494, -6.670806884765625, -6.466256141662598, -6.2617058753967285, -6.057155609130859, -5.85260534286499, -5.648055076599121, -5.443504333496094, -5.238954067230225, -5.0344038009643555, -4.829853057861328, -4.625302791595459, -4.42075252532959, -4.216202259063721, -4.011651992797852, -3.8071017265319824, -3.6025514602661133, -3.398000955581665, -3.193450689315796, -2.9889001846313477, -2.7843499183654785, -2.5797996520996094, -2.3752493858337402, -2.170698881149292, -1.9661484956741333, -1.7615981101989746, -1.5570478439331055, -1.3524974584579468, -1.147947072982788, -0.943396806716919, -0.7388464212417603, -0.5342965126037598, -0.32974615693092346, -0.12519580125808716, 0.07935452461242676, 0.28390491008758545, 0.48845529556274414, 0.6930055618286133, 0.897555947303772, 1.1021063327789307, 1.3066567182540894, 1.511207103729248, 1.7157573699951172, 1.9203077554702759, 2.1248581409454346, 2.3294084072113037, 2.533958911895752, 2.738509178161621, 2.9430594444274902, 3.1476099491119385, 3.3521602153778076, 3.556710720062256, 3.761260986328125, 3.965811252593994, 4.170361518859863, 4.374912261962891, 4.57946252822876, 4.784012794494629, 4.988563537597656, 5.193113803863525, 5.3976640701293945, 5.602214336395264, 5.806764602661133, 6.011314868927002]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 4.0, 8.0, 13.0, 10.0, 25.0, 23.0, 33.0, 65.0, 83.0, 162.0, 310.0, 606.0, 1253.0, 2667.0, 5957.0, 17282.0, 134652.0, 2299903.0, 1626333.0, 79241.0, 14458.0, 5626.0, 2707.0, 1247.0, 697.0, 357.0, 191.0, 122.0, 91.0, 42.0, 23.0, 14.0, 12.0, 22.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8447265625, -1.79034423828125, -1.7359619140625, -1.68157958984375, -1.627197265625, -1.57281494140625, -1.5184326171875, -1.46405029296875, -1.40966796875, -1.35528564453125, -1.3009033203125, -1.24652099609375, -1.192138671875, -1.13775634765625, -1.0833740234375, -1.02899169921875, -0.974609375, -0.92022705078125, -0.8658447265625, -0.81146240234375, -0.757080078125, -0.70269775390625, -0.6483154296875, -0.59393310546875, -0.53955078125, -0.48516845703125, -0.4307861328125, -0.37640380859375, -0.322021484375, -0.26763916015625, -0.2132568359375, -0.15887451171875, -0.1044921875, -0.05010986328125, 0.0042724609375, 0.05865478515625, 0.113037109375, 0.16741943359375, 0.2218017578125, 0.27618408203125, 0.33056640625, 0.38494873046875, 0.4393310546875, 0.49371337890625, 0.548095703125, 0.60247802734375, 0.6568603515625, 0.71124267578125, 0.765625, 0.82000732421875, 0.8743896484375, 0.92877197265625, 0.983154296875, 1.03753662109375, 1.0919189453125, 1.14630126953125, 1.20068359375, 1.25506591796875, 1.3094482421875, 1.36383056640625, 1.418212890625, 1.47259521484375, 1.5269775390625, 1.58135986328125, 1.6357421875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 0.0, 4.0, 3.0, 3.0, 11.0, 8.0, 15.0, 15.0, 9.0, 24.0, 18.0, 24.0, 24.0, 39.0, 45.0, 35.0, 45.0, 48.0, 45.0, 38.0, 44.0, 60.0, 44.0, 56.0, 35.0, 37.0, 38.0, 27.0, 37.0, 27.0, 23.0, 16.0, 22.0, 23.0, 11.0, 9.0, 13.0, 3.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7324447631835938, -0.7061004638671875, -0.6797561645507812, -0.653411865234375, -0.6270675659179688, -0.6007232666015625, -0.5743789672851562, -0.54803466796875, -0.5216903686523438, -0.4953460693359375, -0.46900177001953125, -0.442657470703125, -0.41631317138671875, -0.3899688720703125, -0.36362457275390625, -0.3372802734375, -0.31093597412109375, -0.2845916748046875, -0.25824737548828125, -0.231903076171875, -0.20555877685546875, -0.1792144775390625, -0.15287017822265625, -0.12652587890625, -0.10018157958984375, -0.0738372802734375, -0.04749298095703125, -0.021148681640625, 0.00519561767578125, 0.0315399169921875, 0.05788421630859375, 0.084228515625, 0.11057281494140625, 0.1369171142578125, 0.16326141357421875, 0.189605712890625, 0.21595001220703125, 0.2422943115234375, 0.26863861083984375, 0.29498291015625, 0.32132720947265625, 0.3476715087890625, 0.37401580810546875, 0.400360107421875, 0.42670440673828125, 0.4530487060546875, 0.47939300537109375, 0.5057373046875, 0.5320816040039062, 0.5584259033203125, 0.5847702026367188, 0.611114501953125, 0.6374588012695312, 0.6638031005859375, 0.6901473999023438, 0.71649169921875, 0.7428359985351562, 0.7691802978515625, 0.7955245971679688, 0.821868896484375, 0.8482131958007812, 0.8745574951171875, 0.9009017944335938, 0.92724609375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 9.0, 14.0, 41.0, 112.0, 1255.0, 4192232.0, 422.0, 82.0, 32.0, 13.0, 12.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.783447265625, -16.98876953125, -16.194091796875, -15.3994140625, -14.604736328125, -13.81005859375, -13.015380859375, -12.220703125, -11.426025390625, -10.63134765625, -9.836669921875, -9.0419921875, -8.247314453125, -7.45263671875, -6.657958984375, -5.86328125, -5.068603515625, -4.27392578125, -3.479248046875, -2.6845703125, -1.889892578125, -1.09521484375, -0.300537109375, 0.494140625, 1.288818359375, 2.08349609375, 2.878173828125, 3.6728515625, 4.467529296875, 5.26220703125, 6.056884765625, 6.8515625, 7.646240234375, 8.44091796875, 9.235595703125, 10.0302734375, 10.824951171875, 11.61962890625, 12.414306640625, 13.208984375, 14.003662109375, 14.79833984375, 15.593017578125, 16.3876953125, 17.182373046875, 17.97705078125, 18.771728515625, 19.56640625, 20.361083984375, 21.15576171875, 21.950439453125, 22.7451171875, 23.539794921875, 24.33447265625, 25.129150390625, 25.923828125, 26.718505859375, 27.51318359375, 28.307861328125, 29.1025390625, 29.897216796875, 30.69189453125, 31.486572265625, 32.28125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 7.0, 14.0, 17.0, 29.0, 31.0, 49.0, 79.0, 142.0, 304.0, 734.0, 1134.0, 736.0, 333.0, 148.0, 86.0, 65.0, 41.0, 24.0, 26.0, 10.0, 11.0, 4.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5627288818359375, -0.547332763671875, -0.5319366455078125, -0.51654052734375, -0.5011444091796875, -0.485748291015625, -0.4703521728515625, -0.4549560546875, -0.4395599365234375, -0.424163818359375, -0.4087677001953125, -0.39337158203125, -0.3779754638671875, -0.362579345703125, -0.3471832275390625, -0.331787109375, -0.3163909912109375, -0.300994873046875, -0.2855987548828125, -0.27020263671875, -0.2548065185546875, -0.239410400390625, -0.2240142822265625, -0.2086181640625, -0.1932220458984375, -0.177825927734375, -0.1624298095703125, -0.14703369140625, -0.1316375732421875, -0.116241455078125, -0.1008453369140625, -0.08544921875, -0.0700531005859375, -0.054656982421875, -0.0392608642578125, -0.02386474609375, -0.0084686279296875, 0.006927490234375, 0.0223236083984375, 0.0377197265625, 0.0531158447265625, 0.068511962890625, 0.0839080810546875, 0.09930419921875, 0.1147003173828125, 0.130096435546875, 0.1454925537109375, 0.160888671875, 0.1762847900390625, 0.191680908203125, 0.2070770263671875, 0.22247314453125, 0.2378692626953125, 0.253265380859375, 0.2686614990234375, 0.2840576171875, 0.2994537353515625, 0.314849853515625, 0.3302459716796875, 0.34564208984375, 0.3610382080078125, 0.376434326171875, 0.3918304443359375, 0.4072265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 11.0, 15.0, 12.0, 22.0, 23.0, 21.0, 39.0, 51.0, 64.0, 73.0, 83.0, 80.0, 105.0, 74.0, 64.0, 54.0, 37.0, 28.0, 25.0, 26.0, 19.0, 19.0, 9.0, 4.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.18211829662323, -1.1478058099746704, -1.1134932041168213, -1.0791807174682617, -1.0448682308197021, -1.0105557441711426, -0.9762431979179382, -0.9419306516647339, -0.9076181650161743, -0.8733056783676147, -0.8389931321144104, -0.804680585861206, -0.7703680992126465, -0.7360556125640869, -0.7017430663108826, -0.6674305200576782, -0.6331180334091187, -0.5988055467605591, -0.5644930005073547, -0.5301804542541504, -0.4958679676055908, -0.46155545115470886, -0.4272429347038269, -0.39293041825294495, -0.358617901802063, -0.32430538535118103, -0.2899928689002991, -0.2556803524494171, -0.22136783599853516, -0.1870553195476532, -0.15274280309677124, -0.11843028664588928, -0.08411788940429688, -0.04980537295341492, -0.015492856502532959, 0.018819659948349, 0.05313217639923096, 0.08744469285011292, 0.12175720930099487, 0.15606972575187683, 0.1903822422027588, 0.22469475865364075, 0.2590072751045227, 0.29331979155540466, 0.3276323080062866, 0.3619448244571686, 0.39625734090805054, 0.4305698573589325, 0.46488237380981445, 0.4991948902606964, 0.5335074067115784, 0.5678199529647827, 0.6021324396133423, 0.6364449262619019, 0.6707574725151062, 0.7050700187683105, 0.7393825054168701, 0.7736949920654297, 0.808007538318634, 0.8423200845718384, 0.876632571220398, 0.9109450578689575, 0.9452576041221619, 0.9795701503753662, 1.0138826370239258]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 6.0, 6.0, 7.0, 11.0, 19.0, 15.0, 18.0, 15.0, 17.0, 28.0, 29.0, 39.0, 40.0, 40.0, 34.0, 31.0, 42.0, 38.0, 56.0, 55.0, 52.0, 44.0, 46.0, 39.0, 31.0, 31.0, 34.0, 31.0, 27.0, 19.0, 16.0, 17.0, 15.0, 12.0, 10.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9027748107910156, -0.8754429221153259, -0.8481109738349915, -0.8207790851593018, -0.7934471964836121, -0.7661153078079224, -0.7387833595275879, -0.7114514708518982, -0.6841195821762085, -0.6567876935005188, -0.6294557452201843, -0.6021238565444946, -0.5747919678688049, -0.5474600791931152, -0.5201281309127808, -0.49279624223709106, -0.465464323759079, -0.4381324052810669, -0.4108005166053772, -0.3834685981273651, -0.3561367094516754, -0.32880479097366333, -0.30147290229797363, -0.27414098381996155, -0.24680908024311066, -0.21947717666625977, -0.19214527308940887, -0.16481336951255798, -0.1374814510345459, -0.11014954745769501, -0.08281764388084412, -0.055485740303993225, -0.028153836727142334, -0.0008219312876462936, 0.026509974151849747, 0.053841881453990936, 0.08117378503084183, 0.10850569605827332, 0.1358375996351242, 0.1631695032119751, 0.190501406788826, 0.21783331036567688, 0.24516521394252777, 0.27249711751937866, 0.29982903599739075, 0.32716095447540283, 0.35449284315109253, 0.3818247318267822, 0.4091566503047943, 0.4364885687828064, 0.4638204574584961, 0.4911523759365082, 0.5184842944145203, 0.54581618309021, 0.5731480717658997, 0.6004799604415894, 0.6278119087219238, 0.6551437973976135, 0.682475745677948, 0.7098076343536377, 0.7371395230293274, 0.7644714117050171, 0.7918033599853516, 0.8191352486610413, 0.846467137336731]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 20.0, 16.0, 26.0, 38.0, 62.0, 95.0, 142.0, 226.0, 423.0, 645.0, 995.0, 1615.0, 2716.0, 4771.0, 9139.0, 19271.0, 45571.0, 119927.0, 335140.0, 314787.0, 111633.0, 43090.0, 18149.0, 8658.0, 4555.0, 2687.0, 1615.0, 910.0, 597.0, 366.0, 239.0, 164.0, 87.0, 68.0, 44.0, 24.0, 15.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.38330078125, -0.3709220886230469, -0.35854339599609375, -0.3461647033691406, -0.3337860107421875, -0.3214073181152344, -0.30902862548828125, -0.2966499328613281, -0.284271240234375, -0.2718925476074219, -0.25951385498046875, -0.24713516235351562, -0.2347564697265625, -0.22237777709960938, -0.20999908447265625, -0.19762039184570312, -0.18524169921875, -0.17286300659179688, -0.16048431396484375, -0.14810562133789062, -0.1357269287109375, -0.12334823608398438, -0.11096954345703125, -0.09859085083007812, -0.086212158203125, -0.07383346557617188, -0.06145477294921875, -0.049076080322265625, -0.0366973876953125, -0.024318695068359375, -0.01194000244140625, 0.000438690185546875, 0.0128173828125, 0.025196075439453125, 0.03757476806640625, 0.049953460693359375, 0.0623321533203125, 0.07471084594726562, 0.08708953857421875, 0.09946823120117188, 0.111846923828125, 0.12422561645507812, 0.13660430908203125, 0.14898300170898438, 0.1613616943359375, 0.17374038696289062, 0.18611907958984375, 0.19849777221679688, 0.21087646484375, 0.22325515747070312, 0.23563385009765625, 0.24801254272460938, 0.2603912353515625, 0.2727699279785156, 0.28514862060546875, 0.2975273132324219, 0.309906005859375, 0.3222846984863281, 0.33466339111328125, 0.3470420837402344, 0.3594207763671875, 0.3717994689941406, 0.38417816162109375, 0.3965568542480469, 0.408935546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 13.0, 18.0, 15.0, 23.0, 27.0, 38.0, 33.0, 43.0, 42.0, 41.0, 64.0, 41.0, 50.0, 77.0, 72.0, 38.0, 51.0, 31.0, 39.0, 41.0, 31.0, 25.0, 22.0, 21.0, 12.0, 17.0, 7.0, 13.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.572021484375, -0.55078125, -0.529541015625, -0.50830078125, -0.487060546875, -0.4658203125, -0.444580078125, -0.42333984375, -0.402099609375, -0.380859375, -0.359619140625, -0.33837890625, -0.317138671875, -0.2958984375, -0.274658203125, -0.25341796875, -0.232177734375, -0.2109375, -0.189697265625, -0.16845703125, -0.147216796875, -0.1259765625, -0.104736328125, -0.08349609375, -0.062255859375, -0.041015625, -0.019775390625, 0.00146484375, 0.022705078125, 0.0439453125, 0.065185546875, 0.08642578125, 0.107666015625, 0.12890625, 0.150146484375, 0.17138671875, 0.192626953125, 0.2138671875, 0.235107421875, 0.25634765625, 0.277587890625, 0.298828125, 0.320068359375, 0.34130859375, 0.362548828125, 0.3837890625, 0.405029296875, 0.42626953125, 0.447509765625, 0.46875, 0.489990234375, 0.51123046875, 0.532470703125, 0.5537109375, 0.574951171875, 0.59619140625, 0.617431640625, 0.638671875, 0.659912109375, 0.68115234375, 0.702392578125, 0.7236328125, 0.744873046875, 0.76611328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 4.0, 4.0, 14.0, 14.0, 17.0, 28.0, 43.0, 41.0, 69.0, 106.0, 198.0, 292.0, 513.0, 960.0, 1886.0, 4221.0, 10768.0, 31842.0, 112604.0, 415984.0, 339779.0, 87531.0, 25491.0, 8856.0, 3541.0, 1629.0, 840.0, 482.0, 264.0, 176.0, 103.0, 81.0, 58.0, 21.0, 21.0, 23.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3485527038574219, -0.33455657958984375, -0.3205604553222656, -0.3065643310546875, -0.2925682067871094, -0.27857208251953125, -0.2645759582519531, -0.250579833984375, -0.23658370971679688, -0.22258758544921875, -0.20859146118164062, -0.1945953369140625, -0.18059921264648438, -0.16660308837890625, -0.15260696411132812, -0.13861083984375, -0.12461471557617188, -0.11061859130859375, -0.09662246704101562, -0.0826263427734375, -0.06863021850585938, -0.05463409423828125, -0.040637969970703125, -0.026641845703125, -0.012645721435546875, 0.00135040283203125, 0.015346527099609375, 0.0293426513671875, 0.043338775634765625, 0.05733489990234375, 0.07133102416992188, 0.0853271484375, 0.09932327270507812, 0.11331939697265625, 0.12731552124023438, 0.1413116455078125, 0.15530776977539062, 0.16930389404296875, 0.18330001831054688, 0.197296142578125, 0.21129226684570312, 0.22528839111328125, 0.23928451538085938, 0.2532806396484375, 0.2672767639160156, 0.28127288818359375, 0.2952690124511719, 0.30926513671875, 0.3232612609863281, 0.33725738525390625, 0.3512535095214844, 0.3652496337890625, 0.3792457580566406, 0.39324188232421875, 0.4072380065917969, 0.421234130859375, 0.4352302551269531, 0.44922637939453125, 0.4632225036621094, 0.4772186279296875, 0.4912147521972656, 0.5052108764648438, 0.5192070007324219, 0.533203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 9.0, 9.0, 11.0, 13.0, 17.0, 19.0, 22.0, 24.0, 34.0, 14.0, 38.0, 37.0, 44.0, 36.0, 39.0, 52.0, 43.0, 42.0, 54.0, 53.0, 51.0, 42.0, 42.0, 35.0, 31.0, 24.0, 27.0, 23.0, 16.0, 15.0, 17.0, 14.0, 12.0, 8.0, 4.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.203125, -1.1669769287109375, -1.130828857421875, -1.0946807861328125, -1.05853271484375, -1.0223846435546875, -0.986236572265625, -0.9500885009765625, -0.9139404296875, -0.8777923583984375, -0.841644287109375, -0.8054962158203125, -0.76934814453125, -0.7332000732421875, -0.697052001953125, -0.6609039306640625, -0.624755859375, -0.5886077880859375, -0.552459716796875, -0.5163116455078125, -0.48016357421875, -0.4440155029296875, -0.407867431640625, -0.3717193603515625, -0.3355712890625, -0.2994232177734375, -0.263275146484375, -0.2271270751953125, -0.19097900390625, -0.1548309326171875, -0.118682861328125, -0.0825347900390625, -0.04638671875, -0.0102386474609375, 0.025909423828125, 0.0620574951171875, 0.09820556640625, 0.1343536376953125, 0.170501708984375, 0.2066497802734375, 0.2427978515625, 0.2789459228515625, 0.315093994140625, 0.3512420654296875, 0.38739013671875, 0.4235382080078125, 0.459686279296875, 0.4958343505859375, 0.531982421875, 0.5681304931640625, 0.604278564453125, 0.6404266357421875, 0.67657470703125, 0.7127227783203125, 0.748870849609375, 0.7850189208984375, 0.8211669921875, 0.8573150634765625, 0.893463134765625, 0.9296112060546875, 0.96575927734375, 1.0019073486328125, 1.038055419921875, 1.0742034912109375, 1.1103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 13.0, 15.0, 31.0, 42.0, 72.0, 99.0, 129.0, 240.0, 400.0, 580.0, 1064.0, 1947.0, 4093.0, 8964.0, 23950.0, 89336.0, 517381.0, 312763.0, 56466.0, 17051.0, 6676.0, 3186.0, 1697.0, 896.0, 531.0, 346.0, 165.0, 114.0, 98.0, 76.0, 25.0, 25.0, 18.0, 16.0, 11.0, 10.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13303184509277344, -0.12910079956054688, -0.1251697540283203, -0.12123870849609375, -0.11730766296386719, -0.11337661743164062, -0.10944557189941406, -0.1055145263671875, -0.10158348083496094, -0.09765243530273438, -0.09372138977050781, -0.08979034423828125, -0.08585929870605469, -0.08192825317382812, -0.07799720764160156, -0.074066162109375, -0.07013511657714844, -0.06620407104492188, -0.06227302551269531, -0.05834197998046875, -0.05441093444824219, -0.050479888916015625, -0.04654884338378906, -0.0426177978515625, -0.03868675231933594, -0.034755706787109375, -0.030824661254882812, -0.02689361572265625, -0.022962570190429688, -0.019031524658203125, -0.015100479125976562, -0.01116943359375, -0.0072383880615234375, -0.003307342529296875, 0.0006237030029296875, 0.00455474853515625, 0.008485794067382812, 0.012416839599609375, 0.016347885131835938, 0.0202789306640625, 0.024209976196289062, 0.028141021728515625, 0.03207206726074219, 0.03600311279296875, 0.03993415832519531, 0.043865203857421875, 0.04779624938964844, 0.051727294921875, 0.05565834045410156, 0.059589385986328125, 0.06352043151855469, 0.06745147705078125, 0.07138252258300781, 0.07531356811523438, 0.07924461364746094, 0.0831756591796875, 0.08710670471191406, 0.09103775024414062, 0.09496879577636719, 0.09889984130859375, 0.10283088684082031, 0.10676193237304688, 0.11069297790527344, 0.1146240234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 10.0, 10.0, 19.0, 36.0, 57.0, 87.0, 206.0, 222.0, 139.0, 67.0, 44.0, 28.0, 22.0, 11.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014293193817138672, -0.00013820268213748932, -0.00013347342610359192, -0.00012874417006969452, -0.00012401491403579712, -0.00011928565800189972, -0.00011455640196800232, -0.00010982714593410492, -0.00010509788990020752, -0.00010036863386631012, -9.563937783241272e-05, -9.091012179851532e-05, -8.618086576461792e-05, -8.145160973072052e-05, -7.672235369682312e-05, -7.199309766292572e-05, -6.726384162902832e-05, -6.253458559513092e-05, -5.780532956123352e-05, -5.307607352733612e-05, -4.834681749343872e-05, -4.361756145954132e-05, -3.888830542564392e-05, -3.415904939174652e-05, -2.942979335784912e-05, -2.470053732395172e-05, -1.997128129005432e-05, -1.5242025256156921e-05, -1.0512769222259521e-05, -5.783513188362122e-06, -1.0542571544647217e-06, 3.6749988794326782e-06, 8.404254913330078e-06, 1.3133510947227478e-05, 1.7862766981124878e-05, 2.2592023015022278e-05, 2.7321279048919678e-05, 3.205053508281708e-05, 3.677979111671448e-05, 4.150904715061188e-05, 4.623830318450928e-05, 5.096755921840668e-05, 5.569681525230408e-05, 6.042607128620148e-05, 6.515532732009888e-05, 6.988458335399628e-05, 7.461383938789368e-05, 7.934309542179108e-05, 8.407235145568848e-05, 8.880160748958588e-05, 9.353086352348328e-05, 9.826011955738068e-05, 0.00010298937559127808, 0.00010771863162517548, 0.00011244788765907288, 0.00011717714369297028, 0.00012190639972686768, 0.00012663565576076508, 0.00013136491179466248, 0.00013609416782855988, 0.00014082342386245728, 0.00014555267989635468, 0.00015028193593025208, 0.00015501119196414948, 0.00015974044799804688]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 0.0, 6.0, 4.0, 6.0, 11.0, 15.0, 25.0, 36.0, 95.0, 378.0, 3778.0, 362844.0, 675811.0, 4887.0, 457.0, 104.0, 41.0, 17.0, 10.0, 5.0, 5.0, 3.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5606613159179688, -0.5446624755859375, -0.5286636352539062, -0.512664794921875, -0.49666595458984375, -0.4806671142578125, -0.46466827392578125, -0.44866943359375, -0.43267059326171875, -0.4166717529296875, -0.40067291259765625, -0.384674072265625, -0.36867523193359375, -0.3526763916015625, -0.33667755126953125, -0.3206787109375, -0.30467987060546875, -0.2886810302734375, -0.27268218994140625, -0.256683349609375, -0.24068450927734375, -0.2246856689453125, -0.20868682861328125, -0.19268798828125, -0.17668914794921875, -0.1606903076171875, -0.14469146728515625, -0.128692626953125, -0.11269378662109375, -0.0966949462890625, -0.08069610595703125, -0.064697265625, -0.04869842529296875, -0.0326995849609375, -0.01670074462890625, -0.000701904296875, 0.01529693603515625, 0.0312957763671875, 0.04729461669921875, 0.06329345703125, 0.07929229736328125, 0.0952911376953125, 0.11128997802734375, 0.127288818359375, 0.14328765869140625, 0.1592864990234375, 0.17528533935546875, 0.1912841796875, 0.20728302001953125, 0.2232818603515625, 0.23928070068359375, 0.255279541015625, 0.27127838134765625, 0.2872772216796875, 0.30327606201171875, 0.31927490234375, 0.33527374267578125, 0.3512725830078125, 0.36727142333984375, 0.383270263671875, 0.39926910400390625, 0.4152679443359375, 0.43126678466796875, 0.447265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 3.0, 9.0, 11.0, 13.0, 11.0, 17.0, 26.0, 28.0, 31.0, 56.0, 57.0, 72.0, 95.0, 103.0, 101.0, 82.0, 68.0, 44.0, 39.0, 30.0, 29.0, 17.0, 12.0, 11.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038238525390625, -0.03713035583496094, -0.036022186279296875, -0.03491401672363281, -0.03380584716796875, -0.03269767761230469, -0.031589508056640625, -0.030481338500976562, -0.0293731689453125, -0.028264999389648438, -0.027156829833984375, -0.026048660278320312, -0.02494049072265625, -0.023832321166992188, -0.022724151611328125, -0.021615982055664062, -0.0205078125, -0.019399642944335938, -0.018291473388671875, -0.017183303833007812, -0.01607513427734375, -0.014966964721679688, -0.013858795166015625, -0.012750625610351562, -0.0116424560546875, -0.010534286499023438, -0.009426116943359375, -0.008317947387695312, -0.00720977783203125, -0.0061016082763671875, -0.004993438720703125, -0.0038852691650390625, -0.002777099609375, -0.0016689300537109375, -0.000560760498046875, 0.0005474090576171875, 0.00165557861328125, 0.0027637481689453125, 0.003871917724609375, 0.0049800872802734375, 0.0060882568359375, 0.0071964263916015625, 0.008304595947265625, 0.009412765502929688, 0.01052093505859375, 0.011629104614257812, 0.012737274169921875, 0.013845443725585938, 0.01495361328125, 0.016061782836914062, 0.017169952392578125, 0.018278121948242188, 0.01938629150390625, 0.020494461059570312, 0.021602630615234375, 0.022710800170898438, 0.0238189697265625, 0.024927139282226562, 0.026035308837890625, 0.027143478393554688, 0.02825164794921875, 0.029359817504882812, 0.030467987060546875, 0.03157615661621094, 0.032684326171875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 12.0, 15.0, 28.0, 22.0, 49.0, 64.0, 110.0, 118.0, 134.0, 144.0, 104.0, 54.0, 34.0, 33.0, 14.0, 12.0, 9.0, 13.0, 9.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.387607455253601, -1.3575772047042847, -1.3275469541549683, -1.2975167036056519, -1.2674864530563354, -1.2374560832977295, -1.207425832748413, -1.1773955821990967, -1.1473653316497803, -1.1173350811004639, -1.0873048305511475, -1.057274580001831, -1.0272443294525146, -0.9972140192985535, -0.9671837687492371, -0.9371535181999207, -0.9071232676506042, -0.8770930171012878, -0.8470627665519714, -0.8170324563980103, -0.7870022058486938, -0.7569719552993774, -0.726941704750061, -0.6969114542007446, -0.6668812036514282, -0.6368509531021118, -0.6068207025527954, -0.576790452003479, -0.5467601418495178, -0.5167298913002014, -0.486699640750885, -0.4566693902015686, -0.4266391396522522, -0.3966088891029358, -0.366578608751297, -0.3365483582019806, -0.3065180778503418, -0.2764878273010254, -0.24645757675170898, -0.21642731130123138, -0.18639704585075378, -0.15636678040027618, -0.12633651494979858, -0.09630626440048218, -0.06627599895000458, -0.03624573349952698, -0.006215482950210571, 0.02381478250026703, 0.05384504795074463, 0.08387531340122223, 0.11390557140111923, 0.14393582940101624, 0.17396609485149384, 0.20399636030197144, 0.23402661085128784, 0.26405686140060425, 0.29408714175224304, 0.32411739230155945, 0.35414767265319824, 0.38417792320251465, 0.41420817375183105, 0.44423845410346985, 0.47426870465278625, 0.504298985004425, 0.5343292355537415]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 9.0, 8.0, 9.0, 12.0, 24.0, 22.0, 24.0, 44.0, 32.0, 61.0, 54.0, 54.0, 58.0, 67.0, 77.0, 62.0, 76.0, 48.0, 47.0, 41.0, 44.0, 32.0, 23.0, 24.0, 17.0, 14.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5779840350151062, -0.5522323846817017, -0.5264807343482971, -0.5007290840148926, -0.47497737407684326, -0.4492257237434387, -0.4234740734100342, -0.39772242307662964, -0.3719707429409027, -0.34621909260749817, -0.32046741247177124, -0.2947157621383667, -0.26896411180496216, -0.24321243166923523, -0.2174607813358307, -0.19170911610126495, -0.16595745086669922, -0.14020578563213348, -0.11445412784814835, -0.08870247006416321, -0.06295080482959747, -0.03719913959503174, -0.011447489261627197, 0.014304175972938538, 0.04005584120750427, 0.06580750644207001, 0.09155916422605515, 0.11731082201004028, 0.14306248724460602, 0.16881415247917175, 0.1945658028125763, 0.22031746804714203, 0.246069073677063, 0.27182072401046753, 0.29757240414619446, 0.323324054479599, 0.3490757346153259, 0.37482738494873047, 0.400579035282135, 0.42633068561553955, 0.4520823657512665, 0.477834016084671, 0.503585696220398, 0.5293373465538025, 0.555088996887207, 0.5808407068252563, 0.6065922975540161, 0.6323440074920654, 0.65809565782547, 0.6838473081588745, 0.709598958492279, 0.7353506088256836, 0.7611023187637329, 0.7868539690971375, 0.812605619430542, 0.8383572697639465, 0.8641089200973511, 0.8898605704307556, 0.9156122207641602, 0.9413639307022095, 0.967115581035614, 0.9928672313690186, 1.0186188220977783, 1.0443705320358276, 1.070122241973877]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 6.0, 7.0, 17.0, 16.0, 19.0, 37.0, 32.0, 43.0, 90.0, 131.0, 242.0, 393.0, 714.0, 1396.0, 2914.0, 6897.0, 19594.0, 92511.0, 713508.0, 166407.0, 27210.0, 8936.0, 3634.0, 1701.0, 884.0, 466.0, 269.0, 145.0, 107.0, 68.0, 42.0, 32.0, 16.0, 16.0, 19.0, 8.0, 9.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.630859375, -0.60882568359375, -0.5867919921875, -0.56475830078125, -0.542724609375, -0.52069091796875, -0.4986572265625, -0.47662353515625, -0.45458984375, -0.43255615234375, -0.4105224609375, -0.38848876953125, -0.366455078125, -0.34442138671875, -0.3223876953125, -0.30035400390625, -0.2783203125, -0.25628662109375, -0.2342529296875, -0.21221923828125, -0.190185546875, -0.16815185546875, -0.1461181640625, -0.12408447265625, -0.10205078125, -0.08001708984375, -0.0579833984375, -0.03594970703125, -0.013916015625, 0.00811767578125, 0.0301513671875, 0.05218505859375, 0.07421875, 0.09625244140625, 0.1182861328125, 0.14031982421875, 0.162353515625, 0.18438720703125, 0.2064208984375, 0.22845458984375, 0.25048828125, 0.27252197265625, 0.2945556640625, 0.31658935546875, 0.338623046875, 0.36065673828125, 0.3826904296875, 0.40472412109375, 0.4267578125, 0.44879150390625, 0.4708251953125, 0.49285888671875, 0.514892578125, 0.53692626953125, 0.5589599609375, 0.58099365234375, 0.60302734375, 0.62506103515625, 0.6470947265625, 0.66912841796875, 0.691162109375, 0.71319580078125, 0.7352294921875, 0.75726318359375, 0.779296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 10.0, 17.0, 17.0, 12.0, 21.0, 26.0, 23.0, 37.0, 41.0, 41.0, 45.0, 51.0, 57.0, 60.0, 62.0, 65.0, 59.0, 52.0, 55.0, 37.0, 34.0, 24.0, 31.0, 16.0, 22.0, 17.0, 15.0, 8.0, 6.0, 6.0, 7.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.6418609619140625, -1.573760986328125, -1.5056610107421875, -1.43756103515625, -1.3694610595703125, -1.301361083984375, -1.2332611083984375, -1.1651611328125, -1.0970611572265625, -1.028961181640625, -0.9608612060546875, -0.89276123046875, -0.8246612548828125, -0.756561279296875, -0.6884613037109375, -0.620361328125, -0.5522613525390625, -0.484161376953125, -0.4160614013671875, -0.34796142578125, -0.2798614501953125, -0.211761474609375, -0.1436614990234375, -0.0755615234375, -0.0074615478515625, 0.060638427734375, 0.1287384033203125, 0.19683837890625, 0.2649383544921875, 0.333038330078125, 0.4011383056640625, 0.46923828125, 0.5373382568359375, 0.605438232421875, 0.6735382080078125, 0.74163818359375, 0.8097381591796875, 0.877838134765625, 0.9459381103515625, 1.0140380859375, 1.0821380615234375, 1.150238037109375, 1.2183380126953125, 1.28643798828125, 1.3545379638671875, 1.422637939453125, 1.4907379150390625, 1.558837890625, 1.6269378662109375, 1.695037841796875, 1.7631378173828125, 1.83123779296875, 1.8993377685546875, 1.967437744140625, 2.0355377197265625, 2.1036376953125, 2.1717376708984375, 2.239837646484375, 2.3079376220703125, 2.37603759765625, 2.4441375732421875, 2.512237548828125, 2.5803375244140625, 2.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 7.0, 8.0, 10.0, 12.0, 19.0, 25.0, 33.0, 27.0, 47.0, 54.0, 60.0, 86.0, 153.0, 679.0, 1016858.0, 29690.0, 296.0, 114.0, 80.0, 62.0, 37.0, 41.0, 27.0, 22.0, 14.0, 21.0, 10.0, 11.0, 6.0, 12.0, 3.0, 1.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.7421875, -6.54290771484375, -6.3436279296875, -6.14434814453125, -5.945068359375, -5.74578857421875, -5.5465087890625, -5.34722900390625, -5.14794921875, -4.94866943359375, -4.7493896484375, -4.55010986328125, -4.350830078125, -4.15155029296875, -3.9522705078125, -3.75299072265625, -3.5537109375, -3.35443115234375, -3.1551513671875, -2.95587158203125, -2.756591796875, -2.55731201171875, -2.3580322265625, -2.15875244140625, -1.95947265625, -1.76019287109375, -1.5609130859375, -1.36163330078125, -1.162353515625, -0.96307373046875, -0.7637939453125, -0.56451416015625, -0.365234375, -0.16595458984375, 0.0333251953125, 0.23260498046875, 0.431884765625, 0.63116455078125, 0.8304443359375, 1.02972412109375, 1.22900390625, 1.42828369140625, 1.6275634765625, 1.82684326171875, 2.026123046875, 2.22540283203125, 2.4246826171875, 2.62396240234375, 2.8232421875, 3.02252197265625, 3.2218017578125, 3.42108154296875, 3.620361328125, 3.81964111328125, 4.0189208984375, 4.21820068359375, 4.41748046875, 4.61676025390625, 4.8160400390625, 5.01531982421875, 5.214599609375, 5.41387939453125, 5.6131591796875, 5.81243896484375, 6.01171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 5.0, 12.0, 12.0, 13.0, 18.0, 20.0, 31.0, 33.0, 40.0, 36.0, 47.0, 63.0, 44.0, 70.0, 70.0, 54.0, 58.0, 51.0, 55.0, 40.0, 34.0, 35.0, 25.0, 22.0, 17.0, 20.0, 14.0, 7.0, 11.0, 8.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.654296875, -2.5758056640625, -2.497314453125, -2.4188232421875, -2.34033203125, -2.2618408203125, -2.183349609375, -2.1048583984375, -2.0263671875, -1.9478759765625, -1.869384765625, -1.7908935546875, -1.71240234375, -1.6339111328125, -1.555419921875, -1.4769287109375, -1.3984375, -1.3199462890625, -1.241455078125, -1.1629638671875, -1.08447265625, -1.0059814453125, -0.927490234375, -0.8489990234375, -0.7705078125, -0.6920166015625, -0.613525390625, -0.5350341796875, -0.45654296875, -0.3780517578125, -0.299560546875, -0.2210693359375, -0.142578125, -0.0640869140625, 0.014404296875, 0.0928955078125, 0.17138671875, 0.2498779296875, 0.328369140625, 0.4068603515625, 0.4853515625, 0.5638427734375, 0.642333984375, 0.7208251953125, 0.79931640625, 0.8778076171875, 0.956298828125, 1.0347900390625, 1.11328125, 1.1917724609375, 1.270263671875, 1.3487548828125, 1.42724609375, 1.5057373046875, 1.584228515625, 1.6627197265625, 1.7412109375, 1.8197021484375, 1.898193359375, 1.9766845703125, 2.05517578125, 2.1336669921875, 2.212158203125, 2.2906494140625, 2.369140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 12.0, 18.0, 24.0, 34.0, 75.0, 210.0, 510.0, 1650.0, 8389.0, 263164.0, 761856.0, 9779.0, 1839.0, 565.0, 218.0, 84.0, 35.0, 21.0, 9.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.4296875, -1.38641357421875, -1.3431396484375, -1.29986572265625, -1.256591796875, -1.21331787109375, -1.1700439453125, -1.12677001953125, -1.08349609375, -1.04022216796875, -0.9969482421875, -0.95367431640625, -0.910400390625, -0.86712646484375, -0.8238525390625, -0.78057861328125, -0.7373046875, -0.69403076171875, -0.6507568359375, -0.60748291015625, -0.564208984375, -0.52093505859375, -0.4776611328125, -0.43438720703125, -0.39111328125, -0.34783935546875, -0.3045654296875, -0.26129150390625, -0.218017578125, -0.17474365234375, -0.1314697265625, -0.08819580078125, -0.044921875, -0.00164794921875, 0.0416259765625, 0.08489990234375, 0.128173828125, 0.17144775390625, 0.2147216796875, 0.25799560546875, 0.30126953125, 0.34454345703125, 0.3878173828125, 0.43109130859375, 0.474365234375, 0.51763916015625, 0.5609130859375, 0.60418701171875, 0.6474609375, 0.69073486328125, 0.7340087890625, 0.77728271484375, 0.820556640625, 0.86383056640625, 0.9071044921875, 0.95037841796875, 0.99365234375, 1.03692626953125, 1.0802001953125, 1.12347412109375, 1.166748046875, 1.21002197265625, 1.2532958984375, 1.29656982421875, 1.33984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 16.0, 20.0, 39.0, 76.0, 447.0, 251.0, 36.0, 35.0, 18.0, 16.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.572505950927734e-05, -9.153783321380615e-05, -8.735060691833496e-05, -8.316338062286377e-05, -7.897615432739258e-05, -7.478892803192139e-05, -7.06017017364502e-05, -6.6414475440979e-05, -6.222724914550781e-05, -5.804002285003662e-05, -5.385279655456543e-05, -4.966557025909424e-05, -4.547834396362305e-05, -4.1291117668151855e-05, -3.7103891372680664e-05, -3.291666507720947e-05, -2.872943878173828e-05, -2.454221248626709e-05, -2.03549861907959e-05, -1.6167759895324707e-05, -1.1980533599853516e-05, -7.793307304382324e-06, -3.606081008911133e-06, 5.811452865600586e-07, 4.76837158203125e-06, 8.955597877502441e-06, 1.3142824172973633e-05, 1.7330050468444824e-05, 2.1517276763916016e-05, 2.5704503059387207e-05, 2.98917293548584e-05, 3.407895565032959e-05, 3.826618194580078e-05, 4.245340824127197e-05, 4.6640634536743164e-05, 5.0827860832214355e-05, 5.501508712768555e-05, 5.920231342315674e-05, 6.338953971862793e-05, 6.757676601409912e-05, 7.176399230957031e-05, 7.59512186050415e-05, 8.01384449005127e-05, 8.432567119598389e-05, 8.851289749145508e-05, 9.270012378692627e-05, 9.688735008239746e-05, 0.00010107457637786865, 0.00010526180267333984, 0.00010944902896881104, 0.00011363625526428223, 0.00011782348155975342, 0.00012201070785522461, 0.0001261979341506958, 0.000130385160446167, 0.00013457238674163818, 0.00013875961303710938, 0.00014294683933258057, 0.00014713406562805176, 0.00015132129192352295, 0.00015550851821899414, 0.00015969574451446533, 0.00016388297080993652, 0.00016807019710540771, 0.0001722574234008789]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 6.0, 7.0, 12.0, 14.0, 12.0, 20.0, 34.0, 101.0, 511.0, 5873.0, 975877.0, 63523.0, 2058.0, 300.0, 77.0, 23.0, 15.0, 20.0, 10.0, 6.0, 6.0, 8.0, 6.0, 6.0, 6.0, 2.0, 8.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.287109375, -2.22662353515625, -2.1661376953125, -2.10565185546875, -2.045166015625, -1.98468017578125, -1.9241943359375, -1.86370849609375, -1.80322265625, -1.74273681640625, -1.6822509765625, -1.62176513671875, -1.561279296875, -1.50079345703125, -1.4403076171875, -1.37982177734375, -1.3193359375, -1.25885009765625, -1.1983642578125, -1.13787841796875, -1.077392578125, -1.01690673828125, -0.9564208984375, -0.89593505859375, -0.83544921875, -0.77496337890625, -0.7144775390625, -0.65399169921875, -0.593505859375, -0.53302001953125, -0.4725341796875, -0.41204833984375, -0.3515625, -0.29107666015625, -0.2305908203125, -0.17010498046875, -0.109619140625, -0.04913330078125, 0.0113525390625, 0.07183837890625, 0.13232421875, 0.19281005859375, 0.2532958984375, 0.31378173828125, 0.374267578125, 0.43475341796875, 0.4952392578125, 0.55572509765625, 0.6162109375, 0.67669677734375, 0.7371826171875, 0.79766845703125, 0.858154296875, 0.91864013671875, 0.9791259765625, 1.03961181640625, 1.10009765625, 1.16058349609375, 1.2210693359375, 1.28155517578125, 1.342041015625, 1.40252685546875, 1.4630126953125, 1.52349853515625, 1.583984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 8.0, 5.0, 6.0, 7.0, 4.0, 6.0, 11.0, 11.0, 15.0, 12.0, 12.0, 29.0, 57.0, 99.0, 264.0, 206.0, 96.0, 43.0, 19.0, 20.0, 14.0, 10.0, 8.0, 13.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1787109375, -0.17230224609375, -0.1658935546875, -0.15948486328125, -0.153076171875, -0.14666748046875, -0.1402587890625, -0.13385009765625, -0.12744140625, -0.12103271484375, -0.1146240234375, -0.10821533203125, -0.101806640625, -0.09539794921875, -0.0889892578125, -0.08258056640625, -0.076171875, -0.06976318359375, -0.0633544921875, -0.05694580078125, -0.050537109375, -0.04412841796875, -0.0377197265625, -0.03131103515625, -0.02490234375, -0.01849365234375, -0.0120849609375, -0.00567626953125, 0.000732421875, 0.00714111328125, 0.0135498046875, 0.01995849609375, 0.0263671875, 0.03277587890625, 0.0391845703125, 0.04559326171875, 0.052001953125, 0.05841064453125, 0.0648193359375, 0.07122802734375, 0.07763671875, 0.08404541015625, 0.0904541015625, 0.09686279296875, 0.103271484375, 0.10968017578125, 0.1160888671875, 0.12249755859375, 0.12890625, 0.13531494140625, 0.1417236328125, 0.14813232421875, 0.154541015625, 0.16094970703125, 0.1673583984375, 0.17376708984375, 0.18017578125, 0.18658447265625, 0.1929931640625, 0.19940185546875, 0.205810546875, 0.21221923828125, 0.2186279296875, 0.22503662109375, 0.2314453125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 10.0, 46.0, 122.0, 449.0, 287.0, 74.0, 20.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5340017080307007, -1.306362271308899, -1.0787227153778076, -0.8510832786560059, -0.6234438419342041, -0.39580440521240234, -0.16816484928131104, 0.05947458744049072, 0.2871140241622925, 0.5147534608840942, 0.7423929572105408, 0.9700324535369873, 1.197671890258789, 1.4253113269805908, 1.6529508829116821, 1.8805903196334839, 2.108229637145996, 2.335869073867798, 2.5635085105895996, 2.7911481857299805, 3.018787384033203, 3.246427059173584, 3.4740664958953857, 3.7017059326171875, 3.9293456077575684, 4.156985282897949, 4.384624481201172, 4.612264156341553, 4.839903354644775, 5.067543029785156, 5.295182228088379, 5.52282190322876, 5.750461578369141, 5.9781012535095215, 6.205740451812744, 6.433380126953125, 6.661019325256348, 6.8886590003967285, 7.116298675537109, 7.343937873840332, 7.571577072143555, 7.7992167472839355, 8.026856422424316, 8.254495620727539, 8.482134819030762, 8.709774017333984, 8.937414169311523, 9.165053367614746, 9.392692565917969, 9.620331764221191, 9.84797191619873, 10.075611114501953, 10.303250312805176, 10.530889511108398, 10.758529663085938, 10.98616886138916, 11.2138090133667, 11.441448211669922, 11.669088363647461, 11.896727561950684, 12.124366760253906, 12.352005958557129, 12.579646110534668, 12.80728530883789, 13.034924507141113]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 9.0, 15.0, 13.0, 17.0, 13.0, 16.0, 17.0, 18.0, 19.0, 25.0, 27.0, 26.0, 29.0, 30.0, 31.0, 41.0, 38.0, 44.0, 40.0, 36.0, 38.0, 37.0, 41.0, 45.0, 36.0, 37.0, 34.0, 28.0, 35.0, 21.0, 22.0, 13.0, 16.0, 17.0, 3.0, 12.0, 6.0, 10.0, 6.0, 7.0, 7.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6897172927856445, -2.6114749908447266, -2.5332324504852295, -2.4549901485443115, -2.3767476081848145, -2.2985053062438965, -2.2202630043029785, -2.1420204639434814, -2.0637781620025635, -1.985535740852356, -1.9072933197021484, -1.8290510177612305, -1.750808596611023, -1.6725661754608154, -1.594323754310608, -1.5160813331604004, -1.4378389120101929, -1.3595964908599854, -1.2813540697097778, -1.2031116485595703, -1.1248693466186523, -1.0466269254684448, -0.9683845043182373, -0.8901421427726746, -0.811899721622467, -0.7336573004722595, -0.6554149389266968, -0.5771725177764893, -0.4989301264286041, -0.420687735080719, -0.3424453139305115, -0.26420295238494873, -0.1859605312347412, -0.10771813243627548, -0.029475733637809753, 0.04876667261123657, 0.1270090639591217, 0.20525145530700684, 0.28349387645721436, 0.3617362380027771, 0.4399786591529846, 0.5182210803031921, 0.5964634418487549, 0.6747058629989624, 0.7529482841491699, 0.8311906456947327, 0.9094330668449402, 0.9876754283905029, 1.0659178495407104, 1.144160270690918, 1.2224026918411255, 1.300645112991333, 1.378887414932251, 1.4571298360824585, 1.535372257232666, 1.613614559173584, 1.691857099533081, 1.7700995206832886, 1.848341941833496, 1.926584243774414, 2.004826784133911, 2.083069086074829, 2.161311626434326, 2.239553928375244, 2.317796230316162]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 16.0, 26.0, 25.0, 35.0, 62.0, 145.0, 318.0, 1354.0, 10124.0, 1093963.0, 3069249.0, 16108.0, 2001.0, 428.0, 152.0, 87.0, 51.0, 33.0, 28.0, 20.0, 9.0, 15.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66796875, -4.53863525390625, -4.4093017578125, -4.27996826171875, -4.150634765625, -4.02130126953125, -3.8919677734375, -3.76263427734375, -3.63330078125, -3.50396728515625, -3.3746337890625, -3.24530029296875, -3.115966796875, -2.98663330078125, -2.8572998046875, -2.72796630859375, -2.5986328125, -2.46929931640625, -2.3399658203125, -2.21063232421875, -2.081298828125, -1.95196533203125, -1.8226318359375, -1.69329833984375, -1.56396484375, -1.43463134765625, -1.3052978515625, -1.17596435546875, -1.046630859375, -0.91729736328125, -0.7879638671875, -0.65863037109375, -0.529296875, -0.39996337890625, -0.2706298828125, -0.14129638671875, -0.011962890625, 0.11737060546875, 0.2467041015625, 0.37603759765625, 0.50537109375, 0.63470458984375, 0.7640380859375, 0.89337158203125, 1.022705078125, 1.15203857421875, 1.2813720703125, 1.41070556640625, 1.5400390625, 1.66937255859375, 1.7987060546875, 1.92803955078125, 2.057373046875, 2.18670654296875, 2.3160400390625, 2.44537353515625, 2.57470703125, 2.70404052734375, 2.8333740234375, 2.96270751953125, 3.092041015625, 3.22137451171875, 3.3507080078125, 3.48004150390625, 3.609375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 4.0, 8.0, 7.0, 7.0, 17.0, 14.0, 25.0, 17.0, 21.0, 32.0, 30.0, 33.0, 40.0, 42.0, 42.0, 32.0, 50.0, 48.0, 46.0, 50.0, 44.0, 38.0, 33.0, 35.0, 34.0, 27.0, 44.0, 31.0, 28.0, 20.0, 13.0, 16.0, 19.0, 12.0, 11.0, 5.0, 7.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6240234375, -0.6037979125976562, -0.5835723876953125, -0.5633468627929688, -0.543121337890625, -0.5228958129882812, -0.5026702880859375, -0.48244476318359375, -0.46221923828125, -0.44199371337890625, -0.4217681884765625, -0.40154266357421875, -0.381317138671875, -0.36109161376953125, -0.3408660888671875, -0.32064056396484375, -0.3004150390625, -0.28018951416015625, -0.2599639892578125, -0.23973846435546875, -0.219512939453125, -0.19928741455078125, -0.1790618896484375, -0.15883636474609375, -0.13861083984375, -0.11838531494140625, -0.0981597900390625, -0.07793426513671875, -0.057708740234375, -0.03748321533203125, -0.0172576904296875, 0.00296783447265625, 0.023193359375, 0.04341888427734375, 0.0636444091796875, 0.08386993408203125, 0.104095458984375, 0.12432098388671875, 0.1445465087890625, 0.16477203369140625, 0.18499755859375, 0.20522308349609375, 0.2254486083984375, 0.24567413330078125, 0.265899658203125, 0.28612518310546875, 0.3063507080078125, 0.32657623291015625, 0.3468017578125, 0.36702728271484375, 0.3872528076171875, 0.40747833251953125, 0.427703857421875, 0.44792938232421875, 0.4681549072265625, 0.48838043212890625, 0.50860595703125, 0.5288314819335938, 0.5490570068359375, 0.5692825317382812, 0.589508056640625, 0.6097335815429688, 0.6299591064453125, 0.6501846313476562, 0.67041015625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 8.0, 19.0, 29.0, 101.0, 307.0, 3158.0, 4175546.0, 14403.0, 502.0, 123.0, 48.0, 21.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.69427490234375, -14.3651123046875, -14.03594970703125, -13.706787109375, -13.37762451171875, -13.0484619140625, -12.71929931640625, -12.39013671875, -12.06097412109375, -11.7318115234375, -11.40264892578125, -11.073486328125, -10.74432373046875, -10.4151611328125, -10.08599853515625, -9.7568359375, -9.42767333984375, -9.0985107421875, -8.76934814453125, -8.440185546875, -8.11102294921875, -7.7818603515625, -7.45269775390625, -7.12353515625, -6.79437255859375, -6.4652099609375, -6.13604736328125, -5.806884765625, -5.47772216796875, -5.1485595703125, -4.81939697265625, -4.490234375, -4.16107177734375, -3.8319091796875, -3.50274658203125, -3.173583984375, -2.84442138671875, -2.5152587890625, -2.18609619140625, -1.85693359375, -1.52777099609375, -1.1986083984375, -0.86944580078125, -0.540283203125, -0.21112060546875, 0.1180419921875, 0.44720458984375, 0.7763671875, 1.10552978515625, 1.4346923828125, 1.76385498046875, 2.093017578125, 2.42218017578125, 2.7513427734375, 3.08050537109375, 3.40966796875, 3.73883056640625, 4.0679931640625, 4.39715576171875, 4.726318359375, 5.05548095703125, 5.3846435546875, 5.71380615234375, 6.04296875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 5.0, 9.0, 12.0, 9.0, 15.0, 13.0, 27.0, 32.0, 24.0, 54.0, 75.0, 84.0, 146.0, 240.0, 334.0, 514.0, 670.0, 554.0, 435.0, 249.0, 144.0, 85.0, 69.0, 50.0, 44.0, 26.0, 19.0, 17.0, 15.0, 15.0, 13.0, 10.0, 5.0, 6.0, 7.0, 4.0, 5.0, 2.0, 3.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.2681465148925781, -0.25846099853515625, -0.24877548217773438, -0.2390899658203125, -0.22940444946289062, -0.21971893310546875, -0.21003341674804688, -0.200347900390625, -0.19066238403320312, -0.18097686767578125, -0.17129135131835938, -0.1616058349609375, -0.15192031860351562, -0.14223480224609375, -0.13254928588867188, -0.12286376953125, -0.11317825317382812, -0.10349273681640625, -0.09380722045898438, -0.0841217041015625, -0.07443618774414062, -0.06475067138671875, -0.055065155029296875, -0.045379638671875, -0.035694122314453125, -0.02600860595703125, -0.016323089599609375, -0.0066375732421875, 0.003047943115234375, 0.01273345947265625, 0.022418975830078125, 0.0321044921875, 0.041790008544921875, 0.05147552490234375, 0.061161041259765625, 0.0708465576171875, 0.08053207397460938, 0.09021759033203125, 0.09990310668945312, 0.109588623046875, 0.11927413940429688, 0.12895965576171875, 0.13864517211914062, 0.1483306884765625, 0.15801620483398438, 0.16770172119140625, 0.17738723754882812, 0.18707275390625, 0.19675827026367188, 0.20644378662109375, 0.21612930297851562, 0.2258148193359375, 0.23550033569335938, 0.24518585205078125, 0.2548713684082031, 0.264556884765625, 0.2742424011230469, 0.28392791748046875, 0.2936134338378906, 0.3032989501953125, 0.3129844665527344, 0.32266998291015625, 0.3323554992675781, 0.342041015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 3.0, 4.0, 5.0, 19.0, 18.0, 32.0, 23.0, 35.0, 41.0, 65.0, 76.0, 92.0, 116.0, 115.0, 81.0, 60.0, 44.0, 34.0, 36.0, 15.0, 16.0, 14.0, 10.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8767918348312378, -0.8426021933555603, -0.8084125518798828, -0.7742229104042053, -0.7400332689285278, -0.7058435678482056, -0.6716539263725281, -0.6374642848968506, -0.6032746434211731, -0.5690850019454956, -0.5348953604698181, -0.5007057189941406, -0.46651604771614075, -0.43232640624046326, -0.3981367349624634, -0.3639470934867859, -0.3297574520111084, -0.2955678105354309, -0.2613781690597534, -0.22718849778175354, -0.19299885630607605, -0.15880921483039856, -0.12461955845355988, -0.09042990207672119, -0.0562402606010437, -0.022050611674785614, 0.012139037251472473, 0.04632868617773056, 0.08051833510398865, 0.11470797657966614, 0.14889763295650482, 0.1830872893333435, 0.21727705001831055, 0.25146669149398804, 0.2856563329696655, 0.3198460042476654, 0.3540356457233429, 0.3882252871990204, 0.42241495847702026, 0.45660459995269775, 0.49079424142837524, 0.5249838829040527, 0.5591735243797302, 0.5933631658554077, 0.62755286693573, 0.6617424488067627, 0.695932149887085, 0.7301217913627625, 0.7643114328384399, 0.7985010743141174, 0.8326907157897949, 0.8668803572654724, 0.9010699987411499, 0.9352596998214722, 0.9694493412971497, 1.0036389827728271, 1.0378286838531494, 1.0720183849334717, 1.1062079668045044, 1.1403976678848267, 1.1745872497558594, 1.2087769508361816, 1.2429665327072144, 1.2771562337875366, 1.3113458156585693]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 8.0, 7.0, 8.0, 9.0, 11.0, 15.0, 15.0, 20.0, 23.0, 28.0, 40.0, 25.0, 31.0, 31.0, 34.0, 42.0, 37.0, 33.0, 37.0, 39.0, 35.0, 45.0, 42.0, 36.0, 46.0, 39.0, 32.0, 23.0, 25.0, 27.0, 16.0, 16.0, 17.0, 22.0, 17.0, 6.0, 13.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6731864213943481, -0.6533223390579224, -0.6334582567214966, -0.6135942339897156, -0.5937301516532898, -0.573866069316864, -0.5540019869804382, -0.5341379046440125, -0.5142738819122314, -0.49440979957580566, -0.47454574704170227, -0.4546816647052765, -0.4348176121711731, -0.4149535298347473, -0.39508944749832153, -0.37522536516189575, -0.35536128282546997, -0.3354972004890442, -0.3156331479549408, -0.295769065618515, -0.2759050130844116, -0.25604093074798584, -0.23617684841156006, -0.21631278097629547, -0.19644871354103088, -0.1765846461057663, -0.1567205786705017, -0.13685649633407593, -0.11699242889881134, -0.09712836146354675, -0.07726428657770157, -0.057400211691856384, -0.03753608465194702, -0.017672013491392136, 0.0021920576691627502, 0.022056128829717636, 0.04192019999027252, 0.06178426742553711, 0.0816483423113823, 0.10151241719722748, 0.12137648463249207, 0.14124055206775665, 0.16110461950302124, 0.18096870183944702, 0.2008327692747116, 0.2206968367099762, 0.24056091904640198, 0.26042497158050537, 0.28028905391693115, 0.30015313625335693, 0.3200171887874603, 0.3398812711238861, 0.3597453236579895, 0.3796094059944153, 0.39947348833084106, 0.41933757066726685, 0.43920162320137024, 0.459065705537796, 0.4789297580718994, 0.4987938404083252, 0.518657922744751, 0.5385220050811768, 0.5583860278129578, 0.5782501101493835, 0.5981141924858093]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 2.0, 3.0, 8.0, 9.0, 5.0, 6.0, 19.0, 25.0, 38.0, 72.0, 185.0, 793.0, 4707.0, 42615.0, 815226.0, 170453.0, 12007.0, 1755.0, 333.0, 96.0, 41.0, 15.0, 22.0, 18.0, 15.0, 10.0, 11.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9175949096679688, -0.8845062255859375, -0.8514175415039062, -0.818328857421875, -0.7852401733398438, -0.7521514892578125, -0.7190628051757812, -0.68597412109375, -0.6528854370117188, -0.6197967529296875, -0.5867080688476562, -0.553619384765625, -0.5205307006835938, -0.4874420166015625, -0.45435333251953125, -0.4212646484375, -0.38817596435546875, -0.3550872802734375, -0.32199859619140625, -0.288909912109375, -0.25582122802734375, -0.2227325439453125, -0.18964385986328125, -0.15655517578125, -0.12346649169921875, -0.0903778076171875, -0.05728912353515625, -0.024200439453125, 0.00888824462890625, 0.0419769287109375, 0.07506561279296875, 0.108154296875, 0.14124298095703125, 0.1743316650390625, 0.20742034912109375, 0.240509033203125, 0.27359771728515625, 0.3066864013671875, 0.33977508544921875, 0.37286376953125, 0.40595245361328125, 0.4390411376953125, 0.47212982177734375, 0.505218505859375, 0.5383071899414062, 0.5713958740234375, 0.6044845581054688, 0.6375732421875, 0.6706619262695312, 0.7037506103515625, 0.7368392944335938, 0.769927978515625, 0.8030166625976562, 0.8361053466796875, 0.8691940307617188, 0.90228271484375, 0.9353713989257812, 0.9684600830078125, 1.0015487670898438, 1.034637451171875, 1.0677261352539062, 1.1008148193359375, 1.1339035034179688, 1.1669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 11.0, 15.0, 27.0, 43.0, 57.0, 72.0, 75.0, 77.0, 86.0, 94.0, 90.0, 81.0, 72.0, 52.0, 35.0, 40.0, 23.0, 18.0, 12.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1961479187011719, -1.1696395874023438, -1.1431312561035156, -1.1166229248046875, -1.0901145935058594, -1.0636062622070312, -1.0370979309082031, -1.010589599609375, -0.9840812683105469, -0.9575729370117188, -0.9310646057128906, -0.9045562744140625, -0.8780479431152344, -0.8515396118164062, -0.8250312805175781, -0.79852294921875, -0.7720146179199219, -0.7455062866210938, -0.7189979553222656, -0.6924896240234375, -0.6659812927246094, -0.6394729614257812, -0.6129646301269531, -0.586456298828125, -0.5599479675292969, -0.5334396362304688, -0.5069313049316406, -0.4804229736328125, -0.4539146423339844, -0.42740631103515625, -0.4008979797363281, -0.3743896484375, -0.3478813171386719, -0.32137298583984375, -0.2948646545410156, -0.2683563232421875, -0.24184799194335938, -0.21533966064453125, -0.18883132934570312, -0.162322998046875, -0.13581466674804688, -0.10930633544921875, -0.08279800415039062, -0.0562896728515625, -0.029781341552734375, -0.00327301025390625, 0.023235321044921875, 0.04974365234375, 0.07625198364257812, 0.10276031494140625, 0.12926864624023438, 0.1557769775390625, 0.18228530883789062, 0.20879364013671875, 0.23530197143554688, 0.261810302734375, 0.2883186340332031, 0.31482696533203125, 0.3413352966308594, 0.3678436279296875, 0.3943519592285156, 0.42086029052734375, 0.4473686218261719, 0.473876953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 3.0, 12.0, 7.0, 8.0, 23.0, 27.0, 51.0, 103.0, 202.0, 368.0, 770.0, 1645.0, 3771.0, 10655.0, 36825.0, 196679.0, 633079.0, 123721.0, 26790.0, 8177.0, 3015.0, 1307.0, 651.0, 285.0, 146.0, 83.0, 50.0, 25.0, 20.0, 14.0, 13.0, 11.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.45372772216796875, -0.4409027099609375, -0.42807769775390625, -0.415252685546875, -0.40242767333984375, -0.3896026611328125, -0.37677764892578125, -0.36395263671875, -0.35112762451171875, -0.3383026123046875, -0.32547760009765625, -0.312652587890625, -0.29982757568359375, -0.2870025634765625, -0.27417755126953125, -0.2613525390625, -0.24852752685546875, -0.2357025146484375, -0.22287750244140625, -0.210052490234375, -0.19722747802734375, -0.1844024658203125, -0.17157745361328125, -0.15875244140625, -0.14592742919921875, -0.1331024169921875, -0.12027740478515625, -0.107452392578125, -0.09462738037109375, -0.0818023681640625, -0.06897735595703125, -0.05615234375, -0.04332733154296875, -0.0305023193359375, -0.01767730712890625, -0.004852294921875, 0.00797271728515625, 0.0207977294921875, 0.03362274169921875, 0.04644775390625, 0.05927276611328125, 0.0720977783203125, 0.08492279052734375, 0.097747802734375, 0.11057281494140625, 0.1233978271484375, 0.13622283935546875, 0.1490478515625, 0.16187286376953125, 0.1746978759765625, 0.18752288818359375, 0.200347900390625, 0.21317291259765625, 0.2259979248046875, 0.23882293701171875, 0.25164794921875, 0.26447296142578125, 0.2772979736328125, 0.29012298583984375, 0.302947998046875, 0.31577301025390625, 0.3285980224609375, 0.34142303466796875, 0.354248046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 9.0, 10.0, 16.0, 12.0, 15.0, 23.0, 23.0, 33.0, 35.0, 24.0, 34.0, 63.0, 47.0, 42.0, 33.0, 37.0, 36.0, 47.0, 42.0, 47.0, 47.0, 38.0, 30.0, 32.0, 37.0, 28.0, 26.0, 20.0, 12.0, 21.0, 7.0, 12.0, 6.0, 8.0, 4.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.80419921875, -0.7798538208007812, -0.7555084228515625, -0.7311630249023438, -0.706817626953125, -0.6824722290039062, -0.6581268310546875, -0.6337814331054688, -0.60943603515625, -0.5850906372070312, -0.5607452392578125, -0.5363998413085938, -0.512054443359375, -0.48770904541015625, -0.4633636474609375, -0.43901824951171875, -0.4146728515625, -0.39032745361328125, -0.3659820556640625, -0.34163665771484375, -0.317291259765625, -0.29294586181640625, -0.2686004638671875, -0.24425506591796875, -0.21990966796875, -0.19556427001953125, -0.1712188720703125, -0.14687347412109375, -0.122528076171875, -0.09818267822265625, -0.0738372802734375, -0.04949188232421875, -0.025146484375, -0.00080108642578125, 0.0235443115234375, 0.04788970947265625, 0.072235107421875, 0.09658050537109375, 0.1209259033203125, 0.14527130126953125, 0.16961669921875, 0.19396209716796875, 0.2183074951171875, 0.24265289306640625, 0.266998291015625, 0.29134368896484375, 0.3156890869140625, 0.34003448486328125, 0.3643798828125, 0.38872528076171875, 0.4130706787109375, 0.43741607666015625, 0.461761474609375, 0.48610687255859375, 0.5104522705078125, 0.5347976684570312, 0.55914306640625, 0.5834884643554688, 0.6078338623046875, 0.6321792602539062, 0.656524658203125, 0.6808700561523438, 0.7052154541015625, 0.7295608520507812, 0.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 13.0, 13.0, 19.0, 43.0, 44.0, 102.0, 114.0, 171.0, 288.0, 460.0, 752.0, 1283.0, 2358.0, 4549.0, 11017.0, 42233.0, 569126.0, 363882.0, 33031.0, 9685.0, 4048.0, 2143.0, 1226.0, 699.0, 423.0, 257.0, 170.0, 131.0, 75.0, 55.0, 40.0, 15.0, 17.0, 14.0, 5.0, 9.0, 10.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.1807880401611328, -0.17529678344726562, -0.16980552673339844, -0.16431427001953125, -0.15882301330566406, -0.15333175659179688, -0.1478404998779297, -0.1423492431640625, -0.1368579864501953, -0.13136672973632812, -0.12587547302246094, -0.12038421630859375, -0.11489295959472656, -0.10940170288085938, -0.10391044616699219, -0.098419189453125, -0.09292793273925781, -0.08743667602539062, -0.08194541931152344, -0.07645416259765625, -0.07096290588378906, -0.06547164916992188, -0.05998039245605469, -0.0544891357421875, -0.04899787902832031, -0.043506622314453125, -0.03801536560058594, -0.03252410888671875, -0.027032852172851562, -0.021541595458984375, -0.016050338745117188, -0.01055908203125, -0.0050678253173828125, 0.000423431396484375, 0.0059146881103515625, 0.01140594482421875, 0.016897201538085938, 0.022388458251953125, 0.027879714965820312, 0.0333709716796875, 0.03886222839355469, 0.044353485107421875, 0.04984474182128906, 0.05533599853515625, 0.06082725524902344, 0.06631851196289062, 0.07180976867675781, 0.077301025390625, 0.08279228210449219, 0.08828353881835938, 0.09377479553222656, 0.09926605224609375, 0.10475730895996094, 0.11024856567382812, 0.11573982238769531, 0.1212310791015625, 0.1267223358154297, 0.13221359252929688, 0.13770484924316406, 0.14319610595703125, 0.14868736267089844, 0.15417861938476562, 0.1596698760986328, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 13.0, 7.0, 14.0, 21.0, 43.0, 75.0, 155.0, 287.0, 180.0, 71.0, 54.0, 23.0, 15.0, 11.0, 11.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.551908493041992e-05, -7.122848182916641e-05, -6.69378787279129e-05, -6.26472756266594e-05, -5.8356672525405884e-05, -5.4066069424152374e-05, -4.9775466322898865e-05, -4.5484863221645355e-05, -4.1194260120391846e-05, -3.6903657019138336e-05, -3.261305391788483e-05, -2.8322450816631317e-05, -2.4031847715377808e-05, -1.9741244614124298e-05, -1.545064151287079e-05, -1.1160038411617279e-05, -6.8694353103637695e-06, -2.57883220911026e-06, 1.7117708921432495e-06, 6.002373993396759e-06, 1.0292977094650269e-05, 1.4583580195903778e-05, 1.8874183297157288e-05, 2.3164786398410797e-05, 2.7455389499664307e-05, 3.1745992600917816e-05, 3.6036595702171326e-05, 4.0327198803424835e-05, 4.4617801904678345e-05, 4.8908405005931854e-05, 5.3199008107185364e-05, 5.748961120843887e-05, 6.178021430969238e-05, 6.607081741094589e-05, 7.03614205121994e-05, 7.465202361345291e-05, 7.894262671470642e-05, 8.323322981595993e-05, 8.752383291721344e-05, 9.181443601846695e-05, 9.610503911972046e-05, 0.00010039564222097397, 0.00010468624532222748, 0.00010897684842348099, 0.0001132674515247345, 0.000117558054625988, 0.00012184865772724152, 0.00012613926082849503, 0.00013042986392974854, 0.00013472046703100204, 0.00013901107013225555, 0.00014330167323350906, 0.00014759227633476257, 0.00015188287943601608, 0.0001561734825372696, 0.0001604640856385231, 0.0001647546887397766, 0.00016904529184103012, 0.00017333589494228363, 0.00017762649804353714, 0.00018191710114479065, 0.00018620770424604416, 0.00019049830734729767, 0.00019478891044855118, 0.0001990795135498047]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 6.0, 5.0, 23.0, 25.0, 42.0, 80.0, 117.0, 218.0, 362.0, 639.0, 1124.0, 2592.0, 7609.0, 56994.0, 910768.0, 55468.0, 7314.0, 2463.0, 1149.0, 643.0, 337.0, 212.0, 118.0, 82.0, 62.0, 29.0, 19.0, 7.0, 8.0, 5.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.309326171875, -0.3000907897949219, -0.29085540771484375, -0.2816200256347656, -0.2723846435546875, -0.2631492614746094, -0.25391387939453125, -0.24467849731445312, -0.235443115234375, -0.22620773315429688, -0.21697235107421875, -0.20773696899414062, -0.1985015869140625, -0.18926620483398438, -0.18003082275390625, -0.17079544067382812, -0.16156005859375, -0.15232467651367188, -0.14308929443359375, -0.13385391235351562, -0.1246185302734375, -0.11538314819335938, -0.10614776611328125, -0.09691238403320312, -0.087677001953125, -0.07844161987304688, -0.06920623779296875, -0.059970855712890625, -0.0507354736328125, -0.041500091552734375, -0.03226470947265625, -0.023029327392578125, -0.0137939453125, -0.004558563232421875, 0.00467681884765625, 0.013912200927734375, 0.0231475830078125, 0.032382965087890625, 0.04161834716796875, 0.050853729248046875, 0.060089111328125, 0.06932449340820312, 0.07855987548828125, 0.08779525756835938, 0.0970306396484375, 0.10626602172851562, 0.11550140380859375, 0.12473678588867188, 0.13397216796875, 0.14320755004882812, 0.15244293212890625, 0.16167831420898438, 0.1709136962890625, 0.18014907836914062, 0.18938446044921875, 0.19861984252929688, 0.207855224609375, 0.21709060668945312, 0.22632598876953125, 0.23556137084960938, 0.2447967529296875, 0.2540321350097656, 0.26326751708984375, 0.2725028991699219, 0.28173828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 20.0, 22.0, 32.0, 68.0, 144.0, 226.0, 211.0, 127.0, 42.0, 26.0, 20.0, 18.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0748291015625, -0.07299947738647461, -0.07116985321044922, -0.06934022903442383, -0.06751060485839844, -0.06568098068237305, -0.06385135650634766, -0.062021732330322266, -0.060192108154296875, -0.058362483978271484, -0.056532859802246094, -0.0547032356262207, -0.05287361145019531, -0.05104398727416992, -0.04921436309814453, -0.04738473892211914, -0.04555511474609375, -0.04372549057006836, -0.04189586639404297, -0.04006624221801758, -0.03823661804199219, -0.0364069938659668, -0.034577369689941406, -0.032747745513916016, -0.030918121337890625, -0.029088497161865234, -0.027258872985839844, -0.025429248809814453, -0.023599624633789062, -0.021770000457763672, -0.01994037628173828, -0.01811075210571289, -0.0162811279296875, -0.01445150375366211, -0.012621879577636719, -0.010792255401611328, -0.008962631225585938, -0.007133007049560547, -0.005303382873535156, -0.0034737586975097656, -0.001644134521484375, 0.00018548965454101562, 0.0020151138305664062, 0.003844738006591797, 0.0056743621826171875, 0.007503986358642578, 0.009333610534667969, 0.01116323471069336, 0.01299285888671875, 0.01482248306274414, 0.01665210723876953, 0.018481731414794922, 0.020311355590820312, 0.022140979766845703, 0.023970603942871094, 0.025800228118896484, 0.027629852294921875, 0.029459476470947266, 0.031289100646972656, 0.03311872482299805, 0.03494834899902344, 0.03677797317504883, 0.03860759735107422, 0.04043722152709961, 0.042266845703125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 11.0, 23.0, 77.0, 147.0, 336.0, 232.0, 89.0, 46.0, 22.0, 8.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.740212619304657, -0.6771643161773682, -0.6141160726547241, -0.5510677695274353, -0.48801949620246887, -0.42497122287750244, -0.3619229197502136, -0.2988746464252472, -0.23582637310028076, -0.17277809977531433, -0.1097298115491867, -0.04668152332305908, 0.01636675000190735, 0.07941502332687378, 0.1424633264541626, 0.20551159977912903, 0.26855987310409546, 0.3316081464290619, 0.3946564197540283, 0.45770472288131714, 0.520753026008606, 0.58380126953125, 0.6468495726585388, 0.7098978757858276, 0.7729461193084717, 0.8359944224357605, 0.8990426659584045, 0.9620909690856934, 1.0251392126083374, 1.0881874561309814, 1.151235818862915, 1.214284062385559, 1.2773323059082031, 1.3403805494308472, 1.4034289121627808, 1.4664771556854248, 1.5295253992080688, 1.592573642730713, 1.6556220054626465, 1.7186702489852905, 1.7817184925079346, 1.8447667360305786, 1.9078150987625122, 1.9708633422851562, 2.03391170501709, 2.0969598293304443, 2.160008192062378, 2.2230565547943115, 2.286104679107666, 2.3491530418395996, 2.412201166152954, 2.4752495288848877, 2.5382978916168213, 2.601346015930176, 2.6643943786621094, 2.727442741394043, 2.7904911041259766, 2.85353946685791, 2.9165875911712646, 2.9796359539031982, 3.042684316635132, 3.1057324409484863, 3.16878080368042, 3.2318291664123535, 3.294877290725708]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 10.0, 20.0, 32.0, 39.0, 43.0, 68.0, 89.0, 63.0, 91.0, 80.0, 93.0, 90.0, 72.0, 52.0, 39.0, 36.0, 23.0, 18.0, 17.0, 8.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1846389770507812, -1.159031867980957, -1.1334247589111328, -1.1078176498413086, -1.0822104215621948, -1.0566033124923706, -1.0309962034225464, -1.0053890943527222, -0.979781985282898, -0.9541748762130737, -0.9285677075386047, -0.9029605984687805, -0.8773534893989563, -0.8517463207244873, -0.8261392116546631, -0.8005321025848389, -0.7749249935150146, -0.7493178844451904, -0.7237107157707214, -0.6981036067008972, -0.672496497631073, -0.646889328956604, -0.6212822198867798, -0.5956751108169556, -0.5700679421424866, -0.5444608330726624, -0.5188536643981934, -0.49324655532836914, -0.4676394462585449, -0.4420323073863983, -0.4164251685142517, -0.3908180594444275, -0.36521095037460327, -0.33960381150245667, -0.31399670243263245, -0.28838956356048584, -0.2627824544906616, -0.23717531561851501, -0.2115681916475296, -0.1859610676765442, -0.16035394370555878, -0.13474681973457336, -0.10913969576358795, -0.08353256434202194, -0.05792544037103653, -0.03231830894947052, -0.006711184978485107, 0.018895938992500305, 0.04450306296348572, 0.07011018693447113, 0.09571731090545654, 0.12132444232702255, 0.14693155884742737, 0.17253869771957397, 0.1981458216905594, 0.2237529456615448, 0.2493600696325302, 0.2749671936035156, 0.30057433247566223, 0.32618144154548645, 0.35178858041763306, 0.3773956894874573, 0.4030028283596039, 0.4286099672317505, 0.4542170763015747]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 11.0, 16.0, 70.0, 159.0, 564.0, 2410.0, 16719.0, 532923.0, 476576.0, 15814.0, 2367.0, 602.0, 171.0, 61.0, 27.0, 10.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.0377044677734375, -1.977752685546875, -1.9178009033203125, -1.85784912109375, -1.7978973388671875, -1.737945556640625, -1.6779937744140625, -1.6180419921875, -1.5580902099609375, -1.498138427734375, -1.4381866455078125, -1.37823486328125, -1.3182830810546875, -1.258331298828125, -1.1983795166015625, -1.138427734375, -1.0784759521484375, -1.018524169921875, -0.9585723876953125, -0.89862060546875, -0.8386688232421875, -0.778717041015625, -0.7187652587890625, -0.6588134765625, -0.5988616943359375, -0.538909912109375, -0.4789581298828125, -0.41900634765625, -0.3590545654296875, -0.299102783203125, -0.2391510009765625, -0.17919921875, -0.1192474365234375, -0.059295654296875, 0.0006561279296875, 0.06060791015625, 0.1205596923828125, 0.180511474609375, 0.2404632568359375, 0.3004150390625, 0.3603668212890625, 0.420318603515625, 0.4802703857421875, 0.54022216796875, 0.6001739501953125, 0.660125732421875, 0.7200775146484375, 0.780029296875, 0.8399810791015625, 0.899932861328125, 0.9598846435546875, 1.01983642578125, 1.0797882080078125, 1.139739990234375, 1.1996917724609375, 1.2596435546875, 1.3195953369140625, 1.379547119140625, 1.4394989013671875, 1.49945068359375, 1.5594024658203125, 1.619354248046875, 1.6793060302734375, 1.7392578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 7.0, 8.0, 9.0, 19.0, 20.0, 14.0, 30.0, 33.0, 49.0, 71.0, 48.0, 67.0, 64.0, 73.0, 75.0, 76.0, 71.0, 64.0, 44.0, 30.0, 36.0, 21.0, 24.0, 17.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.779296875, -1.7383346557617188, -1.6973724365234375, -1.6564102172851562, -1.615447998046875, -1.5744857788085938, -1.5335235595703125, -1.4925613403320312, -1.45159912109375, -1.4106369018554688, -1.3696746826171875, -1.3287124633789062, -1.287750244140625, -1.2467880249023438, -1.2058258056640625, -1.1648635864257812, -1.1239013671875, -1.0829391479492188, -1.0419769287109375, -1.0010147094726562, -0.960052490234375, -0.9190902709960938, -0.8781280517578125, -0.8371658325195312, -0.79620361328125, -0.7552413940429688, -0.7142791748046875, -0.6733169555664062, -0.632354736328125, -0.5913925170898438, -0.5504302978515625, -0.5094680786132812, -0.468505859375, -0.42754364013671875, -0.3865814208984375, -0.34561920166015625, -0.304656982421875, -0.26369476318359375, -0.2227325439453125, -0.18177032470703125, -0.14080810546875, -0.09984588623046875, -0.0588836669921875, -0.01792144775390625, 0.023040771484375, 0.06400299072265625, 0.1049652099609375, 0.14592742919921875, 0.1868896484375, 0.22785186767578125, 0.2688140869140625, 0.30977630615234375, 0.350738525390625, 0.39170074462890625, 0.4326629638671875, 0.47362518310546875, 0.51458740234375, 0.5555496215820312, 0.5965118408203125, 0.6374740600585938, 0.678436279296875, 0.7193984985351562, 0.7603607177734375, 0.8013229370117188, 0.84228515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 9.0, 7.0, 6.0, 17.0, 18.0, 22.0, 20.0, 28.0, 39.0, 51.0, 41.0, 64.0, 86.0, 192.0, 821.0, 22365.0, 1011844.0, 11734.0, 622.0, 158.0, 77.0, 71.0, 40.0, 43.0, 26.0, 29.0, 24.0, 15.0, 22.0, 14.0, 4.0, 8.0, 7.0, 3.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.388641357421875, -3.27728271484375, -3.165924072265625, -3.0545654296875, -2.943206787109375, -2.83184814453125, -2.720489501953125, -2.609130859375, -2.497772216796875, -2.38641357421875, -2.275054931640625, -2.1636962890625, -2.052337646484375, -1.94097900390625, -1.829620361328125, -1.71826171875, -1.606903076171875, -1.49554443359375, -1.384185791015625, -1.2728271484375, -1.161468505859375, -1.05010986328125, -0.938751220703125, -0.827392578125, -0.716033935546875, -0.60467529296875, -0.493316650390625, -0.3819580078125, -0.270599365234375, -0.15924072265625, -0.047882080078125, 0.0634765625, 0.174835205078125, 0.28619384765625, 0.397552490234375, 0.5089111328125, 0.620269775390625, 0.73162841796875, 0.842987060546875, 0.954345703125, 1.065704345703125, 1.17706298828125, 1.288421630859375, 1.3997802734375, 1.511138916015625, 1.62249755859375, 1.733856201171875, 1.84521484375, 1.956573486328125, 2.06793212890625, 2.179290771484375, 2.2906494140625, 2.402008056640625, 2.51336669921875, 2.624725341796875, 2.736083984375, 2.847442626953125, 2.95880126953125, 3.070159912109375, 3.1815185546875, 3.292877197265625, 3.40423583984375, 3.515594482421875, 3.626953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 8.0, 5.0, 9.0, 10.0, 14.0, 9.0, 27.0, 14.0, 27.0, 25.0, 35.0, 42.0, 47.0, 39.0, 38.0, 49.0, 54.0, 39.0, 56.0, 33.0, 40.0, 47.0, 38.0, 27.0, 31.0, 23.0, 35.0, 35.0, 29.0, 19.0, 16.0, 21.0, 15.0, 7.0, 9.0, 7.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9230422973632812, -0.8954010009765625, -0.8677597045898438, -0.840118408203125, -0.8124771118164062, -0.7848358154296875, -0.7571945190429688, -0.72955322265625, -0.7019119262695312, -0.6742706298828125, -0.6466293334960938, -0.618988037109375, -0.5913467407226562, -0.5637054443359375, -0.5360641479492188, -0.5084228515625, -0.48078155517578125, -0.4531402587890625, -0.42549896240234375, -0.397857666015625, -0.37021636962890625, -0.3425750732421875, -0.31493377685546875, -0.28729248046875, -0.25965118408203125, -0.2320098876953125, -0.20436859130859375, -0.176727294921875, -0.14908599853515625, -0.1214447021484375, -0.09380340576171875, -0.066162109375, -0.03852081298828125, -0.0108795166015625, 0.01676177978515625, 0.044403076171875, 0.07204437255859375, 0.0996856689453125, 0.12732696533203125, 0.15496826171875, 0.18260955810546875, 0.2102508544921875, 0.23789215087890625, 0.265533447265625, 0.29317474365234375, 0.3208160400390625, 0.34845733642578125, 0.3760986328125, 0.40373992919921875, 0.4313812255859375, 0.45902252197265625, 0.486663818359375, 0.5143051147460938, 0.5419464111328125, 0.5695877075195312, 0.59722900390625, 0.6248703002929688, 0.6525115966796875, 0.6801528930664062, 0.707794189453125, 0.7354354858398438, 0.7630767822265625, 0.7907180786132812, 0.818359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 10.0, 10.0, 11.0, 14.0, 31.0, 25.0, 85.0, 168.0, 316.0, 813.0, 2443.0, 11268.0, 261889.0, 750019.0, 16774.0, 2917.0, 918.0, 380.0, 212.0, 98.0, 56.0, 37.0, 18.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5927734375, -0.570892333984375, -0.54901123046875, -0.527130126953125, -0.5052490234375, -0.483367919921875, -0.46148681640625, -0.439605712890625, -0.417724609375, -0.395843505859375, -0.37396240234375, -0.352081298828125, -0.3302001953125, -0.308319091796875, -0.28643798828125, -0.264556884765625, -0.24267578125, -0.220794677734375, -0.19891357421875, -0.177032470703125, -0.1551513671875, -0.133270263671875, -0.11138916015625, -0.089508056640625, -0.067626953125, -0.045745849609375, -0.02386474609375, -0.001983642578125, 0.0198974609375, 0.041778564453125, 0.06365966796875, 0.085540771484375, 0.107421875, 0.129302978515625, 0.15118408203125, 0.173065185546875, 0.1949462890625, 0.216827392578125, 0.23870849609375, 0.260589599609375, 0.282470703125, 0.304351806640625, 0.32623291015625, 0.348114013671875, 0.3699951171875, 0.391876220703125, 0.41375732421875, 0.435638427734375, 0.45751953125, 0.479400634765625, 0.50128173828125, 0.523162841796875, 0.5450439453125, 0.566925048828125, 0.58880615234375, 0.610687255859375, 0.632568359375, 0.654449462890625, 0.67633056640625, 0.698211669921875, 0.7200927734375, 0.741973876953125, 0.76385498046875, 0.785736083984375, 0.8076171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 9.0, 4.0, 14.0, 11.0, 32.0, 28.0, 68.0, 110.0, 208.0, 242.0, 111.0, 57.0, 41.0, 26.0, 10.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.624792098999023e-05, -8.392054587602615e-05, -8.159317076206207e-05, -7.926579564809799e-05, -7.693842053413391e-05, -7.461104542016983e-05, -7.228367030620575e-05, -6.995629519224167e-05, -6.762892007827759e-05, -6.530154496431351e-05, -6.297416985034943e-05, -6.0646794736385345e-05, -5.8319419622421265e-05, -5.5992044508457184e-05, -5.36646693944931e-05, -5.133729428052902e-05, -4.900991916656494e-05, -4.668254405260086e-05, -4.435516893863678e-05, -4.20277938246727e-05, -3.970041871070862e-05, -3.737304359674454e-05, -3.5045668482780457e-05, -3.2718293368816376e-05, -3.0390918254852295e-05, -2.8063543140888214e-05, -2.5736168026924133e-05, -2.3408792912960052e-05, -2.108141779899597e-05, -1.875404268503189e-05, -1.642666757106781e-05, -1.409929245710373e-05, -1.1771917343139648e-05, -9.444542229175568e-06, -7.117167115211487e-06, -4.789792001247406e-06, -2.462416887283325e-06, -1.3504177331924438e-07, 2.1923333406448364e-06, 4.519708454608917e-06, 6.847083568572998e-06, 9.174458682537079e-06, 1.150183379650116e-05, 1.382920891046524e-05, 1.615658402442932e-05, 1.8483959138393402e-05, 2.0811334252357483e-05, 2.3138709366321564e-05, 2.5466084480285645e-05, 2.7793459594249725e-05, 3.0120834708213806e-05, 3.244820982217789e-05, 3.477558493614197e-05, 3.710296005010605e-05, 3.943033516407013e-05, 4.175771027803421e-05, 4.408508539199829e-05, 4.641246050596237e-05, 4.873983561992645e-05, 5.1067210733890533e-05, 5.3394585847854614e-05, 5.5721960961818695e-05, 5.8049336075782776e-05, 6.037671118974686e-05, 6.270408630371094e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 3.0, 5.0, 8.0, 20.0, 28.0, 32.0, 63.0, 95.0, 206.0, 412.0, 983.0, 2876.0, 12104.0, 122522.0, 858005.0, 41285.0, 6672.0, 1819.0, 737.0, 306.0, 149.0, 74.0, 48.0, 44.0, 19.0, 12.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.3965606689453125, -0.379547119140625, -0.3625335693359375, -0.34552001953125, -0.3285064697265625, -0.311492919921875, -0.2944793701171875, -0.2774658203125, -0.2604522705078125, -0.243438720703125, -0.2264251708984375, -0.20941162109375, -0.1923980712890625, -0.175384521484375, -0.1583709716796875, -0.141357421875, -0.1243438720703125, -0.107330322265625, -0.0903167724609375, -0.07330322265625, -0.0562896728515625, -0.039276123046875, -0.0222625732421875, -0.0052490234375, 0.0117645263671875, 0.028778076171875, 0.0457916259765625, 0.06280517578125, 0.0798187255859375, 0.096832275390625, 0.1138458251953125, 0.130859375, 0.1478729248046875, 0.164886474609375, 0.1819000244140625, 0.19891357421875, 0.2159271240234375, 0.232940673828125, 0.2499542236328125, 0.2669677734375, 0.2839813232421875, 0.300994873046875, 0.3180084228515625, 0.33502197265625, 0.3520355224609375, 0.369049072265625, 0.3860626220703125, 0.403076171875, 0.4200897216796875, 0.437103271484375, 0.4541168212890625, 0.47113037109375, 0.4881439208984375, 0.505157470703125, 0.5221710205078125, 0.5391845703125, 0.5561981201171875, 0.573211669921875, 0.5902252197265625, 0.60723876953125, 0.6242523193359375, 0.641265869140625, 0.6582794189453125, 0.67529296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 4.0, 13.0, 17.0, 23.0, 24.0, 42.0, 48.0, 79.0, 149.0, 193.0, 123.0, 66.0, 64.0, 29.0, 31.0, 13.0, 12.0, 12.0, 7.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1610107421875, -0.15619468688964844, -0.15137863159179688, -0.1465625762939453, -0.14174652099609375, -0.1369304656982422, -0.13211441040039062, -0.12729835510253906, -0.1224822998046875, -0.11766624450683594, -0.11285018920898438, -0.10803413391113281, -0.10321807861328125, -0.09840202331542969, -0.09358596801757812, -0.08876991271972656, -0.083953857421875, -0.07913780212402344, -0.07432174682617188, -0.06950569152832031, -0.06468963623046875, -0.05987358093261719, -0.055057525634765625, -0.05024147033691406, -0.0454254150390625, -0.04060935974121094, -0.035793304443359375, -0.030977249145507812, -0.02616119384765625, -0.021345138549804688, -0.016529083251953125, -0.011713027954101562, -0.00689697265625, -0.0020809173583984375, 0.002735137939453125, 0.0075511932373046875, 0.01236724853515625, 0.017183303833007812, 0.021999359130859375, 0.026815414428710938, 0.0316314697265625, 0.03644752502441406, 0.041263580322265625, 0.04607963562011719, 0.05089569091796875, 0.05571174621582031, 0.060527801513671875, 0.06534385681152344, 0.070159912109375, 0.07497596740722656, 0.07979202270507812, 0.08460807800292969, 0.08942413330078125, 0.09424018859863281, 0.09905624389648438, 0.10387229919433594, 0.1086883544921875, 0.11350440979003906, 0.11832046508789062, 0.12313652038574219, 0.12795257568359375, 0.1327686309814453, 0.13758468627929688, 0.14240074157714844, 0.147216796875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 21.0, 77.0, 281.0, 425.0, 153.0, 34.0, 15.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.611502647399902, -10.416038513183594, -10.220574378967285, -10.025110244750977, -9.829647064208984, -9.634182929992676, -9.438718795776367, -9.243254661560059, -9.04779052734375, -8.852326393127441, -8.656862258911133, -8.461398124694824, -8.265934944152832, -8.070470809936523, -7.875006675720215, -7.679542541503906, -7.484078407287598, -7.288614273071289, -7.093150615692139, -6.89768648147583, -6.7022223472595215, -6.506758213043213, -6.3112945556640625, -6.115830421447754, -5.9203667640686035, -5.724902629852295, -5.5294389724731445, -5.333974838256836, -5.138510704040527, -4.943046569824219, -4.747582912445068, -4.55211877822876, -4.356654644012451, -4.161190509796143, -3.965726613998413, -3.7702627182006836, -3.574798583984375, -3.3793346881866455, -3.183870792388916, -2.9884066581726074, -2.792942523956299, -2.5974786281585693, -2.4020144939422607, -2.2065505981445312, -2.0110864639282227, -1.8156225681304932, -1.6201585531234741, -1.424694538116455, -1.2292306423187256, -1.0337666273117065, -0.8383026123046875, -0.6428386569023132, -0.4473746418952942, -0.25191062688827515, -0.05644667148590088, 0.13901734352111816, 0.3344813585281372, 0.5299453735351562, 0.7254093885421753, 0.9208733439445496, 1.1163372993469238, 1.3118014335632324, 1.507265329360962, 1.702729344367981, 1.898193359375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 11.0, 9.0, 8.0, 13.0, 16.0, 22.0, 25.0, 40.0, 35.0, 35.0, 35.0, 41.0, 39.0, 54.0, 44.0, 47.0, 49.0, 63.0, 44.0, 44.0, 43.0, 37.0, 39.0, 37.0, 32.0, 21.0, 31.0, 12.0, 11.0, 19.0, 13.0, 11.0, 2.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.689207673072815, -1.6446982622146606, -1.6001887321472168, -1.5556793212890625, -1.5111699104309082, -1.4666603803634644, -1.42215096950531, -1.3776414394378662, -1.333132028579712, -1.2886226177215576, -1.2441130876541138, -1.1996036767959595, -1.1550941467285156, -1.1105847358703613, -1.066075325012207, -1.0215659141540527, -0.9770563840866089, -0.9325469136238098, -0.8880374431610107, -0.8435280323028564, -0.7990185618400574, -0.7545090913772583, -0.709999680519104, -0.6654902100563049, -0.6209807395935059, -0.5764712691307068, -0.5319617986679077, -0.4874523878097534, -0.44294291734695435, -0.3984334468841553, -0.3539240062236786, -0.3094145655632019, -0.2649049758911133, -0.2203955203294754, -0.17588606476783752, -0.13137660920619965, -0.08686715364456177, -0.04235769808292389, 0.0021517574787139893, 0.046661198139190674, 0.09117066860198975, 0.13568012416362762, 0.1801895797252655, 0.22469903528690338, 0.26920849084854126, 0.31371796131134033, 0.358227401971817, 0.4027368426322937, 0.4472463130950928, 0.49175578355789185, 0.5362652540206909, 0.5807746648788452, 0.6252841353416443, 0.6697936058044434, 0.7143030166625977, 0.7588124871253967, 0.8033219575881958, 0.8478314280509949, 0.892340898513794, 0.9368503093719482, 0.9813597798347473, 1.0258692502975464, 1.0703786611557007, 1.1148881912231445, 1.1593976020812988]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 8.0, 17.0, 22.0, 46.0, 63.0, 78.0, 141.0, 316.0, 1733.0, 22702.0, 4005653.0, 157868.0, 4493.0, 635.0, 190.0, 106.0, 58.0, 48.0, 34.0, 24.0, 13.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.158203125, -3.035186767578125, -2.91217041015625, -2.789154052734375, -2.6661376953125, -2.543121337890625, -2.42010498046875, -2.297088623046875, -2.174072265625, -2.051055908203125, -1.92803955078125, -1.805023193359375, -1.6820068359375, -1.558990478515625, -1.43597412109375, -1.312957763671875, -1.18994140625, -1.066925048828125, -0.94390869140625, -0.820892333984375, -0.6978759765625, -0.574859619140625, -0.45184326171875, -0.328826904296875, -0.205810546875, -0.082794189453125, 0.04022216796875, 0.163238525390625, 0.2862548828125, 0.409271240234375, 0.53228759765625, 0.655303955078125, 0.7783203125, 0.901336669921875, 1.02435302734375, 1.147369384765625, 1.2703857421875, 1.393402099609375, 1.51641845703125, 1.639434814453125, 1.762451171875, 1.885467529296875, 2.00848388671875, 2.131500244140625, 2.2545166015625, 2.377532958984375, 2.50054931640625, 2.623565673828125, 2.74658203125, 2.869598388671875, 2.99261474609375, 3.115631103515625, 3.2386474609375, 3.361663818359375, 3.48468017578125, 3.607696533203125, 3.730712890625, 3.853729248046875, 3.97674560546875, 4.099761962890625, 4.2227783203125, 4.345794677734375, 4.46881103515625, 4.591827392578125, 4.71484375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 5.0, 17.0, 13.0, 17.0, 21.0, 23.0, 20.0, 25.0, 34.0, 44.0, 35.0, 36.0, 51.0, 41.0, 59.0, 55.0, 56.0, 48.0, 47.0, 42.0, 50.0, 31.0, 33.0, 31.0, 29.0, 23.0, 30.0, 16.0, 20.0, 5.0, 10.0, 8.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74853515625, -0.7276229858398438, -0.7067108154296875, -0.6857986450195312, -0.664886474609375, -0.6439743041992188, -0.6230621337890625, -0.6021499633789062, -0.58123779296875, -0.5603256225585938, -0.5394134521484375, -0.5185012817382812, -0.497589111328125, -0.47667694091796875, -0.4557647705078125, -0.43485260009765625, -0.4139404296875, -0.39302825927734375, -0.3721160888671875, -0.35120391845703125, -0.330291748046875, -0.30937957763671875, -0.2884674072265625, -0.26755523681640625, -0.24664306640625, -0.22573089599609375, -0.2048187255859375, -0.18390655517578125, -0.162994384765625, -0.14208221435546875, -0.1211700439453125, -0.10025787353515625, -0.079345703125, -0.05843353271484375, -0.0375213623046875, -0.01660919189453125, 0.004302978515625, 0.02521514892578125, 0.0461273193359375, 0.06703948974609375, 0.08795166015625, 0.10886383056640625, 0.1297760009765625, 0.15068817138671875, 0.171600341796875, 0.19251251220703125, 0.2134246826171875, 0.23433685302734375, 0.2552490234375, 0.27616119384765625, 0.2970733642578125, 0.31798553466796875, 0.338897705078125, 0.35980987548828125, 0.3807220458984375, 0.40163421630859375, 0.42254638671875, 0.44345855712890625, 0.4643707275390625, 0.48528289794921875, 0.506195068359375, 0.5271072387695312, 0.5480194091796875, 0.5689315795898438, 0.58984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 2.0, 8.0, 11.0, 9.0, 15.0, 13.0, 45.0, 66.0, 118.0, 268.0, 696.0, 2569.0, 17513.0, 1489528.0, 2658215.0, 21216.0, 2716.0, 697.0, 272.0, 126.0, 59.0, 36.0, 17.0, 7.0, 7.0, 3.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.37109375, -2.29931640625, -2.2275390625, -2.15576171875, -2.083984375, -2.01220703125, -1.9404296875, -1.86865234375, -1.796875, -1.72509765625, -1.6533203125, -1.58154296875, -1.509765625, -1.43798828125, -1.3662109375, -1.29443359375, -1.22265625, -1.15087890625, -1.0791015625, -1.00732421875, -0.935546875, -0.86376953125, -0.7919921875, -0.72021484375, -0.6484375, -0.57666015625, -0.5048828125, -0.43310546875, -0.361328125, -0.28955078125, -0.2177734375, -0.14599609375, -0.07421875, -0.00244140625, 0.0693359375, 0.14111328125, 0.212890625, 0.28466796875, 0.3564453125, 0.42822265625, 0.5, 0.57177734375, 0.6435546875, 0.71533203125, 0.787109375, 0.85888671875, 0.9306640625, 1.00244140625, 1.07421875, 1.14599609375, 1.2177734375, 1.28955078125, 1.361328125, 1.43310546875, 1.5048828125, 1.57666015625, 1.6484375, 1.72021484375, 1.7919921875, 1.86376953125, 1.935546875, 2.00732421875, 2.0791015625, 2.15087890625, 2.22265625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 6.0, 8.0, 21.0, 22.0, 20.0, 28.0, 41.0, 51.0, 81.0, 128.0, 217.0, 391.0, 592.0, 774.0, 647.0, 376.0, 223.0, 133.0, 85.0, 62.0, 44.0, 21.0, 23.0, 16.0, 10.0, 10.0, 5.0, 9.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.27685546875, -0.26747894287109375, -0.2581024169921875, -0.24872589111328125, -0.239349365234375, -0.22997283935546875, -0.2205963134765625, -0.21121978759765625, -0.20184326171875, -0.19246673583984375, -0.1830902099609375, -0.17371368408203125, -0.164337158203125, -0.15496063232421875, -0.1455841064453125, -0.13620758056640625, -0.1268310546875, -0.11745452880859375, -0.1080780029296875, -0.09870147705078125, -0.089324951171875, -0.07994842529296875, -0.0705718994140625, -0.06119537353515625, -0.05181884765625, -0.04244232177734375, -0.0330657958984375, -0.02368927001953125, -0.014312744140625, -0.00493621826171875, 0.0044403076171875, 0.01381683349609375, 0.023193359375, 0.03256988525390625, 0.0419464111328125, 0.05132293701171875, 0.060699462890625, 0.07007598876953125, 0.0794525146484375, 0.08882904052734375, 0.09820556640625, 0.10758209228515625, 0.1169586181640625, 0.12633514404296875, 0.135711669921875, 0.14508819580078125, 0.1544647216796875, 0.16384124755859375, 0.1732177734375, 0.18259429931640625, 0.1919708251953125, 0.20134735107421875, 0.210723876953125, 0.22010040283203125, 0.2294769287109375, 0.23885345458984375, 0.24822998046875, 0.25760650634765625, 0.2669830322265625, 0.27635955810546875, 0.285736083984375, 0.29511260986328125, 0.3044891357421875, 0.31386566162109375, 0.3232421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 22.0, 25.0, 43.0, 77.0, 88.0, 140.0, 155.0, 135.0, 115.0, 53.0, 46.0, 33.0, 22.0, 13.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9143352508544922, -0.8651582598686218, -0.8159813284873962, -0.7668043375015259, -0.7176273465156555, -0.6684503555297852, -0.6192734241485596, -0.5700964331626892, -0.5209194421768188, -0.4717424809932709, -0.4225654900074005, -0.37338852882385254, -0.3242115378379822, -0.2750345766544342, -0.22585761547088623, -0.17668062448501587, -0.12750369310379028, -0.07832671701908112, -0.029149748384952545, 0.020027220249176025, 0.06920419633388519, 0.11838117241859436, 0.16755813360214233, 0.2167351245880127, 0.26591208577156067, 0.31508904695510864, 0.364266037940979, 0.413442999124527, 0.46261996030807495, 0.5117969512939453, 0.5609738826751709, 0.610150933265686, 0.6593278646469116, 0.708504855632782, 0.7576817870140076, 0.8068587779998779, 0.8560357689857483, 0.9052127599716187, 0.9543896913528442, 1.0035667419433594, 1.052743673324585, 1.1019206047058105, 1.1510976552963257, 1.2002745866775513, 1.2494515180587769, 1.298628568649292, 1.3478055000305176, 1.3969824314117432, 1.4461593627929688, 1.4953362941741943, 1.5445133447647095, 1.593690276145935, 1.6428672075271606, 1.6920442581176758, 1.7412211894989014, 1.790398120880127, 1.839575171470642, 1.8887521028518677, 1.9379291534423828, 1.9871060848236084, 2.036283016204834, 2.0854599475860596, 2.134636878967285, 2.18381404876709, 2.2329909801483154]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 9.0, 12.0, 12.0, 15.0, 17.0, 19.0, 23.0, 27.0, 35.0, 41.0, 47.0, 28.0, 30.0, 39.0, 40.0, 52.0, 46.0, 45.0, 43.0, 34.0, 31.0, 37.0, 40.0, 36.0, 36.0, 33.0, 14.0, 38.0, 29.0, 15.0, 8.0, 14.0, 11.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7121543288230896, -0.6915651559829712, -0.670975923538208, -0.6503867506980896, -0.6297975778579712, -0.609208345413208, -0.5886191725730896, -0.5680299997329712, -0.547440767288208, -0.5268515944480896, -0.5062623620033264, -0.485673189163208, -0.4650839865207672, -0.4444947838783264, -0.423905611038208, -0.4033164083957672, -0.3827272057533264, -0.3621380031108856, -0.3415488004684448, -0.3209596276283264, -0.3003704249858856, -0.2797812223434448, -0.2591920495033264, -0.23860284686088562, -0.21801364421844482, -0.19742444157600403, -0.17683525383472443, -0.15624606609344482, -0.13565686345100403, -0.11506766825914383, -0.09447847306728363, -0.07388928532600403, -0.05330002307891846, -0.03271082788705826, -0.012121632695198059, 0.00846756249666214, 0.02905675768852234, 0.04964595288038254, 0.07023514807224274, 0.09082433581352234, 0.11141353845596313, 0.13200274109840393, 0.15259192883968353, 0.17318111658096313, 0.19377031922340393, 0.21435952186584473, 0.23494870960712433, 0.25553789734840393, 0.2761270999908447, 0.2967163026332855, 0.3173055052757263, 0.3378946781158447, 0.3584838807582855, 0.3790730834007263, 0.3996622562408447, 0.4202514588832855, 0.4408406615257263, 0.4614298641681671, 0.4820190668106079, 0.5026082396507263, 0.5231974124908447, 0.5437866449356079, 0.5643758177757263, 0.5849649906158447, 0.6055542230606079]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 14.0, 19.0, 18.0, 57.0, 161.0, 720.0, 4311.0, 39314.0, 931308.0, 65395.0, 5950.0, 980.0, 165.0, 45.0, 30.0, 16.0, 5.0, 6.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9016265869140625, -0.867706298828125, -0.8337860107421875, -0.79986572265625, -0.7659454345703125, -0.732025146484375, -0.6981048583984375, -0.6641845703125, -0.6302642822265625, -0.596343994140625, -0.5624237060546875, -0.52850341796875, -0.4945831298828125, -0.460662841796875, -0.4267425537109375, -0.392822265625, -0.3589019775390625, -0.324981689453125, -0.2910614013671875, -0.25714111328125, -0.2232208251953125, -0.189300537109375, -0.1553802490234375, -0.1214599609375, -0.0875396728515625, -0.053619384765625, -0.0196990966796875, 0.01422119140625, 0.0481414794921875, 0.082061767578125, 0.1159820556640625, 0.14990234375, 0.1838226318359375, 0.217742919921875, 0.2516632080078125, 0.28558349609375, 0.3195037841796875, 0.353424072265625, 0.3873443603515625, 0.4212646484375, 0.4551849365234375, 0.489105224609375, 0.5230255126953125, 0.55694580078125, 0.5908660888671875, 0.624786376953125, 0.6587066650390625, 0.692626953125, 0.7265472412109375, 0.760467529296875, 0.7943878173828125, 0.82830810546875, 0.8622283935546875, 0.896148681640625, 0.9300689697265625, 0.9639892578125, 0.9979095458984375, 1.031829833984375, 1.0657501220703125, 1.09967041015625, 1.1335906982421875, 1.167510986328125, 1.2014312744140625, 1.2353515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 13.0, 13.0, 31.0, 17.0, 28.0, 43.0, 44.0, 45.0, 51.0, 49.0, 60.0, 48.0, 59.0, 60.0, 45.0, 57.0, 50.0, 45.0, 48.0, 39.0, 32.0, 25.0, 24.0, 9.0, 14.0, 6.0, 7.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.6494140625, -0.6334114074707031, -0.6174087524414062, -0.6014060974121094, -0.5854034423828125, -0.5694007873535156, -0.5533981323242188, -0.5373954772949219, -0.521392822265625, -0.5053901672363281, -0.48938751220703125, -0.4733848571777344, -0.4573822021484375, -0.4413795471191406, -0.42537689208984375, -0.4093742370605469, -0.39337158203125, -0.3773689270019531, -0.36136627197265625, -0.3453636169433594, -0.3293609619140625, -0.3133583068847656, -0.29735565185546875, -0.2813529968261719, -0.265350341796875, -0.24934768676757812, -0.23334503173828125, -0.21734237670898438, -0.2013397216796875, -0.18533706665039062, -0.16933441162109375, -0.15333175659179688, -0.1373291015625, -0.12132644653320312, -0.10532379150390625, -0.08932113647460938, -0.0733184814453125, -0.057315826416015625, -0.04131317138671875, -0.025310516357421875, -0.009307861328125, 0.006694793701171875, 0.02269744873046875, 0.038700103759765625, 0.0547027587890625, 0.07070541381835938, 0.08670806884765625, 0.10271072387695312, 0.11871337890625, 0.13471603393554688, 0.15071868896484375, 0.16672134399414062, 0.1827239990234375, 0.19872665405273438, 0.21472930908203125, 0.23073196411132812, 0.246734619140625, 0.2627372741699219, 0.27873992919921875, 0.2947425842285156, 0.3107452392578125, 0.3267478942871094, 0.34275054931640625, 0.3587532043457031, 0.374755859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 11.0, 16.0, 37.0, 64.0, 83.0, 169.0, 280.0, 571.0, 1095.0, 2431.0, 6002.0, 17706.0, 75479.0, 497030.0, 368393.0, 55289.0, 14594.0, 5006.0, 2126.0, 1000.0, 484.0, 275.0, 149.0, 94.0, 65.0, 28.0, 16.0, 11.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29499053955078125, -0.2860260009765625, -0.27706146240234375, -0.268096923828125, -0.25913238525390625, -0.2501678466796875, -0.24120330810546875, -0.23223876953125, -0.22327423095703125, -0.2143096923828125, -0.20534515380859375, -0.196380615234375, -0.18741607666015625, -0.1784515380859375, -0.16948699951171875, -0.1605224609375, -0.15155792236328125, -0.1425933837890625, -0.13362884521484375, -0.124664306640625, -0.11569976806640625, -0.1067352294921875, -0.09777069091796875, -0.08880615234375, -0.07984161376953125, -0.0708770751953125, -0.06191253662109375, -0.052947998046875, -0.04398345947265625, -0.0350189208984375, -0.02605438232421875, -0.01708984375, -0.00812530517578125, 0.0008392333984375, 0.00980377197265625, 0.018768310546875, 0.02773284912109375, 0.0366973876953125, 0.04566192626953125, 0.05462646484375, 0.06359100341796875, 0.0725555419921875, 0.08152008056640625, 0.090484619140625, 0.09944915771484375, 0.1084136962890625, 0.11737823486328125, 0.1263427734375, 0.13530731201171875, 0.1442718505859375, 0.15323638916015625, 0.162200927734375, 0.17116546630859375, 0.1801300048828125, 0.18909454345703125, 0.19805908203125, 0.20702362060546875, 0.2159881591796875, 0.22495269775390625, 0.233917236328125, 0.24288177490234375, 0.2518463134765625, 0.26081085205078125, 0.269775390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 5.0, 4.0, 7.0, 7.0, 9.0, 10.0, 14.0, 15.0, 24.0, 18.0, 26.0, 26.0, 24.0, 22.0, 24.0, 34.0, 39.0, 47.0, 48.0, 42.0, 54.0, 52.0, 46.0, 43.0, 29.0, 35.0, 31.0, 40.0, 31.0, 26.0, 19.0, 23.0, 18.0, 18.0, 19.0, 13.0, 11.0, 7.0, 7.0, 6.0, 4.0, 10.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6796875, -0.65838623046875, -0.6370849609375, -0.61578369140625, -0.594482421875, -0.57318115234375, -0.5518798828125, -0.53057861328125, -0.50927734375, -0.48797607421875, -0.4666748046875, -0.44537353515625, -0.424072265625, -0.40277099609375, -0.3814697265625, -0.36016845703125, -0.3388671875, -0.31756591796875, -0.2962646484375, -0.27496337890625, -0.253662109375, -0.23236083984375, -0.2110595703125, -0.18975830078125, -0.16845703125, -0.14715576171875, -0.1258544921875, -0.10455322265625, -0.083251953125, -0.06195068359375, -0.0406494140625, -0.01934814453125, 0.001953125, 0.02325439453125, 0.0445556640625, 0.06585693359375, 0.087158203125, 0.10845947265625, 0.1297607421875, 0.15106201171875, 0.17236328125, 0.19366455078125, 0.2149658203125, 0.23626708984375, 0.257568359375, 0.27886962890625, 0.3001708984375, 0.32147216796875, 0.3427734375, 0.36407470703125, 0.3853759765625, 0.40667724609375, 0.427978515625, 0.44927978515625, 0.4705810546875, 0.49188232421875, 0.51318359375, 0.53448486328125, 0.5557861328125, 0.57708740234375, 0.598388671875, 0.61968994140625, 0.6409912109375, 0.66229248046875, 0.68359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 5.0, 15.0, 4.0, 18.0, 22.0, 35.0, 47.0, 75.0, 101.0, 136.0, 190.0, 331.0, 414.0, 681.0, 1053.0, 1620.0, 2601.0, 4179.0, 7128.0, 12850.0, 24706.0, 52972.0, 134391.0, 321822.0, 280379.0, 109201.0, 44156.0, 21350.0, 11227.0, 6320.0, 3806.0, 2250.0, 1501.0, 970.0, 629.0, 451.0, 274.0, 178.0, 149.0, 95.0, 51.0, 36.0, 31.0, 21.0, 21.0, 6.0, 14.0, 8.0, 2.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0], "bins": [-0.03997802734375, -0.038762569427490234, -0.03754711151123047, -0.0363316535949707, -0.03511619567871094, -0.03390073776245117, -0.032685279846191406, -0.03146982192993164, -0.030254364013671875, -0.02903890609741211, -0.027823448181152344, -0.026607990264892578, -0.025392532348632812, -0.024177074432373047, -0.02296161651611328, -0.021746158599853516, -0.02053070068359375, -0.019315242767333984, -0.01809978485107422, -0.016884326934814453, -0.015668869018554688, -0.014453411102294922, -0.013237953186035156, -0.01202249526977539, -0.010807037353515625, -0.00959157943725586, -0.008376121520996094, -0.007160663604736328, -0.0059452056884765625, -0.004729747772216797, -0.0035142898559570312, -0.0022988319396972656, -0.0010833740234375, 0.00013208389282226562, 0.0013475418090820312, 0.002562999725341797, 0.0037784576416015625, 0.004993915557861328, 0.006209373474121094, 0.007424831390380859, 0.008640289306640625, 0.00985574722290039, 0.011071205139160156, 0.012286663055419922, 0.013502120971679688, 0.014717578887939453, 0.01593303680419922, 0.017148494720458984, 0.01836395263671875, 0.019579410552978516, 0.02079486846923828, 0.022010326385498047, 0.023225784301757812, 0.024441242218017578, 0.025656700134277344, 0.02687215805053711, 0.028087615966796875, 0.02930307388305664, 0.030518531799316406, 0.03173398971557617, 0.03294944763183594, 0.0341649055480957, 0.03538036346435547, 0.036595821380615234, 0.037811279296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 9.0, 18.0, 23.0, 28.0, 55.0, 59.0, 121.0, 161.0, 170.0, 136.0, 71.0, 35.0, 22.0, 18.0, 13.0, 4.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0650367736816406e-05, -3.89590859413147e-05, -3.726780414581299e-05, -3.557652235031128e-05, -3.388524055480957e-05, -3.219395875930786e-05, -3.0502676963806152e-05, -2.8811395168304443e-05, -2.7120113372802734e-05, -2.5428831577301025e-05, -2.3737549781799316e-05, -2.2046267986297607e-05, -2.03549861907959e-05, -1.866370439529419e-05, -1.697242259979248e-05, -1.528114080429077e-05, -1.3589859008789062e-05, -1.1898577213287354e-05, -1.0207295417785645e-05, -8.516013622283936e-06, -6.8247318267822266e-06, -5.133450031280518e-06, -3.4421682357788086e-06, -1.7508864402770996e-06, -5.960464477539063e-08, 1.6316771507263184e-06, 3.3229589462280273e-06, 5.014240741729736e-06, 6.705522537231445e-06, 8.396804332733154e-06, 1.0088086128234863e-05, 1.1779367923736572e-05, 1.3470649719238281e-05, 1.516193151473999e-05, 1.68532133102417e-05, 1.8544495105743408e-05, 2.0235776901245117e-05, 2.1927058696746826e-05, 2.3618340492248535e-05, 2.5309622287750244e-05, 2.7000904083251953e-05, 2.8692185878753662e-05, 3.038346767425537e-05, 3.207474946975708e-05, 3.376603126525879e-05, 3.54573130607605e-05, 3.714859485626221e-05, 3.8839876651763916e-05, 4.0531158447265625e-05, 4.2222440242767334e-05, 4.391372203826904e-05, 4.560500383377075e-05, 4.729628562927246e-05, 4.898756742477417e-05, 5.067884922027588e-05, 5.237013101577759e-05, 5.40614128112793e-05, 5.5752694606781006e-05, 5.7443976402282715e-05, 5.9135258197784424e-05, 6.082653999328613e-05, 6.251782178878784e-05, 6.420910358428955e-05, 6.590038537979126e-05, 6.759166717529297e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 12.0, 11.0, 20.0, 66.0, 173.0, 816.0, 5592.0, 101636.0, 909208.0, 27561.0, 2731.0, 469.0, 132.0, 45.0, 24.0, 12.0, 7.0, 11.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.28271484375, -0.27533721923828125, -0.2679595947265625, -0.26058197021484375, -0.253204345703125, -0.24582672119140625, -0.2384490966796875, -0.23107147216796875, -0.22369384765625, -0.21631622314453125, -0.2089385986328125, -0.20156097412109375, -0.194183349609375, -0.18680572509765625, -0.1794281005859375, -0.17205047607421875, -0.1646728515625, -0.15729522705078125, -0.1499176025390625, -0.14253997802734375, -0.135162353515625, -0.12778472900390625, -0.1204071044921875, -0.11302947998046875, -0.10565185546875, -0.09827423095703125, -0.0908966064453125, -0.08351898193359375, -0.076141357421875, -0.06876373291015625, -0.0613861083984375, -0.05400848388671875, -0.046630859375, -0.03925323486328125, -0.0318756103515625, -0.02449798583984375, -0.017120361328125, -0.00974273681640625, -0.0023651123046875, 0.00501251220703125, 0.01239013671875, 0.01976776123046875, 0.0271453857421875, 0.03452301025390625, 0.041900634765625, 0.04927825927734375, 0.0566558837890625, 0.06403350830078125, 0.0714111328125, 0.07878875732421875, 0.0861663818359375, 0.09354400634765625, 0.100921630859375, 0.10829925537109375, 0.1156768798828125, 0.12305450439453125, 0.13043212890625, 0.13780975341796875, 0.1451873779296875, 0.15256500244140625, 0.159942626953125, 0.16732025146484375, 0.1746978759765625, 0.18207550048828125, 0.189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 11.0, 9.0, 9.0, 10.0, 15.0, 22.0, 32.0, 34.0, 58.0, 72.0, 94.0, 104.0, 97.0, 96.0, 85.0, 61.0, 49.0, 34.0, 22.0, 19.0, 19.0, 14.0, 3.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.019870519638061523, -0.019233226776123047, -0.01859593391418457, -0.017958641052246094, -0.017321348190307617, -0.01668405532836914, -0.016046762466430664, -0.015409469604492188, -0.014772176742553711, -0.014134883880615234, -0.013497591018676758, -0.012860298156738281, -0.012223005294799805, -0.011585712432861328, -0.010948419570922852, -0.010311126708984375, -0.009673833847045898, -0.009036540985107422, -0.008399248123168945, -0.007761955261230469, -0.007124662399291992, -0.006487369537353516, -0.005850076675415039, -0.0052127838134765625, -0.004575490951538086, -0.003938198089599609, -0.003300905227661133, -0.0026636123657226562, -0.0020263195037841797, -0.0013890266418457031, -0.0007517337799072266, -0.00011444091796875, 0.0005228519439697266, 0.0011601448059082031, 0.0017974376678466797, 0.0024347305297851562, 0.003072023391723633, 0.0037093162536621094, 0.004346609115600586, 0.0049839019775390625, 0.005621194839477539, 0.006258487701416016, 0.006895780563354492, 0.007533073425292969, 0.008170366287231445, 0.008807659149169922, 0.009444952011108398, 0.010082244873046875, 0.010719537734985352, 0.011356830596923828, 0.011994123458862305, 0.012631416320800781, 0.013268709182739258, 0.013906002044677734, 0.014543294906616211, 0.015180587768554688, 0.015817880630493164, 0.01645517349243164, 0.017092466354370117, 0.017729759216308594, 0.01836705207824707, 0.019004344940185547, 0.019641637802124023, 0.0202789306640625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 18.0, 79.0, 315.0, 441.0, 120.0, 25.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8653119206428528, -0.770869791507721, -0.6764277219772339, -0.581985592842102, -0.4875434637069702, -0.3931013345718384, -0.2986592650413513, -0.20421713590621948, -0.10977500677108765, -0.015332892537117004, 0.07910922169685364, 0.17355132102966309, 0.2679934501647949, 0.36243557929992676, 0.4568776488304138, 0.5513197779655457, 0.6457619071006775, 0.7402040362358093, 0.8346461057662964, 0.9290882349014282, 1.02353036403656, 1.117972493171692, 1.2124145030975342, 1.306856632232666, 1.4012987613677979, 1.4957408905029297, 1.5901830196380615, 1.6846251487731934, 1.7790672779083252, 1.873509407043457, 1.9679514169692993, 2.0623936653137207, 2.1568355560302734, 2.2512776851654053, 2.345719814300537, 2.440161943435669, 2.534604072570801, 2.6290462017059326, 2.7234883308410645, 2.817930221557617, 2.912372589111328, 3.00681471824646, 3.101256847381592, 3.1956989765167236, 3.2901411056518555, 3.3845832347869873, 3.479025363922119, 3.573467254638672, 3.6679093837738037, 3.7623515129089355, 3.8567936420440674, 3.951235771179199, 4.045677661895752, 4.140120029449463, 4.234561920166016, 4.329004287719727, 4.423446178436279, 4.517888069152832, 4.612330436706543, 4.706772327423096, 4.801214694976807, 4.895656585693359, 4.99009895324707, 5.084540843963623, 5.178983211517334]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 13.0, 18.0, 22.0, 16.0, 31.0, 35.0, 44.0, 44.0, 42.0, 44.0, 56.0, 62.0, 55.0, 62.0, 39.0, 49.0, 42.0, 47.0, 39.0, 39.0, 44.0, 33.0, 28.0, 17.0, 8.0, 13.0, 10.0, 9.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5836512446403503, -0.5690324306488037, -0.5544136166572571, -0.5397948026657104, -0.5251759886741638, -0.5105571746826172, -0.49593839049339294, -0.4813195765018463, -0.4667007625102997, -0.45208194851875305, -0.4374631345272064, -0.4228443503379822, -0.40822553634643555, -0.3936067223548889, -0.3789879083633423, -0.36436909437179565, -0.349750280380249, -0.3351314663887024, -0.32051265239715576, -0.30589383840560913, -0.2912750542163849, -0.27665624022483826, -0.2620374262332916, -0.247418612241745, -0.23279982805252075, -0.21818101406097412, -0.20356221497058868, -0.18894340097904205, -0.17432458698749542, -0.15970578789710999, -0.14508697390556335, -0.13046815991401672, -0.11584934592247009, -0.10123053938150406, -0.08661172538995743, -0.0719929188489914, -0.05737410858273506, -0.04275529831647873, -0.028136491775512695, -0.013517677783966064, 0.0011011287569999695, 0.015719939023256302, 0.030338747426867485, 0.04495755583047867, 0.059576366096735, 0.07419517636299133, 0.08881398290395737, 0.103432796895504, 0.11805160343647003, 0.13267041742801666, 0.1472892165184021, 0.16190803050994873, 0.17652684450149536, 0.191145658493042, 0.20576445758342743, 0.22038327157497406, 0.2350020706653595, 0.24962088465690613, 0.26423969864845276, 0.278858482837677, 0.29347729682922363, 0.30809611082077026, 0.3227149248123169, 0.3373337388038635, 0.35195255279541016]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 7.0, 11.0, 6.0, 12.0, 22.0, 41.0, 82.0, 172.0, 377.0, 895.0, 2360.0, 6424.0, 21574.0, 99738.0, 651750.0, 213474.0, 36121.0, 9737.0, 3473.0, 1300.0, 532.0, 221.0, 107.0, 52.0, 23.0, 11.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9140243530273438, -0.8851776123046875, -0.8563308715820312, -0.827484130859375, -0.7986373901367188, -0.7697906494140625, -0.7409439086914062, -0.71209716796875, -0.6832504272460938, -0.6544036865234375, -0.6255569458007812, -0.596710205078125, -0.5678634643554688, -0.5390167236328125, -0.5101699829101562, -0.4813232421875, -0.45247650146484375, -0.4236297607421875, -0.39478302001953125, -0.365936279296875, -0.33708953857421875, -0.3082427978515625, -0.27939605712890625, -0.25054931640625, -0.22170257568359375, -0.1928558349609375, -0.16400909423828125, -0.135162353515625, -0.10631561279296875, -0.0774688720703125, -0.04862213134765625, -0.019775390625, 0.00907135009765625, 0.0379180908203125, 0.06676483154296875, 0.095611572265625, 0.12445831298828125, 0.1533050537109375, 0.18215179443359375, 0.21099853515625, 0.23984527587890625, 0.2686920166015625, 0.29753875732421875, 0.326385498046875, 0.35523223876953125, 0.3840789794921875, 0.41292572021484375, 0.4417724609375, 0.47061920166015625, 0.4994659423828125, 0.5283126831054688, 0.557159423828125, 0.5860061645507812, 0.6148529052734375, 0.6436996459960938, 0.67254638671875, 0.7013931274414062, 0.7302398681640625, 0.7590866088867188, 0.787933349609375, 0.8167800903320312, 0.8456268310546875, 0.8744735717773438, 0.9033203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 2.0, 7.0, 5.0, 11.0, 9.0, 17.0, 17.0, 23.0, 23.0, 36.0, 39.0, 31.0, 49.0, 47.0, 60.0, 56.0, 58.0, 70.0, 55.0, 57.0, 49.0, 45.0, 38.0, 33.0, 39.0, 23.0, 17.0, 26.0, 17.0, 8.0, 13.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.079345703125, -1.04931640625, -1.019287109375, -0.9892578125, -0.959228515625, -0.92919921875, -0.899169921875, -0.869140625, -0.839111328125, -0.80908203125, -0.779052734375, -0.7490234375, -0.718994140625, -0.68896484375, -0.658935546875, -0.62890625, -0.598876953125, -0.56884765625, -0.538818359375, -0.5087890625, -0.478759765625, -0.44873046875, -0.418701171875, -0.388671875, -0.358642578125, -0.32861328125, -0.298583984375, -0.2685546875, -0.238525390625, -0.20849609375, -0.178466796875, -0.1484375, -0.118408203125, -0.08837890625, -0.058349609375, -0.0283203125, 0.001708984375, 0.03173828125, 0.061767578125, 0.091796875, 0.121826171875, 0.15185546875, 0.181884765625, 0.2119140625, 0.241943359375, 0.27197265625, 0.302001953125, 0.33203125, 0.362060546875, 0.39208984375, 0.422119140625, 0.4521484375, 0.482177734375, 0.51220703125, 0.542236328125, 0.572265625, 0.602294921875, 0.63232421875, 0.662353515625, 0.6923828125, 0.722412109375, 0.75244140625, 0.782470703125, 0.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 5.0, 7.0, 10.0, 16.0, 19.0, 16.0, 26.0, 29.0, 32.0, 42.0, 46.0, 77.0, 107.0, 168.0, 417.0, 2674.0, 64246.0, 957400.0, 20918.0, 1338.0, 334.0, 158.0, 87.0, 74.0, 60.0, 41.0, 40.0, 32.0, 14.0, 17.0, 14.0, 15.0, 9.0, 9.0, 9.0, 13.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.24609375, -2.174468994140625, -2.10284423828125, -2.031219482421875, -1.9595947265625, -1.887969970703125, -1.81634521484375, -1.744720458984375, -1.673095703125, -1.601470947265625, -1.52984619140625, -1.458221435546875, -1.3865966796875, -1.314971923828125, -1.24334716796875, -1.171722412109375, -1.10009765625, -1.028472900390625, -0.95684814453125, -0.885223388671875, -0.8135986328125, -0.741973876953125, -0.67034912109375, -0.598724365234375, -0.527099609375, -0.455474853515625, -0.38385009765625, -0.312225341796875, -0.2406005859375, -0.168975830078125, -0.09735107421875, -0.025726318359375, 0.0458984375, 0.117523193359375, 0.18914794921875, 0.260772705078125, 0.3323974609375, 0.404022216796875, 0.47564697265625, 0.547271728515625, 0.618896484375, 0.690521240234375, 0.76214599609375, 0.833770751953125, 0.9053955078125, 0.977020263671875, 1.04864501953125, 1.120269775390625, 1.19189453125, 1.263519287109375, 1.33514404296875, 1.406768798828125, 1.4783935546875, 1.550018310546875, 1.62164306640625, 1.693267822265625, 1.764892578125, 1.836517333984375, 1.90814208984375, 1.979766845703125, 2.0513916015625, 2.123016357421875, 2.19464111328125, 2.266265869140625, 2.337890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 7.0, 15.0, 11.0, 23.0, 12.0, 19.0, 18.0, 24.0, 23.0, 38.0, 35.0, 28.0, 37.0, 39.0, 39.0, 49.0, 33.0, 52.0, 41.0, 45.0, 51.0, 41.0, 32.0, 32.0, 33.0, 31.0, 24.0, 26.0, 18.0, 15.0, 8.0, 11.0, 13.0, 11.0, 6.0, 6.0, 7.0, 8.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62744140625, -0.6047515869140625, -0.582061767578125, -0.5593719482421875, -0.53668212890625, -0.5139923095703125, -0.491302490234375, -0.4686126708984375, -0.4459228515625, -0.4232330322265625, -0.400543212890625, -0.3778533935546875, -0.35516357421875, -0.3324737548828125, -0.309783935546875, -0.2870941162109375, -0.264404296875, -0.2417144775390625, -0.219024658203125, -0.1963348388671875, -0.17364501953125, -0.1509552001953125, -0.128265380859375, -0.1055755615234375, -0.0828857421875, -0.0601959228515625, -0.037506103515625, -0.0148162841796875, 0.00787353515625, 0.0305633544921875, 0.053253173828125, 0.0759429931640625, 0.0986328125, 0.1213226318359375, 0.144012451171875, 0.1667022705078125, 0.18939208984375, 0.2120819091796875, 0.234771728515625, 0.2574615478515625, 0.2801513671875, 0.3028411865234375, 0.325531005859375, 0.3482208251953125, 0.37091064453125, 0.3936004638671875, 0.416290283203125, 0.4389801025390625, 0.461669921875, 0.4843597412109375, 0.507049560546875, 0.5297393798828125, 0.55242919921875, 0.5751190185546875, 0.597808837890625, 0.6204986572265625, 0.6431884765625, 0.6658782958984375, 0.688568115234375, 0.7112579345703125, 0.73394775390625, 0.7566375732421875, 0.779327392578125, 0.8020172119140625, 0.82470703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 10.0, 21.0, 31.0, 38.0, 79.0, 131.0, 278.0, 548.0, 1204.0, 3299.0, 12407.0, 90313.0, 796654.0, 122023.0, 15235.0, 3711.0, 1270.0, 616.0, 287.0, 150.0, 91.0, 49.0, 33.0, 15.0, 9.0, 9.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.328125, -0.3186302185058594, -0.30913543701171875, -0.2996406555175781, -0.2901458740234375, -0.2806510925292969, -0.27115631103515625, -0.2616615295410156, -0.252166748046875, -0.24267196655273438, -0.23317718505859375, -0.22368240356445312, -0.2141876220703125, -0.20469284057617188, -0.19519805908203125, -0.18570327758789062, -0.17620849609375, -0.16671371459960938, -0.15721893310546875, -0.14772415161132812, -0.1382293701171875, -0.12873458862304688, -0.11923980712890625, -0.10974502563476562, -0.100250244140625, -0.09075546264648438, -0.08126068115234375, -0.07176589965820312, -0.0622711181640625, -0.052776336669921875, -0.04328155517578125, -0.033786773681640625, -0.0242919921875, -0.014797210693359375, -0.00530242919921875, 0.004192352294921875, 0.0136871337890625, 0.023181915283203125, 0.03267669677734375, 0.042171478271484375, 0.051666259765625, 0.061161041259765625, 0.07065582275390625, 0.08015060424804688, 0.0896453857421875, 0.09914016723632812, 0.10863494873046875, 0.11812973022460938, 0.12762451171875, 0.13711929321289062, 0.14661407470703125, 0.15610885620117188, 0.1656036376953125, 0.17509841918945312, 0.18459320068359375, 0.19408798217773438, 0.203582763671875, 0.21307754516601562, 0.22257232666015625, 0.23206710815429688, 0.2415618896484375, 0.2510566711425781, 0.26055145263671875, 0.2700462341308594, 0.279541015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 11.0, 14.0, 25.0, 46.0, 73.0, 188.0, 283.0, 158.0, 80.0, 43.0, 33.0, 21.0, 13.0, 6.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.955862045288086e-05, -6.759818643331528e-05, -6.56377524137497e-05, -6.367731839418411e-05, -6.171688437461853e-05, -5.975645035505295e-05, -5.7796016335487366e-05, -5.5835582315921783e-05, -5.38751482963562e-05, -5.191471427679062e-05, -4.995428025722504e-05, -4.7993846237659454e-05, -4.603341221809387e-05, -4.407297819852829e-05, -4.211254417896271e-05, -4.0152110159397125e-05, -3.819167613983154e-05, -3.623124212026596e-05, -3.427080810070038e-05, -3.2310374081134796e-05, -3.0349940061569214e-05, -2.838950604200363e-05, -2.642907202243805e-05, -2.4468638002872467e-05, -2.2508203983306885e-05, -2.0547769963741302e-05, -1.858733594417572e-05, -1.6626901924610138e-05, -1.4666467905044556e-05, -1.2706033885478973e-05, -1.0745599865913391e-05, -8.785165846347809e-06, -6.8247318267822266e-06, -4.864297807216644e-06, -2.903863787651062e-06, -9.434297680854797e-07, 1.0170042514801025e-06, 2.977438271045685e-06, 4.937872290611267e-06, 6.898306310176849e-06, 8.858740329742432e-06, 1.0819174349308014e-05, 1.2779608368873596e-05, 1.4740042388439178e-05, 1.670047640800476e-05, 1.8660910427570343e-05, 2.0621344447135925e-05, 2.2581778466701508e-05, 2.454221248626709e-05, 2.6502646505832672e-05, 2.8463080525398254e-05, 3.0423514544963837e-05, 3.238394856452942e-05, 3.4344382584095e-05, 3.6304816603660583e-05, 3.8265250623226166e-05, 4.022568464279175e-05, 4.218611866235733e-05, 4.414655268192291e-05, 4.6106986701488495e-05, 4.806742072105408e-05, 5.002785474061966e-05, 5.198828876018524e-05, 5.3948722779750824e-05, 5.5909156799316406e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 20.0, 16.0, 38.0, 63.0, 115.0, 243.0, 489.0, 1150.0, 3799.0, 23596.0, 554629.0, 437965.0, 20652.0, 3642.0, 1095.0, 456.0, 256.0, 117.0, 68.0, 43.0, 30.0, 13.0, 4.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.42431640625, -0.4121818542480469, -0.40004730224609375, -0.3879127502441406, -0.3757781982421875, -0.3636436462402344, -0.35150909423828125, -0.3393745422363281, -0.327239990234375, -0.3151054382324219, -0.30297088623046875, -0.2908363342285156, -0.2787017822265625, -0.2665672302246094, -0.25443267822265625, -0.24229812622070312, -0.23016357421875, -0.21802902221679688, -0.20589447021484375, -0.19375991821289062, -0.1816253662109375, -0.16949081420898438, -0.15735626220703125, -0.14522171020507812, -0.133087158203125, -0.12095260620117188, -0.10881805419921875, -0.09668350219726562, -0.0845489501953125, -0.07241439819335938, -0.06027984619140625, -0.048145294189453125, -0.0360107421875, -0.023876190185546875, -0.01174163818359375, 0.000392913818359375, 0.0125274658203125, 0.024662017822265625, 0.03679656982421875, 0.048931121826171875, 0.061065673828125, 0.07320022583007812, 0.08533477783203125, 0.09746932983398438, 0.1096038818359375, 0.12173843383789062, 0.13387298583984375, 0.14600753784179688, 0.15814208984375, 0.17027664184570312, 0.18241119384765625, 0.19454574584960938, 0.2066802978515625, 0.21881484985351562, 0.23094940185546875, 0.24308395385742188, 0.255218505859375, 0.2673530578613281, 0.27948760986328125, 0.2916221618652344, 0.3037567138671875, 0.3158912658691406, 0.32802581787109375, 0.3401603698730469, 0.352294921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 5.0, 16.0, 18.0, 28.0, 28.0, 50.0, 54.0, 70.0, 125.0, 121.0, 121.0, 93.0, 67.0, 40.0, 44.0, 29.0, 30.0, 10.0, 6.0, 10.0, 8.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.0873727798461914, -0.08416938781738281, -0.08096599578857422, -0.07776260375976562, -0.07455921173095703, -0.07135581970214844, -0.06815242767333984, -0.06494903564453125, -0.061745643615722656, -0.05854225158691406, -0.05533885955810547, -0.052135467529296875, -0.04893207550048828, -0.04572868347167969, -0.042525291442871094, -0.0393218994140625, -0.036118507385253906, -0.03291511535644531, -0.02971172332763672, -0.026508331298828125, -0.02330493927001953, -0.020101547241210938, -0.016898155212402344, -0.01369476318359375, -0.010491371154785156, -0.0072879791259765625, -0.004084587097167969, -0.000881195068359375, 0.0023221969604492188, 0.0055255889892578125, 0.008728981018066406, 0.011932373046875, 0.015135765075683594, 0.018339157104492188, 0.02154254913330078, 0.024745941162109375, 0.02794933319091797, 0.031152725219726562, 0.034356117248535156, 0.03755950927734375, 0.040762901306152344, 0.04396629333496094, 0.04716968536376953, 0.050373077392578125, 0.05357646942138672, 0.05677986145019531, 0.059983253479003906, 0.0631866455078125, 0.0663900375366211, 0.06959342956542969, 0.07279682159423828, 0.07600021362304688, 0.07920360565185547, 0.08240699768066406, 0.08561038970947266, 0.08881378173828125, 0.09201717376708984, 0.09522056579589844, 0.09842395782470703, 0.10162734985351562, 0.10483074188232422, 0.10803413391113281, 0.1112375259399414, 0.11444091796875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 23.0, 20.0, 40.0, 68.0, 115.0, 114.0, 169.0, 156.0, 119.0, 60.0, 47.0, 25.0, 20.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2506989240646362, -1.1903655529022217, -1.1300321817398071, -1.0696988105773926, -1.009365439414978, -0.9490320682525635, -0.8886986970901489, -0.8283653259277344, -0.7680319547653198, -0.7076985836029053, -0.6473652124404907, -0.5870318412780762, -0.5266984701156616, -0.46636509895324707, -0.4060317277908325, -0.34569835662841797, -0.2853649854660034, -0.22503161430358887, -0.16469824314117432, -0.10436487197875977, -0.044031500816345215, 0.016301870346069336, 0.07663524150848389, 0.13696861267089844, 0.197301983833313, 0.25763535499572754, 0.3179687261581421, 0.37830209732055664, 0.4386354684829712, 0.49896883964538574, 0.5593022108078003, 0.6196355819702148, 0.6799688339233398, 0.7403022050857544, 0.800635576248169, 0.8609689474105835, 0.921302318572998, 0.9816356897354126, 1.0419690608978271, 1.1023024320602417, 1.1626358032226562, 1.2229691743850708, 1.2833025455474854, 1.3436359167099, 1.4039692878723145, 1.464302659034729, 1.5246360301971436, 1.584969401359558, 1.6453027725219727, 1.7056361436843872, 1.7659695148468018, 1.8263028860092163, 1.8866362571716309, 1.9469696283340454, 2.00730299949646, 2.067636489868164, 2.127969741821289, 2.188302993774414, 2.248636484146118, 2.3089699745178223, 2.3693032264709473, 2.4296364784240723, 2.4899699687957764, 2.5503034591674805, 2.6106367111206055]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 9.0, 8.0, 8.0, 11.0, 13.0, 19.0, 28.0, 25.0, 32.0, 34.0, 36.0, 31.0, 48.0, 42.0, 32.0, 47.0, 48.0, 36.0, 47.0, 43.0, 56.0, 44.0, 47.0, 29.0, 36.0, 27.0, 27.0, 19.0, 21.0, 19.0, 12.0, 13.0, 18.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.6092500686645508, -1.5667966604232788, -1.5243432521820068, -1.4818898439407349, -1.439436435699463, -1.3969831466674805, -1.354529619216919, -1.3120763301849365, -1.2696229219436646, -1.2271695137023926, -1.1847161054611206, -1.1422626972198486, -1.0998092889785767, -1.0573558807373047, -1.0149025917053223, -0.9724491834640503, -0.9299957156181335, -0.8875423073768616, -0.8450888991355896, -0.8026355504989624, -0.7601821422576904, -0.7177287340164185, -0.6752753257751465, -0.6328219175338745, -0.5903685092926025, -0.5479151010513306, -0.5054616928100586, -0.463008314371109, -0.4205549359321594, -0.37810152769088745, -0.3356481194496155, -0.2931947410106659, -0.2507413625717163, -0.20828796923160553, -0.16583457589149475, -0.12338116765022278, -0.080927774310112, -0.03847438097000122, 0.003979027271270752, 0.04643240571022034, 0.08888581395149231, 0.1313392072916031, 0.17379260063171387, 0.21624600887298584, 0.2586994171142578, 0.3011527955532074, 0.34360620379447937, 0.38605958223342896, 0.4285129904747009, 0.4709663987159729, 0.5134198069572449, 0.5558731555938721, 0.598326563835144, 0.640779972076416, 0.683233380317688, 0.72568678855896, 0.7681401968002319, 0.8105936050415039, 0.8530470132827759, 0.8955004215240479, 0.937953770160675, 0.980407178401947, 1.0228605270385742, 1.0653139352798462, 1.1077673435211182]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 16.0, 26.0, 55.0, 101.0, 420.0, 1819.0, 14191.0, 2519875.0, 1642499.0, 12642.0, 1950.0, 387.0, 140.0, 52.0, 32.0, 21.0, 16.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.145660400390625, -3.05303955078125, -2.960418701171875, -2.8677978515625, -2.775177001953125, -2.68255615234375, -2.589935302734375, -2.497314453125, -2.404693603515625, -2.31207275390625, -2.219451904296875, -2.1268310546875, -2.034210205078125, -1.94158935546875, -1.848968505859375, -1.75634765625, -1.663726806640625, -1.57110595703125, -1.478485107421875, -1.3858642578125, -1.293243408203125, -1.20062255859375, -1.108001708984375, -1.015380859375, -0.922760009765625, -0.83013916015625, -0.737518310546875, -0.6448974609375, -0.552276611328125, -0.45965576171875, -0.367034912109375, -0.2744140625, -0.181793212890625, -0.08917236328125, 0.003448486328125, 0.0960693359375, 0.188690185546875, 0.28131103515625, 0.373931884765625, 0.466552734375, 0.559173583984375, 0.65179443359375, 0.744415283203125, 0.8370361328125, 0.929656982421875, 1.02227783203125, 1.114898681640625, 1.20751953125, 1.300140380859375, 1.39276123046875, 1.485382080078125, 1.5780029296875, 1.670623779296875, 1.76324462890625, 1.855865478515625, 1.948486328125, 2.041107177734375, 2.13372802734375, 2.226348876953125, 2.3189697265625, 2.411590576171875, 2.50421142578125, 2.596832275390625, 2.689453125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 13.0, 16.0, 19.0, 21.0, 25.0, 39.0, 50.0, 56.0, 57.0, 55.0, 77.0, 71.0, 65.0, 75.0, 66.0, 59.0, 54.0, 46.0, 36.0, 24.0, 21.0, 9.0, 16.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9677047729492188, -0.9427337646484375, -0.9177627563476562, -0.892791748046875, -0.8678207397460938, -0.8428497314453125, -0.8178787231445312, -0.79290771484375, -0.7679367065429688, -0.7429656982421875, -0.7179946899414062, -0.693023681640625, -0.6680526733398438, -0.6430816650390625, -0.6181106567382812, -0.5931396484375, -0.5681686401367188, -0.5431976318359375, -0.5182266235351562, -0.493255615234375, -0.46828460693359375, -0.4433135986328125, -0.41834259033203125, -0.39337158203125, -0.36840057373046875, -0.3434295654296875, -0.31845855712890625, -0.293487548828125, -0.26851654052734375, -0.2435455322265625, -0.21857452392578125, -0.193603515625, -0.16863250732421875, -0.1436614990234375, -0.11869049072265625, -0.093719482421875, -0.06874847412109375, -0.0437774658203125, -0.01880645751953125, 0.00616455078125, 0.03113555908203125, 0.0561065673828125, 0.08107757568359375, 0.106048583984375, 0.13101959228515625, 0.1559906005859375, 0.18096160888671875, 0.2059326171875, 0.23090362548828125, 0.2558746337890625, 0.28084564208984375, 0.305816650390625, 0.33078765869140625, 0.3557586669921875, 0.38072967529296875, 0.40570068359375, 0.43067169189453125, 0.4556427001953125, 0.48061370849609375, 0.505584716796875, 0.5305557250976562, 0.5555267333984375, 0.5804977416992188, 0.60546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 14.0, 9.0, 22.0, 46.0, 54.0, 84.0, 139.0, 217.0, 415.0, 1017.0, 3731.0, 23063.0, 709918.0, 3399770.0, 47031.0, 5989.0, 1482.0, 557.0, 258.0, 149.0, 86.0, 65.0, 36.0, 28.0, 22.0, 16.0, 12.0, 10.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4306640625, -1.384735107421875, -1.33880615234375, -1.292877197265625, -1.2469482421875, -1.201019287109375, -1.15509033203125, -1.109161376953125, -1.063232421875, -1.017303466796875, -0.97137451171875, -0.925445556640625, -0.8795166015625, -0.833587646484375, -0.78765869140625, -0.741729736328125, -0.69580078125, -0.649871826171875, -0.60394287109375, -0.558013916015625, -0.5120849609375, -0.466156005859375, -0.42022705078125, -0.374298095703125, -0.328369140625, -0.282440185546875, -0.23651123046875, -0.190582275390625, -0.1446533203125, -0.098724365234375, -0.05279541015625, -0.006866455078125, 0.0390625, 0.084991455078125, 0.13092041015625, 0.176849365234375, 0.2227783203125, 0.268707275390625, 0.31463623046875, 0.360565185546875, 0.406494140625, 0.452423095703125, 0.49835205078125, 0.544281005859375, 0.5902099609375, 0.636138916015625, 0.68206787109375, 0.727996826171875, 0.77392578125, 0.819854736328125, 0.86578369140625, 0.911712646484375, 0.9576416015625, 1.003570556640625, 1.04949951171875, 1.095428466796875, 1.141357421875, 1.187286376953125, 1.23321533203125, 1.279144287109375, 1.3250732421875, 1.371002197265625, 1.41693115234375, 1.462860107421875, 1.5087890625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 7.0, 12.0, 19.0, 28.0, 39.0, 82.0, 139.0, 285.0, 633.0, 1189.0, 876.0, 345.0, 169.0, 95.0, 49.0, 43.0, 19.0, 19.0, 8.0, 10.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415283203125, -0.4029541015625, -0.390625, -0.3782958984375, -0.365966796875, -0.3536376953125, -0.34130859375, -0.3289794921875, -0.316650390625, -0.3043212890625, -0.2919921875, -0.2796630859375, -0.267333984375, -0.2550048828125, -0.24267578125, -0.2303466796875, -0.218017578125, -0.2056884765625, -0.193359375, -0.1810302734375, -0.168701171875, -0.1563720703125, -0.14404296875, -0.1317138671875, -0.119384765625, -0.1070556640625, -0.0947265625, -0.0823974609375, -0.070068359375, -0.0577392578125, -0.04541015625, -0.0330810546875, -0.020751953125, -0.0084228515625, 0.00390625, 0.0162353515625, 0.028564453125, 0.0408935546875, 0.05322265625, 0.0655517578125, 0.077880859375, 0.0902099609375, 0.1025390625, 0.1148681640625, 0.127197265625, 0.1395263671875, 0.15185546875, 0.1641845703125, 0.176513671875, 0.1888427734375, 0.201171875, 0.2135009765625, 0.225830078125, 0.2381591796875, 0.25048828125, 0.2628173828125, 0.275146484375, 0.2874755859375, 0.2998046875, 0.3121337890625, 0.324462890625, 0.3367919921875, 0.34912109375, 0.3614501953125, 0.373779296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 12.0, 18.0, 38.0, 51.0, 86.0, 146.0, 183.0, 194.0, 126.0, 67.0, 34.0, 22.0, 13.0, 6.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7321183681488037, -0.6793529391288757, -0.6265875101089478, -0.573822021484375, -0.5210566520690918, -0.46829119324684143, -0.41552573442459106, -0.3627603054046631, -0.3099948763847351, -0.25722944736480713, -0.20446400344371796, -0.15169855952262878, -0.0989331305027008, -0.04616770148277283, 0.006597757339477539, 0.05936318635940552, 0.1121286153793335, 0.16489404439926147, 0.21765948832035065, 0.2704249322414398, 0.3231903612613678, 0.3759557902812958, 0.42872124910354614, 0.4814866781234741, 0.5342521071434021, 0.5870175361633301, 0.6397829651832581, 0.692548394203186, 0.7453138828277588, 0.798079252243042, 0.8508447408676147, 0.9036101698875427, 0.9563755989074707, 1.0091410875320435, 1.0619064569473267, 1.1146719455718994, 1.1674373149871826, 1.2202028036117554, 1.2729682922363281, 1.3257336616516113, 1.3784990310668945, 1.4312645196914673, 1.4840298891067505, 1.5367953777313232, 1.5895607471466064, 1.6423262357711792, 1.695091724395752, 1.7478570938110352, 1.800622582435608, 1.8533880710601807, 1.9061534404754639, 1.9589189291000366, 2.0116844177246094, 2.0644497871398926, 2.117215156555176, 2.169980525970459, 2.2227461338043213, 2.2755115032196045, 2.328277111053467, 2.38104248046875, 2.433807849884033, 2.4865732192993164, 2.5393388271331787, 2.592104196548462, 2.644869565963745]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 9.0, 7.0, 18.0, 25.0, 28.0, 26.0, 33.0, 37.0, 49.0, 52.0, 53.0, 57.0, 64.0, 58.0, 74.0, 60.0, 49.0, 40.0, 42.0, 33.0, 39.0, 34.0, 26.0, 21.0, 15.0, 6.0, 10.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7617505788803101, -0.7377254366874695, -0.7137002944946289, -0.6896751523017883, -0.6656500101089478, -0.6416248679161072, -0.6175997257232666, -0.593574583530426, -0.5695494413375854, -0.5455242991447449, -0.5214991569519043, -0.4974740147590637, -0.47344887256622314, -0.44942373037338257, -0.425398588180542, -0.4013734459877014, -0.37734827399253845, -0.3533231317996979, -0.3292979896068573, -0.3052728474140167, -0.28124770522117615, -0.25722256302833557, -0.2331974059343338, -0.20917226374149323, -0.18514712154865265, -0.16112197935581207, -0.1370968371629715, -0.11307168751955032, -0.08904654532670975, -0.06502140313386917, -0.040996253490448, -0.016971111297607422, 0.007054030895233154, 0.03107917495071888, 0.055104319006204605, 0.07912946492433548, 0.10315460711717606, 0.12717974185943604, 0.1512048989534378, 0.17523004114627838, 0.19925518333911896, 0.22328032553195953, 0.2473054677248001, 0.2713306248188019, 0.29535576701164246, 0.31938090920448303, 0.3434060513973236, 0.3674311935901642, 0.39145633578300476, 0.41548147797584534, 0.4395066201686859, 0.4635317623615265, 0.48755690455436707, 0.51158207654953, 0.5356072187423706, 0.5596323609352112, 0.5836575031280518, 0.6076826453208923, 0.6317077875137329, 0.6557329297065735, 0.6797580718994141, 0.7037832140922546, 0.7278083562850952, 0.7518334984779358, 0.7758586406707764]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 9.0, 11.0, 17.0, 21.0, 48.0, 55.0, 116.0, 311.0, 809.0, 3065.0, 18656.0, 187226.0, 722733.0, 100777.0, 11403.0, 2185.0, 658.0, 204.0, 111.0, 43.0, 35.0, 25.0, 13.0, 7.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22741127014160156, -0.21910476684570312, -0.2107982635498047, -0.20249176025390625, -0.1941852569580078, -0.18587875366210938, -0.17757225036621094, -0.1692657470703125, -0.16095924377441406, -0.15265274047851562, -0.1443462371826172, -0.13603973388671875, -0.1277332305908203, -0.11942672729492188, -0.11112022399902344, -0.102813720703125, -0.09450721740722656, -0.08620071411132812, -0.07789421081542969, -0.06958770751953125, -0.06128120422363281, -0.052974700927734375, -0.04466819763183594, -0.0363616943359375, -0.028055191040039062, -0.019748687744140625, -0.011442184448242188, -0.00313568115234375, 0.0051708221435546875, 0.013477325439453125, 0.021783828735351562, 0.03009033203125, 0.03839683532714844, 0.046703338623046875, 0.05500984191894531, 0.06331634521484375, 0.07162284851074219, 0.07992935180664062, 0.08823585510253906, 0.0965423583984375, 0.10484886169433594, 0.11315536499023438, 0.12146186828613281, 0.12976837158203125, 0.1380748748779297, 0.14638137817382812, 0.15468788146972656, 0.162994384765625, 0.17130088806152344, 0.17960739135742188, 0.1879138946533203, 0.19622039794921875, 0.2045269012451172, 0.21283340454101562, 0.22113990783691406, 0.2294464111328125, 0.23775291442871094, 0.24605941772460938, 0.2543659210205078, 0.26267242431640625, 0.2709789276123047, 0.2792854309082031, 0.28759193420410156, 0.2958984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 9.0, 16.0, 11.0, 24.0, 36.0, 48.0, 60.0, 73.0, 84.0, 96.0, 102.0, 93.0, 79.0, 70.0, 47.0, 42.0, 48.0, 29.0, 11.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.8916854858398438, -0.8678436279296875, -0.8440017700195312, -0.820159912109375, -0.7963180541992188, -0.7724761962890625, -0.7486343383789062, -0.72479248046875, -0.7009506225585938, -0.6771087646484375, -0.6532669067382812, -0.629425048828125, -0.6055831909179688, -0.5817413330078125, -0.5578994750976562, -0.5340576171875, -0.5102157592773438, -0.4863739013671875, -0.46253204345703125, -0.438690185546875, -0.41484832763671875, -0.3910064697265625, -0.36716461181640625, -0.34332275390625, -0.31948089599609375, -0.2956390380859375, -0.27179718017578125, -0.247955322265625, -0.22411346435546875, -0.2002716064453125, -0.17642974853515625, -0.152587890625, -0.12874603271484375, -0.1049041748046875, -0.08106231689453125, -0.057220458984375, -0.03337860107421875, -0.0095367431640625, 0.01430511474609375, 0.03814697265625, 0.06198883056640625, 0.0858306884765625, 0.10967254638671875, 0.133514404296875, 0.15735626220703125, 0.1811981201171875, 0.20503997802734375, 0.2288818359375, 0.25272369384765625, 0.2765655517578125, 0.30040740966796875, 0.324249267578125, 0.34809112548828125, 0.3719329833984375, 0.39577484130859375, 0.41961669921875, 0.44345855712890625, 0.4673004150390625, 0.49114227294921875, 0.514984130859375, 0.5388259887695312, 0.5626678466796875, 0.5865097045898438, 0.6103515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 13.0, 24.0, 35.0, 61.0, 128.0, 184.0, 299.0, 680.0, 1417.0, 3947.0, 13169.0, 55323.0, 274765.0, 516057.0, 141012.0, 29207.0, 7497.0, 2489.0, 1085.0, 478.0, 273.0, 143.0, 89.0, 49.0, 29.0, 29.0, 15.0, 10.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.193603515625, -0.18854713439941406, -0.18349075317382812, -0.1784343719482422, -0.17337799072265625, -0.1683216094970703, -0.16326522827148438, -0.15820884704589844, -0.1531524658203125, -0.14809608459472656, -0.14303970336914062, -0.1379833221435547, -0.13292694091796875, -0.1278705596923828, -0.12281417846679688, -0.11775779724121094, -0.112701416015625, -0.10764503479003906, -0.10258865356445312, -0.09753227233886719, -0.09247589111328125, -0.08741950988769531, -0.08236312866210938, -0.07730674743652344, -0.0722503662109375, -0.06719398498535156, -0.062137603759765625, -0.05708122253417969, -0.05202484130859375, -0.04696846008300781, -0.041912078857421875, -0.03685569763183594, -0.03179931640625, -0.026742935180664062, -0.021686553955078125, -0.016630172729492188, -0.01157379150390625, -0.0065174102783203125, -0.001461029052734375, 0.0035953521728515625, 0.0086517333984375, 0.013708114624023438, 0.018764495849609375, 0.023820877075195312, 0.02887725830078125, 0.03393363952636719, 0.038990020751953125, 0.04404640197753906, 0.049102783203125, 0.05415916442871094, 0.059215545654296875, 0.06427192687988281, 0.06932830810546875, 0.07438468933105469, 0.07944107055664062, 0.08449745178222656, 0.0895538330078125, 0.09461021423339844, 0.09966659545898438, 0.10472297668457031, 0.10977935791015625, 0.11483573913574219, 0.11989212036132812, 0.12494850158691406, 0.1300048828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 10.0, 9.0, 6.0, 12.0, 17.0, 18.0, 27.0, 24.0, 23.0, 25.0, 17.0, 34.0, 36.0, 40.0, 43.0, 37.0, 45.0, 60.0, 45.0, 45.0, 58.0, 54.0, 47.0, 37.0, 28.0, 26.0, 37.0, 21.0, 25.0, 21.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65283203125, -0.6292190551757812, -0.6056060791015625, -0.5819931030273438, -0.558380126953125, -0.5347671508789062, -0.5111541748046875, -0.48754119873046875, -0.46392822265625, -0.44031524658203125, -0.4167022705078125, -0.39308929443359375, -0.369476318359375, -0.34586334228515625, -0.3222503662109375, -0.29863739013671875, -0.2750244140625, -0.25141143798828125, -0.2277984619140625, -0.20418548583984375, -0.180572509765625, -0.15695953369140625, -0.1333465576171875, -0.10973358154296875, -0.08612060546875, -0.06250762939453125, -0.0388946533203125, -0.01528167724609375, 0.008331298828125, 0.03194427490234375, 0.0555572509765625, 0.07917022705078125, 0.102783203125, 0.12639617919921875, 0.1500091552734375, 0.17362213134765625, 0.197235107421875, 0.22084808349609375, 0.2444610595703125, 0.26807403564453125, 0.29168701171875, 0.31529998779296875, 0.3389129638671875, 0.36252593994140625, 0.386138916015625, 0.40975189208984375, 0.4333648681640625, 0.45697784423828125, 0.4805908203125, 0.5042037963867188, 0.5278167724609375, 0.5514297485351562, 0.575042724609375, 0.5986557006835938, 0.6222686767578125, 0.6458816528320312, 0.66949462890625, 0.6931076049804688, 0.7167205810546875, 0.7403335571289062, 0.763946533203125, 0.7875595092773438, 0.8111724853515625, 0.8347854614257812, 0.8583984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 6.0, 7.0, 10.0, 13.0, 23.0, 38.0, 67.0, 118.0, 160.0, 310.0, 544.0, 1059.0, 2104.0, 5011.0, 13291.0, 42873.0, 167786.0, 484776.0, 241581.0, 59449.0, 17571.0, 6420.0, 2629.0, 1254.0, 624.0, 307.0, 183.0, 119.0, 61.0, 43.0, 33.0, 27.0, 13.0, 7.0, 9.0, 8.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035247802734375, -0.03401660919189453, -0.03278541564941406, -0.031554222106933594, -0.030323028564453125, -0.029091835021972656, -0.027860641479492188, -0.02662944793701172, -0.02539825439453125, -0.02416706085205078, -0.022935867309570312, -0.021704673767089844, -0.020473480224609375, -0.019242286682128906, -0.018011093139648438, -0.01677989959716797, -0.0155487060546875, -0.014317512512207031, -0.013086318969726562, -0.011855125427246094, -0.010623931884765625, -0.009392738342285156, -0.008161544799804688, -0.006930351257324219, -0.00569915771484375, -0.004467964172363281, -0.0032367706298828125, -0.0020055770874023438, -0.000774383544921875, 0.00045680999755859375, 0.0016880035400390625, 0.0029191970825195312, 0.004150390625, 0.005381584167480469, 0.0066127777099609375, 0.007843971252441406, 0.009075164794921875, 0.010306358337402344, 0.011537551879882812, 0.012768745422363281, 0.01399993896484375, 0.015231132507324219, 0.016462326049804688, 0.017693519592285156, 0.018924713134765625, 0.020155906677246094, 0.021387100219726562, 0.02261829376220703, 0.0238494873046875, 0.02508068084716797, 0.026311874389648438, 0.027543067932128906, 0.028774261474609375, 0.030005455017089844, 0.031236648559570312, 0.03246784210205078, 0.03369903564453125, 0.03493022918701172, 0.03616142272949219, 0.037392616271972656, 0.038623809814453125, 0.039855003356933594, 0.04108619689941406, 0.04231739044189453, 0.043548583984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 9.0, 5.0, 10.0, 11.0, 14.0, 12.0, 29.0, 29.0, 43.0, 44.0, 60.0, 71.0, 79.0, 80.0, 85.0, 89.0, 67.0, 64.0, 41.0, 33.0, 27.0, 15.0, 16.0, 6.0, 13.0, 7.0, 8.0, 1.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.9126571714878082e-05, -1.8524006009101868e-05, -1.7921440303325653e-05, -1.731887459754944e-05, -1.6716308891773224e-05, -1.611374318599701e-05, -1.5511177480220795e-05, -1.490861177444458e-05, -1.4306046068668365e-05, -1.3703480362892151e-05, -1.3100914657115936e-05, -1.2498348951339722e-05, -1.1895783245563507e-05, -1.1293217539787292e-05, -1.0690651834011078e-05, -1.0088086128234863e-05, -9.485520422458649e-06, -8.882954716682434e-06, -8.28038901090622e-06, -7.677823305130005e-06, -7.07525759935379e-06, -6.472691893577576e-06, -5.870126187801361e-06, -5.2675604820251465e-06, -4.664994776248932e-06, -4.062429070472717e-06, -3.4598633646965027e-06, -2.857297658920288e-06, -2.2547319531440735e-06, -1.6521662473678589e-06, -1.0496005415916443e-06, -4.470348358154297e-07, 1.555308699607849e-07, 7.580965757369995e-07, 1.3606622815132141e-06, 1.9632279872894287e-06, 2.5657936930656433e-06, 3.168359398841858e-06, 3.7709251046180725e-06, 4.373490810394287e-06, 4.976056516170502e-06, 5.578622221946716e-06, 6.181187927722931e-06, 6.7837536334991455e-06, 7.38631933927536e-06, 7.988885045051575e-06, 8.59145075082779e-06, 9.194016456604004e-06, 9.796582162380219e-06, 1.0399147868156433e-05, 1.1001713573932648e-05, 1.1604279279708862e-05, 1.2206844985485077e-05, 1.2809410691261292e-05, 1.3411976397037506e-05, 1.401454210281372e-05, 1.4617107808589935e-05, 1.521967351436615e-05, 1.5822239220142365e-05, 1.642480492591858e-05, 1.7027370631694794e-05, 1.7629936337471008e-05, 1.8232502043247223e-05, 1.8835067749023438e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 18.0, 9.0, 20.0, 26.0, 37.0, 76.0, 109.0, 157.0, 315.0, 661.0, 1418.0, 3677.0, 10345.0, 33034.0, 122139.0, 414254.0, 334197.0, 89139.0, 25420.0, 8067.0, 2901.0, 1216.0, 576.0, 297.0, 153.0, 92.0, 59.0, 40.0, 32.0, 18.0, 8.0, 12.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037994384765625, -0.03676414489746094, -0.035533905029296875, -0.03430366516113281, -0.03307342529296875, -0.03184318542480469, -0.030612945556640625, -0.029382705688476562, -0.0281524658203125, -0.026922225952148438, -0.025691986083984375, -0.024461746215820312, -0.02323150634765625, -0.022001266479492188, -0.020771026611328125, -0.019540786743164062, -0.018310546875, -0.017080307006835938, -0.015850067138671875, -0.014619827270507812, -0.01338958740234375, -0.012159347534179688, -0.010929107666015625, -0.009698867797851562, -0.0084686279296875, -0.0072383880615234375, -0.006008148193359375, -0.0047779083251953125, -0.00354766845703125, -0.0023174285888671875, -0.001087188720703125, 0.0001430511474609375, 0.001373291015625, 0.0026035308837890625, 0.003833770751953125, 0.0050640106201171875, 0.00629425048828125, 0.0075244903564453125, 0.008754730224609375, 0.009984970092773438, 0.0112152099609375, 0.012445449829101562, 0.013675689697265625, 0.014905929565429688, 0.01613616943359375, 0.017366409301757812, 0.018596649169921875, 0.019826889038085938, 0.02105712890625, 0.022287368774414062, 0.023517608642578125, 0.024747848510742188, 0.02597808837890625, 0.027208328247070312, 0.028438568115234375, 0.029668807983398438, 0.0308990478515625, 0.03212928771972656, 0.033359527587890625, 0.03458976745605469, 0.03582000732421875, 0.03705024719238281, 0.038280487060546875, 0.03951072692871094, 0.040740966796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 12.0, 9.0, 14.0, 12.0, 13.0, 20.0, 25.0, 22.0, 24.0, 28.0, 41.0, 40.0, 32.0, 52.0, 45.0, 54.0, 57.0, 46.0, 54.0, 50.0, 39.0, 38.0, 36.0, 30.0, 34.0, 19.0, 35.0, 18.0, 22.0, 12.0, 6.0, 8.0, 8.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005889892578125, -0.0056498050689697266, -0.005409717559814453, -0.00516963005065918, -0.004929542541503906, -0.004689455032348633, -0.004449367523193359, -0.004209280014038086, -0.0039691925048828125, -0.003729104995727539, -0.0034890174865722656, -0.003248929977416992, -0.0030088424682617188, -0.0027687549591064453, -0.002528667449951172, -0.0022885799407958984, -0.002048492431640625, -0.0018084049224853516, -0.0015683174133300781, -0.0013282299041748047, -0.0010881423950195312, -0.0008480548858642578, -0.0006079673767089844, -0.00036787986755371094, -0.0001277923583984375, 0.00011229515075683594, 0.0003523826599121094, 0.0005924701690673828, 0.0008325576782226562, 0.0010726451873779297, 0.0013127326965332031, 0.0015528202056884766, 0.00179290771484375, 0.0020329952239990234, 0.002273082733154297, 0.0025131702423095703, 0.0027532577514648438, 0.002993345260620117, 0.0032334327697753906, 0.003473520278930664, 0.0037136077880859375, 0.003953695297241211, 0.004193782806396484, 0.004433870315551758, 0.004673957824707031, 0.004914045333862305, 0.005154132843017578, 0.0053942203521728516, 0.005634307861328125, 0.0058743953704833984, 0.006114482879638672, 0.006354570388793945, 0.006594657897949219, 0.006834745407104492, 0.007074832916259766, 0.007314920425415039, 0.0075550079345703125, 0.007795095443725586, 0.00803518295288086, 0.008275270462036133, 0.008515357971191406, 0.00875544548034668, 0.008995532989501953, 0.009235620498657227, 0.0094757080078125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 7.0, 9.0, 136.0, 629.0, 209.0, 23.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.817451536655426, -0.6943567991256714, -0.5712620615959167, -0.4481672942638397, -0.3250725567340851, -0.20197778940200806, -0.07888305187225342, 0.04421168565750122, 0.16730642318725586, 0.2904011607170105, 0.41349589824676514, 0.5365906953811646, 0.6596853733062744, 0.7827801704406738, 0.9058749079704285, 1.028969645500183, 1.152064323425293, 1.2751591205596924, 1.3982537984848022, 1.5213485956192017, 1.6444432735443115, 1.767538070678711, 1.8906328678131104, 2.0137276649475098, 2.13682222366333, 2.2599170207977295, 2.383011817932129, 2.506106376647949, 2.6292011737823486, 2.752295970916748, 2.8753907680511475, 2.998485565185547, 3.1215803623199463, 3.2446751594543457, 3.367769956588745, 3.4908645153045654, 3.613959312438965, 3.7370541095733643, 3.8601489067077637, 3.983243465423584, 4.1063385009765625, 4.229433059692383, 4.352528095245361, 4.475622653961182, 4.59871768951416, 4.7218122482299805, 4.844906806945801, 4.968001842498779, 5.0910964012146, 5.21419095993042, 5.337285995483398, 5.460380554199219, 5.583475589752197, 5.706570148468018, 5.829664707183838, 5.952759742736816, 6.075854301452637, 6.198948860168457, 6.3220438957214355, 6.445138454437256, 6.568233489990234, 6.691328048706055, 6.814422607421875, 6.9375176429748535, 7.060612201690674]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 10.0, 8.0, 14.0, 13.0, 29.0, 34.0, 46.0, 45.0, 70.0, 59.0, 84.0, 87.0, 95.0, 76.0, 65.0, 59.0, 52.0, 56.0, 37.0, 22.0, 13.0, 12.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7214376330375671, -0.700748860836029, -0.6800601482391357, -0.6593713760375977, -0.6386826038360596, -0.6179938912391663, -0.5973051190376282, -0.5766164064407349, -0.5559276342391968, -0.5352388620376587, -0.5145501494407654, -0.4938613772392273, -0.4731726348400116, -0.4524838924407959, -0.4317951202392578, -0.4111063778400421, -0.3904176354408264, -0.3697288930416107, -0.349040150642395, -0.32835137844085693, -0.30766263604164124, -0.28697389364242554, -0.26628512144088745, -0.24559637904167175, -0.22490763664245605, -0.20421889424324036, -0.18353013694286346, -0.16284137964248657, -0.14215263724327087, -0.12146388739347458, -0.10077513754367828, -0.08008638024330139, -0.05939757823944092, -0.03870882838964462, -0.018020078539848328, 0.0026686713099479675, 0.023357421159744263, 0.04404617100954056, 0.06473492085933685, 0.08542367815971375, 0.10611242055892944, 0.12680116295814514, 0.14748992025852203, 0.16817867755889893, 0.18886741995811462, 0.20955616235733032, 0.23024491965770721, 0.2509336769580841, 0.2716224193572998, 0.2923111617565155, 0.3129999041557312, 0.3336886763572693, 0.354377418756485, 0.3750661611557007, 0.39575493335723877, 0.41644367575645447, 0.43713241815567017, 0.45782116055488586, 0.47850990295410156, 0.49919867515563965, 0.5198874473571777, 0.540576159954071, 0.5612649321556091, 0.5819536447525024, 0.6026424169540405]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 9.0, 23.0, 40.0, 40.0, 62.0, 115.0, 154.0, 305.0, 537.0, 1043.0, 2063.0, 4408.0, 10267.0, 28611.0, 105765.0, 467628.0, 322866.0, 69141.0, 20541.0, 7810.0, 3511.0, 1611.0, 862.0, 468.0, 268.0, 141.0, 84.0, 49.0, 40.0, 26.0, 17.0, 8.0, 8.0, 4.0, 0.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5224609375, -0.5060577392578125, -0.489654541015625, -0.4732513427734375, -0.45684814453125, -0.4404449462890625, -0.424041748046875, -0.4076385498046875, -0.3912353515625, -0.3748321533203125, -0.358428955078125, -0.3420257568359375, -0.32562255859375, -0.3092193603515625, -0.292816162109375, -0.2764129638671875, -0.260009765625, -0.2436065673828125, -0.227203369140625, -0.2108001708984375, -0.19439697265625, -0.1779937744140625, -0.161590576171875, -0.1451873779296875, -0.1287841796875, -0.1123809814453125, -0.095977783203125, -0.0795745849609375, -0.06317138671875, -0.0467681884765625, -0.030364990234375, -0.0139617919921875, 0.00244140625, 0.0188446044921875, 0.035247802734375, 0.0516510009765625, 0.06805419921875, 0.0844573974609375, 0.100860595703125, 0.1172637939453125, 0.1336669921875, 0.1500701904296875, 0.166473388671875, 0.1828765869140625, 0.19927978515625, 0.2156829833984375, 0.232086181640625, 0.2484893798828125, 0.264892578125, 0.2812957763671875, 0.297698974609375, 0.3141021728515625, 0.33050537109375, 0.3469085693359375, 0.363311767578125, 0.3797149658203125, 0.3961181640625, 0.4125213623046875, 0.428924560546875, 0.4453277587890625, 0.46173095703125, 0.4781341552734375, 0.494537353515625, 0.5109405517578125, 0.52734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 14.0, 10.0, 12.0, 15.0, 24.0, 22.0, 25.0, 23.0, 36.0, 36.0, 41.0, 45.0, 52.0, 57.0, 57.0, 47.0, 61.0, 45.0, 46.0, 41.0, 40.0, 36.0, 28.0, 32.0, 30.0, 26.0, 21.0, 15.0, 18.0, 3.0, 6.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6639404296875, -0.641357421875, -0.6187744140625, -0.59619140625, -0.5736083984375, -0.551025390625, -0.5284423828125, -0.505859375, -0.4832763671875, -0.460693359375, -0.4381103515625, -0.41552734375, -0.3929443359375, -0.370361328125, -0.3477783203125, -0.3251953125, -0.3026123046875, -0.280029296875, -0.2574462890625, -0.23486328125, -0.2122802734375, -0.189697265625, -0.1671142578125, -0.14453125, -0.1219482421875, -0.099365234375, -0.0767822265625, -0.05419921875, -0.0316162109375, -0.009033203125, 0.0135498046875, 0.0361328125, 0.0587158203125, 0.081298828125, 0.1038818359375, 0.12646484375, 0.1490478515625, 0.171630859375, 0.1942138671875, 0.216796875, 0.2393798828125, 0.261962890625, 0.2845458984375, 0.30712890625, 0.3297119140625, 0.352294921875, 0.3748779296875, 0.3974609375, 0.4200439453125, 0.442626953125, 0.4652099609375, 0.48779296875, 0.5103759765625, 0.532958984375, 0.5555419921875, 0.578125, 0.6007080078125, 0.623291015625, 0.6458740234375, 0.66845703125, 0.6910400390625, 0.713623046875, 0.7362060546875, 0.7587890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 17.0, 19.0, 31.0, 27.0, 42.0, 51.0, 57.0, 75.0, 108.0, 149.0, 210.0, 369.0, 798.0, 2357.0, 9494.0, 72195.0, 810344.0, 132982.0, 13752.0, 3160.0, 997.0, 421.0, 228.0, 161.0, 112.0, 81.0, 68.0, 47.0, 37.0, 25.0, 30.0, 20.0, 19.0, 11.0, 8.0, 9.0, 9.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9958267211914062, -0.9652862548828125, -0.9347457885742188, -0.904205322265625, -0.8736648559570312, -0.8431243896484375, -0.8125839233398438, -0.78204345703125, -0.7515029907226562, -0.7209625244140625, -0.6904220581054688, -0.659881591796875, -0.6293411254882812, -0.5988006591796875, -0.5682601928710938, -0.5377197265625, -0.5071792602539062, -0.4766387939453125, -0.44609832763671875, -0.415557861328125, -0.38501739501953125, -0.3544769287109375, -0.32393646240234375, -0.29339599609375, -0.26285552978515625, -0.2323150634765625, -0.20177459716796875, -0.171234130859375, -0.14069366455078125, -0.1101531982421875, -0.07961273193359375, -0.049072265625, -0.01853179931640625, 0.0120086669921875, 0.04254913330078125, 0.073089599609375, 0.10363006591796875, 0.1341705322265625, 0.16471099853515625, 0.19525146484375, 0.22579193115234375, 0.2563323974609375, 0.28687286376953125, 0.317413330078125, 0.34795379638671875, 0.3784942626953125, 0.40903472900390625, 0.4395751953125, 0.47011566162109375, 0.5006561279296875, 0.5311965942382812, 0.561737060546875, 0.5922775268554688, 0.6228179931640625, 0.6533584594726562, 0.68389892578125, 0.7144393920898438, 0.7449798583984375, 0.7755203247070312, 0.806060791015625, 0.8366012573242188, 0.8671417236328125, 0.8976821899414062, 0.92822265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 10.0, 21.0, 15.0, 14.0, 16.0, 31.0, 21.0, 24.0, 22.0, 27.0, 30.0, 31.0, 43.0, 42.0, 45.0, 39.0, 38.0, 38.0, 33.0, 36.0, 39.0, 32.0, 35.0, 43.0, 39.0, 34.0, 27.0, 19.0, 21.0, 19.0, 22.0, 13.0, 11.0, 11.0, 10.0, 9.0, 13.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.6552734375, -0.6362380981445312, -0.6172027587890625, -0.5981674194335938, -0.579132080078125, -0.5600967407226562, -0.5410614013671875, -0.5220260620117188, -0.50299072265625, -0.48395538330078125, -0.4649200439453125, -0.44588470458984375, -0.426849365234375, -0.40781402587890625, -0.3887786865234375, -0.36974334716796875, -0.3507080078125, -0.33167266845703125, -0.3126373291015625, -0.29360198974609375, -0.274566650390625, -0.25553131103515625, -0.2364959716796875, -0.21746063232421875, -0.19842529296875, -0.17938995361328125, -0.1603546142578125, -0.14131927490234375, -0.122283935546875, -0.10324859619140625, -0.0842132568359375, -0.06517791748046875, -0.046142578125, -0.02710723876953125, -0.0080718994140625, 0.01096343994140625, 0.029998779296875, 0.04903411865234375, 0.0680694580078125, 0.08710479736328125, 0.10614013671875, 0.12517547607421875, 0.1442108154296875, 0.16324615478515625, 0.182281494140625, 0.20131683349609375, 0.2203521728515625, 0.23938751220703125, 0.2584228515625, 0.27745819091796875, 0.2964935302734375, 0.31552886962890625, 0.334564208984375, 0.35359954833984375, 0.3726348876953125, 0.39167022705078125, 0.41070556640625, 0.42974090576171875, 0.4487762451171875, 0.46781158447265625, 0.486846923828125, 0.5058822631835938, 0.5249176025390625, 0.5439529418945312, 0.56298828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 7.0, 16.0, 22.0, 40.0, 74.0, 160.0, 326.0, 748.0, 2194.0, 9248.0, 89825.0, 883259.0, 52675.0, 6923.0, 1837.0, 613.0, 272.0, 148.0, 75.0, 35.0, 22.0, 13.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634765625, -0.5495338439941406, -0.5355911254882812, -0.5216484069824219, -0.5077056884765625, -0.4937629699707031, -0.47982025146484375, -0.4658775329589844, -0.451934814453125, -0.4379920959472656, -0.42404937744140625, -0.4101066589355469, -0.3961639404296875, -0.3822212219238281, -0.36827850341796875, -0.3543357849121094, -0.34039306640625, -0.3264503479003906, -0.31250762939453125, -0.2985649108886719, -0.2846221923828125, -0.2706794738769531, -0.25673675537109375, -0.24279403686523438, -0.228851318359375, -0.21490859985351562, -0.20096588134765625, -0.18702316284179688, -0.1730804443359375, -0.15913772583007812, -0.14519500732421875, -0.13125228881835938, -0.1173095703125, -0.10336685180664062, -0.08942413330078125, -0.07548141479492188, -0.0615386962890625, -0.047595977783203125, -0.03365325927734375, -0.019710540771484375, -0.005767822265625, 0.008174896240234375, 0.02211761474609375, 0.036060333251953125, 0.0500030517578125, 0.06394577026367188, 0.07788848876953125, 0.09183120727539062, 0.10577392578125, 0.11971664428710938, 0.13365936279296875, 0.14760208129882812, 0.1615447998046875, 0.17548751831054688, 0.18943023681640625, 0.20337295532226562, 0.217315673828125, 0.23125839233398438, 0.24520111083984375, 0.2591438293457031, 0.2730865478515625, 0.2870292663574219, 0.30097198486328125, 0.3149147033691406, 0.328857421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 16.0, 26.0, 49.0, 80.0, 183.0, 245.0, 209.0, 85.0, 47.0, 10.0, 15.0, 4.0, 7.0, 8.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8995018005371094e-05, -4.672631621360779e-05, -4.445761442184448e-05, -4.218891263008118e-05, -3.992021083831787e-05, -3.7651509046554565e-05, -3.538280725479126e-05, -3.3114105463027954e-05, -3.084540367126465e-05, -2.8576701879501343e-05, -2.6308000087738037e-05, -2.403929829597473e-05, -2.1770596504211426e-05, -1.950189471244812e-05, -1.7233192920684814e-05, -1.4964491128921509e-05, -1.2695789337158203e-05, -1.0427087545394897e-05, -8.158385753631592e-06, -5.889683961868286e-06, -3.6209821701049805e-06, -1.3522803783416748e-06, 9.164214134216309e-07, 3.1851232051849365e-06, 5.453824996948242e-06, 7.722526788711548e-06, 9.991228580474854e-06, 1.225993037223816e-05, 1.4528632164001465e-05, 1.679733395576477e-05, 1.9066035747528076e-05, 2.1334737539291382e-05, 2.3603439331054688e-05, 2.5872141122817993e-05, 2.81408429145813e-05, 3.0409544706344604e-05, 3.267824649810791e-05, 3.4946948289871216e-05, 3.721565008163452e-05, 3.948435187339783e-05, 4.175305366516113e-05, 4.402175545692444e-05, 4.6290457248687744e-05, 4.855915904045105e-05, 5.0827860832214355e-05, 5.309656262397766e-05, 5.536526441574097e-05, 5.763396620750427e-05, 5.990266799926758e-05, 6.217136979103088e-05, 6.444007158279419e-05, 6.67087733745575e-05, 6.89774751663208e-05, 7.12461769580841e-05, 7.351487874984741e-05, 7.578358054161072e-05, 7.805228233337402e-05, 8.032098412513733e-05, 8.258968591690063e-05, 8.485838770866394e-05, 8.712708950042725e-05, 8.939579129219055e-05, 9.166449308395386e-05, 9.393319487571716e-05, 9.620189666748047e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 8.0, 13.0, 14.0, 27.0, 48.0, 87.0, 274.0, 729.0, 2917.0, 20946.0, 806946.0, 204852.0, 9143.0, 1656.0, 486.0, 192.0, 80.0, 42.0, 30.0, 14.0, 11.0, 12.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.3093452453613281, -0.29373931884765625, -0.2781333923339844, -0.2625274658203125, -0.24692153930664062, -0.23131561279296875, -0.21570968627929688, -0.200103759765625, -0.18449783325195312, -0.16889190673828125, -0.15328598022460938, -0.1376800537109375, -0.12207412719726562, -0.10646820068359375, -0.09086227416992188, -0.07525634765625, -0.059650421142578125, -0.04404449462890625, -0.028438568115234375, -0.0128326416015625, 0.002773284912109375, 0.01837921142578125, 0.033985137939453125, 0.049591064453125, 0.06519699096679688, 0.08080291748046875, 0.09640884399414062, 0.1120147705078125, 0.12762069702148438, 0.14322662353515625, 0.15883255004882812, 0.1744384765625, 0.19004440307617188, 0.20565032958984375, 0.22125625610351562, 0.2368621826171875, 0.2524681091308594, 0.26807403564453125, 0.2836799621582031, 0.299285888671875, 0.3148918151855469, 0.33049774169921875, 0.3461036682128906, 0.3617095947265625, 0.3773155212402344, 0.39292144775390625, 0.4085273742675781, 0.42413330078125, 0.4397392272949219, 0.45534515380859375, 0.4709510803222656, 0.4865570068359375, 0.5021629333496094, 0.5177688598632812, 0.5333747863769531, 0.548980712890625, 0.5645866394042969, 0.5801925659179688, 0.5957984924316406, 0.6114044189453125, 0.6270103454589844, 0.6426162719726562, 0.6582221984863281, 0.673828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 18.0, 13.0, 14.0, 34.0, 65.0, 57.0, 99.0, 116.0, 103.0, 109.0, 95.0, 79.0, 42.0, 40.0, 26.0, 18.0, 11.0, 4.0, 7.0, 9.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.146728515625, -0.1432971954345703, -0.13986587524414062, -0.13643455505371094, -0.13300323486328125, -0.12957191467285156, -0.12614059448242188, -0.12270927429199219, -0.1192779541015625, -0.11584663391113281, -0.11241531372070312, -0.10898399353027344, -0.10555267333984375, -0.10212135314941406, -0.09869003295898438, -0.09525871276855469, -0.091827392578125, -0.08839607238769531, -0.08496475219726562, -0.08153343200683594, -0.07810211181640625, -0.07467079162597656, -0.07123947143554688, -0.06780815124511719, -0.0643768310546875, -0.06094551086425781, -0.057514190673828125, -0.05408287048339844, -0.05065155029296875, -0.04722023010253906, -0.043788909912109375, -0.04035758972167969, -0.03692626953125, -0.03349494934082031, -0.030063629150390625, -0.026632308959960938, -0.02320098876953125, -0.019769668579101562, -0.016338348388671875, -0.012907028198242188, -0.0094757080078125, -0.0060443878173828125, -0.002613067626953125, 0.0008182525634765625, 0.00424957275390625, 0.0076808929443359375, 0.011112213134765625, 0.014543533325195312, 0.017974853515625, 0.021406173706054688, 0.024837493896484375, 0.028268814086914062, 0.03170013427734375, 0.03513145446777344, 0.038562774658203125, 0.04199409484863281, 0.0454254150390625, 0.04885673522949219, 0.052288055419921875, 0.05571937561035156, 0.05915069580078125, 0.06258201599121094, 0.06601333618164062, 0.06944465637207031, 0.0728759765625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 22.0, 42.0, 49.0, 90.0, 129.0, 173.0, 165.0, 114.0, 67.0, 57.0, 32.0, 18.0, 9.0, 10.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4202715158462524, -1.3635207414627075, -1.306769847869873, -1.2500190734863281, -1.1932682991027832, -1.1365175247192383, -1.0797667503356934, -1.0230158567428589, -0.966265082359314, -0.909514307975769, -0.8527634739875793, -0.7960126399993896, -0.7392618656158447, -0.6825110912322998, -0.6257602572441101, -0.5690094232559204, -0.5122586488723755, -0.4555078446865082, -0.39875704050064087, -0.34200623631477356, -0.28525543212890625, -0.22850462794303894, -0.17175382375717163, -0.11500301957130432, -0.05825221538543701, -0.0015014111995697021, 0.05524939298629761, 0.11200019717216492, 0.16875100135803223, 0.22550180554389954, 0.28225260972976685, 0.33900341391563416, 0.395754337310791, 0.4525051414966583, 0.5092559456825256, 0.5660067796707153, 0.6227575540542603, 0.6795083284378052, 0.7362591624259949, 0.7930099964141846, 0.8497607707977295, 0.9065115451812744, 0.9632623791694641, 1.0200132131576538, 1.0767639875411987, 1.1335147619247437, 1.1902656555175781, 1.247016429901123, 1.303767204284668, 1.360517978668213, 1.4172687530517578, 1.4740196466445923, 1.5307704210281372, 1.5875211954116821, 1.6442720890045166, 1.7010228633880615, 1.7577736377716064, 1.8145244121551514, 1.8712751865386963, 1.9280260801315308, 1.9847768545150757, 2.04152774810791, 2.098278522491455, 2.155029296875, 2.211780071258545]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 9.0, 8.0, 12.0, 9.0, 16.0, 21.0, 30.0, 26.0, 25.0, 24.0, 37.0, 38.0, 47.0, 53.0, 38.0, 43.0, 49.0, 39.0, 61.0, 49.0, 43.0, 44.0, 37.0, 35.0, 31.0, 28.0, 24.0, 20.0, 21.0, 18.0, 9.0, 15.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2263832092285156, -1.1879488229751587, -1.1495144367218018, -1.1110800504684448, -1.072645664215088, -1.034211277961731, -0.995776891708374, -0.9573425054550171, -0.9189081192016602, -0.8804737329483032, -0.8420393466949463, -0.8036049604415894, -0.7651705741882324, -0.7267361879348755, -0.6883018016815186, -0.6498674154281616, -0.6114329695701599, -0.572998583316803, -0.534564197063446, -0.4961298108100891, -0.4576954245567322, -0.41926103830337524, -0.3808266222476959, -0.342392235994339, -0.30395784974098206, -0.2655234634876251, -0.2270890772342682, -0.18865467607975006, -0.15022028982639313, -0.1117859035730362, -0.07335150241851807, -0.03491711616516113, 0.0035172700881958008, 0.04195166006684303, 0.08038605004549026, 0.1188204437494278, 0.15725483000278473, 0.19568921625614166, 0.2341236174106598, 0.2725580036640167, 0.31099238991737366, 0.3494267761707306, 0.3878611624240875, 0.42629557847976685, 0.4647299647331238, 0.5031643509864807, 0.5415987372398376, 0.5800331234931946, 0.6184675097465515, 0.6569018959999084, 0.6953362822532654, 0.7337706685066223, 0.7722050547599792, 0.8106394410133362, 0.8490738868713379, 0.8875082731246948, 0.9259426593780518, 0.9643770456314087, 1.0028114318847656, 1.0412458181381226, 1.0796802043914795, 1.1181145906448364, 1.1565489768981934, 1.1949833631515503, 1.2334177494049072]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 7.0, 15.0, 31.0, 49.0, 94.0, 130.0, 427.0, 1663.0, 11939.0, 1704246.0, 2460075.0, 13086.0, 1722.0, 409.0, 143.0, 68.0, 44.0, 27.0, 15.0, 13.0, 12.0, 6.0, 4.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.322357177734375, -2.24237060546875, -2.162384033203125, -2.0823974609375, -2.002410888671875, -1.92242431640625, -1.842437744140625, -1.762451171875, -1.682464599609375, -1.60247802734375, -1.522491455078125, -1.4425048828125, -1.362518310546875, -1.28253173828125, -1.202545166015625, -1.12255859375, -1.042572021484375, -0.96258544921875, -0.882598876953125, -0.8026123046875, -0.722625732421875, -0.64263916015625, -0.562652587890625, -0.482666015625, -0.402679443359375, -0.32269287109375, -0.242706298828125, -0.1627197265625, -0.082733154296875, -0.00274658203125, 0.077239990234375, 0.1572265625, 0.237213134765625, 0.31719970703125, 0.397186279296875, 0.4771728515625, 0.557159423828125, 0.63714599609375, 0.717132568359375, 0.797119140625, 0.877105712890625, 0.95709228515625, 1.037078857421875, 1.1170654296875, 1.197052001953125, 1.27703857421875, 1.357025146484375, 1.43701171875, 1.516998291015625, 1.59698486328125, 1.676971435546875, 1.7569580078125, 1.836944580078125, 1.91693115234375, 1.996917724609375, 2.076904296875, 2.156890869140625, 2.23687744140625, 2.316864013671875, 2.3968505859375, 2.476837158203125, 2.55682373046875, 2.636810302734375, 2.716796875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 9.0, 10.0, 8.0, 17.0, 19.0, 21.0, 30.0, 24.0, 36.0, 40.0, 55.0, 36.0, 70.0, 69.0, 73.0, 54.0, 78.0, 56.0, 48.0, 38.0, 42.0, 44.0, 40.0, 28.0, 18.0, 13.0, 12.0, 2.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.49542999267578125, -0.4737701416015625, -0.45211029052734375, -0.430450439453125, -0.40879058837890625, -0.3871307373046875, -0.36547088623046875, -0.34381103515625, -0.32215118408203125, -0.3004913330078125, -0.27883148193359375, -0.257171630859375, -0.23551177978515625, -0.2138519287109375, -0.19219207763671875, -0.1705322265625, -0.14887237548828125, -0.1272125244140625, -0.10555267333984375, -0.083892822265625, -0.06223297119140625, -0.0405731201171875, -0.01891326904296875, 0.00274658203125, 0.02440643310546875, 0.0460662841796875, 0.06772613525390625, 0.089385986328125, 0.11104583740234375, 0.1327056884765625, 0.15436553955078125, 0.176025390625, 0.19768524169921875, 0.2193450927734375, 0.24100494384765625, 0.262664794921875, 0.28432464599609375, 0.3059844970703125, 0.32764434814453125, 0.34930419921875, 0.37096405029296875, 0.3926239013671875, 0.41428375244140625, 0.435943603515625, 0.45760345458984375, 0.4792633056640625, 0.5009231567382812, 0.5225830078125, 0.5442428588867188, 0.5659027099609375, 0.5875625610351562, 0.609222412109375, 0.6308822631835938, 0.6525421142578125, 0.6742019653320312, 0.69586181640625, 0.7175216674804688, 0.7391815185546875, 0.7608413696289062, 0.782501220703125, 0.8041610717773438, 0.8258209228515625, 0.8474807739257812, 0.869140625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 5.0, 29.0, 32.0, 41.0, 78.0, 151.0, 245.0, 522.0, 1201.0, 3366.0, 14090.0, 120907.0, 3619734.0, 398244.0, 26941.0, 5451.0, 1667.0, 741.0, 323.0, 197.0, 97.0, 71.0, 43.0, 26.0, 17.0, 12.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0], "bins": [-1.353515625, -1.3210372924804688, -1.2885589599609375, -1.2560806274414062, -1.223602294921875, -1.1911239624023438, -1.1586456298828125, -1.1261672973632812, -1.09368896484375, -1.0612106323242188, -1.0287322998046875, -0.9962539672851562, -0.963775634765625, -0.9312973022460938, -0.8988189697265625, -0.8663406372070312, -0.8338623046875, -0.8013839721679688, -0.7689056396484375, -0.7364273071289062, -0.703948974609375, -0.6714706420898438, -0.6389923095703125, -0.6065139770507812, -0.57403564453125, -0.5415573120117188, -0.5090789794921875, -0.47660064697265625, -0.444122314453125, -0.41164398193359375, -0.3791656494140625, -0.34668731689453125, -0.314208984375, -0.28173065185546875, -0.2492523193359375, -0.21677398681640625, -0.184295654296875, -0.15181732177734375, -0.1193389892578125, -0.08686065673828125, -0.05438232421875, -0.02190399169921875, 0.0105743408203125, 0.04305267333984375, 0.075531005859375, 0.10800933837890625, 0.1404876708984375, 0.17296600341796875, 0.2054443359375, 0.23792266845703125, 0.2704010009765625, 0.30287933349609375, 0.335357666015625, 0.36783599853515625, 0.4003143310546875, 0.43279266357421875, 0.46527099609375, 0.49774932861328125, 0.5302276611328125, 0.5627059936523438, 0.595184326171875, 0.6276626586914062, 0.6601409912109375, 0.6926193237304688, 0.72509765625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 10.0, 12.0, 12.0, 26.0, 35.0, 44.0, 61.0, 78.0, 124.0, 205.0, 330.0, 509.0, 672.0, 594.0, 459.0, 345.0, 166.0, 107.0, 57.0, 63.0, 37.0, 32.0, 20.0, 13.0, 12.0, 5.0, 5.0, 5.0, 6.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.24019622802734375, -0.2336883544921875, -0.22718048095703125, -0.220672607421875, -0.21416473388671875, -0.2076568603515625, -0.20114898681640625, -0.19464111328125, -0.18813323974609375, -0.1816253662109375, -0.17511749267578125, -0.168609619140625, -0.16210174560546875, -0.1555938720703125, -0.14908599853515625, -0.142578125, -0.13607025146484375, -0.1295623779296875, -0.12305450439453125, -0.116546630859375, -0.11003875732421875, -0.1035308837890625, -0.09702301025390625, -0.09051513671875, -0.08400726318359375, -0.0774993896484375, -0.07099151611328125, -0.064483642578125, -0.05797576904296875, -0.0514678955078125, -0.04496002197265625, -0.0384521484375, -0.03194427490234375, -0.0254364013671875, -0.01892852783203125, -0.012420654296875, -0.00591278076171875, 0.0005950927734375, 0.00710296630859375, 0.01361083984375, 0.02011871337890625, 0.0266265869140625, 0.03313446044921875, 0.039642333984375, 0.04615020751953125, 0.0526580810546875, 0.05916595458984375, 0.065673828125, 0.07218170166015625, 0.0786895751953125, 0.08519744873046875, 0.091705322265625, 0.09821319580078125, 0.1047210693359375, 0.11122894287109375, 0.11773681640625, 0.12424468994140625, 0.1307525634765625, 0.13726043701171875, 0.143768310546875, 0.15027618408203125, 0.1567840576171875, 0.16329193115234375, 0.1697998046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 15.0, 6.0, 23.0, 51.0, 104.0, 136.0, 213.0, 193.0, 100.0, 79.0, 36.0, 20.0, 17.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9311900734901428, -0.8792020082473755, -0.8272139430046082, -0.7752258777618408, -0.7232378125190735, -0.6712497472763062, -0.6192616820335388, -0.5672736167907715, -0.5152855515480042, -0.4632974863052368, -0.4113094210624695, -0.35932135581970215, -0.3073332905769348, -0.2553452253341675, -0.20335716009140015, -0.1513690948486328, -0.09938102960586548, -0.047392964363098145, 0.0045951008796691895, 0.05658316612243652, 0.10857123136520386, 0.1605592966079712, 0.21254736185073853, 0.26453542709350586, 0.3165234923362732, 0.3685115575790405, 0.42049962282180786, 0.4724876880645752, 0.5244757533073425, 0.5764638185501099, 0.6284518837928772, 0.6804399490356445, 0.7324280738830566, 0.784416139125824, 0.8364042043685913, 0.8883922696113586, 0.940380334854126, 0.9923684000968933, 1.0443564653396606, 1.0963444709777832, 1.1483325958251953, 1.2003207206726074, 1.25230872631073, 1.3042967319488525, 1.3562848567962646, 1.4082729816436768, 1.4602609872817993, 1.5122489929199219, 1.564237117767334, 1.616225242614746, 1.6682132482528687, 1.7202012538909912, 1.7721893787384033, 1.8241775035858154, 1.876165509223938, 1.9281535148620605, 1.9801416397094727, 2.0321297645568848, 2.084117889404297, 2.13610577583313, 2.188093900680542, 2.240082025527954, 2.292069911956787, 2.344058036804199, 2.3960461616516113]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 14.0, 11.0, 15.0, 25.0, 15.0, 24.0, 26.0, 30.0, 33.0, 42.0, 43.0, 60.0, 49.0, 75.0, 44.0, 58.0, 50.0, 61.0, 50.0, 50.0, 38.0, 38.0, 40.0, 26.0, 24.0, 8.0, 10.0, 12.0, 8.0, 9.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.565366268157959, -0.5442867279052734, -0.5232071876525879, -0.5021276473999023, -0.4810481071472168, -0.45996856689453125, -0.4388890564441681, -0.41780951619148254, -0.396729975938797, -0.37565043568611145, -0.3545708954334259, -0.33349138498306274, -0.3124118447303772, -0.29133230447769165, -0.2702527642250061, -0.24917322397232056, -0.228093683719635, -0.20701414346694946, -0.18593460321426392, -0.16485507786273956, -0.14377553761005402, -0.12269599735736847, -0.10161647200584412, -0.08053693175315857, -0.05945739150047302, -0.038377854973077774, -0.017298318445682526, 0.0037812143564224243, 0.02486075460910797, 0.04594029486179352, 0.06701982021331787, 0.08809936046600342, 0.10917896032333374, 0.1302585005760193, 0.15133804082870483, 0.1724175661802292, 0.19349710643291473, 0.21457664668560028, 0.23565617203712463, 0.2567357122898102, 0.2778152525424957, 0.2988947927951813, 0.3199743330478668, 0.34105384349823, 0.3621333837509155, 0.3832129240036011, 0.4042924642562866, 0.42537200450897217, 0.4464515447616577, 0.46753108501434326, 0.4886106252670288, 0.5096901655197144, 0.5307697057723999, 0.5518492460250854, 0.572928786277771, 0.5940083265304565, 0.6150878667831421, 0.6361674070358276, 0.6572469472885132, 0.6783264875411987, 0.6994060277938843, 0.7204855680465698, 0.7415651082992554, 0.7626446485519409, 0.7837241291999817]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 12.0, 22.0, 29.0, 68.0, 185.0, 836.0, 5585.0, 86620.0, 887485.0, 62026.0, 4642.0, 719.0, 156.0, 68.0, 30.0, 13.0, 11.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3787422180175781, -0.36588287353515625, -0.3530235290527344, -0.3401641845703125, -0.3273048400878906, -0.31444549560546875, -0.3015861511230469, -0.288726806640625, -0.2758674621582031, -0.26300811767578125, -0.2501487731933594, -0.2372894287109375, -0.22443008422851562, -0.21157073974609375, -0.19871139526367188, -0.18585205078125, -0.17299270629882812, -0.16013336181640625, -0.14727401733398438, -0.1344146728515625, -0.12155532836914062, -0.10869598388671875, -0.09583663940429688, -0.082977294921875, -0.07011795043945312, -0.05725860595703125, -0.044399261474609375, -0.0315399169921875, -0.018680572509765625, -0.00582122802734375, 0.007038116455078125, 0.0198974609375, 0.032756805419921875, 0.04561614990234375, 0.058475494384765625, 0.0713348388671875, 0.08419418334960938, 0.09705352783203125, 0.10991287231445312, 0.122772216796875, 0.13563156127929688, 0.14849090576171875, 0.16135025024414062, 0.1742095947265625, 0.18706893920898438, 0.19992828369140625, 0.21278762817382812, 0.22564697265625, 0.23850631713867188, 0.25136566162109375, 0.2642250061035156, 0.2770843505859375, 0.2899436950683594, 0.30280303955078125, 0.3156623840332031, 0.328521728515625, 0.3413810729980469, 0.35424041748046875, 0.3670997619628906, 0.3799591064453125, 0.3928184509277344, 0.40567779541015625, 0.4185371398925781, 0.431396484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 9.0, 15.0, 16.0, 11.0, 23.0, 24.0, 30.0, 42.0, 45.0, 47.0, 62.0, 59.0, 65.0, 74.0, 72.0, 55.0, 65.0, 54.0, 48.0, 44.0, 40.0, 25.0, 16.0, 15.0, 11.0, 10.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46826171875, -0.451690673828125, -0.43511962890625, -0.418548583984375, -0.4019775390625, -0.385406494140625, -0.36883544921875, -0.352264404296875, -0.335693359375, -0.319122314453125, -0.30255126953125, -0.285980224609375, -0.2694091796875, -0.252838134765625, -0.23626708984375, -0.219696044921875, -0.203125, -0.186553955078125, -0.16998291015625, -0.153411865234375, -0.1368408203125, -0.120269775390625, -0.10369873046875, -0.087127685546875, -0.070556640625, -0.053985595703125, -0.03741455078125, -0.020843505859375, -0.0042724609375, 0.012298583984375, 0.02886962890625, 0.045440673828125, 0.06201171875, 0.078582763671875, 0.09515380859375, 0.111724853515625, 0.1282958984375, 0.144866943359375, 0.16143798828125, 0.178009033203125, 0.194580078125, 0.211151123046875, 0.22772216796875, 0.244293212890625, 0.2608642578125, 0.277435302734375, 0.29400634765625, 0.310577392578125, 0.3271484375, 0.343719482421875, 0.36029052734375, 0.376861572265625, 0.3934326171875, 0.410003662109375, 0.42657470703125, 0.443145751953125, 0.459716796875, 0.476287841796875, 0.49285888671875, 0.509429931640625, 0.5260009765625, 0.542572021484375, 0.55914306640625, 0.575714111328125, 0.59228515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 10.0, 10.0, 13.0, 24.0, 28.0, 42.0, 76.0, 105.0, 173.0, 335.0, 639.0, 1239.0, 2624.0, 5925.0, 15441.0, 48455.0, 184737.0, 467171.0, 229803.0, 60337.0, 18449.0, 6910.0, 2972.0, 1391.0, 688.0, 359.0, 205.0, 138.0, 72.0, 49.0, 43.0, 18.0, 17.0, 7.0, 9.0, 8.0, 5.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.13525390625, -0.1314525604248047, -0.12765121459960938, -0.12384986877441406, -0.12004852294921875, -0.11624717712402344, -0.11244583129882812, -0.10864448547363281, -0.1048431396484375, -0.10104179382324219, -0.09724044799804688, -0.09343910217285156, -0.08963775634765625, -0.08583641052246094, -0.08203506469726562, -0.07823371887207031, -0.074432373046875, -0.07063102722167969, -0.06682968139648438, -0.06302833557128906, -0.05922698974609375, -0.05542564392089844, -0.051624298095703125, -0.04782295227050781, -0.0440216064453125, -0.04022026062011719, -0.036418914794921875, -0.03261756896972656, -0.02881622314453125, -0.025014877319335938, -0.021213531494140625, -0.017412185668945312, -0.01361083984375, -0.009809494018554688, -0.006008148193359375, -0.0022068023681640625, 0.00159454345703125, 0.0053958892822265625, 0.009197235107421875, 0.012998580932617188, 0.0167999267578125, 0.020601272583007812, 0.024402618408203125, 0.028203964233398438, 0.03200531005859375, 0.03580665588378906, 0.039608001708984375, 0.04340934753417969, 0.047210693359375, 0.05101203918457031, 0.054813385009765625, 0.05861473083496094, 0.06241607666015625, 0.06621742248535156, 0.07001876831054688, 0.07382011413574219, 0.0776214599609375, 0.08142280578613281, 0.08522415161132812, 0.08902549743652344, 0.09282684326171875, 0.09662818908691406, 0.10042953491210938, 0.10423088073730469, 0.1080322265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 15.0, 8.0, 10.0, 14.0, 15.0, 18.0, 32.0, 36.0, 40.0, 49.0, 48.0, 44.0, 61.0, 70.0, 65.0, 57.0, 70.0, 47.0, 45.0, 34.0, 43.0, 29.0, 34.0, 24.0, 17.0, 13.0, 13.0, 18.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9384765625, -0.9112091064453125, -0.883941650390625, -0.8566741943359375, -0.82940673828125, -0.8021392822265625, -0.774871826171875, -0.7476043701171875, -0.7203369140625, -0.6930694580078125, -0.665802001953125, -0.6385345458984375, -0.61126708984375, -0.5839996337890625, -0.556732177734375, -0.5294647216796875, -0.502197265625, -0.4749298095703125, -0.447662353515625, -0.4203948974609375, -0.39312744140625, -0.3658599853515625, -0.338592529296875, -0.3113250732421875, -0.2840576171875, -0.2567901611328125, -0.229522705078125, -0.2022552490234375, -0.17498779296875, -0.1477203369140625, -0.120452880859375, -0.0931854248046875, -0.06591796875, -0.0386505126953125, -0.011383056640625, 0.0158843994140625, 0.04315185546875, 0.0704193115234375, 0.097686767578125, 0.1249542236328125, 0.1522216796875, 0.1794891357421875, 0.206756591796875, 0.2340240478515625, 0.26129150390625, 0.2885589599609375, 0.315826416015625, 0.3430938720703125, 0.370361328125, 0.3976287841796875, 0.424896240234375, 0.4521636962890625, 0.47943115234375, 0.5066986083984375, 0.533966064453125, 0.5612335205078125, 0.5885009765625, 0.6157684326171875, 0.643035888671875, 0.6703033447265625, 0.69757080078125, 0.7248382568359375, 0.752105712890625, 0.7793731689453125, 0.806640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 4.0, 8.0, 10.0, 23.0, 27.0, 25.0, 57.0, 84.0, 137.0, 197.0, 328.0, 463.0, 863.0, 1585.0, 3201.0, 6741.0, 16556.0, 46946.0, 145980.0, 355625.0, 302010.0, 108192.0, 35287.0, 12941.0, 5454.0, 2490.0, 1317.0, 761.0, 442.0, 276.0, 160.0, 116.0, 68.0, 54.0, 44.0, 21.0, 18.0, 11.0, 10.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.022917747497558594, -0.022031784057617188, -0.02114582061767578, -0.020259857177734375, -0.01937389373779297, -0.018487930297851562, -0.017601966857910156, -0.01671600341796875, -0.015830039978027344, -0.014944076538085938, -0.014058113098144531, -0.013172149658203125, -0.012286186218261719, -0.011400222778320312, -0.010514259338378906, -0.0096282958984375, -0.008742332458496094, -0.007856369018554688, -0.006970405578613281, -0.006084442138671875, -0.005198478698730469, -0.0043125152587890625, -0.0034265518188476562, -0.00254058837890625, -0.0016546249389648438, -0.0007686614990234375, 0.00011730194091796875, 0.001003265380859375, 0.0018892288208007812, 0.0027751922607421875, 0.0036611557006835938, 0.004547119140625, 0.005433082580566406, 0.0063190460205078125, 0.007205009460449219, 0.008090972900390625, 0.008976936340332031, 0.009862899780273438, 0.010748863220214844, 0.01163482666015625, 0.012520790100097656, 0.013406753540039062, 0.014292716979980469, 0.015178680419921875, 0.01606464385986328, 0.016950607299804688, 0.017836570739746094, 0.0187225341796875, 0.019608497619628906, 0.020494461059570312, 0.02138042449951172, 0.022266387939453125, 0.02315235137939453, 0.024038314819335938, 0.024924278259277344, 0.02581024169921875, 0.026696205139160156, 0.027582168579101562, 0.02846813201904297, 0.029354095458984375, 0.03024005889892578, 0.031126022338867188, 0.032011985778808594, 0.03289794921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 14.0, 22.0, 28.0, 34.0, 46.0, 51.0, 66.0, 82.0, 103.0, 95.0, 90.0, 90.0, 64.0, 61.0, 35.0, 21.0, 24.0, 16.0, 10.0, 11.0, 5.0, 7.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7954578399658203e-05, -2.7242116630077362e-05, -2.652965486049652e-05, -2.581719309091568e-05, -2.510473132133484e-05, -2.4392269551753998e-05, -2.3679807782173157e-05, -2.2967346012592316e-05, -2.2254884243011475e-05, -2.1542422473430634e-05, -2.0829960703849792e-05, -2.011749893426895e-05, -1.940503716468811e-05, -1.869257539510727e-05, -1.7980113625526428e-05, -1.7267651855945587e-05, -1.6555190086364746e-05, -1.5842728316783905e-05, -1.5130266547203064e-05, -1.4417804777622223e-05, -1.3705343008041382e-05, -1.299288123846054e-05, -1.22804194688797e-05, -1.1567957699298859e-05, -1.0855495929718018e-05, -1.0143034160137177e-05, -9.430572390556335e-06, -8.718110620975494e-06, -8.005648851394653e-06, -7.293187081813812e-06, -6.580725312232971e-06, -5.86826354265213e-06, -5.155801773071289e-06, -4.443340003490448e-06, -3.730878233909607e-06, -3.018416464328766e-06, -2.305954694747925e-06, -1.5934929251670837e-06, -8.810311555862427e-07, -1.685693860054016e-07, 5.438923835754395e-07, 1.2563541531562805e-06, 1.9688159227371216e-06, 2.6812776923179626e-06, 3.3937394618988037e-06, 4.106201231479645e-06, 4.818663001060486e-06, 5.531124770641327e-06, 6.243586540222168e-06, 6.956048309803009e-06, 7.66851007938385e-06, 8.380971848964691e-06, 9.093433618545532e-06, 9.805895388126373e-06, 1.0518357157707214e-05, 1.1230818927288055e-05, 1.1943280696868896e-05, 1.2655742466449738e-05, 1.3368204236030579e-05, 1.408066600561142e-05, 1.479312777519226e-05, 1.5505589544773102e-05, 1.6218051314353943e-05, 1.6930513083934784e-05, 1.7642974853515625e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 2.0, 11.0, 13.0, 15.0, 12.0, 26.0, 38.0, 58.0, 79.0, 130.0, 182.0, 312.0, 492.0, 820.0, 1609.0, 3340.0, 7113.0, 16559.0, 41542.0, 109359.0, 258032.0, 322601.0, 172625.0, 66819.0, 25860.0, 10799.0, 4790.0, 2325.0, 1192.0, 658.0, 393.0, 244.0, 162.0, 120.0, 61.0, 41.0, 32.0, 16.0, 17.0, 10.0, 8.0, 4.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.022979736328125, -0.0223085880279541, -0.021637439727783203, -0.020966291427612305, -0.020295143127441406, -0.019623994827270508, -0.01895284652709961, -0.01828169822692871, -0.017610549926757812, -0.016939401626586914, -0.016268253326416016, -0.015597105026245117, -0.014925956726074219, -0.01425480842590332, -0.013583660125732422, -0.012912511825561523, -0.012241363525390625, -0.011570215225219727, -0.010899066925048828, -0.01022791862487793, -0.009556770324707031, -0.008885622024536133, -0.008214473724365234, -0.007543325424194336, -0.0068721771240234375, -0.006201028823852539, -0.005529880523681641, -0.004858732223510742, -0.004187583923339844, -0.0035164356231689453, -0.002845287322998047, -0.0021741390228271484, -0.00150299072265625, -0.0008318424224853516, -0.00016069412231445312, 0.0005104541778564453, 0.0011816024780273438, 0.0018527507781982422, 0.0025238990783691406, 0.003195047378540039, 0.0038661956787109375, 0.004537343978881836, 0.005208492279052734, 0.005879640579223633, 0.006550788879394531, 0.00722193717956543, 0.007893085479736328, 0.008564233779907227, 0.009235382080078125, 0.009906530380249023, 0.010577678680419922, 0.01124882698059082, 0.011919975280761719, 0.012591123580932617, 0.013262271881103516, 0.013933420181274414, 0.014604568481445312, 0.015275716781616211, 0.01594686508178711, 0.016618013381958008, 0.017289161682128906, 0.017960309982299805, 0.018631458282470703, 0.0193026065826416, 0.0199737548828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 4.0, 6.0, 5.0, 13.0, 21.0, 17.0, 19.0, 22.0, 33.0, 45.0, 39.0, 46.0, 45.0, 53.0, 45.0, 62.0, 43.0, 62.0, 66.0, 52.0, 49.0, 38.0, 32.0, 41.0, 23.0, 25.0, 19.0, 17.0, 17.0, 7.0, 6.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00606536865234375, -0.005846261978149414, -0.005627155303955078, -0.005408048629760742, -0.005188941955566406, -0.00496983528137207, -0.004750728607177734, -0.0045316219329833984, -0.0043125152587890625, -0.0040934085845947266, -0.0038743019104003906, -0.0036551952362060547, -0.0034360885620117188, -0.003216981887817383, -0.002997875213623047, -0.002778768539428711, -0.002559661865234375, -0.002340555191040039, -0.002121448516845703, -0.0019023418426513672, -0.0016832351684570312, -0.0014641284942626953, -0.0012450218200683594, -0.0010259151458740234, -0.0008068084716796875, -0.0005877017974853516, -0.0003685951232910156, -0.0001494884490966797, 6.961822509765625e-05, 0.0002887248992919922, 0.0005078315734863281, 0.0007269382476806641, 0.000946044921875, 0.001165151596069336, 0.0013842582702636719, 0.0016033649444580078, 0.0018224716186523438, 0.0020415782928466797, 0.0022606849670410156, 0.0024797916412353516, 0.0026988983154296875, 0.0029180049896240234, 0.0031371116638183594, 0.0033562183380126953, 0.0035753250122070312, 0.003794431686401367, 0.004013538360595703, 0.004232645034790039, 0.004451751708984375, 0.004670858383178711, 0.004889965057373047, 0.005109071731567383, 0.005328178405761719, 0.005547285079956055, 0.005766391754150391, 0.0059854984283447266, 0.0062046051025390625, 0.0064237117767333984, 0.006642818450927734, 0.00686192512512207, 0.007081031799316406, 0.007300138473510742, 0.007519245147705078, 0.007738351821899414, 0.00795745849609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 16.0, 79.0, 518.0, 347.0, 49.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552289605140686, -0.43884190917015076, -0.3253942131996155, -0.2119465172290802, -0.09849882125854492, 0.014948844909667969, 0.12839657068252563, 0.2418442964553833, 0.3552919626235962, 0.46873965859413147, 0.5821873545646667, 0.6956350803375244, 0.8090827465057373, 0.9225304126739502, 1.035978078842163, 1.1494258642196655, 1.2628735303878784, 1.3763211965560913, 1.4897689819335938, 1.6032166481018066, 1.7166643142700195, 1.8301119804382324, 1.9435596466064453, 2.057007312774658, 2.170454978942871, 2.283902645111084, 2.397350311279297, 2.5107979774475098, 2.6242456436157227, 2.7376933097839355, 2.8511412143707275, 2.9645888805389404, 3.0780367851257324, 3.1914844512939453, 3.304932117462158, 3.418379783630371, 3.531827449798584, 3.645275115966797, 3.758723020553589, 3.8721706867218018, 3.9856183528900146, 4.099066257476807, 4.2125139236450195, 4.325961589813232, 4.439409255981445, 4.552856922149658, 4.666304588317871, 4.779752254486084, 4.893199920654297, 5.00664758682251, 5.120095252990723, 5.2335429191589355, 5.346990585327148, 5.460438251495361, 5.573885917663574, 5.687334060668945, 5.80078125, 5.914228916168213, 6.027676582336426, 6.141124248504639, 6.254571914672852, 6.3680195808410645, 6.481467247009277, 6.594915390014648, 6.708363056182861]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 4.0, 7.0, 15.0, 19.0, 27.0, 26.0, 34.0, 38.0, 40.0, 69.0, 70.0, 79.0, 73.0, 81.0, 78.0, 70.0, 64.0, 52.0, 54.0, 37.0, 17.0, 14.0, 11.0, 14.0, 8.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5818410515785217, -0.5629381537437439, -0.5440352559089661, -0.5251323580741882, -0.5062295198440552, -0.48732659220695496, -0.4684237241744995, -0.4495208263397217, -0.43061792850494385, -0.411715030670166, -0.3928121328353882, -0.37390926480293274, -0.3550063669681549, -0.3361034691333771, -0.31720060110092163, -0.2982977032661438, -0.27939480543136597, -0.26049190759658813, -0.2415890246629715, -0.22268614172935486, -0.20378324389457703, -0.1848803460597992, -0.16597746312618256, -0.14707458019256592, -0.12817168235778809, -0.10926879197359085, -0.09036590158939362, -0.07146301120519638, -0.052560120820999146, -0.03365723043680191, -0.014754340052604675, 0.004148542881011963, 0.023051440715789795, 0.04195433109998703, 0.060857221484184265, 0.0797601118683815, 0.09866300225257874, 0.11756589263677597, 0.1364687830209732, 0.15537166595458984, 0.17427456378936768, 0.1931774616241455, 0.21208034455776215, 0.23098322749137878, 0.24988612532615662, 0.26878902316093445, 0.2876918911933899, 0.3065947890281677, 0.32549768686294556, 0.3444005846977234, 0.3633034825325012, 0.38220635056495667, 0.4011092483997345, 0.42001214623451233, 0.4389150142669678, 0.4578179121017456, 0.47672080993652344, 0.49562370777130127, 0.5145266056060791, 0.5334295034408569, 0.5523324012756348, 0.5712352395057678, 0.5901381373405457, 0.6090410351753235, 0.6279439330101013]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 7.0, 7.0, 2.0, 11.0, 19.0, 50.0, 77.0, 178.0, 462.0, 1373.0, 4734.0, 31057.0, 679383.0, 310139.0, 16249.0, 3162.0, 980.0, 354.0, 149.0, 69.0, 39.0, 19.0, 13.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8883132934570312, -0.8552398681640625, -0.8221664428710938, -0.789093017578125, -0.7560195922851562, -0.7229461669921875, -0.6898727416992188, -0.65679931640625, -0.6237258911132812, -0.5906524658203125, -0.5575790405273438, -0.524505615234375, -0.49143218994140625, -0.4583587646484375, -0.42528533935546875, -0.3922119140625, -0.35913848876953125, -0.3260650634765625, -0.29299163818359375, -0.259918212890625, -0.22684478759765625, -0.1937713623046875, -0.16069793701171875, -0.12762451171875, -0.09455108642578125, -0.0614776611328125, -0.02840423583984375, 0.004669189453125, 0.03774261474609375, 0.0708160400390625, 0.10388946533203125, 0.136962890625, 0.17003631591796875, 0.2031097412109375, 0.23618316650390625, 0.269256591796875, 0.30233001708984375, 0.3354034423828125, 0.36847686767578125, 0.40155029296875, 0.43462371826171875, 0.4676971435546875, 0.5007705688476562, 0.533843994140625, 0.5669174194335938, 0.5999908447265625, 0.6330642700195312, 0.6661376953125, 0.6992111206054688, 0.7322845458984375, 0.7653579711914062, 0.798431396484375, 0.8315048217773438, 0.8645782470703125, 0.8976516723632812, 0.93072509765625, 0.9637985229492188, 0.9968719482421875, 1.0299453735351562, 1.063018798828125, 1.0960922241210938, 1.1291656494140625, 1.1622390747070312, 1.1953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 7.0, 11.0, 13.0, 18.0, 17.0, 23.0, 34.0, 37.0, 29.0, 47.0, 58.0, 57.0, 84.0, 61.0, 75.0, 80.0, 67.0, 55.0, 55.0, 53.0, 40.0, 28.0, 17.0, 11.0, 13.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85205078125, -0.8191146850585938, -0.7861785888671875, -0.7532424926757812, -0.720306396484375, -0.6873703002929688, -0.6544342041015625, -0.6214981079101562, -0.58856201171875, -0.5556259155273438, -0.5226898193359375, -0.48975372314453125, -0.456817626953125, -0.42388153076171875, -0.3909454345703125, -0.35800933837890625, -0.3250732421875, -0.29213714599609375, -0.2592010498046875, -0.22626495361328125, -0.193328857421875, -0.16039276123046875, -0.1274566650390625, -0.09452056884765625, -0.06158447265625, -0.02864837646484375, 0.0042877197265625, 0.03722381591796875, 0.070159912109375, 0.10309600830078125, 0.1360321044921875, 0.16896820068359375, 0.201904296875, 0.23484039306640625, 0.2677764892578125, 0.30071258544921875, 0.333648681640625, 0.36658477783203125, 0.3995208740234375, 0.43245697021484375, 0.46539306640625, 0.49832916259765625, 0.5312652587890625, 0.5642013549804688, 0.597137451171875, 0.6300735473632812, 0.6630096435546875, 0.6959457397460938, 0.7288818359375, 0.7618179321289062, 0.7947540283203125, 0.8276901245117188, 0.860626220703125, 0.8935623168945312, 0.9264984130859375, 0.9594345092773438, 0.99237060546875, 1.0253067016601562, 1.0582427978515625, 1.0911788940429688, 1.124114990234375, 1.1570510864257812, 1.1899871826171875, 1.2229232788085938, 1.255859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 17.0, 18.0, 21.0, 28.0, 43.0, 61.0, 134.0, 202.0, 414.0, 948.0, 3538.0, 38669.0, 925332.0, 72026.0, 4833.0, 1191.0, 475.0, 237.0, 135.0, 74.0, 41.0, 29.0, 21.0, 14.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.259765625, -1.221099853515625, -1.18243408203125, -1.143768310546875, -1.1051025390625, -1.066436767578125, -1.02777099609375, -0.989105224609375, -0.950439453125, -0.911773681640625, -0.87310791015625, -0.834442138671875, -0.7957763671875, -0.757110595703125, -0.71844482421875, -0.679779052734375, -0.64111328125, -0.602447509765625, -0.56378173828125, -0.525115966796875, -0.4864501953125, -0.447784423828125, -0.40911865234375, -0.370452880859375, -0.331787109375, -0.293121337890625, -0.25445556640625, -0.215789794921875, -0.1771240234375, -0.138458251953125, -0.09979248046875, -0.061126708984375, -0.0224609375, 0.016204833984375, 0.05487060546875, 0.093536376953125, 0.1322021484375, 0.170867919921875, 0.20953369140625, 0.248199462890625, 0.286865234375, 0.325531005859375, 0.36419677734375, 0.402862548828125, 0.4415283203125, 0.480194091796875, 0.51885986328125, 0.557525634765625, 0.59619140625, 0.634857177734375, 0.67352294921875, 0.712188720703125, 0.7508544921875, 0.789520263671875, 0.82818603515625, 0.866851806640625, 0.905517578125, 0.944183349609375, 0.98284912109375, 1.021514892578125, 1.0601806640625, 1.098846435546875, 1.13751220703125, 1.176177978515625, 1.21484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 9.0, 6.0, 6.0, 11.0, 12.0, 17.0, 27.0, 24.0, 26.0, 34.0, 22.0, 42.0, 43.0, 32.0, 55.0, 50.0, 48.0, 61.0, 39.0, 40.0, 46.0, 55.0, 38.0, 34.0, 39.0, 36.0, 27.0, 18.0, 17.0, 21.0, 9.0, 16.0, 8.0, 11.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8076858520507812, -0.7804107666015625, -0.7531356811523438, -0.725860595703125, -0.6985855102539062, -0.6713104248046875, -0.6440353393554688, -0.61676025390625, -0.5894851684570312, -0.5622100830078125, -0.5349349975585938, -0.507659912109375, -0.48038482666015625, -0.4531097412109375, -0.42583465576171875, -0.3985595703125, -0.37128448486328125, -0.3440093994140625, -0.31673431396484375, -0.289459228515625, -0.26218414306640625, -0.2349090576171875, -0.20763397216796875, -0.18035888671875, -0.15308380126953125, -0.1258087158203125, -0.09853363037109375, -0.071258544921875, -0.04398345947265625, -0.0167083740234375, 0.01056671142578125, 0.037841796875, 0.06511688232421875, 0.0923919677734375, 0.11966705322265625, 0.146942138671875, 0.17421722412109375, 0.2014923095703125, 0.22876739501953125, 0.25604248046875, 0.28331756591796875, 0.3105926513671875, 0.33786773681640625, 0.365142822265625, 0.39241790771484375, 0.4196929931640625, 0.44696807861328125, 0.4742431640625, 0.5015182495117188, 0.5287933349609375, 0.5560684204101562, 0.583343505859375, 0.6106185913085938, 0.6378936767578125, 0.6651687622070312, 0.69244384765625, 0.7197189331054688, 0.7469940185546875, 0.7742691040039062, 0.801544189453125, 0.8288192749023438, 0.8560943603515625, 0.8833694458007812, 0.91064453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 8.0, 21.0, 33.0, 48.0, 125.0, 320.0, 924.0, 4029.0, 46473.0, 949471.0, 41996.0, 3709.0, 881.0, 292.0, 109.0, 46.0, 27.0, 13.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5784416198730469, -0.5616683959960938, -0.5448951721191406, -0.5281219482421875, -0.5113487243652344, -0.49457550048828125, -0.4778022766113281, -0.461029052734375, -0.4442558288574219, -0.42748260498046875, -0.4107093811035156, -0.3939361572265625, -0.3771629333496094, -0.36038970947265625, -0.3436164855957031, -0.32684326171875, -0.3100700378417969, -0.29329681396484375, -0.2765235900878906, -0.2597503662109375, -0.24297714233398438, -0.22620391845703125, -0.20943069458007812, -0.192657470703125, -0.17588424682617188, -0.15911102294921875, -0.14233779907226562, -0.1255645751953125, -0.10879135131835938, -0.09201812744140625, -0.07524490356445312, -0.0584716796875, -0.041698455810546875, -0.02492523193359375, -0.008152008056640625, 0.0086212158203125, 0.025394439697265625, 0.04216766357421875, 0.058940887451171875, 0.075714111328125, 0.09248733520507812, 0.10926055908203125, 0.12603378295898438, 0.1428070068359375, 0.15958023071289062, 0.17635345458984375, 0.19312667846679688, 0.20989990234375, 0.22667312622070312, 0.24344635009765625, 0.2602195739746094, 0.2769927978515625, 0.2937660217285156, 0.31053924560546875, 0.3273124694824219, 0.344085693359375, 0.3608589172363281, 0.37763214111328125, 0.3944053649902344, 0.4111785888671875, 0.4279518127441406, 0.44472503662109375, 0.4614982604980469, 0.478271484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 6.0, 8.0, 12.0, 29.0, 55.0, 145.0, 245.0, 225.0, 135.0, 68.0, 19.0, 15.0, 13.0, 7.0, 10.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.598234176635742e-05, -6.384868174791336e-05, -6.17150217294693e-05, -5.958136171102524e-05, -5.744770169258118e-05, -5.5314041674137115e-05, -5.3180381655693054e-05, -5.104672163724899e-05, -4.891306161880493e-05, -4.677940160036087e-05, -4.464574158191681e-05, -4.251208156347275e-05, -4.0378421545028687e-05, -3.8244761526584625e-05, -3.6111101508140564e-05, -3.39774414896965e-05, -3.184378147125244e-05, -2.971012145280838e-05, -2.757646143436432e-05, -2.5442801415920258e-05, -2.3309141397476196e-05, -2.1175481379032135e-05, -1.9041821360588074e-05, -1.6908161342144012e-05, -1.4774501323699951e-05, -1.264084130525589e-05, -1.0507181286811829e-05, -8.373521268367767e-06, -6.239861249923706e-06, -4.106201231479645e-06, -1.9725412130355835e-06, 1.6111880540847778e-07, 2.294778823852539e-06, 4.4284388422966e-06, 6.562098860740662e-06, 8.695758879184723e-06, 1.0829418897628784e-05, 1.2963078916072845e-05, 1.5096738934516907e-05, 1.7230398952960968e-05, 1.936405897140503e-05, 2.149771898984909e-05, 2.3631379008293152e-05, 2.5765039026737213e-05, 2.7898699045181274e-05, 3.0032359063625336e-05, 3.21660190820694e-05, 3.429967910051346e-05, 3.643333911895752e-05, 3.856699913740158e-05, 4.070065915584564e-05, 4.28343191742897e-05, 4.4967979192733765e-05, 4.7101639211177826e-05, 4.923529922962189e-05, 5.136895924806595e-05, 5.350261926651001e-05, 5.563627928495407e-05, 5.776993930339813e-05, 5.9903599321842194e-05, 6.203725934028625e-05, 6.417091935873032e-05, 6.630457937717438e-05, 6.843823939561844e-05, 7.05718994140625e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 11.0, 14.0, 19.0, 38.0, 61.0, 119.0, 236.0, 696.0, 3640.0, 41239.0, 944495.0, 52547.0, 4077.0, 809.0, 252.0, 121.0, 51.0, 31.0, 19.0, 16.0, 14.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5523262023925781, -0.5367813110351562, -0.5212364196777344, -0.5056915283203125, -0.4901466369628906, -0.47460174560546875, -0.4590568542480469, -0.443511962890625, -0.4279670715332031, -0.41242218017578125, -0.3968772888183594, -0.3813323974609375, -0.3657875061035156, -0.35024261474609375, -0.3346977233886719, -0.31915283203125, -0.3036079406738281, -0.28806304931640625, -0.2725181579589844, -0.2569732666015625, -0.24142837524414062, -0.22588348388671875, -0.21033859252929688, -0.194793701171875, -0.17924880981445312, -0.16370391845703125, -0.14815902709960938, -0.1326141357421875, -0.11706924438476562, -0.10152435302734375, -0.08597946166992188, -0.0704345703125, -0.054889678955078125, -0.03934478759765625, -0.023799896240234375, -0.0082550048828125, 0.007289886474609375, 0.02283477783203125, 0.038379669189453125, 0.053924560546875, 0.06946945190429688, 0.08501434326171875, 0.10055923461914062, 0.1161041259765625, 0.13164901733398438, 0.14719390869140625, 0.16273880004882812, 0.17828369140625, 0.19382858276367188, 0.20937347412109375, 0.22491836547851562, 0.2404632568359375, 0.2560081481933594, 0.27155303955078125, 0.2870979309082031, 0.302642822265625, 0.3181877136230469, 0.33373260498046875, 0.3492774963378906, 0.3648223876953125, 0.3803672790527344, 0.39591217041015625, 0.4114570617675781, 0.427001953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 6.0, 15.0, 12.0, 21.0, 34.0, 41.0, 74.0, 78.0, 119.0, 121.0, 111.0, 93.0, 77.0, 53.0, 45.0, 27.0, 13.0, 11.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.112060546875, -0.10871505737304688, -0.10536956787109375, -0.10202407836914062, -0.0986785888671875, -0.09533309936523438, -0.09198760986328125, -0.08864212036132812, -0.085296630859375, -0.08195114135742188, -0.07860565185546875, -0.07526016235351562, -0.0719146728515625, -0.06856918334960938, -0.06522369384765625, -0.061878204345703125, -0.05853271484375, -0.055187225341796875, -0.05184173583984375, -0.048496246337890625, -0.0451507568359375, -0.041805267333984375, -0.03845977783203125, -0.035114288330078125, -0.031768798828125, -0.028423309326171875, -0.02507781982421875, -0.021732330322265625, -0.0183868408203125, -0.015041351318359375, -0.01169586181640625, -0.008350372314453125, -0.0050048828125, -0.001659393310546875, 0.00168609619140625, 0.005031585693359375, 0.0083770751953125, 0.011722564697265625, 0.01506805419921875, 0.018413543701171875, 0.021759033203125, 0.025104522705078125, 0.02845001220703125, 0.031795501708984375, 0.0351409912109375, 0.038486480712890625, 0.04183197021484375, 0.045177459716796875, 0.04852294921875, 0.051868438720703125, 0.05521392822265625, 0.058559417724609375, 0.0619049072265625, 0.06525039672851562, 0.06859588623046875, 0.07194137573242188, 0.075286865234375, 0.07863235473632812, 0.08197784423828125, 0.08532333374023438, 0.0886688232421875, 0.09201431274414062, 0.09535980224609375, 0.09870529174804688, 0.10205078125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 12.0, 25.0, 37.0, 84.0, 130.0, 191.0, 187.0, 154.0, 83.0, 41.0, 22.0, 17.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.028669595718384, -1.9635827541351318, -1.8984960317611694, -1.8334091901779175, -1.768322467803955, -1.7032356262207031, -1.6381487846374512, -1.5730619430541992, -1.5079752206802368, -1.4428883790969849, -1.3778016567230225, -1.3127148151397705, -1.2476279735565186, -1.1825412511825562, -1.1174544095993042, -1.0523676872253418, -0.9872808456420898, -0.9221940636634827, -0.8571072816848755, -0.7920204401016235, -0.7269336581230164, -0.6618468761444092, -0.5967600345611572, -0.53167325258255, -0.46658647060394287, -0.4014996886253357, -0.33641287684440613, -0.27132606506347656, -0.20623928308486938, -0.1411525011062622, -0.07606568932533264, -0.010978877544403076, 0.0541081428527832, 0.11919493973255157, 0.18428173661231995, 0.24936853349208832, 0.3144553303718567, 0.37954211235046387, 0.44462892413139343, 0.509715735912323, 0.5748025178909302, 0.6398892998695374, 0.7049760818481445, 0.7700629234313965, 0.8351497054100037, 0.9002364873886108, 0.9653233289718628, 1.0304100513458252, 1.0954968929290771, 1.160583734512329, 1.2256704568862915, 1.2907572984695435, 1.3558440208435059, 1.4209308624267578, 1.4860177040100098, 1.5511045455932617, 1.6161912679672241, 1.681278109550476, 1.7463648319244385, 1.8114516735076904, 1.8765385150909424, 1.9416252374649048, 2.006711959838867, 2.071798801422119, 2.136885643005371]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 8.0, 11.0, 6.0, 12.0, 12.0, 13.0, 23.0, 26.0, 31.0, 23.0, 26.0, 27.0, 22.0, 30.0, 26.0, 32.0, 47.0, 33.0, 40.0, 37.0, 30.0, 26.0, 45.0, 31.0, 38.0, 38.0, 39.0, 41.0, 29.0, 26.0, 21.0, 23.0, 18.0, 15.0, 12.0, 7.0, 11.0, 10.0, 15.0, 6.0, 6.0, 6.0, 3.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.162905216217041, -1.1256847381591797, -1.0884641408920288, -1.0512436628341675, -1.0140231847763062, -0.9768026471138, -0.939582109451294, -0.9023616313934326, -0.8651410937309265, -0.8279205560684204, -0.7907000780105591, -0.753479540348053, -0.7162590026855469, -0.6790385246276855, -0.6418179869651794, -0.6045974493026733, -0.567376971244812, -0.5301564335823059, -0.4929359555244446, -0.4557154178619385, -0.41849491000175476, -0.38127440214157104, -0.34405386447906494, -0.3068333566188812, -0.2696128487586975, -0.2323923408985138, -0.19517181813716888, -0.15795129537582397, -0.12073078751564026, -0.08351027965545654, -0.04628975689411163, -0.009069234132766724, 0.028151273727416992, 0.0653717890381813, 0.10259230434894562, 0.13981282711029053, 0.17703333497047424, 0.21425384283065796, 0.25147438049316406, 0.2886948883533478, 0.3259153962135315, 0.3631359040737152, 0.4003564119338989, 0.43757694959640503, 0.47479745745658875, 0.5120179653167725, 0.5492385029792786, 0.5864590406417847, 0.623679518699646, 0.6609000563621521, 0.6981205344200134, 0.7353410720825195, 0.7725615501403809, 0.809782087802887, 0.8470026254653931, 0.8842231035232544, 0.9214436411857605, 0.9586641788482666, 0.9958846569061279, 1.0331051349639893, 1.0703257322311401, 1.1075462102890015, 1.1447666883468628, 1.1819872856140137, 1.219207763671875]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 9.0, 10.0, 12.0, 18.0, 38.0, 78.0, 252.0, 776.0, 3620.0, 116087.0, 4041468.0, 28230.0, 2576.0, 676.0, 209.0, 96.0, 44.0, 34.0, 11.0, 5.0, 9.0, 6.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6465606689453125, -1.569488525390625, -1.4924163818359375, -1.41534423828125, -1.3382720947265625, -1.261199951171875, -1.1841278076171875, -1.1070556640625, -1.0299835205078125, -0.952911376953125, -0.8758392333984375, -0.79876708984375, -0.7216949462890625, -0.644622802734375, -0.5675506591796875, -0.490478515625, -0.4134063720703125, -0.336334228515625, -0.2592620849609375, -0.18218994140625, -0.1051177978515625, -0.028045654296875, 0.0490264892578125, 0.1260986328125, 0.2031707763671875, 0.280242919921875, 0.3573150634765625, 0.43438720703125, 0.5114593505859375, 0.588531494140625, 0.6656036376953125, 0.74267578125, 0.8197479248046875, 0.896820068359375, 0.9738922119140625, 1.05096435546875, 1.1280364990234375, 1.205108642578125, 1.2821807861328125, 1.3592529296875, 1.4363250732421875, 1.513397216796875, 1.5904693603515625, 1.66754150390625, 1.7446136474609375, 1.821685791015625, 1.8987579345703125, 1.975830078125, 2.0529022216796875, 2.129974365234375, 2.2070465087890625, 2.28411865234375, 2.3611907958984375, 2.438262939453125, 2.5153350830078125, 2.5924072265625, 2.6694793701171875, 2.746551513671875, 2.8236236572265625, 2.90069580078125, 2.9777679443359375, 3.054840087890625, 3.1319122314453125, 3.208984375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 9.0, 11.0, 10.0, 17.0, 13.0, 18.0, 27.0, 32.0, 42.0, 41.0, 37.0, 42.0, 48.0, 52.0, 52.0, 57.0, 50.0, 60.0, 52.0, 60.0, 48.0, 47.0, 27.0, 34.0, 25.0, 16.0, 22.0, 14.0, 13.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5763702392578125, -0.558990478515625, -0.5416107177734375, -0.52423095703125, -0.5068511962890625, -0.489471435546875, -0.4720916748046875, -0.4547119140625, -0.4373321533203125, -0.419952392578125, -0.4025726318359375, -0.38519287109375, -0.3678131103515625, -0.350433349609375, -0.3330535888671875, -0.315673828125, -0.2982940673828125, -0.280914306640625, -0.2635345458984375, -0.24615478515625, -0.2287750244140625, -0.211395263671875, -0.1940155029296875, -0.1766357421875, -0.1592559814453125, -0.141876220703125, -0.1244964599609375, -0.10711669921875, -0.0897369384765625, -0.072357177734375, -0.0549774169921875, -0.03759765625, -0.0202178955078125, -0.002838134765625, 0.0145416259765625, 0.03192138671875, 0.0493011474609375, 0.066680908203125, 0.0840606689453125, 0.1014404296875, 0.1188201904296875, 0.136199951171875, 0.1535797119140625, 0.17095947265625, 0.1883392333984375, 0.205718994140625, 0.2230987548828125, 0.240478515625, 0.2578582763671875, 0.275238037109375, 0.2926177978515625, 0.30999755859375, 0.3273773193359375, 0.344757080078125, 0.3621368408203125, 0.3795166015625, 0.3968963623046875, 0.414276123046875, 0.4316558837890625, 0.44903564453125, 0.4664154052734375, 0.483795166015625, 0.5011749267578125, 0.5185546875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 5.0, 10.0, 12.0, 18.0, 29.0, 51.0, 72.0, 132.0, 227.0, 433.0, 1015.0, 2607.0, 10166.0, 86525.0, 3734014.0, 331870.0, 20141.0, 4185.0, 1406.0, 611.0, 316.0, 151.0, 95.0, 76.0, 36.0, 23.0, 14.0, 13.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.94091796875, -0.9069290161132812, -0.8729400634765625, -0.8389511108398438, -0.804962158203125, -0.7709732055664062, -0.7369842529296875, -0.7029953002929688, -0.66900634765625, -0.6350173950195312, -0.6010284423828125, -0.5670394897460938, -0.533050537109375, -0.49906158447265625, -0.4650726318359375, -0.43108367919921875, -0.3970947265625, -0.36310577392578125, -0.3291168212890625, -0.29512786865234375, -0.261138916015625, -0.22714996337890625, -0.1931610107421875, -0.15917205810546875, -0.12518310546875, -0.09119415283203125, -0.0572052001953125, -0.02321624755859375, 0.010772705078125, 0.04476165771484375, 0.0787506103515625, 0.11273956298828125, 0.146728515625, 0.18071746826171875, 0.2147064208984375, 0.24869537353515625, 0.282684326171875, 0.31667327880859375, 0.3506622314453125, 0.38465118408203125, 0.41864013671875, 0.45262908935546875, 0.4866180419921875, 0.5206069946289062, 0.554595947265625, 0.5885848999023438, 0.6225738525390625, 0.6565628051757812, 0.6905517578125, 0.7245407104492188, 0.7585296630859375, 0.7925186157226562, 0.826507568359375, 0.8604965209960938, 0.8944854736328125, 0.9284744262695312, 0.96246337890625, 0.9964523315429688, 1.0304412841796875, 1.0644302368164062, 1.098419189453125, 1.1324081420898438, 1.1663970947265625, 1.2003860473632812, 1.234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 13.0, 15.0, 25.0, 35.0, 37.0, 80.0, 133.0, 269.0, 556.0, 876.0, 904.0, 527.0, 241.0, 135.0, 82.0, 37.0, 29.0, 20.0, 11.0, 11.0, 8.0, 5.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3023948669433594, -0.29375457763671875, -0.2851142883300781, -0.2764739990234375, -0.2678337097167969, -0.25919342041015625, -0.2505531311035156, -0.241912841796875, -0.23327255249023438, -0.22463226318359375, -0.21599197387695312, -0.2073516845703125, -0.19871139526367188, -0.19007110595703125, -0.18143081665039062, -0.17279052734375, -0.16415023803710938, -0.15550994873046875, -0.14686965942382812, -0.1382293701171875, -0.12958908081054688, -0.12094879150390625, -0.11230850219726562, -0.103668212890625, -0.09502792358398438, -0.08638763427734375, -0.07774734497070312, -0.0691070556640625, -0.060466766357421875, -0.05182647705078125, -0.043186187744140625, -0.0345458984375, -0.025905609130859375, -0.01726531982421875, -0.008625030517578125, 1.52587890625e-05, 0.008655548095703125, 0.01729583740234375, 0.025936126708984375, 0.034576416015625, 0.043216705322265625, 0.05185699462890625, 0.060497283935546875, 0.0691375732421875, 0.07777786254882812, 0.08641815185546875, 0.09505844116210938, 0.10369873046875, 0.11233901977539062, 0.12097930908203125, 0.12961959838867188, 0.1382598876953125, 0.14690017700195312, 0.15554046630859375, 0.16418075561523438, 0.172821044921875, 0.18146133422851562, 0.19010162353515625, 0.19874191284179688, 0.2073822021484375, 0.21602249145507812, 0.22466278076171875, 0.23330307006835938, 0.241943359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 10.0, 20.0, 28.0, 44.0, 64.0, 80.0, 108.0, 124.0, 129.0, 102.0, 88.0, 69.0, 52.0, 17.0, 13.0, 8.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6997055411338806, -0.6683148741722107, -0.636924147605896, -0.6055334806442261, -0.5741427540779114, -0.5427520871162415, -0.5113613605499268, -0.47997069358825684, -0.4485799968242645, -0.4171893000602722, -0.3857986032962799, -0.3544079065322876, -0.3230172395706177, -0.291626513004303, -0.26023584604263306, -0.22884514927864075, -0.19745445251464844, -0.16606375575065613, -0.13467305898666382, -0.1032823771238327, -0.0718916803598404, -0.040500983595848083, -0.009110301733016968, 0.022280395030975342, 0.05367109179496765, 0.08506178855895996, 0.11645247787237167, 0.1478431671857834, 0.1792338639497757, 0.210624560713768, 0.24201524257659912, 0.27340593934059143, 0.3047966957092285, 0.3361873924732208, 0.36757808923721313, 0.39896875619888306, 0.43035948276519775, 0.4617501497268677, 0.49314084649086, 0.5245315432548523, 0.555922269821167, 0.5873129367828369, 0.6187036633491516, 0.6500943303108215, 0.6814850568771362, 0.7128757238388062, 0.7442663908004761, 0.7756571173667908, 0.8070477843284607, 0.8384384512901306, 0.8698291778564453, 0.9012198448181152, 0.9326105713844299, 0.9640012383460999, 0.9953919649124146, 1.0267826318740845, 1.0581732988357544, 1.0895639657974243, 1.1209546327590942, 1.1523454189300537, 1.1837360858917236, 1.2151267528533936, 1.2465174198150635, 1.2779080867767334, 1.3092988729476929]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 10.0, 9.0, 4.0, 2.0, 13.0, 9.0, 14.0, 24.0, 25.0, 28.0, 29.0, 32.0, 33.0, 36.0, 33.0, 47.0, 49.0, 44.0, 52.0, 58.0, 56.0, 46.0, 47.0, 43.0, 27.0, 44.0, 26.0, 39.0, 25.0, 19.0, 19.0, 22.0, 9.0, 3.0, 8.0, 8.0, 2.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.568087100982666, -0.5508230924606323, -0.5335590839385986, -0.5162950754165649, -0.49903109669685364, -0.48176708817481995, -0.46450310945510864, -0.44723910093307495, -0.42997509241104126, -0.41271108388900757, -0.3954470753669739, -0.3781830966472626, -0.3609190881252289, -0.3436550796031952, -0.3263911008834839, -0.3091270923614502, -0.2918630838394165, -0.2745990753173828, -0.2573350667953491, -0.24007108807563782, -0.22280707955360413, -0.20554307103157043, -0.18827907741069794, -0.17101508378982544, -0.15375107526779175, -0.13648706674575806, -0.11922307312488556, -0.10195907205343246, -0.08469507098197937, -0.06743106991052628, -0.05016706883907318, -0.03290306776762009, -0.015639126300811768, 0.001624874770641327, 0.01888887584209442, 0.036152876913547516, 0.05341687798500061, 0.0706808790564537, 0.0879448801279068, 0.1052088811993599, 0.12247288227081299, 0.13973689079284668, 0.15700088441371918, 0.17426487803459167, 0.19152888655662537, 0.20879289507865906, 0.22605688869953156, 0.24332088232040405, 0.26058489084243774, 0.27784889936447144, 0.2951129078865051, 0.31237688660621643, 0.3296408951282501, 0.3469049036502838, 0.3641688823699951, 0.3814328908920288, 0.3986968994140625, 0.4159609079360962, 0.4332249164581299, 0.4504888951778412, 0.4677529036998749, 0.48501691222190857, 0.5022808909416199, 0.5195448994636536, 0.5368089079856873]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 10.0, 13.0, 11.0, 21.0, 24.0, 38.0, 36.0, 48.0, 96.0, 130.0, 233.0, 438.0, 908.0, 2320.0, 6577.0, 20707.0, 72908.0, 267041.0, 447933.0, 163474.0, 44807.0, 13212.0, 4342.0, 1600.0, 699.0, 337.0, 183.0, 116.0, 65.0, 47.0, 41.0, 28.0, 21.0, 17.0, 16.0, 8.0, 5.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1070556640625, -0.10393524169921875, -0.1008148193359375, -0.09769439697265625, -0.094573974609375, -0.09145355224609375, -0.0883331298828125, -0.08521270751953125, -0.08209228515625, -0.07897186279296875, -0.0758514404296875, -0.07273101806640625, -0.069610595703125, -0.06649017333984375, -0.0633697509765625, -0.06024932861328125, -0.05712890625, -0.05400848388671875, -0.0508880615234375, -0.04776763916015625, -0.044647216796875, -0.04152679443359375, -0.0384063720703125, -0.03528594970703125, -0.03216552734375, -0.02904510498046875, -0.0259246826171875, -0.02280426025390625, -0.019683837890625, -0.01656341552734375, -0.0134429931640625, -0.01032257080078125, -0.0072021484375, -0.00408172607421875, -0.0009613037109375, 0.00215911865234375, 0.005279541015625, 0.00839996337890625, 0.0115203857421875, 0.01464080810546875, 0.01776123046875, 0.02088165283203125, 0.0240020751953125, 0.02712249755859375, 0.030242919921875, 0.03336334228515625, 0.0364837646484375, 0.03960418701171875, 0.042724609375, 0.04584503173828125, 0.0489654541015625, 0.05208587646484375, 0.055206298828125, 0.05832672119140625, 0.0614471435546875, 0.06456756591796875, 0.06768798828125, 0.07080841064453125, 0.0739288330078125, 0.07704925537109375, 0.080169677734375, 0.08329010009765625, 0.0864105224609375, 0.08953094482421875, 0.0926513671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 9.0, 6.0, 10.0, 17.0, 22.0, 25.0, 26.0, 40.0, 42.0, 48.0, 52.0, 56.0, 84.0, 60.0, 82.0, 66.0, 64.0, 50.0, 55.0, 36.0, 48.0, 27.0, 19.0, 21.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4712333679199219, -0.45540618896484375, -0.4395790100097656, -0.4237518310546875, -0.4079246520996094, -0.39209747314453125, -0.3762702941894531, -0.360443115234375, -0.3446159362792969, -0.32878875732421875, -0.3129615783691406, -0.2971343994140625, -0.2813072204589844, -0.26548004150390625, -0.24965286254882812, -0.23382568359375, -0.21799850463867188, -0.20217132568359375, -0.18634414672851562, -0.1705169677734375, -0.15468978881835938, -0.13886260986328125, -0.12303543090820312, -0.107208251953125, -0.09138107299804688, -0.07555389404296875, -0.059726715087890625, -0.0438995361328125, -0.028072357177734375, -0.01224517822265625, 0.003582000732421875, 0.0194091796875, 0.035236358642578125, 0.05106353759765625, 0.06689071655273438, 0.0827178955078125, 0.09854507446289062, 0.11437225341796875, 0.13019943237304688, 0.146026611328125, 0.16185379028320312, 0.17768096923828125, 0.19350814819335938, 0.2093353271484375, 0.22516250610351562, 0.24098968505859375, 0.2568168640136719, 0.27264404296875, 0.2884712219238281, 0.30429840087890625, 0.3201255798339844, 0.3359527587890625, 0.3517799377441406, 0.36760711669921875, 0.3834342956542969, 0.399261474609375, 0.4150886535644531, 0.43091583251953125, 0.4467430114746094, 0.4625701904296875, 0.4783973693847656, 0.49422454833984375, 0.5100517272949219, 0.52587890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 5.0, 14.0, 30.0, 33.0, 46.0, 81.0, 80.0, 139.0, 213.0, 336.0, 541.0, 1063.0, 2049.0, 4406.0, 9798.0, 23652.0, 60011.0, 155003.0, 325482.0, 274212.0, 115579.0, 43979.0, 17432.0, 7327.0, 3221.0, 1558.0, 864.0, 472.0, 308.0, 187.0, 133.0, 75.0, 58.0, 44.0, 30.0, 15.0, 16.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0594482421875, -0.057312965393066406, -0.05517768859863281, -0.05304241180419922, -0.050907135009765625, -0.04877185821533203, -0.04663658142089844, -0.044501304626464844, -0.04236602783203125, -0.040230751037597656, -0.03809547424316406, -0.03596019744873047, -0.033824920654296875, -0.03168964385986328, -0.029554367065429688, -0.027419090270996094, -0.0252838134765625, -0.023148536682128906, -0.021013259887695312, -0.01887798309326172, -0.016742706298828125, -0.014607429504394531, -0.012472152709960938, -0.010336875915527344, -0.00820159912109375, -0.006066322326660156, -0.0039310455322265625, -0.0017957687377929688, 0.000339508056640625, 0.0024747848510742188, 0.0046100616455078125, 0.006745338439941406, 0.008880615234375, 0.011015892028808594, 0.013151168823242188, 0.015286445617675781, 0.017421722412109375, 0.01955699920654297, 0.021692276000976562, 0.023827552795410156, 0.02596282958984375, 0.028098106384277344, 0.030233383178710938, 0.03236865997314453, 0.034503936767578125, 0.03663921356201172, 0.03877449035644531, 0.040909767150878906, 0.0430450439453125, 0.045180320739746094, 0.04731559753417969, 0.04945087432861328, 0.051586151123046875, 0.05372142791748047, 0.05585670471191406, 0.057991981506347656, 0.06012725830078125, 0.062262535095214844, 0.06439781188964844, 0.06653308868408203, 0.06866836547851562, 0.07080364227294922, 0.07293891906738281, 0.0750741958618164, 0.07720947265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 2.0, 9.0, 9.0, 9.0, 12.0, 15.0, 15.0, 18.0, 19.0, 24.0, 29.0, 35.0, 56.0, 45.0, 43.0, 44.0, 55.0, 57.0, 64.0, 62.0, 61.0, 45.0, 40.0, 43.0, 36.0, 27.0, 26.0, 19.0, 16.0, 12.0, 21.0, 6.0, 12.0, 7.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7216796875, -0.6975173950195312, -0.6733551025390625, -0.6491928100585938, -0.625030517578125, -0.6008682250976562, -0.5767059326171875, -0.5525436401367188, -0.52838134765625, -0.5042190551757812, -0.4800567626953125, -0.45589447021484375, -0.431732177734375, -0.40756988525390625, -0.3834075927734375, -0.35924530029296875, -0.3350830078125, -0.31092071533203125, -0.2867584228515625, -0.26259613037109375, -0.238433837890625, -0.21427154541015625, -0.1901092529296875, -0.16594696044921875, -0.14178466796875, -0.11762237548828125, -0.0934600830078125, -0.06929779052734375, -0.045135498046875, -0.02097320556640625, 0.0031890869140625, 0.02735137939453125, 0.051513671875, 0.07567596435546875, 0.0998382568359375, 0.12400054931640625, 0.148162841796875, 0.17232513427734375, 0.1964874267578125, 0.22064971923828125, 0.24481201171875, 0.26897430419921875, 0.2931365966796875, 0.31729888916015625, 0.341461181640625, 0.36562347412109375, 0.3897857666015625, 0.41394805908203125, 0.4381103515625, 0.46227264404296875, 0.4864349365234375, 0.5105972290039062, 0.534759521484375, 0.5589218139648438, 0.5830841064453125, 0.6072463989257812, 0.63140869140625, 0.6555709838867188, 0.6797332763671875, 0.7038955688476562, 0.728057861328125, 0.7522201538085938, 0.7763824462890625, 0.8005447387695312, 0.82470703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 14.0, 12.0, 26.0, 26.0, 52.0, 74.0, 127.0, 204.0, 354.0, 638.0, 1124.0, 2229.0, 5134.0, 14471.0, 52213.0, 239600.0, 502744.0, 171103.0, 38398.0, 11466.0, 4261.0, 1912.0, 1021.0, 545.0, 278.0, 182.0, 116.0, 62.0, 43.0, 27.0, 21.0, 17.0, 15.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0240631103515625, -0.023184537887573242, -0.022305965423583984, -0.021427392959594727, -0.02054882049560547, -0.01967024803161621, -0.018791675567626953, -0.017913103103637695, -0.017034530639648438, -0.01615595817565918, -0.015277385711669922, -0.014398813247680664, -0.013520240783691406, -0.012641668319702148, -0.01176309585571289, -0.010884523391723633, -0.010005950927734375, -0.009127378463745117, -0.00824880599975586, -0.0073702335357666016, -0.006491661071777344, -0.005613088607788086, -0.004734516143798828, -0.0038559436798095703, -0.0029773712158203125, -0.0020987987518310547, -0.0012202262878417969, -0.00034165382385253906, 0.0005369186401367188, 0.0014154911041259766, 0.0022940635681152344, 0.003172636032104492, 0.00405120849609375, 0.004929780960083008, 0.005808353424072266, 0.0066869258880615234, 0.007565498352050781, 0.008444070816040039, 0.009322643280029297, 0.010201215744018555, 0.011079788208007812, 0.01195836067199707, 0.012836933135986328, 0.013715505599975586, 0.014594078063964844, 0.015472650527954102, 0.01635122299194336, 0.017229795455932617, 0.018108367919921875, 0.018986940383911133, 0.01986551284790039, 0.02074408531188965, 0.021622657775878906, 0.022501230239868164, 0.023379802703857422, 0.02425837516784668, 0.025136947631835938, 0.026015520095825195, 0.026894092559814453, 0.02777266502380371, 0.02865123748779297, 0.029529809951782227, 0.030408382415771484, 0.03128695487976074, 0.03216552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 16.0, 12.0, 23.0, 24.0, 68.0, 61.0, 79.0, 106.0, 99.0, 115.0, 103.0, 82.0, 71.0, 28.0, 30.0, 18.0, 14.0, 11.0, 8.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.6475096344947815e-05, -1.590326428413391e-05, -1.5331432223320007e-05, -1.4759600162506104e-05, -1.41877681016922e-05, -1.3615936040878296e-05, -1.3044103980064392e-05, -1.2472271919250488e-05, -1.1900439858436584e-05, -1.132860779762268e-05, -1.0756775736808777e-05, -1.0184943675994873e-05, -9.61311161518097e-06, -9.041279554367065e-06, -8.469447493553162e-06, -7.897615432739258e-06, -7.325783371925354e-06, -6.75395131111145e-06, -6.182119250297546e-06, -5.610287189483643e-06, -5.038455128669739e-06, -4.466623067855835e-06, -3.894791007041931e-06, -3.3229589462280273e-06, -2.7511268854141235e-06, -2.1792948246002197e-06, -1.607462763786316e-06, -1.0356307029724121e-06, -4.637986421585083e-07, 1.0803341865539551e-07, 6.798654794692993e-07, 1.2516975402832031e-06, 1.823529601097107e-06, 2.3953616619110107e-06, 2.9671937227249146e-06, 3.5390257835388184e-06, 4.110857844352722e-06, 4.682689905166626e-06, 5.25452196598053e-06, 5.826354026794434e-06, 6.398186087608337e-06, 6.970018148422241e-06, 7.541850209236145e-06, 8.113682270050049e-06, 8.685514330863953e-06, 9.257346391677856e-06, 9.82917845249176e-06, 1.0401010513305664e-05, 1.0972842574119568e-05, 1.1544674634933472e-05, 1.2116506695747375e-05, 1.268833875656128e-05, 1.3260170817375183e-05, 1.3832002878189087e-05, 1.440383493900299e-05, 1.4975666999816895e-05, 1.55474990606308e-05, 1.6119331121444702e-05, 1.6691163182258606e-05, 1.726299524307251e-05, 1.7834827303886414e-05, 1.8406659364700317e-05, 1.897849142551422e-05, 1.9550323486328125e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 9.0, 7.0, 9.0, 15.0, 27.0, 26.0, 46.0, 72.0, 101.0, 150.0, 175.0, 330.0, 516.0, 891.0, 1675.0, 3216.0, 6713.0, 15010.0, 36160.0, 89049.0, 205464.0, 311340.0, 214908.0, 93805.0, 38272.0, 15955.0, 7151.0, 3350.0, 1698.0, 886.0, 520.0, 301.0, 222.0, 134.0, 97.0, 68.0, 39.0, 38.0, 24.0, 21.0, 15.0, 7.0, 12.0, 6.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0190582275390625, -0.018489837646484375, -0.01792144775390625, -0.017353057861328125, -0.01678466796875, -0.016216278076171875, -0.01564788818359375, -0.015079498291015625, -0.0145111083984375, -0.013942718505859375, -0.01337432861328125, -0.012805938720703125, -0.012237548828125, -0.011669158935546875, -0.01110076904296875, -0.010532379150390625, -0.0099639892578125, -0.009395599365234375, -0.00882720947265625, -0.008258819580078125, -0.0076904296875, -0.007122039794921875, -0.00655364990234375, -0.005985260009765625, -0.0054168701171875, -0.004848480224609375, -0.00428009033203125, -0.003711700439453125, -0.003143310546875, -0.002574920654296875, -0.00200653076171875, -0.001438140869140625, -0.0008697509765625, -0.000301361083984375, 0.00026702880859375, 0.000835418701171875, 0.00140380859375, 0.001972198486328125, 0.00254058837890625, 0.003108978271484375, 0.0036773681640625, 0.004245758056640625, 0.00481414794921875, 0.005382537841796875, 0.005950927734375, 0.006519317626953125, 0.00708770751953125, 0.007656097412109375, 0.0082244873046875, 0.008792877197265625, 0.00936126708984375, 0.009929656982421875, 0.010498046875, 0.011066436767578125, 0.01163482666015625, 0.012203216552734375, 0.0127716064453125, 0.013339996337890625, 0.01390838623046875, 0.014476776123046875, 0.015045166015625, 0.015613555908203125, 0.01618194580078125, 0.016750335693359375, 0.0173187255859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 4.0, 13.0, 6.0, 9.0, 8.0, 12.0, 11.0, 17.0, 15.0, 14.0, 21.0, 18.0, 33.0, 29.0, 33.0, 38.0, 38.0, 52.0, 60.0, 43.0, 41.0, 51.0, 46.0, 37.0, 37.0, 32.0, 29.0, 37.0, 34.0, 24.0, 25.0, 24.0, 16.0, 13.0, 14.0, 11.0, 12.0, 12.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0054473876953125, -0.005285143852233887, -0.0051229000091552734, -0.00496065616607666, -0.004798412322998047, -0.004636168479919434, -0.00447392463684082, -0.004311680793762207, -0.004149436950683594, -0.0039871931076049805, -0.003824949264526367, -0.003662705421447754, -0.0035004615783691406, -0.0033382177352905273, -0.003175973892211914, -0.0030137300491333008, -0.0028514862060546875, -0.0026892423629760742, -0.002526998519897461, -0.0023647546768188477, -0.0022025108337402344, -0.002040266990661621, -0.0018780231475830078, -0.0017157793045043945, -0.0015535354614257812, -0.001391291618347168, -0.0012290477752685547, -0.0010668039321899414, -0.0009045600891113281, -0.0007423162460327148, -0.0005800724029541016, -0.0004178285598754883, -0.000255584716796875, -9.334087371826172e-05, 6.890296936035156e-05, 0.00023114681243896484, 0.0003933906555175781, 0.0005556344985961914, 0.0007178783416748047, 0.000880122184753418, 0.0010423660278320312, 0.0012046098709106445, 0.0013668537139892578, 0.001529097557067871, 0.0016913414001464844, 0.0018535852432250977, 0.002015829086303711, 0.0021780729293823242, 0.0023403167724609375, 0.0025025606155395508, 0.002664804458618164, 0.0028270483016967773, 0.0029892921447753906, 0.003151535987854004, 0.003313779830932617, 0.0034760236740112305, 0.0036382675170898438, 0.003800511360168457, 0.00396275520324707, 0.004124999046325684, 0.004287242889404297, 0.00444948673248291, 0.0046117305755615234, 0.004773974418640137, 0.00493621826171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 30.0, 114.0, 258.0, 363.0, 163.0, 47.0, 20.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8652573227882385, -0.8086316585540771, -0.7520060539245605, -0.6953803896903992, -0.6387547254562378, -0.5821291208267212, -0.5255034565925598, -0.4688778221607208, -0.41225218772888184, -0.35562655329704285, -0.29900091886520386, -0.24237525463104248, -0.1857496201992035, -0.1291239857673645, -0.07249832153320312, -0.015872687101364136, 0.040752947330474854, 0.09737858921289444, 0.15400423109531403, 0.2106298804283142, 0.2672555148601532, 0.3238811492919922, 0.38050681352615356, 0.43713244795799255, 0.49375808238983154, 0.5503837466239929, 0.6070093512535095, 0.6636350154876709, 0.7202606201171875, 0.7768862843513489, 0.8335119485855103, 0.8901375532150269, 0.946763277053833, 1.0033888816833496, 1.0600146055221558, 1.1166402101516724, 1.173265814781189, 1.2298915386199951, 1.2865171432495117, 1.3431427478790283, 1.399768352508545, 1.4563939571380615, 1.5130196809768677, 1.5696452856063843, 1.6262708902359009, 1.682896614074707, 1.7395222187042236, 1.7961478233337402, 1.8527735471725464, 1.909399151802063, 1.9660248756408691, 2.0226504802703857, 2.0792760848999023, 2.135901689529419, 2.1925272941589355, 2.2491531372070312, 2.305778741836548, 2.3624043464660645, 2.419029951095581, 2.4756555557250977, 2.5322813987731934, 2.58890700340271, 2.6455326080322266, 2.702158212661743, 2.7587838172912598]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 9.0, 8.0, 9.0, 14.0, 18.0, 33.0, 34.0, 33.0, 46.0, 42.0, 51.0, 68.0, 61.0, 72.0, 79.0, 61.0, 71.0, 47.0, 41.0, 54.0, 41.0, 21.0, 28.0, 22.0, 7.0, 6.0, 10.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501637876033783, -0.4867832660675049, -0.4719286859035492, -0.4570740759372711, -0.44221946597099304, -0.42736488580703735, -0.4125102758407593, -0.3976556658744812, -0.3828010559082031, -0.36794644594192505, -0.35309186577796936, -0.3382372558116913, -0.3233826458454132, -0.3085280656814575, -0.29367345571517944, -0.27881884574890137, -0.2639642655849457, -0.2491096705198288, -0.23425506055355072, -0.21940046548843384, -0.20454585552215576, -0.18969126045703888, -0.174836665391922, -0.15998205542564392, -0.14512746036052704, -0.13027286529541016, -0.11541825532913208, -0.1005636602640152, -0.08570905774831772, -0.07085445523262024, -0.05599986016750336, -0.04114525765180588, -0.0262906551361084, -0.011436054483056068, 0.0034185461699962616, 0.018273144960403442, 0.03312774747610092, 0.0479823499917984, 0.06283694505691528, 0.07769154757261276, 0.09254615008831024, 0.10740075260400772, 0.1222553551197052, 0.13710995018482208, 0.15196454524993896, 0.16681915521621704, 0.18167375028133392, 0.1965283453464508, 0.21138295531272888, 0.22623755037784576, 0.24109216034412384, 0.2559467554092407, 0.2708013653755188, 0.2856559753417969, 0.30051055550575256, 0.31536516547203064, 0.33021974563598633, 0.3450743556022644, 0.3599289357662201, 0.37478354573249817, 0.38963815569877625, 0.40449273586273193, 0.41934734582901, 0.4342019557952881, 0.44905656576156616]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 4.0, 21.0, 36.0, 34.0, 56.0, 79.0, 139.0, 222.0, 367.0, 648.0, 1133.0, 2248.0, 5011.0, 12351.0, 36456.0, 144824.0, 535044.0, 229319.0, 52051.0, 16186.0, 6236.0, 2801.0, 1372.0, 753.0, 428.0, 235.0, 160.0, 95.0, 71.0, 38.0, 28.0, 31.0, 14.0, 12.0, 13.0, 5.0, 5.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32470703125, -0.3133697509765625, -0.302032470703125, -0.2906951904296875, -0.27935791015625, -0.2680206298828125, -0.256683349609375, -0.2453460693359375, -0.2340087890625, -0.2226715087890625, -0.211334228515625, -0.1999969482421875, -0.18865966796875, -0.1773223876953125, -0.165985107421875, -0.1546478271484375, -0.143310546875, -0.1319732666015625, -0.120635986328125, -0.1092987060546875, -0.09796142578125, -0.0866241455078125, -0.075286865234375, -0.0639495849609375, -0.0526123046875, -0.0412750244140625, -0.029937744140625, -0.0186004638671875, -0.00726318359375, 0.0040740966796875, 0.015411376953125, 0.0267486572265625, 0.0380859375, 0.0494232177734375, 0.060760498046875, 0.0720977783203125, 0.08343505859375, 0.0947723388671875, 0.106109619140625, 0.1174468994140625, 0.1287841796875, 0.1401214599609375, 0.151458740234375, 0.1627960205078125, 0.17413330078125, 0.1854705810546875, 0.196807861328125, 0.2081451416015625, 0.219482421875, 0.2308197021484375, 0.242156982421875, 0.2534942626953125, 0.26483154296875, 0.2761688232421875, 0.287506103515625, 0.2988433837890625, 0.3101806640625, 0.3215179443359375, 0.332855224609375, 0.3441925048828125, 0.35552978515625, 0.3668670654296875, 0.378204345703125, 0.3895416259765625, 0.40087890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 5.0, 11.0, 17.0, 16.0, 25.0, 22.0, 22.0, 28.0, 26.0, 40.0, 55.0, 46.0, 48.0, 58.0, 51.0, 50.0, 50.0, 55.0, 58.0, 46.0, 49.0, 46.0, 25.0, 27.0, 21.0, 20.0, 15.0, 16.0, 7.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.90380859375, -0.8793792724609375, -0.854949951171875, -0.8305206298828125, -0.80609130859375, -0.7816619873046875, -0.757232666015625, -0.7328033447265625, -0.7083740234375, -0.6839447021484375, -0.659515380859375, -0.6350860595703125, -0.61065673828125, -0.5862274169921875, -0.561798095703125, -0.5373687744140625, -0.512939453125, -0.4885101318359375, -0.464080810546875, -0.4396514892578125, -0.41522216796875, -0.3907928466796875, -0.366363525390625, -0.3419342041015625, -0.3175048828125, -0.2930755615234375, -0.268646240234375, -0.2442169189453125, -0.21978759765625, -0.1953582763671875, -0.170928955078125, -0.1464996337890625, -0.1220703125, -0.0976409912109375, -0.073211669921875, -0.0487823486328125, -0.02435302734375, 7.62939453125e-05, 0.024505615234375, 0.0489349365234375, 0.0733642578125, 0.0977935791015625, 0.122222900390625, 0.1466522216796875, 0.17108154296875, 0.1955108642578125, 0.219940185546875, 0.2443695068359375, 0.268798828125, 0.2932281494140625, 0.317657470703125, 0.3420867919921875, 0.36651611328125, 0.3909454345703125, 0.415374755859375, 0.4398040771484375, 0.4642333984375, 0.4886627197265625, 0.513092041015625, 0.5375213623046875, 0.56195068359375, 0.5863800048828125, 0.610809326171875, 0.6352386474609375, 0.65966796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 11.0, 12.0, 16.0, 19.0, 29.0, 46.0, 57.0, 91.0, 136.0, 278.0, 586.0, 1762.0, 7364.0, 77331.0, 869601.0, 80430.0, 7607.0, 1796.0, 636.0, 260.0, 137.0, 100.0, 64.0, 51.0, 28.0, 16.0, 16.0, 20.0, 6.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7783203125, -0.7536163330078125, -0.728912353515625, -0.7042083740234375, -0.67950439453125, -0.6548004150390625, -0.630096435546875, -0.6053924560546875, -0.5806884765625, -0.5559844970703125, -0.531280517578125, -0.5065765380859375, -0.48187255859375, -0.4571685791015625, -0.432464599609375, -0.4077606201171875, -0.383056640625, -0.3583526611328125, -0.333648681640625, -0.3089447021484375, -0.28424072265625, -0.2595367431640625, -0.234832763671875, -0.2101287841796875, -0.1854248046875, -0.1607208251953125, -0.136016845703125, -0.1113128662109375, -0.08660888671875, -0.0619049072265625, -0.037200927734375, -0.0124969482421875, 0.01220703125, 0.0369110107421875, 0.061614990234375, 0.0863189697265625, 0.11102294921875, 0.1357269287109375, 0.160430908203125, 0.1851348876953125, 0.2098388671875, 0.2345428466796875, 0.259246826171875, 0.2839508056640625, 0.30865478515625, 0.3333587646484375, 0.358062744140625, 0.3827667236328125, 0.407470703125, 0.4321746826171875, 0.456878662109375, 0.4815826416015625, 0.50628662109375, 0.5309906005859375, 0.555694580078125, 0.5803985595703125, 0.6051025390625, 0.6298065185546875, 0.654510498046875, 0.6792144775390625, 0.70391845703125, 0.7286224365234375, 0.753326416015625, 0.7780303955078125, 0.802734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 8.0, 6.0, 5.0, 6.0, 4.0, 8.0, 11.0, 15.0, 28.0, 25.0, 33.0, 41.0, 33.0, 37.0, 29.0, 53.0, 52.0, 47.0, 47.0, 57.0, 53.0, 58.0, 51.0, 50.0, 50.0, 19.0, 32.0, 21.0, 20.0, 21.0, 16.0, 16.0, 11.0, 11.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.951171875, -0.9241790771484375, -0.897186279296875, -0.8701934814453125, -0.84320068359375, -0.8162078857421875, -0.789215087890625, -0.7622222900390625, -0.7352294921875, -0.7082366943359375, -0.681243896484375, -0.6542510986328125, -0.62725830078125, -0.6002655029296875, -0.573272705078125, -0.5462799072265625, -0.519287109375, -0.4922943115234375, -0.465301513671875, -0.4383087158203125, -0.41131591796875, -0.3843231201171875, -0.357330322265625, -0.3303375244140625, -0.3033447265625, -0.2763519287109375, -0.249359130859375, -0.2223663330078125, -0.19537353515625, -0.1683807373046875, -0.141387939453125, -0.1143951416015625, -0.08740234375, -0.0604095458984375, -0.033416748046875, -0.0064239501953125, 0.02056884765625, 0.0475616455078125, 0.074554443359375, 0.1015472412109375, 0.1285400390625, 0.1555328369140625, 0.182525634765625, 0.2095184326171875, 0.23651123046875, 0.2635040283203125, 0.290496826171875, 0.3174896240234375, 0.344482421875, 0.3714752197265625, 0.398468017578125, 0.4254608154296875, 0.45245361328125, 0.4794464111328125, 0.506439208984375, 0.5334320068359375, 0.5604248046875, 0.5874176025390625, 0.614410400390625, 0.6414031982421875, 0.66839599609375, 0.6953887939453125, 0.722381591796875, 0.7493743896484375, 0.7763671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 4.0, 11.0, 7.0, 27.0, 25.0, 74.0, 126.0, 284.0, 813.0, 2638.0, 13921.0, 761171.0, 257954.0, 8494.0, 1906.0, 610.0, 224.0, 116.0, 61.0, 33.0, 13.0, 13.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.37726593017578125, -0.3646392822265625, -0.35201263427734375, -0.339385986328125, -0.32675933837890625, -0.3141326904296875, -0.30150604248046875, -0.28887939453125, -0.27625274658203125, -0.2636260986328125, -0.25099945068359375, -0.238372802734375, -0.22574615478515625, -0.2131195068359375, -0.20049285888671875, -0.1878662109375, -0.17523956298828125, -0.1626129150390625, -0.14998626708984375, -0.137359619140625, -0.12473297119140625, -0.1121063232421875, -0.09947967529296875, -0.08685302734375, -0.07422637939453125, -0.0615997314453125, -0.04897308349609375, -0.036346435546875, -0.02371978759765625, -0.0110931396484375, 0.00153350830078125, 0.01416015625, 0.02678680419921875, 0.0394134521484375, 0.05204010009765625, 0.064666748046875, 0.07729339599609375, 0.0899200439453125, 0.10254669189453125, 0.11517333984375, 0.12779998779296875, 0.1404266357421875, 0.15305328369140625, 0.165679931640625, 0.17830657958984375, 0.1909332275390625, 0.20355987548828125, 0.2161865234375, 0.22881317138671875, 0.2414398193359375, 0.25406646728515625, 0.266693115234375, 0.27931976318359375, 0.2919464111328125, 0.30457305908203125, 0.31719970703125, 0.32982635498046875, 0.3424530029296875, 0.35507965087890625, 0.367706298828125, 0.38033294677734375, 0.3929595947265625, 0.40558624267578125, 0.418212890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 12.0, 15.0, 34.0, 51.0, 64.0, 115.0, 173.0, 172.0, 103.0, 98.0, 60.0, 41.0, 17.0, 13.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.254840314388275e-05, -4.1406601667404175e-05, -4.02648001909256e-05, -3.912299871444702e-05, -3.7981197237968445e-05, -3.683939576148987e-05, -3.569759428501129e-05, -3.4555792808532715e-05, -3.341399133205414e-05, -3.227218985557556e-05, -3.1130388379096985e-05, -2.9988586902618408e-05, -2.884678542613983e-05, -2.7704983949661255e-05, -2.6563182473182678e-05, -2.54213809967041e-05, -2.4279579520225525e-05, -2.3137778043746948e-05, -2.199597656726837e-05, -2.0854175090789795e-05, -1.9712373614311218e-05, -1.857057213783264e-05, -1.7428770661354065e-05, -1.6286969184875488e-05, -1.5145167708396912e-05, -1.4003366231918335e-05, -1.2861564755439758e-05, -1.1719763278961182e-05, -1.0577961802482605e-05, -9.436160326004028e-06, -8.294358849525452e-06, -7.152557373046875e-06, -6.010755896568298e-06, -4.868954420089722e-06, -3.727152943611145e-06, -2.5853514671325684e-06, -1.4435499906539917e-06, -3.0174851417541504e-07, 8.400529623031616e-07, 1.9818544387817383e-06, 3.123655915260315e-06, 4.265457391738892e-06, 5.407258868217468e-06, 6.549060344696045e-06, 7.690861821174622e-06, 8.832663297653198e-06, 9.974464774131775e-06, 1.1116266250610352e-05, 1.2258067727088928e-05, 1.3399869203567505e-05, 1.4541670680046082e-05, 1.5683472156524658e-05, 1.6825273633003235e-05, 1.796707510948181e-05, 1.9108876585960388e-05, 2.0250678062438965e-05, 2.139247953891754e-05, 2.2534281015396118e-05, 2.3676082491874695e-05, 2.481788396835327e-05, 2.5959685444831848e-05, 2.7101486921310425e-05, 2.8243288397789e-05, 2.9385089874267578e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 14.0, 12.0, 19.0, 30.0, 61.0, 130.0, 279.0, 808.0, 2836.0, 16044.0, 673291.0, 340279.0, 11238.0, 2335.0, 652.0, 244.0, 112.0, 50.0, 33.0, 15.0, 8.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.35498046875, -0.3441963195800781, -0.33341217041015625, -0.3226280212402344, -0.3118438720703125, -0.3010597229003906, -0.29027557373046875, -0.2794914245605469, -0.268707275390625, -0.2579231262207031, -0.24713897705078125, -0.23635482788085938, -0.2255706787109375, -0.21478652954101562, -0.20400238037109375, -0.19321823120117188, -0.18243408203125, -0.17164993286132812, -0.16086578369140625, -0.15008163452148438, -0.1392974853515625, -0.12851333618164062, -0.11772918701171875, -0.10694503784179688, -0.096160888671875, -0.08537673950195312, -0.07459259033203125, -0.06380844116210938, -0.0530242919921875, -0.042240142822265625, -0.03145599365234375, -0.020671844482421875, -0.0098876953125, 0.000896453857421875, 0.01168060302734375, 0.022464752197265625, 0.0332489013671875, 0.044033050537109375, 0.05481719970703125, 0.06560134887695312, 0.076385498046875, 0.08716964721679688, 0.09795379638671875, 0.10873794555664062, 0.1195220947265625, 0.13030624389648438, 0.14109039306640625, 0.15187454223632812, 0.16265869140625, 0.17344284057617188, 0.18422698974609375, 0.19501113891601562, 0.2057952880859375, 0.21657943725585938, 0.22736358642578125, 0.23814773559570312, 0.248931884765625, 0.2597160339355469, 0.27050018310546875, 0.2812843322753906, 0.2920684814453125, 0.3028526306152344, 0.31363677978515625, 0.3244209289550781, 0.335205078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 13.0, 20.0, 28.0, 46.0, 42.0, 48.0, 91.0, 95.0, 113.0, 134.0, 82.0, 66.0, 58.0, 38.0, 22.0, 25.0, 21.0, 5.0, 6.0, 9.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0809326171875, -0.0784749984741211, -0.07601737976074219, -0.07355976104736328, -0.07110214233398438, -0.06864452362060547, -0.06618690490722656, -0.06372928619384766, -0.06127166748046875, -0.058814048767089844, -0.05635643005371094, -0.05389881134033203, -0.051441192626953125, -0.04898357391357422, -0.04652595520019531, -0.044068336486816406, -0.0416107177734375, -0.039153099060058594, -0.03669548034667969, -0.03423786163330078, -0.031780242919921875, -0.02932262420654297, -0.026865005493164062, -0.024407386779785156, -0.02194976806640625, -0.019492149353027344, -0.017034530639648438, -0.014576911926269531, -0.012119293212890625, -0.009661674499511719, -0.0072040557861328125, -0.004746437072753906, -0.002288818359375, 0.00016880035400390625, 0.0026264190673828125, 0.005084037780761719, 0.007541656494140625, 0.009999275207519531, 0.012456893920898438, 0.014914512634277344, 0.01737213134765625, 0.019829750061035156, 0.022287368774414062, 0.02474498748779297, 0.027202606201171875, 0.02966022491455078, 0.03211784362792969, 0.034575462341308594, 0.0370330810546875, 0.039490699768066406, 0.04194831848144531, 0.04440593719482422, 0.046863555908203125, 0.04932117462158203, 0.05177879333496094, 0.054236412048339844, 0.05669403076171875, 0.059151649475097656, 0.06160926818847656, 0.06406688690185547, 0.06652450561523438, 0.06898212432861328, 0.07143974304199219, 0.0738973617553711, 0.07635498046875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 14.0, 13.0, 36.0, 40.0, 78.0, 92.0, 154.0, 159.0, 146.0, 102.0, 55.0, 45.0, 24.0, 16.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5553004741668701, -1.5075490474700928, -1.459797739982605, -1.4120464324951172, -1.3642950057983398, -1.3165435791015625, -1.2687922716140747, -1.221040964126587, -1.1732895374298096, -1.1255381107330322, -1.0777868032455444, -1.0300354957580566, -0.9822840690612793, -0.9345327019691467, -0.8867813348770142, -0.8390299677848816, -0.791278600692749, -0.7435272336006165, -0.6957758665084839, -0.6480244994163513, -0.6002731323242188, -0.5525217652320862, -0.5047703981399536, -0.45701903104782104, -0.4092676639556885, -0.3615162968635559, -0.31376492977142334, -0.26601356267929077, -0.2182621955871582, -0.17051082849502563, -0.12275946140289307, -0.0750080943107605, -0.02725684642791748, 0.020494520664215088, 0.06824588775634766, 0.11599725484848022, 0.1637486219406128, 0.21149998903274536, 0.25925135612487793, 0.3070027232170105, 0.35475409030914307, 0.40250545740127563, 0.4502568244934082, 0.49800819158554077, 0.5457595586776733, 0.5935109257698059, 0.6412622928619385, 0.689013659954071, 0.7367650270462036, 0.7845163941383362, 0.8322677612304688, 0.8800191283226013, 0.9277704954147339, 0.9755218625068665, 1.023273229598999, 1.0710246562957764, 1.1187759637832642, 1.166527271270752, 1.2142786979675293, 1.2620301246643066, 1.3097814321517944, 1.3575327396392822, 1.4052841663360596, 1.453035593032837, 1.5007869005203247]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 11.0, 15.0, 13.0, 13.0, 17.0, 18.0, 27.0, 16.0, 24.0, 18.0, 40.0, 37.0, 28.0, 35.0, 33.0, 27.0, 36.0, 32.0, 35.0, 30.0, 39.0, 40.0, 33.0, 33.0, 33.0, 36.0, 29.0, 31.0, 25.0, 23.0, 19.0, 24.0, 18.0, 21.0, 11.0, 14.0, 11.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0419141054153442, -1.0074104070663452, -0.972906768321991, -0.9384031295776367, -0.9038994312286377, -0.8693957328796387, -0.8348920941352844, -0.8003884553909302, -0.7658847570419312, -0.7313810586929321, -0.6968774199485779, -0.6623737812042236, -0.6278700828552246, -0.5933663845062256, -0.5588627457618713, -0.5243591070175171, -0.48985540866851807, -0.45535174012184143, -0.4208480715751648, -0.38634440302848816, -0.3518407344818115, -0.3173370659351349, -0.28283339738845825, -0.24832972884178162, -0.21382606029510498, -0.17932239174842834, -0.1448187232017517, -0.11031505465507507, -0.07581138610839844, -0.0413077175617218, -0.006804049015045166, 0.02769961953163147, 0.062203288078308105, 0.09670695662498474, 0.13121062517166138, 0.165714293718338, 0.20021796226501465, 0.23472163081169128, 0.2692252993583679, 0.30372896790504456, 0.3382326364517212, 0.3727363049983978, 0.40723997354507446, 0.4417436420917511, 0.47624731063842773, 0.5107510089874268, 0.545254647731781, 0.5797582864761353, 0.6142619848251343, 0.6487656831741333, 0.6832693219184875, 0.7177729606628418, 0.7522766590118408, 0.7867803573608398, 0.8212839961051941, 0.8557876348495483, 0.8902913331985474, 0.9247950315475464, 0.9592986702919006, 0.9938023090362549, 1.028306007385254, 1.062809705734253, 1.097313404083252, 1.1318169832229614, 1.1663206815719604]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 18.0, 23.0, 34.0, 63.0, 94.0, 211.0, 439.0, 1064.0, 3054.0, 16104.0, 701109.0, 3405019.0, 56152.0, 7030.0, 2159.0, 873.0, 376.0, 174.0, 98.0, 46.0, 32.0, 22.0, 17.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4951171875, -1.4501190185546875, -1.405120849609375, -1.3601226806640625, -1.31512451171875, -1.2701263427734375, -1.225128173828125, -1.1801300048828125, -1.1351318359375, -1.0901336669921875, -1.045135498046875, -1.0001373291015625, -0.95513916015625, -0.9101409912109375, -0.865142822265625, -0.8201446533203125, -0.775146484375, -0.7301483154296875, -0.685150146484375, -0.6401519775390625, -0.59515380859375, -0.5501556396484375, -0.505157470703125, -0.4601593017578125, -0.4151611328125, -0.3701629638671875, -0.325164794921875, -0.2801666259765625, -0.23516845703125, -0.1901702880859375, -0.145172119140625, -0.1001739501953125, -0.05517578125, -0.0101776123046875, 0.034820556640625, 0.0798187255859375, 0.12481689453125, 0.1698150634765625, 0.214813232421875, 0.2598114013671875, 0.3048095703125, 0.3498077392578125, 0.394805908203125, 0.4398040771484375, 0.48480224609375, 0.5298004150390625, 0.574798583984375, 0.6197967529296875, 0.664794921875, 0.7097930908203125, 0.754791259765625, 0.7997894287109375, 0.84478759765625, 0.8897857666015625, 0.934783935546875, 0.9797821044921875, 1.0247802734375, 1.0697784423828125, 1.114776611328125, 1.1597747802734375, 1.20477294921875, 1.2497711181640625, 1.294769287109375, 1.3397674560546875, 1.384765625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 13.0, 9.0, 15.0, 19.0, 29.0, 36.0, 25.0, 45.0, 63.0, 65.0, 57.0, 68.0, 77.0, 60.0, 64.0, 66.0, 65.0, 44.0, 44.0, 33.0, 26.0, 20.0, 10.0, 16.0, 4.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.70703125, -0.6886024475097656, -0.6701736450195312, -0.6517448425292969, -0.6333160400390625, -0.6148872375488281, -0.5964584350585938, -0.5780296325683594, -0.559600830078125, -0.5411720275878906, -0.5227432250976562, -0.5043144226074219, -0.4858856201171875, -0.4674568176269531, -0.44902801513671875, -0.4305992126464844, -0.41217041015625, -0.3937416076660156, -0.37531280517578125, -0.3568840026855469, -0.3384552001953125, -0.3200263977050781, -0.30159759521484375, -0.2831687927246094, -0.264739990234375, -0.24631118774414062, -0.22788238525390625, -0.20945358276367188, -0.1910247802734375, -0.17259597778320312, -0.15416717529296875, -0.13573837280273438, -0.1173095703125, -0.09888076782226562, -0.08045196533203125, -0.062023162841796875, -0.0435943603515625, -0.025165557861328125, -0.00673675537109375, 0.011692047119140625, 0.030120849609375, 0.048549652099609375, 0.06697845458984375, 0.08540725708007812, 0.1038360595703125, 0.12226486206054688, 0.14069366455078125, 0.15912246704101562, 0.17755126953125, 0.19598007202148438, 0.21440887451171875, 0.23283767700195312, 0.2512664794921875, 0.2696952819824219, 0.28812408447265625, 0.3065528869628906, 0.324981689453125, 0.3434104919433594, 0.36183929443359375, 0.3802680969238281, 0.3986968994140625, 0.4171257019042969, 0.43555450439453125, 0.4539833068847656, 0.472412109375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 13.0, 22.0, 20.0, 20.0, 48.0, 61.0, 109.0, 157.0, 288.0, 461.0, 947.0, 1939.0, 5080.0, 18834.0, 150455.0, 3562274.0, 409711.0, 31588.0, 7244.0, 2504.0, 1093.0, 571.0, 327.0, 184.0, 105.0, 59.0, 45.0, 26.0, 21.0, 12.0, 6.0, 8.0, 11.0, 3.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.84521484375, -0.820098876953125, -0.79498291015625, -0.769866943359375, -0.7447509765625, -0.719635009765625, -0.69451904296875, -0.669403076171875, -0.644287109375, -0.619171142578125, -0.59405517578125, -0.568939208984375, -0.5438232421875, -0.518707275390625, -0.49359130859375, -0.468475341796875, -0.443359375, -0.418243408203125, -0.39312744140625, -0.368011474609375, -0.3428955078125, -0.317779541015625, -0.29266357421875, -0.267547607421875, -0.242431640625, -0.217315673828125, -0.19219970703125, -0.167083740234375, -0.1419677734375, -0.116851806640625, -0.09173583984375, -0.066619873046875, -0.04150390625, -0.016387939453125, 0.00872802734375, 0.033843994140625, 0.0589599609375, 0.084075927734375, 0.10919189453125, 0.134307861328125, 0.159423828125, 0.184539794921875, 0.20965576171875, 0.234771728515625, 0.2598876953125, 0.285003662109375, 0.31011962890625, 0.335235595703125, 0.3603515625, 0.385467529296875, 0.41058349609375, 0.435699462890625, 0.4608154296875, 0.485931396484375, 0.51104736328125, 0.536163330078125, 0.561279296875, 0.586395263671875, 0.61151123046875, 0.636627197265625, 0.6617431640625, 0.686859130859375, 0.71197509765625, 0.737091064453125, 0.76220703125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 17.0, 11.0, 15.0, 42.0, 54.0, 97.0, 190.0, 409.0, 810.0, 992.0, 672.0, 343.0, 143.0, 96.0, 56.0, 43.0, 24.0, 14.0, 10.0, 5.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19141769409179688, -0.18288421630859375, -0.17435073852539062, -0.1658172607421875, -0.15728378295898438, -0.14875030517578125, -0.14021682739257812, -0.131683349609375, -0.12314987182617188, -0.11461639404296875, -0.10608291625976562, -0.0975494384765625, -0.08901596069335938, -0.08048248291015625, -0.07194900512695312, -0.06341552734375, -0.054882049560546875, -0.04634857177734375, -0.037815093994140625, -0.0292816162109375, -0.020748138427734375, -0.01221466064453125, -0.003681182861328125, 0.004852294921875, 0.013385772705078125, 0.02191925048828125, 0.030452728271484375, 0.0389862060546875, 0.047519683837890625, 0.05605316162109375, 0.06458663940429688, 0.0731201171875, 0.08165359497070312, 0.09018707275390625, 0.09872055053710938, 0.1072540283203125, 0.11578750610351562, 0.12432098388671875, 0.13285446166992188, 0.141387939453125, 0.14992141723632812, 0.15845489501953125, 0.16698837280273438, 0.1755218505859375, 0.18405532836914062, 0.19258880615234375, 0.20112228393554688, 0.20965576171875, 0.21818923950195312, 0.22672271728515625, 0.23525619506835938, 0.2437896728515625, 0.2523231506347656, 0.26085662841796875, 0.2693901062011719, 0.277923583984375, 0.2864570617675781, 0.29499053955078125, 0.3035240173339844, 0.3120574951171875, 0.3205909729003906, 0.32912445068359375, 0.3376579284667969, 0.34619140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 8.0, 5.0, 6.0, 13.0, 28.0, 55.0, 104.0, 116.0, 183.0, 159.0, 135.0, 85.0, 36.0, 34.0, 14.0, 7.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0781259536743164, -1.039666771888733, -1.0012074708938599, -0.9627482891082764, -0.9242891073226929, -0.8858298659324646, -0.8473706245422363, -0.8089114427566528, -0.7704522609710693, -0.7319930195808411, -0.6935338377952576, -0.6550745964050293, -0.6166154146194458, -0.5781561732292175, -0.5396969318389893, -0.5012377500534058, -0.4627785086631775, -0.4243192970752716, -0.3858600854873657, -0.34740084409713745, -0.30894166231155396, -0.2704824209213257, -0.2320232093334198, -0.19356399774551392, -0.15510478615760803, -0.11664557456970215, -0.07818635553121567, -0.03972713649272919, -0.0012679249048233032, 0.03719128668308258, 0.07565051317214966, 0.11410972476005554, 0.15256893634796143, 0.1910281479358673, 0.2294873595237732, 0.26794660091400146, 0.30640578269958496, 0.34486502408981323, 0.3833242356777191, 0.421783447265625, 0.4602426588535309, 0.49870187044143677, 0.537161111831665, 0.5756202936172485, 0.6140795350074768, 0.6525387167930603, 0.6909979581832886, 0.7294571399688721, 0.7679163813591003, 0.8063756227493286, 0.8448348045349121, 0.8832940459251404, 0.9217532277107239, 0.9602124691009521, 0.9986716508865356, 1.0371308326721191, 1.0755901336669922, 1.1140493154525757, 1.1525086164474487, 1.1909677982330322, 1.2294269800186157, 1.2678861618041992, 1.3063454627990723, 1.3448046445846558, 1.3832638263702393]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 17.0, 9.0, 14.0, 12.0, 21.0, 28.0, 49.0, 42.0, 36.0, 41.0, 42.0, 53.0, 49.0, 46.0, 42.0, 55.0, 44.0, 44.0, 42.0, 40.0, 44.0, 33.0, 30.0, 24.0, 31.0, 20.0, 13.0, 12.0, 12.0, 7.0, 4.0, 4.0, 7.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4527290165424347, -0.4377433955669403, -0.4227577745914459, -0.40777212381362915, -0.39278650283813477, -0.3778008818626404, -0.362815260887146, -0.3478296399116516, -0.3328440189361572, -0.31785839796066284, -0.30287277698516846, -0.2878871560096741, -0.2729015052318573, -0.2579158842563629, -0.24293026328086853, -0.22794464230537415, -0.21295899152755737, -0.197973370552063, -0.1829877346754074, -0.16800211369991302, -0.15301647782325745, -0.13803085684776306, -0.12304523587226868, -0.1080596074461937, -0.09307397902011871, -0.07808835059404373, -0.06310272216796875, -0.048117101192474365, -0.033131472766399384, -0.018145844340324402, -0.003160223364830017, 0.011825405061244965, 0.02681100368499756, 0.04179663211107254, 0.056782256811857224, 0.0717678815126419, 0.08675350993871689, 0.10173913836479187, 0.11672475934028625, 0.13171038031578064, 0.14669601619243622, 0.1616816371679306, 0.17666727304458618, 0.19165289402008057, 0.20663851499557495, 0.22162415087223053, 0.23660977184772491, 0.2515954077243805, 0.2665810286998749, 0.28156664967536926, 0.29655227065086365, 0.3115379214286804, 0.3265235424041748, 0.3415091633796692, 0.3564947843551636, 0.37148040533065796, 0.38646602630615234, 0.40145164728164673, 0.4164372682571411, 0.4314228892326355, 0.44640854001045227, 0.46139416098594666, 0.47637978196144104, 0.4913654029369354, 0.5063510537147522]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 8.0, 15.0, 21.0, 47.0, 49.0, 97.0, 184.0, 362.0, 955.0, 3073.0, 14277.0, 96470.0, 568385.0, 312957.0, 41440.0, 7103.0, 1809.0, 631.0, 303.0, 149.0, 76.0, 40.0, 36.0, 22.0, 9.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.1655406951904297, -0.16091537475585938, -0.15629005432128906, -0.15166473388671875, -0.14703941345214844, -0.14241409301757812, -0.1377887725830078, -0.1331634521484375, -0.1285381317138672, -0.12391281127929688, -0.11928749084472656, -0.11466217041015625, -0.11003684997558594, -0.10541152954101562, -0.10078620910644531, -0.096160888671875, -0.09153556823730469, -0.08691024780273438, -0.08228492736816406, -0.07765960693359375, -0.07303428649902344, -0.06840896606445312, -0.06378364562988281, -0.0591583251953125, -0.05453300476074219, -0.049907684326171875, -0.04528236389160156, -0.04065704345703125, -0.03603172302246094, -0.031406402587890625, -0.026781082153320312, -0.02215576171875, -0.017530441284179688, -0.012905120849609375, -0.008279800415039062, -0.00365447998046875, 0.0009708404541015625, 0.005596160888671875, 0.010221481323242188, 0.0148468017578125, 0.019472122192382812, 0.024097442626953125, 0.028722763061523438, 0.03334808349609375, 0.03797340393066406, 0.042598724365234375, 0.04722404479980469, 0.051849365234375, 0.05647468566894531, 0.061100006103515625, 0.06572532653808594, 0.07035064697265625, 0.07497596740722656, 0.07960128784179688, 0.08422660827636719, 0.0888519287109375, 0.09347724914550781, 0.09810256958007812, 0.10272789001464844, 0.10735321044921875, 0.11197853088378906, 0.11660385131835938, 0.12122917175292969, 0.1258544921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 16.0, 12.0, 21.0, 25.0, 25.0, 48.0, 58.0, 36.0, 54.0, 65.0, 54.0, 73.0, 71.0, 55.0, 61.0, 45.0, 54.0, 42.0, 37.0, 39.0, 23.0, 22.0, 10.0, 9.0, 11.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3429069519042969, -0.32961273193359375, -0.3163185119628906, -0.3030242919921875, -0.2897300720214844, -0.27643585205078125, -0.2631416320800781, -0.249847412109375, -0.23655319213867188, -0.22325897216796875, -0.20996475219726562, -0.1966705322265625, -0.18337631225585938, -0.17008209228515625, -0.15678787231445312, -0.14349365234375, -0.13019943237304688, -0.11690521240234375, -0.10361099243164062, -0.0903167724609375, -0.07702255249023438, -0.06372833251953125, -0.050434112548828125, -0.037139892578125, -0.023845672607421875, -0.01055145263671875, 0.002742767333984375, 0.0160369873046875, 0.029331207275390625, 0.04262542724609375, 0.055919647216796875, 0.0692138671875, 0.08250808715820312, 0.09580230712890625, 0.10909652709960938, 0.1223907470703125, 0.13568496704101562, 0.14897918701171875, 0.16227340698242188, 0.175567626953125, 0.18886184692382812, 0.20215606689453125, 0.21545028686523438, 0.2287445068359375, 0.24203872680664062, 0.25533294677734375, 0.2686271667480469, 0.28192138671875, 0.2952156066894531, 0.30850982666015625, 0.3218040466308594, 0.3350982666015625, 0.3483924865722656, 0.36168670654296875, 0.3749809265136719, 0.388275146484375, 0.4015693664550781, 0.41486358642578125, 0.4281578063964844, 0.4414520263671875, 0.4547462463378906, 0.46804046630859375, 0.4813346862792969, 0.49462890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 18.0, 19.0, 27.0, 44.0, 56.0, 68.0, 99.0, 140.0, 226.0, 342.0, 595.0, 1116.0, 2070.0, 3924.0, 8248.0, 17360.0, 38770.0, 87638.0, 187849.0, 286571.0, 218173.0, 106622.0, 47418.0, 21001.0, 9672.0, 4664.0, 2454.0, 1308.0, 750.0, 481.0, 261.0, 168.0, 99.0, 75.0, 44.0, 39.0, 28.0, 24.0, 14.0, 14.0, 8.0, 9.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.054901123046875, -0.05321788787841797, -0.05153465270996094, -0.049851417541503906, -0.048168182373046875, -0.046484947204589844, -0.04480171203613281, -0.04311847686767578, -0.04143524169921875, -0.03975200653076172, -0.03806877136230469, -0.036385536193847656, -0.034702301025390625, -0.033019065856933594, -0.03133583068847656, -0.02965259552001953, -0.0279693603515625, -0.02628612518310547, -0.024602890014648438, -0.022919654846191406, -0.021236419677734375, -0.019553184509277344, -0.017869949340820312, -0.01618671417236328, -0.01450347900390625, -0.012820243835449219, -0.011137008666992188, -0.009453773498535156, -0.007770538330078125, -0.006087303161621094, -0.0044040679931640625, -0.0027208328247070312, -0.00103759765625, 0.0006456375122070312, 0.0023288726806640625, 0.004012107849121094, 0.005695343017578125, 0.007378578186035156, 0.009061813354492188, 0.010745048522949219, 0.01242828369140625, 0.014111518859863281, 0.015794754028320312, 0.017477989196777344, 0.019161224365234375, 0.020844459533691406, 0.022527694702148438, 0.02421092987060547, 0.0258941650390625, 0.02757740020751953, 0.029260635375976562, 0.030943870544433594, 0.032627105712890625, 0.034310340881347656, 0.03599357604980469, 0.03767681121826172, 0.03936004638671875, 0.04104328155517578, 0.04272651672363281, 0.044409751892089844, 0.046092987060546875, 0.047776222229003906, 0.04945945739746094, 0.05114269256591797, 0.052825927734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 9.0, 6.0, 7.0, 7.0, 11.0, 11.0, 10.0, 16.0, 21.0, 18.0, 20.0, 21.0, 32.0, 37.0, 40.0, 37.0, 37.0, 40.0, 31.0, 45.0, 43.0, 43.0, 34.0, 36.0, 40.0, 51.0, 51.0, 36.0, 28.0, 22.0, 26.0, 21.0, 15.0, 20.0, 12.0, 12.0, 15.0, 8.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.5244140625, -0.5072784423828125, -0.490142822265625, -0.4730072021484375, -0.45587158203125, -0.4387359619140625, -0.421600341796875, -0.4044647216796875, -0.3873291015625, -0.3701934814453125, -0.353057861328125, -0.3359222412109375, -0.31878662109375, -0.3016510009765625, -0.284515380859375, -0.2673797607421875, -0.250244140625, -0.2331085205078125, -0.215972900390625, -0.1988372802734375, -0.18170166015625, -0.1645660400390625, -0.147430419921875, -0.1302947998046875, -0.1131591796875, -0.0960235595703125, -0.078887939453125, -0.0617523193359375, -0.04461669921875, -0.0274810791015625, -0.010345458984375, 0.0067901611328125, 0.02392578125, 0.0410614013671875, 0.058197021484375, 0.0753326416015625, 0.09246826171875, 0.1096038818359375, 0.126739501953125, 0.1438751220703125, 0.1610107421875, 0.1781463623046875, 0.195281982421875, 0.2124176025390625, 0.22955322265625, 0.2466888427734375, 0.263824462890625, 0.2809600830078125, 0.298095703125, 0.3152313232421875, 0.332366943359375, 0.3495025634765625, 0.36663818359375, 0.3837738037109375, 0.400909423828125, 0.4180450439453125, 0.4351806640625, 0.4523162841796875, 0.469451904296875, 0.4865875244140625, 0.50372314453125, 0.5208587646484375, 0.537994384765625, 0.5551300048828125, 0.572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 24.0, 37.0, 64.0, 90.0, 154.0, 285.0, 541.0, 991.0, 1941.0, 4465.0, 12059.0, 44690.0, 198392.0, 472241.0, 235894.0, 53220.0, 14072.0, 4877.0, 2141.0, 1055.0, 536.0, 306.0, 172.0, 93.0, 70.0, 35.0, 26.0, 20.0, 8.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0239715576171875, -0.023160696029663086, -0.022349834442138672, -0.021538972854614258, -0.020728111267089844, -0.01991724967956543, -0.019106388092041016, -0.0182955265045166, -0.017484664916992188, -0.016673803329467773, -0.01586294174194336, -0.015052080154418945, -0.014241218566894531, -0.013430356979370117, -0.012619495391845703, -0.011808633804321289, -0.010997772216796875, -0.010186910629272461, -0.009376049041748047, -0.008565187454223633, -0.007754325866699219, -0.006943464279174805, -0.006132602691650391, -0.0053217411041259766, -0.0045108795166015625, -0.0037000179290771484, -0.0028891563415527344, -0.0020782947540283203, -0.0012674331665039062, -0.0004565715789794922, 0.0003542900085449219, 0.001165151596069336, 0.00197601318359375, 0.002786874771118164, 0.003597736358642578, 0.004408597946166992, 0.005219459533691406, 0.00603032112121582, 0.006841182708740234, 0.0076520442962646484, 0.008462905883789062, 0.009273767471313477, 0.01008462905883789, 0.010895490646362305, 0.011706352233886719, 0.012517213821411133, 0.013328075408935547, 0.014138936996459961, 0.014949798583984375, 0.01576066017150879, 0.016571521759033203, 0.017382383346557617, 0.01819324493408203, 0.019004106521606445, 0.01981496810913086, 0.020625829696655273, 0.021436691284179688, 0.0222475528717041, 0.023058414459228516, 0.02386927604675293, 0.024680137634277344, 0.025490999221801758, 0.026301860809326172, 0.027112722396850586, 0.027923583984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 22.0, 18.0, 22.0, 37.0, 42.0, 39.0, 60.0, 70.0, 71.0, 54.0, 73.0, 79.0, 68.0, 51.0, 40.0, 41.0, 36.0, 31.0, 26.0, 17.0, 15.0, 9.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.360242307186127e-06, -7.031485438346863e-06, -6.702728569507599e-06, -6.373971700668335e-06, -6.045214831829071e-06, -5.716457962989807e-06, -5.387701094150543e-06, -5.058944225311279e-06, -4.730187356472015e-06, -4.4014304876327515e-06, -4.0726736187934875e-06, -3.7439167499542236e-06, -3.4151598811149597e-06, -3.086403012275696e-06, -2.757646143436432e-06, -2.428889274597168e-06, -2.100132405757904e-06, -1.7713755369186401e-06, -1.4426186680793762e-06, -1.1138617992401123e-06, -7.851049304008484e-07, -4.5634806156158447e-07, -1.2759119272232056e-07, 2.0116567611694336e-07, 5.299225449562073e-07, 8.586794137954712e-07, 1.1874362826347351e-06, 1.516193151473999e-06, 1.844950020313263e-06, 2.173706889152527e-06, 2.5024637579917908e-06, 2.8312206268310547e-06, 3.1599774956703186e-06, 3.4887343645095825e-06, 3.8174912333488464e-06, 4.14624810218811e-06, 4.475004971027374e-06, 4.803761839866638e-06, 5.132518708705902e-06, 5.461275577545166e-06, 5.79003244638443e-06, 6.118789315223694e-06, 6.447546184062958e-06, 6.776303052902222e-06, 7.105059921741486e-06, 7.4338167905807495e-06, 7.762573659420013e-06, 8.091330528259277e-06, 8.420087397098541e-06, 8.748844265937805e-06, 9.077601134777069e-06, 9.406358003616333e-06, 9.735114872455597e-06, 1.006387174129486e-05, 1.0392628610134125e-05, 1.0721385478973389e-05, 1.1050142347812653e-05, 1.1378899216651917e-05, 1.170765608549118e-05, 1.2036412954330444e-05, 1.2365169823169708e-05, 1.2693926692008972e-05, 1.3022683560848236e-05, 1.33514404296875e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 4.0, 7.0, 11.0, 18.0, 31.0, 33.0, 59.0, 82.0, 130.0, 183.0, 273.0, 487.0, 808.0, 1484.0, 3369.0, 7941.0, 20290.0, 54557.0, 147394.0, 297044.0, 289253.0, 139351.0, 52170.0, 19050.0, 7520.0, 3320.0, 1574.0, 812.0, 467.0, 310.0, 145.0, 124.0, 70.0, 49.0, 35.0, 20.0, 22.0, 13.0, 4.0, 6.0, 5.0, 6.0, 3.0, 1.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.01815176010131836, -0.01756572723388672, -0.016979694366455078, -0.016393661499023438, -0.015807628631591797, -0.015221595764160156, -0.014635562896728516, -0.014049530029296875, -0.013463497161865234, -0.012877464294433594, -0.012291431427001953, -0.011705398559570312, -0.011119365692138672, -0.010533332824707031, -0.00994729995727539, -0.00936126708984375, -0.00877523422241211, -0.008189201354980469, -0.007603168487548828, -0.0070171356201171875, -0.006431102752685547, -0.005845069885253906, -0.005259037017822266, -0.004673004150390625, -0.004086971282958984, -0.0035009384155273438, -0.002914905548095703, -0.0023288726806640625, -0.0017428398132324219, -0.0011568069458007812, -0.0005707740783691406, 1.52587890625e-05, 0.0006012916564941406, 0.0011873245239257812, 0.0017733573913574219, 0.0023593902587890625, 0.002945423126220703, 0.0035314559936523438, 0.004117488861083984, 0.004703521728515625, 0.005289554595947266, 0.005875587463378906, 0.006461620330810547, 0.0070476531982421875, 0.007633686065673828, 0.008219718933105469, 0.00880575180053711, 0.00939178466796875, 0.00997781753540039, 0.010563850402832031, 0.011149883270263672, 0.011735916137695312, 0.012321949005126953, 0.012907981872558594, 0.013494014739990234, 0.014080047607421875, 0.014666080474853516, 0.015252113342285156, 0.015838146209716797, 0.016424179077148438, 0.017010211944580078, 0.01759624481201172, 0.01818227767944336, 0.018768310546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 5.0, 4.0, 10.0, 18.0, 11.0, 18.0, 22.0, 27.0, 25.0, 42.0, 50.0, 45.0, 46.0, 55.0, 56.0, 61.0, 49.0, 54.0, 50.0, 68.0, 42.0, 26.0, 29.0, 25.0, 25.0, 27.0, 22.0, 16.0, 15.0, 11.0, 4.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0057525634765625, -0.005561530590057373, -0.005370497703552246, -0.005179464817047119, -0.004988431930541992, -0.004797399044036865, -0.004606366157531738, -0.004415333271026611, -0.004224300384521484, -0.004033267498016357, -0.0038422346115112305, -0.0036512017250061035, -0.0034601688385009766, -0.0032691359519958496, -0.0030781030654907227, -0.0028870701789855957, -0.0026960372924804688, -0.002505004405975342, -0.002313971519470215, -0.002122938632965088, -0.001931905746459961, -0.001740872859954834, -0.001549839973449707, -0.00135880708694458, -0.0011677742004394531, -0.0009767413139343262, -0.0007857084274291992, -0.0005946755409240723, -0.0004036426544189453, -0.00021260976791381836, -2.1576881408691406e-05, 0.00016945600509643555, 0.0003604888916015625, 0.0005515217781066895, 0.0007425546646118164, 0.0009335875511169434, 0.0011246204376220703, 0.0013156533241271973, 0.0015066862106323242, 0.0016977190971374512, 0.0018887519836425781, 0.002079784870147705, 0.002270817756652832, 0.002461850643157959, 0.002652883529663086, 0.002843916416168213, 0.00303494930267334, 0.003225982189178467, 0.0034170150756835938, 0.0036080479621887207, 0.0037990808486938477, 0.003990113735198975, 0.0041811466217041016, 0.0043721795082092285, 0.0045632123947143555, 0.004754245281219482, 0.004945278167724609, 0.005136311054229736, 0.005327343940734863, 0.00551837682723999, 0.005709409713745117, 0.005900442600250244, 0.006091475486755371, 0.006282508373260498, 0.006473541259765625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 22.0, 43.0, 108.0, 238.0, 252.0, 183.0, 78.0, 30.0, 20.0, 9.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7442717552185059, -0.7094017267227173, -0.6745316386222839, -0.6396615505218506, -0.604791522026062, -0.5699214935302734, -0.5350514054298401, -0.5001813173294067, -0.46531128883361816, -0.4304412305355072, -0.39557117223739624, -0.3607011139392853, -0.3258310556411743, -0.29096099734306335, -0.2560909390449524, -0.22122088074684143, -0.18635082244873047, -0.1514807641506195, -0.11661070585250854, -0.08174064755439758, -0.04687058925628662, -0.01200053095817566, 0.022869527339935303, 0.057739585638046265, 0.09260964393615723, 0.1274797022342682, 0.16234976053237915, 0.1972198188304901, 0.23208987712860107, 0.26695993542671204, 0.301829993724823, 0.33670005202293396, 0.37156999111175537, 0.40644004940986633, 0.4413101077079773, 0.47618016600608826, 0.5110502243041992, 0.5459202527999878, 0.5807903409004211, 0.6156604290008545, 0.6505304574966431, 0.6854004859924316, 0.720270574092865, 0.7551406621932983, 0.7900106906890869, 0.8248807191848755, 0.8597508072853088, 0.8946208953857422, 0.9294909238815308, 0.9643609523773193, 0.9992310404777527, 1.034101128578186, 1.0689711570739746, 1.1038411855697632, 1.1387112140655518, 1.1735813617706299, 1.2084513902664185, 1.243321418762207, 1.2781915664672852, 1.3130615949630737, 1.3479316234588623, 1.3828016519546509, 1.4176716804504395, 1.4525418281555176, 1.4874118566513062]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 15.0, 10.0, 16.0, 17.0, 23.0, 30.0, 36.0, 57.0, 53.0, 53.0, 60.0, 61.0, 64.0, 54.0, 59.0, 65.0, 46.0, 58.0, 49.0, 30.0, 29.0, 34.0, 19.0, 15.0, 13.0, 7.0, 4.0, 8.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3560403883457184, -0.34330275654792786, -0.33056512475013733, -0.3178274929523468, -0.3050898611545563, -0.29235222935676575, -0.2796146273612976, -0.2668769955635071, -0.25413936376571655, -0.24140173196792603, -0.2286641001701355, -0.21592646837234497, -0.20318883657455444, -0.19045120477676392, -0.17771358788013458, -0.16497595608234406, -0.15223830938339233, -0.1395006775856018, -0.12676304578781128, -0.11402542144060135, -0.10128778964281082, -0.0885501578450203, -0.07581253349781036, -0.06307490170001984, -0.05033726990222931, -0.03759963810443878, -0.024862010031938553, -0.012124381959438324, 0.0006132498383522034, 0.01335088163614273, 0.02608850598335266, 0.03882613778114319, 0.05156373977661133, 0.06430137157440186, 0.07703900337219238, 0.08977662771940231, 0.10251425951719284, 0.11525189131498337, 0.1279895156621933, 0.14072714745998383, 0.15346477925777435, 0.16620241105556488, 0.1789400428533554, 0.19167765974998474, 0.20441529154777527, 0.2171529233455658, 0.22989055514335632, 0.24262818694114685, 0.2553658187389374, 0.2681034505367279, 0.28084108233451843, 0.29357871413230896, 0.3063163459300995, 0.31905397772789, 0.33179157972335815, 0.3445292115211487, 0.3572668433189392, 0.37000447511672974, 0.38274210691452026, 0.3954797387123108, 0.4082173705101013, 0.42095500230789185, 0.4336926341056824, 0.4464302659034729, 0.4591678977012634]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 4.0, 12.0, 10.0, 12.0, 23.0, 17.0, 54.0, 56.0, 80.0, 140.0, 203.0, 293.0, 429.0, 678.0, 1136.0, 2028.0, 3539.0, 6731.0, 13703.0, 31930.0, 85351.0, 257311.0, 397036.0, 152016.0, 52730.0, 21625.0, 9914.0, 4799.0, 2746.0, 1450.0, 908.0, 519.0, 335.0, 255.0, 156.0, 92.0, 61.0, 35.0, 36.0, 22.0, 21.0, 13.0, 12.0, 5.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2183837890625, -0.2111682891845703, -0.20395278930664062, -0.19673728942871094, -0.18952178955078125, -0.18230628967285156, -0.17509078979492188, -0.1678752899169922, -0.1606597900390625, -0.1534442901611328, -0.14622879028320312, -0.13901329040527344, -0.13179779052734375, -0.12458229064941406, -0.11736679077148438, -0.11015129089355469, -0.102935791015625, -0.09572029113769531, -0.08850479125976562, -0.08128929138183594, -0.07407379150390625, -0.06685829162597656, -0.059642791748046875, -0.05242729187011719, -0.0452117919921875, -0.03799629211425781, -0.030780792236328125, -0.023565292358398438, -0.01634979248046875, -0.009134292602539062, -0.001918792724609375, 0.0052967071533203125, 0.01251220703125, 0.019727706909179688, 0.026943206787109375, 0.03415870666503906, 0.04137420654296875, 0.04858970642089844, 0.055805206298828125, 0.06302070617675781, 0.0702362060546875, 0.07745170593261719, 0.08466720581054688, 0.09188270568847656, 0.09909820556640625, 0.10631370544433594, 0.11352920532226562, 0.12074470520019531, 0.127960205078125, 0.1351757049560547, 0.14239120483398438, 0.14960670471191406, 0.15682220458984375, 0.16403770446777344, 0.17125320434570312, 0.1784687042236328, 0.1856842041015625, 0.1928997039794922, 0.20011520385742188, 0.20733070373535156, 0.21454620361328125, 0.22176170349121094, 0.22897720336914062, 0.2361927032470703, 0.243408203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 12.0, 4.0, 15.0, 15.0, 16.0, 27.0, 37.0, 47.0, 49.0, 49.0, 50.0, 77.0, 64.0, 59.0, 62.0, 68.0, 57.0, 59.0, 42.0, 45.0, 36.0, 34.0, 20.0, 14.0, 14.0, 4.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7029266357421875, -0.676361083984375, -0.6497955322265625, -0.62322998046875, -0.5966644287109375, -0.570098876953125, -0.5435333251953125, -0.5169677734375, -0.4904022216796875, -0.463836669921875, -0.4372711181640625, -0.41070556640625, -0.3841400146484375, -0.357574462890625, -0.3310089111328125, -0.304443359375, -0.2778778076171875, -0.251312255859375, -0.2247467041015625, -0.19818115234375, -0.1716156005859375, -0.145050048828125, -0.1184844970703125, -0.0919189453125, -0.0653533935546875, -0.038787841796875, -0.0122222900390625, 0.01434326171875, 0.0409088134765625, 0.067474365234375, 0.0940399169921875, 0.12060546875, 0.1471710205078125, 0.173736572265625, 0.2003021240234375, 0.22686767578125, 0.2534332275390625, 0.279998779296875, 0.3065643310546875, 0.3331298828125, 0.3596954345703125, 0.386260986328125, 0.4128265380859375, 0.43939208984375, 0.4659576416015625, 0.492523193359375, 0.5190887451171875, 0.545654296875, 0.5722198486328125, 0.598785400390625, 0.6253509521484375, 0.65191650390625, 0.6784820556640625, 0.705047607421875, 0.7316131591796875, 0.7581787109375, 0.7847442626953125, 0.811309814453125, 0.8378753662109375, 0.86444091796875, 0.8910064697265625, 0.917572021484375, 0.9441375732421875, 0.970703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 2.0, 6.0, 2.0, 8.0, 9.0, 14.0, 13.0, 33.0, 26.0, 52.0, 67.0, 137.0, 175.0, 415.0, 1043.0, 3971.0, 28812.0, 667328.0, 325370.0, 16596.0, 2805.0, 799.0, 325.0, 180.0, 114.0, 61.0, 51.0, 33.0, 20.0, 19.0, 22.0, 15.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.71142578125, -0.6904296875, -0.66943359375, -0.6484375, -0.62744140625, -0.6064453125, -0.58544921875, -0.564453125, -0.54345703125, -0.5224609375, -0.50146484375, -0.48046875, -0.45947265625, -0.4384765625, -0.41748046875, -0.396484375, -0.37548828125, -0.3544921875, -0.33349609375, -0.3125, -0.29150390625, -0.2705078125, -0.24951171875, -0.228515625, -0.20751953125, -0.1865234375, -0.16552734375, -0.14453125, -0.12353515625, -0.1025390625, -0.08154296875, -0.060546875, -0.03955078125, -0.0185546875, 0.00244140625, 0.0234375, 0.04443359375, 0.0654296875, 0.08642578125, 0.107421875, 0.12841796875, 0.1494140625, 0.17041015625, 0.19140625, 0.21240234375, 0.2333984375, 0.25439453125, 0.275390625, 0.29638671875, 0.3173828125, 0.33837890625, 0.359375, 0.38037109375, 0.4013671875, 0.42236328125, 0.443359375, 0.46435546875, 0.4853515625, 0.50634765625, 0.52734375, 0.54833984375, 0.5693359375, 0.59033203125, 0.611328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 5.0, 9.0, 13.0, 14.0, 10.0, 16.0, 19.0, 14.0, 28.0, 23.0, 30.0, 27.0, 43.0, 27.0, 40.0, 39.0, 49.0, 54.0, 49.0, 28.0, 42.0, 28.0, 29.0, 45.0, 26.0, 33.0, 39.0, 27.0, 19.0, 30.0, 19.0, 20.0, 18.0, 15.0, 5.0, 11.0, 8.0, 6.0, 5.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65185546875, -0.6307601928710938, -0.6096649169921875, -0.5885696411132812, -0.567474365234375, -0.5463790893554688, -0.5252838134765625, -0.5041885375976562, -0.48309326171875, -0.46199798583984375, -0.4409027099609375, -0.41980743408203125, -0.398712158203125, -0.37761688232421875, -0.3565216064453125, -0.33542633056640625, -0.3143310546875, -0.29323577880859375, -0.2721405029296875, -0.25104522705078125, -0.229949951171875, -0.20885467529296875, -0.1877593994140625, -0.16666412353515625, -0.14556884765625, -0.12447357177734375, -0.1033782958984375, -0.08228302001953125, -0.061187744140625, -0.04009246826171875, -0.0189971923828125, 0.00209808349609375, 0.023193359375, 0.04428863525390625, 0.0653839111328125, 0.08647918701171875, 0.107574462890625, 0.12866973876953125, 0.1497650146484375, 0.17086029052734375, 0.19195556640625, 0.21305084228515625, 0.2341461181640625, 0.25524139404296875, 0.276336669921875, 0.29743194580078125, 0.3185272216796875, 0.33962249755859375, 0.3607177734375, 0.38181304931640625, 0.4029083251953125, 0.42400360107421875, 0.445098876953125, 0.46619415283203125, 0.4872894287109375, 0.5083847045898438, 0.52947998046875, 0.5505752563476562, 0.5716705322265625, 0.5927658081054688, 0.613861083984375, 0.6349563598632812, 0.6560516357421875, 0.6771469116210938, 0.6982421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 9.0, 9.0, 17.0, 34.0, 38.0, 53.0, 113.0, 212.0, 515.0, 1319.0, 4510.0, 44514.0, 855820.0, 130851.0, 7546.0, 1743.0, 651.0, 287.0, 127.0, 67.0, 37.0, 24.0, 14.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27392578125, -0.26578521728515625, -0.2576446533203125, -0.24950408935546875, -0.241363525390625, -0.23322296142578125, -0.2250823974609375, -0.21694183349609375, -0.20880126953125, -0.20066070556640625, -0.1925201416015625, -0.18437957763671875, -0.176239013671875, -0.16809844970703125, -0.1599578857421875, -0.15181732177734375, -0.1436767578125, -0.13553619384765625, -0.1273956298828125, -0.11925506591796875, -0.111114501953125, -0.10297393798828125, -0.0948333740234375, -0.08669281005859375, -0.07855224609375, -0.07041168212890625, -0.0622711181640625, -0.05413055419921875, -0.045989990234375, -0.03784942626953125, -0.0297088623046875, -0.02156829833984375, -0.013427734375, -0.00528717041015625, 0.0028533935546875, 0.01099395751953125, 0.019134521484375, 0.02727508544921875, 0.0354156494140625, 0.04355621337890625, 0.05169677734375, 0.05983734130859375, 0.0679779052734375, 0.07611846923828125, 0.084259033203125, 0.09239959716796875, 0.1005401611328125, 0.10868072509765625, 0.1168212890625, 0.12496185302734375, 0.1331024169921875, 0.14124298095703125, 0.149383544921875, 0.15752410888671875, 0.1656646728515625, 0.17380523681640625, 0.18194580078125, 0.19008636474609375, 0.1982269287109375, 0.20636749267578125, 0.214508056640625, 0.22264862060546875, 0.2307891845703125, 0.23892974853515625, 0.2470703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 15.0, 28.0, 55.0, 137.0, 236.0, 249.0, 159.0, 72.0, 34.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.848573684692383e-05, -6.668455898761749e-05, -6.488338112831116e-05, -6.308220326900482e-05, -6.128102540969849e-05, -5.947984755039215e-05, -5.7678669691085815e-05, -5.587749183177948e-05, -5.4076313972473145e-05, -5.227513611316681e-05, -5.0473958253860474e-05, -4.867278039455414e-05, -4.68716025352478e-05, -4.507042467594147e-05, -4.326924681663513e-05, -4.1468068957328796e-05, -3.966689109802246e-05, -3.7865713238716125e-05, -3.606453537940979e-05, -3.4263357520103455e-05, -3.246217966079712e-05, -3.0661001801490784e-05, -2.8859823942184448e-05, -2.7058646082878113e-05, -2.5257468223571777e-05, -2.3456290364265442e-05, -2.1655112504959106e-05, -1.985393464565277e-05, -1.8052756786346436e-05, -1.62515789270401e-05, -1.4450401067733765e-05, -1.264922320842743e-05, -1.0848045349121094e-05, -9.046867489814758e-06, -7.245689630508423e-06, -5.444511771202087e-06, -3.643333911895752e-06, -1.8421560525894165e-06, -4.0978193283081055e-08, 1.7601996660232544e-06, 3.56137752532959e-06, 5.362555384635925e-06, 7.163733243942261e-06, 8.964911103248596e-06, 1.0766088962554932e-05, 1.2567266821861267e-05, 1.4368444681167603e-05, 1.6169622540473938e-05, 1.7970800399780273e-05, 1.977197825908661e-05, 2.1573156118392944e-05, 2.337433397769928e-05, 2.5175511837005615e-05, 2.697668969631195e-05, 2.8777867555618286e-05, 3.057904541492462e-05, 3.238022327423096e-05, 3.418140113353729e-05, 3.598257899284363e-05, 3.778375685214996e-05, 3.95849347114563e-05, 4.1386112570762634e-05, 4.318729043006897e-05, 4.4988468289375305e-05, 4.678964614868164e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 19.0, 15.0, 36.0, 60.0, 157.0, 278.0, 669.0, 1657.0, 5664.0, 52290.0, 864274.0, 111860.0, 7885.0, 2104.0, 859.0, 367.0, 175.0, 71.0, 38.0, 23.0, 12.0, 10.0, 6.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2567100524902344, -0.24803924560546875, -0.23936843872070312, -0.2306976318359375, -0.22202682495117188, -0.21335601806640625, -0.20468521118164062, -0.196014404296875, -0.18734359741210938, -0.17867279052734375, -0.17000198364257812, -0.1613311767578125, -0.15266036987304688, -0.14398956298828125, -0.13531875610351562, -0.12664794921875, -0.11797714233398438, -0.10930633544921875, -0.10063552856445312, -0.0919647216796875, -0.08329391479492188, -0.07462310791015625, -0.06595230102539062, -0.057281494140625, -0.048610687255859375, -0.03993988037109375, -0.031269073486328125, -0.0225982666015625, -0.013927459716796875, -0.00525665283203125, 0.003414154052734375, 0.0120849609375, 0.020755767822265625, 0.02942657470703125, 0.038097381591796875, 0.0467681884765625, 0.055438995361328125, 0.06410980224609375, 0.07278060913085938, 0.081451416015625, 0.09012222290039062, 0.09879302978515625, 0.10746383666992188, 0.1161346435546875, 0.12480545043945312, 0.13347625732421875, 0.14214706420898438, 0.15081787109375, 0.15948867797851562, 0.16815948486328125, 0.17683029174804688, 0.1855010986328125, 0.19417190551757812, 0.20284271240234375, 0.21151351928710938, 0.220184326171875, 0.22885513305664062, 0.23752593994140625, 0.24619674682617188, 0.2548675537109375, 0.2635383605957031, 0.27220916748046875, 0.2808799743652344, 0.28955078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 5.0, 9.0, 17.0, 18.0, 25.0, 29.0, 48.0, 70.0, 57.0, 83.0, 116.0, 118.0, 86.0, 78.0, 59.0, 42.0, 39.0, 22.0, 26.0, 20.0, 10.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06317138671875, -0.06114959716796875, -0.0591278076171875, -0.05710601806640625, -0.055084228515625, -0.05306243896484375, -0.0510406494140625, -0.04901885986328125, -0.0469970703125, -0.04497528076171875, -0.0429534912109375, -0.04093170166015625, -0.038909912109375, -0.03688812255859375, -0.0348663330078125, -0.03284454345703125, -0.03082275390625, -0.02880096435546875, -0.0267791748046875, -0.02475738525390625, -0.022735595703125, -0.02071380615234375, -0.0186920166015625, -0.01667022705078125, -0.0146484375, -0.01262664794921875, -0.0106048583984375, -0.00858306884765625, -0.006561279296875, -0.00453948974609375, -0.0025177001953125, -0.00049591064453125, 0.00152587890625, 0.00354766845703125, 0.0055694580078125, 0.00759124755859375, 0.009613037109375, 0.01163482666015625, 0.0136566162109375, 0.01567840576171875, 0.0177001953125, 0.01972198486328125, 0.0217437744140625, 0.02376556396484375, 0.025787353515625, 0.02780914306640625, 0.0298309326171875, 0.03185272216796875, 0.03387451171875, 0.03589630126953125, 0.0379180908203125, 0.03993988037109375, 0.041961669921875, 0.04398345947265625, 0.0460052490234375, 0.04802703857421875, 0.050048828125, 0.05207061767578125, 0.0540924072265625, 0.05611419677734375, 0.058135986328125, 0.06015777587890625, 0.0621795654296875, 0.06420135498046875, 0.06622314453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 3.0, 14.0, 30.0, 47.0, 95.0, 155.0, 186.0, 176.0, 118.0, 94.0, 25.0, 22.0, 16.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1412497758865356, -1.0889570713043213, -1.0366644859313965, -0.9843717813491821, -0.9320791363716125, -0.879786491394043, -0.8274937868118286, -0.775201141834259, -0.7229084968566895, -0.6706158518791199, -0.6183232069015503, -0.5660305023193359, -0.5137378573417664, -0.4614452123641968, -0.4091525375843048, -0.35685986280441284, -0.30456721782684326, -0.2522745728492737, -0.1999818980693817, -0.14768923819065094, -0.09539657831192017, -0.043103933334350586, 0.009188741445541382, 0.06148141622543335, 0.11377406120300293, 0.1660667210817337, 0.21835938096046448, 0.27065205574035645, 0.322944700717926, 0.3752373456954956, 0.4275300204753876, 0.47982269525527954, 0.5321152210235596, 0.5844078660011292, 0.6367005109786987, 0.6889932155609131, 0.7412858605384827, 0.7935785055160522, 0.8458712100982666, 0.8981638550758362, 0.9504565000534058, 1.0027492046356201, 1.055041790008545, 1.1073344945907593, 1.1596271991729736, 1.2119197845458984, 1.2642124891281128, 1.3165051937103271, 1.368797779083252, 1.4210904836654663, 1.4733830690383911, 1.5256757736206055, 1.5779683589935303, 1.6302610635757446, 1.682553768157959, 1.7348463535308838, 1.7871390581130981, 1.8394317626953125, 1.8917243480682373, 1.9440170526504517, 1.996309757232666, 2.048602342605591, 2.1008949279785156, 2.1531877517700195, 2.2054803371429443]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 5.0, 4.0, 10.0, 5.0, 10.0, 12.0, 15.0, 21.0, 30.0, 23.0, 20.0, 21.0, 27.0, 25.0, 35.0, 32.0, 36.0, 42.0, 42.0, 44.0, 41.0, 51.0, 43.0, 37.0, 41.0, 42.0, 32.0, 28.0, 29.0, 21.0, 23.0, 21.0, 17.0, 18.0, 12.0, 11.0, 10.0, 10.0, 13.0, 8.0, 3.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8651425838470459, -0.8339269757270813, -0.8027114272117615, -0.7714958190917969, -0.740280270576477, -0.7090646624565125, -0.6778490543365479, -0.646633505821228, -0.6154178977012634, -0.5842022895812988, -0.552986741065979, -0.5217711329460144, -0.4905555546283722, -0.45933997631073, -0.42812439799308777, -0.39690881967544556, -0.36569324135780334, -0.33447766304016113, -0.3032620847225189, -0.2720465064048767, -0.2408308982849121, -0.2096153199672699, -0.17839974164962769, -0.14718414843082428, -0.11596857011318207, -0.08475298434495926, -0.05353740230202675, -0.02232182025909424, 0.00889376550912857, 0.04010935127735138, 0.07132492959499359, 0.102540522813797, 0.1337561011314392, 0.16497167944908142, 0.19618727266788483, 0.22740285098552704, 0.25861844420433044, 0.28983402252197266, 0.32104960083961487, 0.3522651791572571, 0.3834807872772217, 0.4146963655948639, 0.4459119439125061, 0.4771275520324707, 0.5083431005477905, 0.5395587086677551, 0.5707743167877197, 0.6019898653030396, 0.6332054138183594, 0.664421021938324, 0.6956365704536438, 0.7268521785736084, 0.7580677270889282, 0.7892833352088928, 0.8204989433288574, 0.8517144918441772, 0.8829300999641418, 0.9141457080841064, 0.9453612565994263, 0.9765768647193909, 1.0077924728393555, 1.0390080213546753, 1.0702235698699951, 1.1014392375946045, 1.1326547861099243]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 11.0, 15.0, 19.0, 27.0, 48.0, 106.0, 232.0, 574.0, 1982.0, 8617.0, 186418.0, 3893197.0, 92337.0, 7390.0, 2071.0, 702.0, 271.0, 114.0, 61.0, 39.0, 9.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.669921875, -1.62530517578125, -1.5806884765625, -1.53607177734375, -1.491455078125, -1.44683837890625, -1.4022216796875, -1.35760498046875, -1.31298828125, -1.26837158203125, -1.2237548828125, -1.17913818359375, -1.134521484375, -1.08990478515625, -1.0452880859375, -1.00067138671875, -0.9560546875, -0.91143798828125, -0.8668212890625, -0.82220458984375, -0.777587890625, -0.73297119140625, -0.6883544921875, -0.64373779296875, -0.59912109375, -0.55450439453125, -0.5098876953125, -0.46527099609375, -0.420654296875, -0.37603759765625, -0.3314208984375, -0.28680419921875, -0.2421875, -0.19757080078125, -0.1529541015625, -0.10833740234375, -0.063720703125, -0.01910400390625, 0.0255126953125, 0.07012939453125, 0.11474609375, 0.15936279296875, 0.2039794921875, 0.24859619140625, 0.293212890625, 0.33782958984375, 0.3824462890625, 0.42706298828125, 0.4716796875, 0.51629638671875, 0.5609130859375, 0.60552978515625, 0.650146484375, 0.69476318359375, 0.7393798828125, 0.78399658203125, 0.82861328125, 0.87322998046875, 0.9178466796875, 0.96246337890625, 1.007080078125, 1.05169677734375, 1.0963134765625, 1.14093017578125, 1.185546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 7.0, 3.0, 7.0, 9.0, 18.0, 23.0, 23.0, 36.0, 62.0, 57.0, 86.0, 70.0, 80.0, 91.0, 78.0, 68.0, 68.0, 52.0, 52.0, 30.0, 29.0, 19.0, 11.0, 8.0, 9.0, 1.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6718482971191406, -0.6532669067382812, -0.6346855163574219, -0.6161041259765625, -0.5975227355957031, -0.5789413452148438, -0.5603599548339844, -0.541778564453125, -0.5231971740722656, -0.5046157836914062, -0.4860343933105469, -0.4674530029296875, -0.4488716125488281, -0.43029022216796875, -0.4117088317871094, -0.39312744140625, -0.3745460510253906, -0.35596466064453125, -0.3373832702636719, -0.3188018798828125, -0.3002204895019531, -0.28163909912109375, -0.2630577087402344, -0.244476318359375, -0.22589492797851562, -0.20731353759765625, -0.18873214721679688, -0.1701507568359375, -0.15156936645507812, -0.13298797607421875, -0.11440658569335938, -0.0958251953125, -0.07724380493164062, -0.05866241455078125, -0.040081024169921875, -0.0214996337890625, -0.002918243408203125, 0.01566314697265625, 0.034244537353515625, 0.052825927734375, 0.07140731811523438, 0.08998870849609375, 0.10857009887695312, 0.1271514892578125, 0.14573287963867188, 0.16431427001953125, 0.18289566040039062, 0.20147705078125, 0.22005844116210938, 0.23863983154296875, 0.2572212219238281, 0.2758026123046875, 0.2943840026855469, 0.31296539306640625, 0.3315467834472656, 0.350128173828125, 0.3687095642089844, 0.38729095458984375, 0.4058723449707031, 0.4244537353515625, 0.4430351257324219, 0.46161651611328125, 0.4801979064941406, 0.498779296875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 11.0, 18.0, 34.0, 54.0, 92.0, 186.0, 403.0, 1019.0, 3279.0, 20414.0, 1273973.0, 2861047.0, 27864.0, 3698.0, 1153.0, 510.0, 205.0, 131.0, 72.0, 39.0, 17.0, 12.0, 9.0, 12.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.77020263671875, -0.7318115234375, -0.69342041015625, -0.655029296875, -0.61663818359375, -0.5782470703125, -0.53985595703125, -0.50146484375, -0.46307373046875, -0.4246826171875, -0.38629150390625, -0.347900390625, -0.30950927734375, -0.2711181640625, -0.23272705078125, -0.1943359375, -0.15594482421875, -0.1175537109375, -0.07916259765625, -0.040771484375, -0.00238037109375, 0.0360107421875, 0.07440185546875, 0.11279296875, 0.15118408203125, 0.1895751953125, 0.22796630859375, 0.266357421875, 0.30474853515625, 0.3431396484375, 0.38153076171875, 0.419921875, 0.45831298828125, 0.4967041015625, 0.53509521484375, 0.573486328125, 0.61187744140625, 0.6502685546875, 0.68865966796875, 0.72705078125, 0.76544189453125, 0.8038330078125, 0.84222412109375, 0.880615234375, 0.91900634765625, 0.9573974609375, 0.99578857421875, 1.0341796875, 1.07257080078125, 1.1109619140625, 1.14935302734375, 1.187744140625, 1.22613525390625, 1.2645263671875, 1.30291748046875, 1.34130859375, 1.37969970703125, 1.4180908203125, 1.45648193359375, 1.494873046875, 1.53326416015625, 1.5716552734375, 1.61004638671875, 1.6484375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 13.0, 12.0, 35.0, 34.0, 59.0, 79.0, 137.0, 267.0, 570.0, 937.0, 837.0, 460.0, 260.0, 127.0, 70.0, 50.0, 39.0, 20.0, 10.0, 12.0, 8.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275390625, -0.26791954040527344, -0.2604484558105469, -0.2529773712158203, -0.24550628662109375, -0.2380352020263672, -0.23056411743164062, -0.22309303283691406, -0.2156219482421875, -0.20815086364746094, -0.20067977905273438, -0.1932086944580078, -0.18573760986328125, -0.1782665252685547, -0.17079544067382812, -0.16332435607910156, -0.155853271484375, -0.14838218688964844, -0.14091110229492188, -0.1334400177001953, -0.12596893310546875, -0.11849784851074219, -0.11102676391601562, -0.10355567932128906, -0.0960845947265625, -0.08861351013183594, -0.08114242553710938, -0.07367134094238281, -0.06620025634765625, -0.05872917175292969, -0.051258087158203125, -0.04378700256347656, -0.03631591796875, -0.028844833374023438, -0.021373748779296875, -0.013902664184570312, -0.00643157958984375, 0.0010395050048828125, 0.008510589599609375, 0.015981674194335938, 0.0234527587890625, 0.030923843383789062, 0.038394927978515625, 0.04586601257324219, 0.05333709716796875, 0.06080818176269531, 0.06827926635742188, 0.07575035095214844, 0.083221435546875, 0.09069252014160156, 0.09816360473632812, 0.10563468933105469, 0.11310577392578125, 0.12057685852050781, 0.12804794311523438, 0.13551902770996094, 0.1429901123046875, 0.15046119689941406, 0.15793228149414062, 0.1654033660888672, 0.17287445068359375, 0.1803455352783203, 0.18781661987304688, 0.19528770446777344, 0.2027587890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 15.0, 8.0, 38.0, 49.0, 71.0, 97.0, 131.0, 128.0, 125.0, 95.0, 73.0, 54.0, 35.0, 36.0, 11.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9480636119842529, -0.9206008315086365, -0.8931381106376648, -0.8656753301620483, -0.8382126092910767, -0.8107498288154602, -0.7832870483398438, -0.7558243274688721, -0.7283615469932556, -0.7008987665176392, -0.6734360456466675, -0.645973265171051, -0.6185104846954346, -0.5910477638244629, -0.5635849833488464, -0.53612220287323, -0.5086594820022583, -0.48119673132896423, -0.45373398065567017, -0.4262712001800537, -0.39880844950675964, -0.3713456988334656, -0.3438829183578491, -0.31642016768455505, -0.288957417011261, -0.2614946663379669, -0.23403190076351166, -0.2065691351890564, -0.17910638451576233, -0.15164363384246826, -0.124180868268013, -0.09671810269355774, -0.0692552924156189, -0.04179253429174423, -0.014329776167869568, 0.013132981956005096, 0.04059574007987976, 0.06805849075317383, 0.09552125632762909, 0.12298402190208435, 0.15044677257537842, 0.17790952324867249, 0.20537228882312775, 0.232835054397583, 0.2602978050708771, 0.28776055574417114, 0.3152233362197876, 0.34268608689308167, 0.37014883756637573, 0.3976115882396698, 0.42507433891296387, 0.4525371193885803, 0.4799998700618744, 0.5074626207351685, 0.5349254012107849, 0.5623881816864014, 0.589850902557373, 0.6173136830329895, 0.6447764039039612, 0.6722391843795776, 0.6997019052505493, 0.7271646857261658, 0.7546274662017822, 0.7820901870727539, 0.8095529675483704]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 3.0, 4.0, 7.0, 7.0, 12.0, 12.0, 14.0, 14.0, 23.0, 24.0, 31.0, 36.0, 27.0, 37.0, 47.0, 49.0, 32.0, 39.0, 39.0, 52.0, 46.0, 40.0, 36.0, 42.0, 48.0, 39.0, 33.0, 29.0, 22.0, 27.0, 28.0, 19.0, 12.0, 14.0, 7.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3701837360858917, -0.3575890064239502, -0.3449942469596863, -0.33239951729774475, -0.3198047876358032, -0.3072100281715393, -0.2946152985095978, -0.28202056884765625, -0.26942580938339233, -0.2568310797214508, -0.2442363202571869, -0.23164159059524536, -0.21904684603214264, -0.20645210146903992, -0.1938573718070984, -0.18126262724399567, -0.16866788268089294, -0.15607313811779022, -0.1434783935546875, -0.13088366389274597, -0.11828891932964325, -0.10569417476654053, -0.0930994376540184, -0.08050470054149628, -0.06790995597839355, -0.05531521514058113, -0.04272047430276871, -0.030125733464956284, -0.01753099262714386, -0.004936248064041138, 0.0076584890484809875, 0.020253226161003113, 0.03284800052642822, 0.045442741364240646, 0.05803748220205307, 0.0706322193145752, 0.08322696387767792, 0.09582170844078064, 0.10841644555330276, 0.12101118266582489, 0.1336059272289276, 0.14620067179203033, 0.15879541635513306, 0.17139014601707458, 0.1839848905801773, 0.19657963514328003, 0.20917436480522156, 0.22176910936832428, 0.234363853931427, 0.24695859849452972, 0.25955334305763245, 0.272148072719574, 0.2847428321838379, 0.2973375618457794, 0.30993229150772095, 0.32252705097198486, 0.3351217806339264, 0.3477165102958679, 0.36031126976013184, 0.37290599942207336, 0.3855007290840149, 0.3980954885482788, 0.41069021821022034, 0.42328494787216187, 0.4358797073364258]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 8.0, 11.0, 6.0, 12.0, 10.0, 22.0, 47.0, 72.0, 179.0, 398.0, 1140.0, 3326.0, 13795.0, 116139.0, 760696.0, 132414.0, 14623.0, 3654.0, 1187.0, 423.0, 159.0, 79.0, 40.0, 23.0, 13.0, 8.0, 10.0, 6.0, 12.0, 5.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.22705078125, -0.2206592559814453, -0.21426773071289062, -0.20787620544433594, -0.20148468017578125, -0.19509315490722656, -0.18870162963867188, -0.1823101043701172, -0.1759185791015625, -0.1695270538330078, -0.16313552856445312, -0.15674400329589844, -0.15035247802734375, -0.14396095275878906, -0.13756942749023438, -0.1311779022216797, -0.124786376953125, -0.11839485168457031, -0.11200332641601562, -0.10561180114746094, -0.09922027587890625, -0.09282875061035156, -0.08643722534179688, -0.08004570007324219, -0.0736541748046875, -0.06726264953613281, -0.060871124267578125, -0.05447959899902344, -0.04808807373046875, -0.04169654846191406, -0.035305023193359375, -0.028913497924804688, -0.02252197265625, -0.016130447387695312, -0.009738922119140625, -0.0033473968505859375, 0.00304412841796875, 0.009435653686523438, 0.015827178955078125, 0.022218704223632812, 0.0286102294921875, 0.03500175476074219, 0.041393280029296875, 0.04778480529785156, 0.05417633056640625, 0.06056785583496094, 0.06695938110351562, 0.07335090637207031, 0.079742431640625, 0.08613395690917969, 0.09252548217773438, 0.09891700744628906, 0.10530853271484375, 0.11170005798339844, 0.11809158325195312, 0.12448310852050781, 0.1308746337890625, 0.1372661590576172, 0.14365768432617188, 0.15004920959472656, 0.15644073486328125, 0.16283226013183594, 0.16922378540039062, 0.1756153106689453, 0.1820068359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 6.0, 7.0, 16.0, 15.0, 17.0, 23.0, 44.0, 48.0, 44.0, 47.0, 61.0, 58.0, 45.0, 63.0, 59.0, 56.0, 55.0, 43.0, 47.0, 43.0, 36.0, 35.0, 31.0, 18.0, 13.0, 8.0, 9.0, 8.0, 6.0, 6.0, 4.0, 7.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.24976348876953125, -0.2392730712890625, -0.22878265380859375, -0.218292236328125, -0.20780181884765625, -0.1973114013671875, -0.18682098388671875, -0.17633056640625, -0.16584014892578125, -0.1553497314453125, -0.14485931396484375, -0.134368896484375, -0.12387847900390625, -0.1133880615234375, -0.10289764404296875, -0.0924072265625, -0.08191680908203125, -0.0714263916015625, -0.06093597412109375, -0.050445556640625, -0.03995513916015625, -0.0294647216796875, -0.01897430419921875, -0.00848388671875, 0.00200653076171875, 0.0124969482421875, 0.02298736572265625, 0.033477783203125, 0.04396820068359375, 0.0544586181640625, 0.06494903564453125, 0.075439453125, 0.08592987060546875, 0.0964202880859375, 0.10691070556640625, 0.117401123046875, 0.12789154052734375, 0.1383819580078125, 0.14887237548828125, 0.15936279296875, 0.16985321044921875, 0.1803436279296875, 0.19083404541015625, 0.201324462890625, 0.21181488037109375, 0.2223052978515625, 0.23279571533203125, 0.2432861328125, 0.25377655029296875, 0.2642669677734375, 0.27475738525390625, 0.285247802734375, 0.29573822021484375, 0.3062286376953125, 0.31671905517578125, 0.32720947265625, 0.33769989013671875, 0.3481903076171875, 0.35868072509765625, 0.369171142578125, 0.37966156005859375, 0.3901519775390625, 0.40064239501953125, 0.4111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 21.0, 22.0, 31.0, 40.0, 75.0, 102.0, 143.0, 235.0, 366.0, 660.0, 1043.0, 1929.0, 3981.0, 9011.0, 24622.0, 88070.0, 315246.0, 409046.0, 135251.0, 35914.0, 11889.0, 5031.0, 2474.0, 1300.0, 747.0, 460.0, 275.0, 189.0, 116.0, 66.0, 60.0, 38.0, 23.0, 19.0, 11.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.088043212890625, -0.08538818359375, -0.082733154296875, -0.080078125, -0.077423095703125, -0.07476806640625, -0.072113037109375, -0.0694580078125, -0.066802978515625, -0.06414794921875, -0.061492919921875, -0.058837890625, -0.056182861328125, -0.05352783203125, -0.050872802734375, -0.0482177734375, -0.045562744140625, -0.04290771484375, -0.040252685546875, -0.03759765625, -0.034942626953125, -0.03228759765625, -0.029632568359375, -0.0269775390625, -0.024322509765625, -0.02166748046875, -0.019012451171875, -0.016357421875, -0.013702392578125, -0.01104736328125, -0.008392333984375, -0.0057373046875, -0.003082275390625, -0.00042724609375, 0.002227783203125, 0.0048828125, 0.007537841796875, 0.01019287109375, 0.012847900390625, 0.0155029296875, 0.018157958984375, 0.02081298828125, 0.023468017578125, 0.026123046875, 0.028778076171875, 0.03143310546875, 0.034088134765625, 0.0367431640625, 0.039398193359375, 0.04205322265625, 0.044708251953125, 0.04736328125, 0.050018310546875, 0.05267333984375, 0.055328369140625, 0.0579833984375, 0.060638427734375, 0.06329345703125, 0.065948486328125, 0.068603515625, 0.071258544921875, 0.07391357421875, 0.076568603515625, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 3.0, 8.0, 10.0, 17.0, 19.0, 11.0, 18.0, 18.0, 27.0, 27.0, 25.0, 46.0, 46.0, 43.0, 51.0, 51.0, 36.0, 46.0, 46.0, 43.0, 33.0, 40.0, 46.0, 48.0, 37.0, 41.0, 31.0, 22.0, 16.0, 17.0, 19.0, 11.0, 6.0, 5.0, 9.0, 6.0, 3.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.583984375, -0.566680908203125, -0.54937744140625, -0.532073974609375, -0.5147705078125, -0.497467041015625, -0.48016357421875, -0.462860107421875, -0.445556640625, -0.428253173828125, -0.41094970703125, -0.393646240234375, -0.3763427734375, -0.359039306640625, -0.34173583984375, -0.324432373046875, -0.30712890625, -0.289825439453125, -0.27252197265625, -0.255218505859375, -0.2379150390625, -0.220611572265625, -0.20330810546875, -0.186004638671875, -0.168701171875, -0.151397705078125, -0.13409423828125, -0.116790771484375, -0.0994873046875, -0.082183837890625, -0.06488037109375, -0.047576904296875, -0.0302734375, -0.012969970703125, 0.00433349609375, 0.021636962890625, 0.0389404296875, 0.056243896484375, 0.07354736328125, 0.090850830078125, 0.108154296875, 0.125457763671875, 0.14276123046875, 0.160064697265625, 0.1773681640625, 0.194671630859375, 0.21197509765625, 0.229278564453125, 0.24658203125, 0.263885498046875, 0.28118896484375, 0.298492431640625, 0.3157958984375, 0.333099365234375, 0.35040283203125, 0.367706298828125, 0.385009765625, 0.402313232421875, 0.41961669921875, 0.436920166015625, 0.4542236328125, 0.471527099609375, 0.48883056640625, 0.506134033203125, 0.5234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 16.0, 14.0, 33.0, 43.0, 54.0, 81.0, 131.0, 214.0, 382.0, 677.0, 1378.0, 2977.0, 7206.0, 21174.0, 94362.0, 424977.0, 383616.0, 80181.0, 18870.0, 6431.0, 2801.0, 1325.0, 670.0, 379.0, 202.0, 120.0, 74.0, 45.0, 40.0, 13.0, 17.0, 8.0, 9.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294647216796875, -0.02851271629333496, -0.027560710906982422, -0.026608705520629883, -0.025656700134277344, -0.024704694747924805, -0.023752689361572266, -0.022800683975219727, -0.021848678588867188, -0.02089667320251465, -0.01994466781616211, -0.01899266242980957, -0.01804065704345703, -0.017088651657104492, -0.016136646270751953, -0.015184640884399414, -0.014232635498046875, -0.013280630111694336, -0.012328624725341797, -0.011376619338989258, -0.010424613952636719, -0.00947260856628418, -0.00852060317993164, -0.0075685977935791016, -0.0066165924072265625, -0.0056645870208740234, -0.004712581634521484, -0.0037605762481689453, -0.0028085708618164062, -0.0018565654754638672, -0.0009045600891113281, 4.744529724121094e-05, 0.00099945068359375, 0.001951456069946289, 0.002903461456298828, 0.003855466842651367, 0.004807472229003906, 0.005759477615356445, 0.006711483001708984, 0.0076634883880615234, 0.008615493774414062, 0.009567499160766602, 0.01051950454711914, 0.01147150993347168, 0.012423515319824219, 0.013375520706176758, 0.014327526092529297, 0.015279531478881836, 0.016231536865234375, 0.017183542251586914, 0.018135547637939453, 0.019087553024291992, 0.02003955841064453, 0.02099156379699707, 0.02194356918334961, 0.02289557456970215, 0.023847579956054688, 0.024799585342407227, 0.025751590728759766, 0.026703596115112305, 0.027655601501464844, 0.028607606887817383, 0.029559612274169922, 0.03051161766052246, 0.031463623046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 11.0, 6.0, 17.0, 18.0, 32.0, 44.0, 52.0, 70.0, 95.0, 134.0, 113.0, 105.0, 69.0, 70.0, 41.0, 31.0, 27.0, 18.0, 5.0, 9.0, 5.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5139579772949219e-05, -1.4603137969970703e-05, -1.4066696166992188e-05, -1.3530254364013672e-05, -1.2993812561035156e-05, -1.245737075805664e-05, -1.1920928955078125e-05, -1.138448715209961e-05, -1.0848045349121094e-05, -1.0311603546142578e-05, -9.775161743164062e-06, -9.238719940185547e-06, -8.702278137207031e-06, -8.165836334228516e-06, -7.62939453125e-06, -7.092952728271484e-06, -6.556510925292969e-06, -6.020069122314453e-06, -5.4836273193359375e-06, -4.947185516357422e-06, -4.410743713378906e-06, -3.874301910400391e-06, -3.337860107421875e-06, -2.8014183044433594e-06, -2.2649765014648438e-06, -1.7285346984863281e-06, -1.1920928955078125e-06, -6.556510925292969e-07, -1.1920928955078125e-07, 4.172325134277344e-07, 9.5367431640625e-07, 1.4901161193847656e-06, 2.0265579223632812e-06, 2.562999725341797e-06, 3.0994415283203125e-06, 3.635883331298828e-06, 4.172325134277344e-06, 4.708766937255859e-06, 5.245208740234375e-06, 5.781650543212891e-06, 6.318092346191406e-06, 6.854534149169922e-06, 7.3909759521484375e-06, 7.927417755126953e-06, 8.463859558105469e-06, 9.000301361083984e-06, 9.5367431640625e-06, 1.0073184967041016e-05, 1.0609626770019531e-05, 1.1146068572998047e-05, 1.1682510375976562e-05, 1.2218952178955078e-05, 1.2755393981933594e-05, 1.329183578491211e-05, 1.3828277587890625e-05, 1.436471939086914e-05, 1.4901161193847656e-05, 1.5437602996826172e-05, 1.5974044799804688e-05, 1.6510486602783203e-05, 1.704692840576172e-05, 1.7583370208740234e-05, 1.811981201171875e-05, 1.8656253814697266e-05, 1.919269561767578e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 10.0, 24.0, 34.0, 49.0, 77.0, 133.0, 215.0, 366.0, 668.0, 1070.0, 1974.0, 4146.0, 9310.0, 27832.0, 109755.0, 400573.0, 359966.0, 91702.0, 24346.0, 8333.0, 3600.0, 1830.0, 999.0, 618.0, 379.0, 203.0, 126.0, 72.0, 41.0, 33.0, 21.0, 13.0, 9.0, 8.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0360107421875, -0.03506159782409668, -0.03411245346069336, -0.03316330909729004, -0.03221416473388672, -0.0312650203704834, -0.030315876007080078, -0.029366731643676758, -0.028417587280273438, -0.027468442916870117, -0.026519298553466797, -0.025570154190063477, -0.024621009826660156, -0.023671865463256836, -0.022722721099853516, -0.021773576736450195, -0.020824432373046875, -0.019875288009643555, -0.018926143646240234, -0.017976999282836914, -0.017027854919433594, -0.016078710556030273, -0.015129566192626953, -0.014180421829223633, -0.013231277465820312, -0.012282133102416992, -0.011332988739013672, -0.010383844375610352, -0.009434700012207031, -0.008485555648803711, -0.007536411285400391, -0.00658726692199707, -0.00563812255859375, -0.00468897819519043, -0.0037398338317871094, -0.002790689468383789, -0.0018415451049804688, -0.0008924007415771484, 5.6743621826171875e-05, 0.0010058879852294922, 0.0019550323486328125, 0.002904176712036133, 0.003853321075439453, 0.0048024654388427734, 0.005751609802246094, 0.006700754165649414, 0.007649898529052734, 0.008599042892456055, 0.009548187255859375, 0.010497331619262695, 0.011446475982666016, 0.012395620346069336, 0.013344764709472656, 0.014293909072875977, 0.015243053436279297, 0.016192197799682617, 0.017141342163085938, 0.018090486526489258, 0.019039630889892578, 0.0199887752532959, 0.02093791961669922, 0.02188706398010254, 0.02283620834350586, 0.02378535270690918, 0.0247344970703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 8.0, 6.0, 11.0, 3.0, 11.0, 18.0, 16.0, 33.0, 36.0, 57.0, 53.0, 67.0, 77.0, 72.0, 69.0, 81.0, 57.0, 61.0, 47.0, 41.0, 33.0, 30.0, 27.0, 21.0, 12.0, 9.0, 3.0, 8.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.008331298828125, -0.008081316947937012, -0.007831335067749023, -0.007581353187561035, -0.007331371307373047, -0.007081389427185059, -0.00683140754699707, -0.006581425666809082, -0.006331443786621094, -0.0060814619064331055, -0.005831480026245117, -0.005581498146057129, -0.005331516265869141, -0.005081534385681152, -0.004831552505493164, -0.004581570625305176, -0.0043315887451171875, -0.004081606864929199, -0.003831624984741211, -0.0035816431045532227, -0.0033316612243652344, -0.003081679344177246, -0.002831697463989258, -0.0025817155838012695, -0.0023317337036132812, -0.002081751823425293, -0.0018317699432373047, -0.0015817880630493164, -0.0013318061828613281, -0.0010818243026733398, -0.0008318424224853516, -0.0005818605422973633, -0.000331878662109375, -8.189678192138672e-05, 0.00016808509826660156, 0.00041806697845458984, 0.0006680488586425781, 0.0009180307388305664, 0.0011680126190185547, 0.001417994499206543, 0.0016679763793945312, 0.0019179582595825195, 0.002167940139770508, 0.002417922019958496, 0.0026679039001464844, 0.0029178857803344727, 0.003167867660522461, 0.0034178495407104492, 0.0036678314208984375, 0.003917813301086426, 0.004167795181274414, 0.004417777061462402, 0.004667758941650391, 0.004917740821838379, 0.005167722702026367, 0.0054177045822143555, 0.005667686462402344, 0.005917668342590332, 0.00616765022277832, 0.006417632102966309, 0.006667613983154297, 0.006917595863342285, 0.0071675777435302734, 0.007417559623718262, 0.00766754150390625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 11.0, 34.0, 65.0, 145.0, 214.0, 238.0, 153.0, 79.0, 35.0, 12.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.691898763179779, -0.6619037985801697, -0.6319088339805603, -0.6019138693809509, -0.5719189047813416, -0.5419239401817322, -0.5119289755821228, -0.4819340109825134, -0.45193904638290405, -0.4219440817832947, -0.3919491171836853, -0.3619541525840759, -0.33195918798446655, -0.3019642233848572, -0.2719692587852478, -0.24197429418563843, -0.21197932958602905, -0.18198436498641968, -0.1519894003868103, -0.12199443578720093, -0.09199947118759155, -0.06200450658798218, -0.0320095419883728, -0.0020145773887634277, 0.027980387210845947, 0.05797535181045532, 0.0879703164100647, 0.11796528100967407, 0.14796024560928345, 0.17795521020889282, 0.2079501748085022, 0.23794513940811157, 0.2679401636123657, 0.2979351282119751, 0.3279300928115845, 0.35792505741119385, 0.3879200220108032, 0.4179149866104126, 0.447909951210022, 0.47790491580963135, 0.5078998804092407, 0.5378948450088501, 0.5678898096084595, 0.5978847742080688, 0.6278797388076782, 0.6578747034072876, 0.687869668006897, 0.7178646326065063, 0.7478595972061157, 0.7778545618057251, 0.8078495264053345, 0.8378444910049438, 0.8678394556045532, 0.8978344202041626, 0.927829384803772, 0.9578243494033813, 0.9878193140029907, 1.0178142786026, 1.0478092432022095, 1.0778042078018188, 1.1077991724014282, 1.1377941370010376, 1.167789101600647, 1.1977840662002563, 1.2277790307998657]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 6.0, 9.0, 13.0, 10.0, 12.0, 19.0, 21.0, 23.0, 47.0, 37.0, 28.0, 45.0, 65.0, 42.0, 46.0, 60.0, 56.0, 52.0, 40.0, 52.0, 47.0, 49.0, 35.0, 38.0, 29.0, 24.0, 14.0, 22.0, 7.0, 7.0, 8.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2623453438282013, -0.2529442012310028, -0.24354302883148193, -0.23414188623428345, -0.22474072873592377, -0.2153395712375641, -0.2059384137392044, -0.19653725624084473, -0.18713611364364624, -0.17773495614528656, -0.16833379864692688, -0.1589326560497284, -0.1495314985513687, -0.14013034105300903, -0.13072918355464935, -0.12132803350687027, -0.11192686855792999, -0.10252571105957031, -0.09312456101179123, -0.08372340351343155, -0.07432225346565247, -0.06492109596729279, -0.055519938468933105, -0.04611878842115402, -0.03671763092279434, -0.02731647714972496, -0.01791532151401043, -0.008514165878295898, 0.0008869878947734833, 0.010288141667842865, 0.019689299166202545, 0.02909044921398163, 0.03849160671234131, 0.04789276048541069, 0.05729391425848007, 0.06669507175683975, 0.07609622180461884, 0.08549737930297852, 0.0948985368013382, 0.10429968684911728, 0.11370084434747696, 0.12310200184583664, 0.13250315189361572, 0.1419043093919754, 0.15130546689033508, 0.16070660948753357, 0.17010778188705444, 0.17950892448425293, 0.1889100819826126, 0.1983112394809723, 0.20771239697933197, 0.21711355447769165, 0.22651469707489014, 0.23591585457324982, 0.2453170120716095, 0.254718154668808, 0.26411932706832886, 0.27352046966552734, 0.2829216420650482, 0.2923227846622467, 0.3017239570617676, 0.31112509965896606, 0.32052624225616455, 0.3299274146556854, 0.3393285572528839]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 7.0, 8.0, 7.0, 4.0, 14.0, 44.0, 54.0, 85.0, 149.0, 268.0, 568.0, 1301.0, 3526.0, 11035.0, 43254.0, 342061.0, 569590.0, 55920.0, 13728.0, 4134.0, 1447.0, 611.0, 298.0, 175.0, 95.0, 62.0, 27.0, 20.0, 19.0, 16.0, 5.0, 10.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4888916015625, -0.475341796875, -0.4617919921875, -0.4482421875, -0.4346923828125, -0.421142578125, -0.4075927734375, -0.39404296875, -0.3804931640625, -0.366943359375, -0.3533935546875, -0.33984375, -0.3262939453125, -0.312744140625, -0.2991943359375, -0.28564453125, -0.2720947265625, -0.258544921875, -0.2449951171875, -0.2314453125, -0.2178955078125, -0.204345703125, -0.1907958984375, -0.17724609375, -0.1636962890625, -0.150146484375, -0.1365966796875, -0.123046875, -0.1094970703125, -0.095947265625, -0.0823974609375, -0.06884765625, -0.0552978515625, -0.041748046875, -0.0281982421875, -0.0146484375, -0.0010986328125, 0.012451171875, 0.0260009765625, 0.03955078125, 0.0531005859375, 0.066650390625, 0.0802001953125, 0.09375, 0.1072998046875, 0.120849609375, 0.1343994140625, 0.14794921875, 0.1614990234375, 0.175048828125, 0.1885986328125, 0.2021484375, 0.2156982421875, 0.229248046875, 0.2427978515625, 0.25634765625, 0.2698974609375, 0.283447265625, 0.2969970703125, 0.310546875, 0.3240966796875, 0.337646484375, 0.3511962890625, 0.36474609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 1.0, 6.0, 7.0, 11.0, 9.0, 15.0, 26.0, 13.0, 36.0, 34.0, 30.0, 37.0, 46.0, 37.0, 44.0, 57.0, 53.0, 51.0, 58.0, 48.0, 52.0, 57.0, 37.0, 53.0, 37.0, 17.0, 22.0, 19.0, 12.0, 16.0, 14.0, 6.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5316925048828125, -0.513580322265625, -0.4954681396484375, -0.47735595703125, -0.4592437744140625, -0.441131591796875, -0.4230194091796875, -0.4049072265625, -0.3867950439453125, -0.368682861328125, -0.3505706787109375, -0.33245849609375, -0.3143463134765625, -0.296234130859375, -0.2781219482421875, -0.260009765625, -0.2418975830078125, -0.223785400390625, -0.2056732177734375, -0.18756103515625, -0.1694488525390625, -0.151336669921875, -0.1332244873046875, -0.1151123046875, -0.0970001220703125, -0.078887939453125, -0.0607757568359375, -0.04266357421875, -0.0245513916015625, -0.006439208984375, 0.0116729736328125, 0.02978515625, 0.0478973388671875, 0.066009521484375, 0.0841217041015625, 0.10223388671875, 0.1203460693359375, 0.138458251953125, 0.1565704345703125, 0.1746826171875, 0.1927947998046875, 0.210906982421875, 0.2290191650390625, 0.24713134765625, 0.2652435302734375, 0.283355712890625, 0.3014678955078125, 0.319580078125, 0.3376922607421875, 0.355804443359375, 0.3739166259765625, 0.39202880859375, 0.4101409912109375, 0.428253173828125, 0.4463653564453125, 0.4644775390625, 0.4825897216796875, 0.500701904296875, 0.5188140869140625, 0.53692626953125, 0.5550384521484375, 0.573150634765625, 0.5912628173828125, 0.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 6.0, 7.0, 10.0, 9.0, 12.0, 13.0, 12.0, 19.0, 23.0, 36.0, 42.0, 69.0, 71.0, 116.0, 158.0, 290.0, 605.0, 1836.0, 11212.0, 225697.0, 783161.0, 20809.0, 2648.0, 695.0, 321.0, 183.0, 131.0, 88.0, 59.0, 41.0, 33.0, 25.0, 22.0, 17.0, 21.0, 20.0, 6.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6583709716796875, -0.632171630859375, -0.6059722900390625, -0.57977294921875, -0.5535736083984375, -0.527374267578125, -0.5011749267578125, -0.4749755859375, -0.4487762451171875, -0.422576904296875, -0.3963775634765625, -0.37017822265625, -0.3439788818359375, -0.317779541015625, -0.2915802001953125, -0.265380859375, -0.2391815185546875, -0.212982177734375, -0.1867828369140625, -0.16058349609375, -0.1343841552734375, -0.108184814453125, -0.0819854736328125, -0.0557861328125, -0.0295867919921875, -0.003387451171875, 0.0228118896484375, 0.04901123046875, 0.0752105712890625, 0.101409912109375, 0.1276092529296875, 0.15380859375, 0.1800079345703125, 0.206207275390625, 0.2324066162109375, 0.25860595703125, 0.2848052978515625, 0.311004638671875, 0.3372039794921875, 0.3634033203125, 0.3896026611328125, 0.415802001953125, 0.4420013427734375, 0.46820068359375, 0.4944000244140625, 0.520599365234375, 0.5467987060546875, 0.572998046875, 0.5991973876953125, 0.625396728515625, 0.6515960693359375, 0.67779541015625, 0.7039947509765625, 0.730194091796875, 0.7563934326171875, 0.7825927734375, 0.8087921142578125, 0.834991455078125, 0.8611907958984375, 0.88739013671875, 0.9135894775390625, 0.939788818359375, 0.9659881591796875, 0.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 8.0, 3.0, 7.0, 14.0, 12.0, 15.0, 10.0, 15.0, 13.0, 21.0, 26.0, 30.0, 26.0, 44.0, 28.0, 38.0, 55.0, 45.0, 67.0, 63.0, 41.0, 46.0, 45.0, 45.0, 32.0, 37.0, 35.0, 21.0, 31.0, 16.0, 19.0, 20.0, 21.0, 17.0, 7.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.557525634765625, -0.53692626953125, -0.516326904296875, -0.4957275390625, -0.475128173828125, -0.45452880859375, -0.433929443359375, -0.413330078125, -0.392730712890625, -0.37213134765625, -0.351531982421875, -0.3309326171875, -0.310333251953125, -0.28973388671875, -0.269134521484375, -0.24853515625, -0.227935791015625, -0.20733642578125, -0.186737060546875, -0.1661376953125, -0.145538330078125, -0.12493896484375, -0.104339599609375, -0.083740234375, -0.063140869140625, -0.04254150390625, -0.021942138671875, -0.0013427734375, 0.019256591796875, 0.03985595703125, 0.060455322265625, 0.0810546875, 0.101654052734375, 0.12225341796875, 0.142852783203125, 0.1634521484375, 0.184051513671875, 0.20465087890625, 0.225250244140625, 0.245849609375, 0.266448974609375, 0.28704833984375, 0.307647705078125, 0.3282470703125, 0.348846435546875, 0.36944580078125, 0.390045166015625, 0.41064453125, 0.431243896484375, 0.45184326171875, 0.472442626953125, 0.4930419921875, 0.513641357421875, 0.53424072265625, 0.554840087890625, 0.575439453125, 0.596038818359375, 0.61663818359375, 0.637237548828125, 0.6578369140625, 0.678436279296875, 0.69903564453125, 0.719635009765625, 0.740234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 13.0, 18.0, 20.0, 34.0, 56.0, 113.0, 183.0, 382.0, 987.0, 5579.0, 634468.0, 399931.0, 4978.0, 979.0, 368.0, 182.0, 97.0, 61.0, 25.0, 28.0, 15.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.55224609375, -0.5396881103515625, -0.527130126953125, -0.5145721435546875, -0.50201416015625, -0.4894561767578125, -0.476898193359375, -0.4643402099609375, -0.4517822265625, -0.4392242431640625, -0.426666259765625, -0.4141082763671875, -0.40155029296875, -0.3889923095703125, -0.376434326171875, -0.3638763427734375, -0.351318359375, -0.3387603759765625, -0.326202392578125, -0.3136444091796875, -0.30108642578125, -0.2885284423828125, -0.275970458984375, -0.2634124755859375, -0.2508544921875, -0.2382965087890625, -0.225738525390625, -0.2131805419921875, -0.20062255859375, -0.1880645751953125, -0.175506591796875, -0.1629486083984375, -0.150390625, -0.1378326416015625, -0.125274658203125, -0.1127166748046875, -0.10015869140625, -0.0876007080078125, -0.075042724609375, -0.0624847412109375, -0.0499267578125, -0.0373687744140625, -0.024810791015625, -0.0122528076171875, 0.00030517578125, 0.0128631591796875, 0.025421142578125, 0.0379791259765625, 0.050537109375, 0.0630950927734375, 0.075653076171875, 0.0882110595703125, 0.10076904296875, 0.1133270263671875, 0.125885009765625, 0.1384429931640625, 0.1510009765625, 0.1635589599609375, 0.176116943359375, 0.1886749267578125, 0.20123291015625, 0.2137908935546875, 0.226348876953125, 0.2389068603515625, 0.25146484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 14.0, 20.0, 69.0, 218.0, 505.0, 115.0, 41.0, 11.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001373291015625, -0.00013459939509630203, -0.00013186968863010406, -0.0001291399821639061, -0.00012641027569770813, -0.00012368056923151016, -0.0001209508627653122, -0.00011822115629911423, -0.00011549144983291626, -0.00011276174336671829, -0.00011003203690052032, -0.00010730233043432236, -0.00010457262396812439, -0.00010184291750192642, -9.911321103572845e-05, -9.638350456953049e-05, -9.365379810333252e-05, -9.092409163713455e-05, -8.819438517093658e-05, -8.546467870473862e-05, -8.273497223854065e-05, -8.000526577234268e-05, -7.727555930614471e-05, -7.454585283994675e-05, -7.181614637374878e-05, -6.908643990755081e-05, -6.635673344135284e-05, -6.362702697515488e-05, -6.089732050895691e-05, -5.816761404275894e-05, -5.5437907576560974e-05, -5.2708201110363007e-05, -4.997849464416504e-05, -4.724878817796707e-05, -4.4519081711769104e-05, -4.1789375245571136e-05, -3.905966877937317e-05, -3.63299623131752e-05, -3.3600255846977234e-05, -3.0870549380779266e-05, -2.81408429145813e-05, -2.541113644838333e-05, -2.2681429982185364e-05, -1.9951723515987396e-05, -1.722201704978943e-05, -1.4492310583591461e-05, -1.1762604117393494e-05, -9.032897651195526e-06, -6.303191184997559e-06, -3.573484718799591e-06, -8.437782526016235e-07, 1.885928213596344e-06, 4.6156346797943115e-06, 7.345341145992279e-06, 1.0075047612190247e-05, 1.2804754078388214e-05, 1.553446054458618e-05, 1.826416701078415e-05, 2.0993873476982117e-05, 2.3723579943180084e-05, 2.6453286409378052e-05, 2.918299287557602e-05, 3.191269934177399e-05, 3.4642405807971954e-05, 3.737211227416992e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 10.0, 34.0, 53.0, 130.0, 300.0, 1018.0, 11944.0, 1021441.0, 12082.0, 1028.0, 276.0, 105.0, 56.0, 28.0, 23.0, 11.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5220108032226562, -0.5015411376953125, -0.48107147216796875, -0.460601806640625, -0.44013214111328125, -0.4196624755859375, -0.39919281005859375, -0.37872314453125, -0.35825347900390625, -0.3377838134765625, -0.31731414794921875, -0.296844482421875, -0.27637481689453125, -0.2559051513671875, -0.23543548583984375, -0.2149658203125, -0.19449615478515625, -0.1740264892578125, -0.15355682373046875, -0.133087158203125, -0.11261749267578125, -0.0921478271484375, -0.07167816162109375, -0.05120849609375, -0.03073883056640625, -0.0102691650390625, 0.01020050048828125, 0.030670166015625, 0.05113983154296875, 0.0716094970703125, 0.09207916259765625, 0.112548828125, 0.13301849365234375, 0.1534881591796875, 0.17395782470703125, 0.194427490234375, 0.21489715576171875, 0.2353668212890625, 0.25583648681640625, 0.27630615234375, 0.29677581787109375, 0.3172454833984375, 0.33771514892578125, 0.358184814453125, 0.37865447998046875, 0.3991241455078125, 0.41959381103515625, 0.4400634765625, 0.46053314208984375, 0.4810028076171875, 0.5014724731445312, 0.521942138671875, 0.5424118041992188, 0.5628814697265625, 0.5833511352539062, 0.60382080078125, 0.6242904663085938, 0.6447601318359375, 0.6652297973632812, 0.685699462890625, 0.7061691284179688, 0.7266387939453125, 0.7471084594726562, 0.767578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 16.0, 22.0, 29.0, 51.0, 68.0, 148.0, 294.0, 148.0, 89.0, 51.0, 25.0, 21.0, 11.0, 10.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140869140625, -0.1373891830444336, -0.1339092254638672, -0.13042926788330078, -0.12694931030273438, -0.12346935272216797, -0.11998939514160156, -0.11650943756103516, -0.11302947998046875, -0.10954952239990234, -0.10606956481933594, -0.10258960723876953, -0.09910964965820312, -0.09562969207763672, -0.09214973449707031, -0.0886697769165039, -0.0851898193359375, -0.0817098617553711, -0.07822990417480469, -0.07474994659423828, -0.07126998901367188, -0.06779003143310547, -0.06431007385253906, -0.060830116271972656, -0.05735015869140625, -0.053870201110839844, -0.05039024353027344, -0.04691028594970703, -0.043430328369140625, -0.03995037078857422, -0.03647041320800781, -0.032990455627441406, -0.029510498046875, -0.026030540466308594, -0.022550582885742188, -0.01907062530517578, -0.015590667724609375, -0.012110710144042969, -0.008630752563476562, -0.005150794982910156, -0.00167083740234375, 0.0018091201782226562, 0.0052890777587890625, 0.008769035339355469, 0.012248992919921875, 0.01572895050048828, 0.019208908081054688, 0.022688865661621094, 0.0261688232421875, 0.029648780822753906, 0.03312873840332031, 0.03660869598388672, 0.040088653564453125, 0.04356861114501953, 0.04704856872558594, 0.050528526306152344, 0.05400848388671875, 0.057488441467285156, 0.06096839904785156, 0.06444835662841797, 0.06792831420898438, 0.07140827178955078, 0.07488822937011719, 0.0783681869506836, 0.08184814453125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 9.0, 13.0, 27.0, 36.0, 50.0, 80.0, 111.0, 125.0, 137.0, 111.0, 78.0, 79.0, 55.0, 24.0, 26.0, 15.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1382230520248413, -1.105010747909546, -1.07179856300354, -1.0385863780975342, -1.0053740739822388, -0.9721618294715881, -0.9389495849609375, -0.9057373404502869, -0.8725250959396362, -0.8393128514289856, -0.806100606918335, -0.7728883624076843, -0.7396761178970337, -0.7064638733863831, -0.6732516288757324, -0.6400393843650818, -0.6068271398544312, -0.5736148953437805, -0.5404026508331299, -0.5071904063224792, -0.4739781618118286, -0.440765917301178, -0.40755367279052734, -0.3743414282798767, -0.3411291837692261, -0.30791693925857544, -0.2747046947479248, -0.24149245023727417, -0.20828020572662354, -0.1750679612159729, -0.14185571670532227, -0.10864347219467163, -0.07543134689331055, -0.04221910238265991, -0.009006857872009277, 0.024205386638641357, 0.05741763114929199, 0.09062987565994263, 0.12384212017059326, 0.1570543646812439, 0.19026660919189453, 0.22347885370254517, 0.2566910982131958, 0.28990334272384644, 0.32311558723449707, 0.3563278317451477, 0.38954007625579834, 0.422752320766449, 0.4559645652770996, 0.48917680978775024, 0.5223890542984009, 0.5556012988090515, 0.5888135433197021, 0.6220257878303528, 0.6552380323410034, 0.688450276851654, 0.7216625213623047, 0.7548747658729553, 0.788087010383606, 0.8212992548942566, 0.8545114994049072, 0.8877237439155579, 0.9209359884262085, 0.9541482329368591, 0.9873604774475098]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 7.0, 13.0, 15.0, 22.0, 9.0, 18.0, 28.0, 26.0, 36.0, 25.0, 30.0, 34.0, 32.0, 40.0, 45.0, 35.0, 41.0, 51.0, 42.0, 31.0, 41.0, 34.0, 40.0, 26.0, 36.0, 44.0, 16.0, 16.0, 12.0, 18.0, 17.0, 12.0, 16.0, 12.0, 7.0, 6.0, 10.0, 6.0, 9.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0], "bins": [-0.9578178524971008, -0.9307506680488586, -0.9036834836006165, -0.8766162991523743, -0.8495491147041321, -0.8224819302558899, -0.7954146862030029, -0.7683475017547607, -0.7412803173065186, -0.7142131328582764, -0.6871459484100342, -0.660078763961792, -0.6330115795135498, -0.6059443950653076, -0.5788772106170654, -0.5518100261688232, -0.524742841720581, -0.49767565727233887, -0.4706084728240967, -0.4435412883758545, -0.4164741039276123, -0.3894069194793701, -0.36233970522880554, -0.33527252078056335, -0.30820533633232117, -0.281138151884079, -0.2540709674358368, -0.2270037680864334, -0.19993658363819122, -0.17286939918994904, -0.14580219984054565, -0.11873501539230347, -0.0916677713394165, -0.06460058689117432, -0.03753339499235153, -0.010466203093528748, 0.01660098135471344, 0.04366816580295563, 0.07073536515235901, 0.0978025496006012, 0.12486973404884338, 0.15193691849708557, 0.17900410294532776, 0.20607130229473114, 0.23313848674297333, 0.2602056860923767, 0.2872728705406189, 0.3143400549888611, 0.34140723943710327, 0.36847442388534546, 0.39554160833358765, 0.42260879278182983, 0.449675977230072, 0.4767431616783142, 0.5038104057312012, 0.5308775901794434, 0.5579447746276855, 0.5850119590759277, 0.6120791435241699, 0.6391463279724121, 0.6662135124206543, 0.6932806968688965, 0.7203478813171387, 0.7474150657653809, 0.774482250213623]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 5.0, 2.0, 5.0, 9.0, 11.0, 15.0, 24.0, 38.0, 61.0, 103.0, 151.0, 262.0, 576.0, 1469.0, 5180.0, 33146.0, 1774142.0, 2329801.0, 40134.0, 6099.0, 1778.0, 602.0, 274.0, 166.0, 79.0, 53.0, 36.0, 21.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3427734375, -1.309234619140625, -1.27569580078125, -1.242156982421875, -1.2086181640625, -1.175079345703125, -1.14154052734375, -1.108001708984375, -1.074462890625, -1.040924072265625, -1.00738525390625, -0.973846435546875, -0.9403076171875, -0.906768798828125, -0.87322998046875, -0.839691162109375, -0.80615234375, -0.772613525390625, -0.73907470703125, -0.705535888671875, -0.6719970703125, -0.638458251953125, -0.60491943359375, -0.571380615234375, -0.537841796875, -0.504302978515625, -0.47076416015625, -0.437225341796875, -0.4036865234375, -0.370147705078125, -0.33660888671875, -0.303070068359375, -0.26953125, -0.235992431640625, -0.20245361328125, -0.168914794921875, -0.1353759765625, -0.101837158203125, -0.06829833984375, -0.034759521484375, -0.001220703125, 0.032318115234375, 0.06585693359375, 0.099395751953125, 0.1329345703125, 0.166473388671875, 0.20001220703125, 0.233551025390625, 0.26708984375, 0.300628662109375, 0.33416748046875, 0.367706298828125, 0.4012451171875, 0.434783935546875, 0.46832275390625, 0.501861572265625, 0.535400390625, 0.568939208984375, 0.60247802734375, 0.636016845703125, 0.6695556640625, 0.703094482421875, 0.73663330078125, 0.770172119140625, 0.8037109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 9.0, 5.0, 10.0, 15.0, 17.0, 28.0, 27.0, 35.0, 40.0, 37.0, 49.0, 65.0, 51.0, 59.0, 62.0, 53.0, 63.0, 48.0, 57.0, 39.0, 39.0, 27.0, 34.0, 26.0, 21.0, 13.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3009033203125, -0.2890625, -0.2772216796875, -0.265380859375, -0.2535400390625, -0.24169921875, -0.2298583984375, -0.218017578125, -0.2061767578125, -0.1943359375, -0.1824951171875, -0.170654296875, -0.1588134765625, -0.14697265625, -0.1351318359375, -0.123291015625, -0.1114501953125, -0.099609375, -0.0877685546875, -0.075927734375, -0.0640869140625, -0.05224609375, -0.0404052734375, -0.028564453125, -0.0167236328125, -0.0048828125, 0.0069580078125, 0.018798828125, 0.0306396484375, 0.04248046875, 0.0543212890625, 0.066162109375, 0.0780029296875, 0.08984375, 0.1016845703125, 0.113525390625, 0.1253662109375, 0.13720703125, 0.1490478515625, 0.160888671875, 0.1727294921875, 0.1845703125, 0.1964111328125, 0.208251953125, 0.2200927734375, 0.23193359375, 0.2437744140625, 0.255615234375, 0.2674560546875, 0.279296875, 0.2911376953125, 0.302978515625, 0.3148193359375, 0.32666015625, 0.3385009765625, 0.350341796875, 0.3621826171875, 0.3740234375, 0.3858642578125, 0.397705078125, 0.4095458984375, 0.42138671875, 0.4332275390625, 0.445068359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 10.0, 12.0, 19.0, 24.0, 32.0, 61.0, 80.0, 144.0, 260.0, 542.0, 1276.0, 4394.0, 25120.0, 1038126.0, 3074041.0, 41197.0, 5852.0, 1640.0, 640.0, 355.0, 156.0, 99.0, 60.0, 33.0, 24.0, 30.0, 12.0, 12.0, 9.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.65545654296875, -0.6243896484375, -0.59332275390625, -0.562255859375, -0.53118896484375, -0.5001220703125, -0.46905517578125, -0.43798828125, -0.40692138671875, -0.3758544921875, -0.34478759765625, -0.313720703125, -0.28265380859375, -0.2515869140625, -0.22052001953125, -0.189453125, -0.15838623046875, -0.1273193359375, -0.09625244140625, -0.065185546875, -0.03411865234375, -0.0030517578125, 0.02801513671875, 0.05908203125, 0.09014892578125, 0.1212158203125, 0.15228271484375, 0.183349609375, 0.21441650390625, 0.2454833984375, 0.27655029296875, 0.3076171875, 0.33868408203125, 0.3697509765625, 0.40081787109375, 0.431884765625, 0.46295166015625, 0.4940185546875, 0.52508544921875, 0.55615234375, 0.58721923828125, 0.6182861328125, 0.64935302734375, 0.680419921875, 0.71148681640625, 0.7425537109375, 0.77362060546875, 0.8046875, 0.83575439453125, 0.8668212890625, 0.89788818359375, 0.928955078125, 0.96002197265625, 0.9910888671875, 1.02215576171875, 1.05322265625, 1.08428955078125, 1.1153564453125, 1.14642333984375, 1.177490234375, 1.20855712890625, 1.2396240234375, 1.27069091796875, 1.3017578125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 14.0, 14.0, 18.0, 16.0, 37.0, 28.0, 48.0, 72.0, 114.0, 179.0, 293.0, 544.0, 691.0, 726.0, 491.0, 327.0, 159.0, 90.0, 71.0, 28.0, 24.0, 15.0, 15.0, 15.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1976318359375, -0.1921253204345703, -0.18661880493164062, -0.18111228942871094, -0.17560577392578125, -0.17009925842285156, -0.16459274291992188, -0.1590862274169922, -0.1535797119140625, -0.1480731964111328, -0.14256668090820312, -0.13706016540527344, -0.13155364990234375, -0.12604713439941406, -0.12054061889648438, -0.11503410339355469, -0.109527587890625, -0.10402107238769531, -0.09851455688476562, -0.09300804138183594, -0.08750152587890625, -0.08199501037597656, -0.07648849487304688, -0.07098197937011719, -0.0654754638671875, -0.05996894836425781, -0.054462432861328125, -0.04895591735839844, -0.04344940185546875, -0.03794288635253906, -0.032436370849609375, -0.026929855346679688, -0.02142333984375, -0.015916824340820312, -0.010410308837890625, -0.0049037933349609375, 0.00060272216796875, 0.0061092376708984375, 0.011615753173828125, 0.017122268676757812, 0.0226287841796875, 0.028135299682617188, 0.033641815185546875, 0.03914833068847656, 0.04465484619140625, 0.05016136169433594, 0.055667877197265625, 0.06117439270019531, 0.066680908203125, 0.07218742370605469, 0.07769393920898438, 0.08320045471191406, 0.08870697021484375, 0.09421348571777344, 0.09972000122070312, 0.10522651672363281, 0.1107330322265625, 0.11623954772949219, 0.12174606323242188, 0.12725257873535156, 0.13275909423828125, 0.13826560974121094, 0.14377212524414062, 0.1492786407470703, 0.15478515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 10.0, 15.0, 21.0, 24.0, 50.0, 73.0, 76.0, 101.0, 121.0, 105.0, 106.0, 84.0, 59.0, 55.0, 30.0, 20.0, 16.0, 4.0, 10.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6262499690055847, -0.6048156023025513, -0.5833812355995178, -0.5619468688964844, -0.5405125617980957, -0.5190781950950623, -0.4976438283920288, -0.47620946168899536, -0.4547750949859619, -0.43334072828292847, -0.411906361579895, -0.39047202467918396, -0.3690376579761505, -0.34760329127311707, -0.326168954372406, -0.30473458766937256, -0.2833002209663391, -0.26186585426330566, -0.2404315024614334, -0.21899715065956116, -0.1975627839565277, -0.17612841725349426, -0.154694065451622, -0.13325971364974976, -0.11182534694671631, -0.09039098769426346, -0.06895662844181061, -0.04752226918935776, -0.026087909936904907, -0.004653550684452057, 0.016780808568000793, 0.03821516036987305, 0.05964958667755127, 0.08108394593000412, 0.10251830518245697, 0.12395266443490982, 0.14538702368736267, 0.16682139039039612, 0.18825574219226837, 0.20969009399414062, 0.23112446069717407, 0.2525588274002075, 0.27399319410324097, 0.295427531003952, 0.3168618977069855, 0.3382962644100189, 0.35973060131073, 0.3811649680137634, 0.4025993347167969, 0.4240337014198303, 0.44546806812286377, 0.46690240502357483, 0.4883367717266083, 0.5097711086273193, 0.5312054753303528, 0.5526398420333862, 0.5740742087364197, 0.5955085754394531, 0.6169429421424866, 0.63837730884552, 0.6598116159439087, 0.6812459826469421, 0.7026803493499756, 0.724114716053009, 0.7455490827560425]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 4.0, 3.0, 8.0, 10.0, 14.0, 10.0, 10.0, 13.0, 20.0, 27.0, 22.0, 15.0, 31.0, 37.0, 44.0, 51.0, 47.0, 45.0, 43.0, 47.0, 53.0, 35.0, 43.0, 31.0, 48.0, 41.0, 41.0, 25.0, 31.0, 18.0, 15.0, 19.0, 18.0, 20.0, 13.0, 14.0, 12.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3579709529876709, -0.34680646657943726, -0.3356419801712036, -0.32447749376296997, -0.31331300735473633, -0.3021485209465027, -0.29098403453826904, -0.2798195481300354, -0.26865506172180176, -0.2574905753135681, -0.24632608890533447, -0.23516160249710083, -0.2239971160888672, -0.21283262968063354, -0.2016681432723999, -0.19050365686416626, -0.17933915555477142, -0.16817466914653778, -0.15701018273830414, -0.1458456963300705, -0.13468120992183685, -0.12351672351360321, -0.11235222965478897, -0.10118774324655533, -0.09002325683832169, -0.07885877043008804, -0.0676942840218544, -0.05652979388833046, -0.04536530748009682, -0.034200821071863174, -0.023036330938339233, -0.01187184453010559, -0.0007073581218719482, 0.010457129217684269, 0.021621616557240486, 0.03278610482811928, 0.04395059123635292, 0.05511507764458656, 0.0662795677781105, 0.07744405418634415, 0.08860854059457779, 0.09977302700281143, 0.11093751341104507, 0.12210200726985931, 0.13326649367809296, 0.1444309800863266, 0.15559546649456024, 0.16675995290279388, 0.17792443931102753, 0.18908892571926117, 0.2002534121274948, 0.21141789853572845, 0.2225823849439621, 0.23374687135219574, 0.24491137266159058, 0.2560758590698242, 0.26724034547805786, 0.2784048318862915, 0.28956931829452515, 0.3007338047027588, 0.31189829111099243, 0.3230627775192261, 0.3342272639274597, 0.34539175033569336, 0.356556236743927]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 17.0, 13.0, 22.0, 31.0, 56.0, 122.0, 265.0, 642.0, 1739.0, 5457.0, 20905.0, 257899.0, 703172.0, 45013.0, 8894.0, 2647.0, 882.0, 363.0, 167.0, 85.0, 48.0, 28.0, 17.0, 11.0, 13.0, 5.0, 8.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2805061340332031, -0.27121734619140625, -0.2619285583496094, -0.2526397705078125, -0.24335098266601562, -0.23406219482421875, -0.22477340698242188, -0.215484619140625, -0.20619583129882812, -0.19690704345703125, -0.18761825561523438, -0.1783294677734375, -0.16904067993164062, -0.15975189208984375, -0.15046310424804688, -0.14117431640625, -0.13188552856445312, -0.12259674072265625, -0.11330795288085938, -0.1040191650390625, -0.09473037719726562, -0.08544158935546875, -0.07615280151367188, -0.066864013671875, -0.057575225830078125, -0.04828643798828125, -0.038997650146484375, -0.0297088623046875, -0.020420074462890625, -0.01113128662109375, -0.001842498779296875, 0.0074462890625, 0.016735076904296875, 0.02602386474609375, 0.035312652587890625, 0.0446014404296875, 0.053890228271484375, 0.06317901611328125, 0.07246780395507812, 0.081756591796875, 0.09104537963867188, 0.10033416748046875, 0.10962295532226562, 0.1189117431640625, 0.12820053100585938, 0.13748931884765625, 0.14677810668945312, 0.15606689453125, 0.16535568237304688, 0.17464447021484375, 0.18393325805664062, 0.1932220458984375, 0.20251083374023438, 0.21179962158203125, 0.22108840942382812, 0.230377197265625, 0.23966598510742188, 0.24895477294921875, 0.2582435607910156, 0.2675323486328125, 0.2768211364746094, 0.28610992431640625, 0.2953987121582031, 0.3046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 12.0, 14.0, 11.0, 21.0, 21.0, 33.0, 28.0, 34.0, 44.0, 59.0, 57.0, 55.0, 48.0, 61.0, 52.0, 54.0, 49.0, 53.0, 46.0, 34.0, 30.0, 29.0, 29.0, 21.0, 19.0, 20.0, 8.0, 14.0, 6.0, 3.0, 5.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.368896484375, -0.35936546325683594, -0.3498344421386719, -0.3403034210205078, -0.33077239990234375, -0.3212413787841797, -0.3117103576660156, -0.30217933654785156, -0.2926483154296875, -0.28311729431152344, -0.2735862731933594, -0.2640552520751953, -0.25452423095703125, -0.2449932098388672, -0.23546218872070312, -0.22593116760253906, -0.216400146484375, -0.20686912536621094, -0.19733810424804688, -0.1878070831298828, -0.17827606201171875, -0.1687450408935547, -0.15921401977539062, -0.14968299865722656, -0.1401519775390625, -0.13062095642089844, -0.12108993530273438, -0.11155891418457031, -0.10202789306640625, -0.09249687194824219, -0.08296585083007812, -0.07343482971191406, -0.06390380859375, -0.05437278747558594, -0.044841766357421875, -0.03531074523925781, -0.02577972412109375, -0.016248703002929688, -0.006717681884765625, 0.0028133392333984375, 0.0123443603515625, 0.021875381469726562, 0.031406402587890625, 0.04093742370605469, 0.05046844482421875, 0.05999946594238281, 0.06953048706054688, 0.07906150817871094, 0.088592529296875, 0.09812355041503906, 0.10765457153320312, 0.11718559265136719, 0.12671661376953125, 0.1362476348876953, 0.14577865600585938, 0.15530967712402344, 0.1648406982421875, 0.17437171936035156, 0.18390274047851562, 0.1934337615966797, 0.20296478271484375, 0.2124958038330078, 0.22202682495117188, 0.23155784606933594, 0.2410888671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 12.0, 33.0, 36.0, 60.0, 121.0, 240.0, 554.0, 1143.0, 2907.0, 9311.0, 40356.0, 279672.0, 590104.0, 97597.0, 17936.0, 5011.0, 1886.0, 774.0, 377.0, 173.0, 106.0, 52.0, 28.0, 21.0, 8.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1385498046875, -0.13346481323242188, -0.12837982177734375, -0.12329483032226562, -0.1182098388671875, -0.11312484741210938, -0.10803985595703125, -0.10295486450195312, -0.097869873046875, -0.09278488159179688, -0.08769989013671875, -0.08261489868164062, -0.0775299072265625, -0.07244491577148438, -0.06735992431640625, -0.062274932861328125, -0.05718994140625, -0.052104949951171875, -0.04701995849609375, -0.041934967041015625, -0.0368499755859375, -0.031764984130859375, -0.02667999267578125, -0.021595001220703125, -0.016510009765625, -0.011425018310546875, -0.00634002685546875, -0.001255035400390625, 0.0038299560546875, 0.008914947509765625, 0.01399993896484375, 0.019084930419921875, 0.024169921875, 0.029254913330078125, 0.03433990478515625, 0.039424896240234375, 0.0445098876953125, 0.049594879150390625, 0.05467987060546875, 0.059764862060546875, 0.064849853515625, 0.06993484497070312, 0.07501983642578125, 0.08010482788085938, 0.0851898193359375, 0.09027481079101562, 0.09535980224609375, 0.10044479370117188, 0.10552978515625, 0.11061477661132812, 0.11569976806640625, 0.12078475952148438, 0.1258697509765625, 0.13095474243164062, 0.13603973388671875, 0.14112472534179688, 0.146209716796875, 0.15129470825195312, 0.15637969970703125, 0.16146469116210938, 0.1665496826171875, 0.17163467407226562, 0.17671966552734375, 0.18180465698242188, 0.1868896484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 2.0, 7.0, 8.0, 11.0, 10.0, 19.0, 17.0, 18.0, 20.0, 33.0, 36.0, 41.0, 34.0, 43.0, 49.0, 40.0, 59.0, 44.0, 47.0, 53.0, 37.0, 43.0, 43.0, 46.0, 38.0, 38.0, 34.0, 25.0, 23.0, 15.0, 7.0, 12.0, 6.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5302047729492188, -0.5115814208984375, -0.49295806884765625, -0.474334716796875, -0.45571136474609375, -0.4370880126953125, -0.41846466064453125, -0.39984130859375, -0.38121795654296875, -0.3625946044921875, -0.34397125244140625, -0.325347900390625, -0.30672454833984375, -0.2881011962890625, -0.26947784423828125, -0.2508544921875, -0.23223114013671875, -0.2136077880859375, -0.19498443603515625, -0.176361083984375, -0.15773773193359375, -0.1391143798828125, -0.12049102783203125, -0.10186767578125, -0.08324432373046875, -0.0646209716796875, -0.04599761962890625, -0.027374267578125, -0.00875091552734375, 0.0098724365234375, 0.02849578857421875, 0.047119140625, 0.06574249267578125, 0.0843658447265625, 0.10298919677734375, 0.121612548828125, 0.14023590087890625, 0.1588592529296875, 0.17748260498046875, 0.19610595703125, 0.21472930908203125, 0.2333526611328125, 0.25197601318359375, 0.270599365234375, 0.28922271728515625, 0.3078460693359375, 0.32646942138671875, 0.3450927734375, 0.36371612548828125, 0.3823394775390625, 0.40096282958984375, 0.419586181640625, 0.43820953369140625, 0.4568328857421875, 0.47545623779296875, 0.49407958984375, 0.5127029418945312, 0.5313262939453125, 0.5499496459960938, 0.568572998046875, 0.5871963500976562, 0.6058197021484375, 0.6244430541992188, 0.64306640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 20.0, 17.0, 36.0, 46.0, 55.0, 115.0, 201.0, 409.0, 744.0, 1776.0, 4142.0, 11670.0, 44173.0, 242268.0, 540233.0, 156746.0, 30897.0, 8871.0, 3343.0, 1411.0, 618.0, 327.0, 176.0, 106.0, 59.0, 23.0, 20.0, 10.0, 9.0, 10.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.042022705078125, -0.04092764854431152, -0.03983259201049805, -0.03873753547668457, -0.037642478942871094, -0.03654742240905762, -0.03545236587524414, -0.034357309341430664, -0.03326225280761719, -0.03216719627380371, -0.031072139739990234, -0.029977083206176758, -0.02888202667236328, -0.027786970138549805, -0.026691913604736328, -0.02559685707092285, -0.024501800537109375, -0.0234067440032959, -0.022311687469482422, -0.021216630935668945, -0.02012157440185547, -0.019026517868041992, -0.017931461334228516, -0.01683640480041504, -0.015741348266601562, -0.014646291732788086, -0.01355123519897461, -0.012456178665161133, -0.011361122131347656, -0.01026606559753418, -0.009171009063720703, -0.008075952529907227, -0.00698089599609375, -0.0058858394622802734, -0.004790782928466797, -0.0036957263946533203, -0.0026006698608398438, -0.0015056133270263672, -0.0004105567932128906, 0.0006844997406005859, 0.0017795562744140625, 0.002874612808227539, 0.003969669342041016, 0.005064725875854492, 0.006159782409667969, 0.007254838943481445, 0.008349895477294922, 0.009444952011108398, 0.010540008544921875, 0.011635065078735352, 0.012730121612548828, 0.013825178146362305, 0.014920234680175781, 0.016015291213989258, 0.017110347747802734, 0.01820540428161621, 0.019300460815429688, 0.020395517349243164, 0.02149057388305664, 0.022585630416870117, 0.023680686950683594, 0.02477574348449707, 0.025870800018310547, 0.026965856552124023, 0.0280609130859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 9.0, 11.0, 18.0, 25.0, 44.0, 35.0, 62.0, 79.0, 86.0, 94.0, 107.0, 94.0, 88.0, 58.0, 51.0, 43.0, 22.0, 14.0, 14.0, 11.0, 5.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.54813751578331e-05, -1.492910087108612e-05, -1.4376826584339142e-05, -1.3824552297592163e-05, -1.3272278010845184e-05, -1.2720003724098206e-05, -1.2167729437351227e-05, -1.1615455150604248e-05, -1.106318086385727e-05, -1.051090657711029e-05, -9.958632290363312e-06, -9.406358003616333e-06, -8.854083716869354e-06, -8.301809430122375e-06, -7.749535143375397e-06, -7.197260856628418e-06, -6.644986569881439e-06, -6.0927122831344604e-06, -5.540437996387482e-06, -4.988163709640503e-06, -4.435889422893524e-06, -3.883615136146545e-06, -3.3313408493995667e-06, -2.779066562652588e-06, -2.226792275905609e-06, -1.6745179891586304e-06, -1.1222437024116516e-06, -5.699694156646729e-07, -1.7695128917694092e-08, 5.345791578292847e-07, 1.0868534445762634e-06, 1.6391277313232422e-06, 2.191402018070221e-06, 2.7436763048171997e-06, 3.2959505915641785e-06, 3.848224878311157e-06, 4.400499165058136e-06, 4.952773451805115e-06, 5.5050477385520935e-06, 6.057322025299072e-06, 6.609596312046051e-06, 7.16187059879303e-06, 7.714144885540009e-06, 8.266419172286987e-06, 8.818693459033966e-06, 9.370967745780945e-06, 9.923242032527924e-06, 1.0475516319274902e-05, 1.1027790606021881e-05, 1.158006489276886e-05, 1.2132339179515839e-05, 1.2684613466262817e-05, 1.3236887753009796e-05, 1.3789162039756775e-05, 1.4341436326503754e-05, 1.4893710613250732e-05, 1.544598489999771e-05, 1.599825918674469e-05, 1.655053347349167e-05, 1.7102807760238647e-05, 1.7655082046985626e-05, 1.8207356333732605e-05, 1.8759630620479584e-05, 1.9311904907226562e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 5.0, 9.0, 8.0, 10.0, 16.0, 15.0, 25.0, 35.0, 43.0, 47.0, 82.0, 139.0, 230.0, 406.0, 776.0, 1634.0, 3617.0, 10003.0, 30793.0, 119041.0, 396944.0, 348208.0, 95760.0, 25998.0, 8421.0, 3220.0, 1412.0, 728.0, 335.0, 196.0, 120.0, 79.0, 61.0, 34.0, 29.0, 17.0, 11.0, 15.0, 15.0, 7.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0343017578125, -0.03325986862182617, -0.032217979431152344, -0.031176090240478516, -0.030134201049804688, -0.02909231185913086, -0.02805042266845703, -0.027008533477783203, -0.025966644287109375, -0.024924755096435547, -0.02388286590576172, -0.02284097671508789, -0.021799087524414062, -0.020757198333740234, -0.019715309143066406, -0.018673419952392578, -0.01763153076171875, -0.016589641571044922, -0.015547752380371094, -0.014505863189697266, -0.013463973999023438, -0.01242208480834961, -0.011380195617675781, -0.010338306427001953, -0.009296417236328125, -0.008254528045654297, -0.007212638854980469, -0.006170749664306641, -0.0051288604736328125, -0.004086971282958984, -0.0030450820922851562, -0.002003192901611328, -0.0009613037109375, 8.058547973632812e-05, 0.0011224746704101562, 0.0021643638610839844, 0.0032062530517578125, 0.004248142242431641, 0.005290031433105469, 0.006331920623779297, 0.007373809814453125, 0.008415699005126953, 0.009457588195800781, 0.01049947738647461, 0.011541366577148438, 0.012583255767822266, 0.013625144958496094, 0.014667034149169922, 0.01570892333984375, 0.016750812530517578, 0.017792701721191406, 0.018834590911865234, 0.019876480102539062, 0.02091836929321289, 0.02196025848388672, 0.023002147674560547, 0.024044036865234375, 0.025085926055908203, 0.02612781524658203, 0.02716970443725586, 0.028211593627929688, 0.029253482818603516, 0.030295372009277344, 0.03133726119995117, 0.032379150390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 5.0, 10.0, 6.0, 8.0, 10.0, 10.0, 20.0, 27.0, 40.0, 52.0, 53.0, 69.0, 74.0, 67.0, 86.0, 85.0, 66.0, 67.0, 47.0, 41.0, 34.0, 29.0, 23.0, 12.0, 11.0, 13.0, 9.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0117950439453125, -0.011431217193603516, -0.011067390441894531, -0.010703563690185547, -0.010339736938476562, -0.009975910186767578, -0.009612083435058594, -0.00924825668334961, -0.008884429931640625, -0.00852060317993164, -0.008156776428222656, -0.007792949676513672, -0.0074291229248046875, -0.007065296173095703, -0.006701469421386719, -0.006337642669677734, -0.00597381591796875, -0.005609989166259766, -0.005246162414550781, -0.004882335662841797, -0.0045185089111328125, -0.004154682159423828, -0.0037908554077148438, -0.0034270286560058594, -0.003063201904296875, -0.0026993751525878906, -0.0023355484008789062, -0.001971721649169922, -0.0016078948974609375, -0.0012440681457519531, -0.0008802413940429688, -0.0005164146423339844, -0.000152587890625, 0.00021123886108398438, 0.0005750656127929688, 0.0009388923645019531, 0.0013027191162109375, 0.0016665458679199219, 0.0020303726196289062, 0.0023941993713378906, 0.002758026123046875, 0.0031218528747558594, 0.0034856796264648438, 0.003849506378173828, 0.0042133331298828125, 0.004577159881591797, 0.004940986633300781, 0.005304813385009766, 0.00566864013671875, 0.006032466888427734, 0.006396293640136719, 0.006760120391845703, 0.0071239471435546875, 0.007487773895263672, 0.007851600646972656, 0.00821542739868164, 0.008579254150390625, 0.00894308090209961, 0.009306907653808594, 0.009670734405517578, 0.010034561157226562, 0.010398387908935547, 0.010762214660644531, 0.011126041412353516, 0.0114898681640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 21.0, 29.0, 44.0, 73.0, 112.0, 162.0, 146.0, 146.0, 106.0, 62.0, 30.0, 24.0, 14.0, 9.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3167197108268738, -0.2973078489303589, -0.277895987033844, -0.2584841251373291, -0.2390722781419754, -0.2196604162454605, -0.2002485692501068, -0.18083670735359192, -0.16142484545707703, -0.14201298356056213, -0.12260112911462784, -0.10318927466869354, -0.08377741277217865, -0.06436555087566376, -0.04495369642972946, -0.025541841983795166, -0.0061299800872802734, 0.01328187808394432, 0.032693736255168915, 0.05210559442639351, 0.0715174525976181, 0.090929314494133, 0.11034116894006729, 0.1297530233860016, 0.14916488528251648, 0.16857674717903137, 0.18798860907554626, 0.20740045607089996, 0.22681231796741486, 0.24622417986392975, 0.26563602685928345, 0.28504788875579834, 0.304459810256958, 0.3238716721534729, 0.3432835340499878, 0.3626953959465027, 0.3821072578430176, 0.40151911973953247, 0.420930951833725, 0.44034281373023987, 0.45975467562675476, 0.47916653752326965, 0.49857839941978455, 0.517990231513977, 0.5374020934104919, 0.5568139553070068, 0.5762258172035217, 0.5956376791000366, 0.6150495409965515, 0.6344614028930664, 0.6538732647895813, 0.6732851266860962, 0.6926969885826111, 0.712108850479126, 0.7315207123756409, 0.7509325742721558, 0.7703443765640259, 0.7897562384605408, 0.8091681003570557, 0.8285799622535706, 0.8479918241500854, 0.8674036860466003, 0.8868155479431152, 0.9062273502349854, 0.925639271736145]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 8.0, 0.0, 8.0, 9.0, 17.0, 13.0, 10.0, 18.0, 25.0, 35.0, 26.0, 41.0, 44.0, 52.0, 61.0, 55.0, 63.0, 55.0, 56.0, 52.0, 51.0, 46.0, 41.0, 34.0, 31.0, 27.0, 23.0, 24.0, 13.0, 22.0, 12.0, 12.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32876110076904297, -0.3194924592971802, -0.3102238178253174, -0.3009551763534546, -0.2916865348815918, -0.2824179232120514, -0.2731492817401886, -0.2638806402683258, -0.254611998796463, -0.24534335732460022, -0.23607471585273743, -0.22680608928203583, -0.21753744781017303, -0.20826880633831024, -0.19900017976760864, -0.18973153829574585, -0.18046289682388306, -0.17119425535202026, -0.16192561388015747, -0.15265698730945587, -0.14338834583759308, -0.13411970436573029, -0.12485107034444809, -0.1155824363231659, -0.1063137948513031, -0.09704515337944031, -0.08777651935815811, -0.07850788533687592, -0.06923924386501312, -0.05997060611844063, -0.050701968371868134, -0.04143333435058594, -0.032164692878723145, -0.02289605513215065, -0.013627417385578156, -0.004358779639005661, 0.0049098581075668335, 0.014178495854139328, 0.023447133600711823, 0.03271576762199402, 0.04198440909385681, 0.051253046840429306, 0.0605216845870018, 0.069790318608284, 0.07905896008014679, 0.08832760155200958, 0.09759623557329178, 0.10686486959457397, 0.11613351106643677, 0.12540215253829956, 0.13467079401016235, 0.14393942058086395, 0.15320806205272675, 0.16247670352458954, 0.17174533009529114, 0.18101397156715393, 0.19028261303901672, 0.19955125451087952, 0.2088198959827423, 0.2180885225534439, 0.2273571640253067, 0.2366258054971695, 0.2458944320678711, 0.2551630735397339, 0.2644317150115967]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 8.0, 4.0, 16.0, 18.0, 28.0, 38.0, 74.0, 81.0, 118.0, 180.0, 324.0, 527.0, 986.0, 1903.0, 4050.0, 9725.0, 27038.0, 87634.0, 417301.0, 373462.0, 81825.0, 25895.0, 9214.0, 3963.0, 1836.0, 895.0, 531.0, 282.0, 210.0, 127.0, 69.0, 52.0, 38.0, 27.0, 25.0, 10.0, 12.0, 5.0, 3.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2739906311035156, -0.26453399658203125, -0.2550773620605469, -0.2456207275390625, -0.23616409301757812, -0.22670745849609375, -0.21725082397460938, -0.207794189453125, -0.19833755493164062, -0.18888092041015625, -0.17942428588867188, -0.1699676513671875, -0.16051101684570312, -0.15105438232421875, -0.14159774780273438, -0.13214111328125, -0.12268447875976562, -0.11322784423828125, -0.10377120971679688, -0.0943145751953125, -0.08485794067382812, -0.07540130615234375, -0.06594467163085938, -0.056488037109375, -0.047031402587890625, -0.03757476806640625, -0.028118133544921875, -0.0186614990234375, -0.009204864501953125, 0.00025177001953125, 0.009708404541015625, 0.0191650390625, 0.028621673583984375, 0.03807830810546875, 0.047534942626953125, 0.0569915771484375, 0.06644821166992188, 0.07590484619140625, 0.08536148071289062, 0.094818115234375, 0.10427474975585938, 0.11373138427734375, 0.12318801879882812, 0.1326446533203125, 0.14210128784179688, 0.15155792236328125, 0.16101455688476562, 0.17047119140625, 0.17992782592773438, 0.18938446044921875, 0.19884109497070312, 0.2082977294921875, 0.21775436401367188, 0.22721099853515625, 0.23666763305664062, 0.246124267578125, 0.2555809020996094, 0.26503753662109375, 0.2744941711425781, 0.2839508056640625, 0.2934074401855469, 0.30286407470703125, 0.3123207092285156, 0.32177734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 12.0, 8.0, 17.0, 6.0, 13.0, 22.0, 24.0, 28.0, 36.0, 38.0, 44.0, 49.0, 52.0, 53.0, 55.0, 51.0, 50.0, 50.0, 52.0, 53.0, 41.0, 39.0, 27.0, 31.0, 23.0, 27.0, 18.0, 11.0, 19.0, 10.0, 8.0, 4.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5478515625, -0.5316963195800781, -0.5155410766601562, -0.4993858337402344, -0.4832305908203125, -0.4670753479003906, -0.45092010498046875, -0.4347648620605469, -0.418609619140625, -0.4024543762207031, -0.38629913330078125, -0.3701438903808594, -0.3539886474609375, -0.3378334045410156, -0.32167816162109375, -0.3055229187011719, -0.28936767578125, -0.2732124328613281, -0.25705718994140625, -0.24090194702148438, -0.2247467041015625, -0.20859146118164062, -0.19243621826171875, -0.17628097534179688, -0.160125732421875, -0.14397048950195312, -0.12781524658203125, -0.11166000366210938, -0.0955047607421875, -0.07934951782226562, -0.06319427490234375, -0.047039031982421875, -0.0308837890625, -0.014728546142578125, 0.00142669677734375, 0.017581939697265625, 0.0337371826171875, 0.049892425537109375, 0.06604766845703125, 0.08220291137695312, 0.098358154296875, 0.11451339721679688, 0.13066864013671875, 0.14682388305664062, 0.1629791259765625, 0.17913436889648438, 0.19528961181640625, 0.21144485473632812, 0.22760009765625, 0.24375534057617188, 0.25991058349609375, 0.2760658264160156, 0.2922210693359375, 0.3083763122558594, 0.32453155517578125, 0.3406867980957031, 0.356842041015625, 0.3729972839355469, 0.38915252685546875, 0.4053077697753906, 0.4214630126953125, 0.4376182556152344, 0.45377349853515625, 0.4699287414550781, 0.486083984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 5.0, 6.0, 5.0, 13.0, 11.0, 18.0, 28.0, 32.0, 37.0, 65.0, 75.0, 152.0, 231.0, 622.0, 3398.0, 148431.0, 882284.0, 11268.0, 1017.0, 332.0, 174.0, 100.0, 69.0, 46.0, 28.0, 25.0, 20.0, 17.0, 12.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.853515625, -0.8167266845703125, -0.779937744140625, -0.7431488037109375, -0.70635986328125, -0.6695709228515625, -0.632781982421875, -0.5959930419921875, -0.5592041015625, -0.5224151611328125, -0.485626220703125, -0.4488372802734375, -0.41204833984375, -0.3752593994140625, -0.338470458984375, -0.3016815185546875, -0.264892578125, -0.2281036376953125, -0.191314697265625, -0.1545257568359375, -0.11773681640625, -0.0809478759765625, -0.044158935546875, -0.0073699951171875, 0.0294189453125, 0.0662078857421875, 0.102996826171875, 0.1397857666015625, 0.17657470703125, 0.2133636474609375, 0.250152587890625, 0.2869415283203125, 0.32373046875, 0.3605194091796875, 0.397308349609375, 0.4340972900390625, 0.47088623046875, 0.5076751708984375, 0.544464111328125, 0.5812530517578125, 0.6180419921875, 0.6548309326171875, 0.691619873046875, 0.7284088134765625, 0.76519775390625, 0.8019866943359375, 0.838775634765625, 0.8755645751953125, 0.912353515625, 0.9491424560546875, 0.985931396484375, 1.0227203369140625, 1.05950927734375, 1.0962982177734375, 1.133087158203125, 1.1698760986328125, 1.2066650390625, 1.2434539794921875, 1.280242919921875, 1.3170318603515625, 1.35382080078125, 1.3906097412109375, 1.427398681640625, 1.4641876220703125, 1.5009765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 16.0, 11.0, 14.0, 22.0, 32.0, 36.0, 28.0, 37.0, 38.0, 62.0, 63.0, 59.0, 56.0, 59.0, 76.0, 58.0, 49.0, 53.0, 38.0, 38.0, 26.0, 28.0, 21.0, 12.0, 12.0, 9.0, 7.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5736083984375, -0.550048828125, -0.5264892578125, -0.5029296875, -0.4793701171875, -0.455810546875, -0.4322509765625, -0.40869140625, -0.3851318359375, -0.361572265625, -0.3380126953125, -0.314453125, -0.2908935546875, -0.267333984375, -0.2437744140625, -0.22021484375, -0.1966552734375, -0.173095703125, -0.1495361328125, -0.1259765625, -0.1024169921875, -0.078857421875, -0.0552978515625, -0.03173828125, -0.0081787109375, 0.015380859375, 0.0389404296875, 0.0625, 0.0860595703125, 0.109619140625, 0.1331787109375, 0.15673828125, 0.1802978515625, 0.203857421875, 0.2274169921875, 0.2509765625, 0.2745361328125, 0.298095703125, 0.3216552734375, 0.34521484375, 0.3687744140625, 0.392333984375, 0.4158935546875, 0.439453125, 0.4630126953125, 0.486572265625, 0.5101318359375, 0.53369140625, 0.5572509765625, 0.580810546875, 0.6043701171875, 0.6279296875, 0.6514892578125, 0.675048828125, 0.6986083984375, 0.72216796875, 0.7457275390625, 0.769287109375, 0.7928466796875, 0.81640625, 0.8399658203125, 0.863525390625, 0.8870849609375, 0.91064453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 0.0, 7.0, 7.0, 8.0, 6.0, 13.0, 11.0, 15.0, 25.0, 40.0, 64.0, 138.0, 208.0, 396.0, 847.0, 1842.0, 5714.0, 39182.0, 865648.0, 119764.0, 9676.0, 2629.0, 1110.0, 511.0, 265.0, 139.0, 93.0, 56.0, 33.0, 26.0, 15.0, 12.0, 8.0, 5.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.20741653442382812, -0.19901275634765625, -0.19060897827148438, -0.1822052001953125, -0.17380142211914062, -0.16539764404296875, -0.15699386596679688, -0.148590087890625, -0.14018630981445312, -0.13178253173828125, -0.12337875366210938, -0.1149749755859375, -0.10657119750976562, -0.09816741943359375, -0.08976364135742188, -0.08135986328125, -0.07295608520507812, -0.06455230712890625, -0.056148529052734375, -0.0477447509765625, -0.039340972900390625, -0.03093719482421875, -0.022533416748046875, -0.014129638671875, -0.005725860595703125, 0.00267791748046875, 0.011081695556640625, 0.0194854736328125, 0.027889251708984375, 0.03629302978515625, 0.044696807861328125, 0.0531005859375, 0.061504364013671875, 0.06990814208984375, 0.07831192016601562, 0.0867156982421875, 0.09511947631835938, 0.10352325439453125, 0.11192703247070312, 0.120330810546875, 0.12873458862304688, 0.13713836669921875, 0.14554214477539062, 0.1539459228515625, 0.16234970092773438, 0.17075347900390625, 0.17915725708007812, 0.18756103515625, 0.19596481323242188, 0.20436859130859375, 0.21277236938476562, 0.2211761474609375, 0.22957992553710938, 0.23798370361328125, 0.24638748168945312, 0.254791259765625, 0.2631950378417969, 0.27159881591796875, 0.2800025939941406, 0.2884063720703125, 0.2968101501464844, 0.30521392822265625, 0.3136177062988281, 0.322021484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 8.0, 17.0, 30.0, 68.0, 179.0, 413.0, 154.0, 57.0, 20.0, 14.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.218122482299805e-05, -7.00848177075386e-05, -6.798841059207916e-05, -6.589200347661972e-05, -6.379559636116028e-05, -6.169918924570084e-05, -5.9602782130241394e-05, -5.750637501478195e-05, -5.540996789932251e-05, -5.331356078386307e-05, -5.1217153668403625e-05, -4.912074655294418e-05, -4.702433943748474e-05, -4.49279323220253e-05, -4.283152520656586e-05, -4.0735118091106415e-05, -3.863871097564697e-05, -3.654230386018753e-05, -3.444589674472809e-05, -3.2349489629268646e-05, -3.0253082513809204e-05, -2.8156675398349762e-05, -2.606026828289032e-05, -2.3963861167430878e-05, -2.1867454051971436e-05, -1.9771046936511993e-05, -1.767463982105255e-05, -1.557823270559311e-05, -1.3481825590133667e-05, -1.1385418474674225e-05, -9.289011359214783e-06, -7.1926042437553406e-06, -5.0961971282958984e-06, -2.9997900128364563e-06, -9.033828973770142e-07, 1.193024218082428e-06, 3.28943133354187e-06, 5.385838449001312e-06, 7.482245564460754e-06, 9.578652679920197e-06, 1.1675059795379639e-05, 1.377146691083908e-05, 1.5867874026298523e-05, 1.7964281141757965e-05, 2.0060688257217407e-05, 2.215709537267685e-05, 2.425350248813629e-05, 2.6349909603595734e-05, 2.8446316719055176e-05, 3.054272383451462e-05, 3.263913094997406e-05, 3.47355380654335e-05, 3.6831945180892944e-05, 3.8928352296352386e-05, 4.102475941181183e-05, 4.312116652727127e-05, 4.521757364273071e-05, 4.7313980758190155e-05, 4.94103878736496e-05, 5.150679498910904e-05, 5.360320210456848e-05, 5.5699609220027924e-05, 5.7796016335487366e-05, 5.989242345094681e-05, 6.198883056640625e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 10.0, 12.0, 28.0, 37.0, 46.0, 104.0, 182.0, 346.0, 656.0, 1328.0, 2811.0, 8712.0, 55712.0, 754919.0, 196531.0, 18845.0, 4487.0, 1790.0, 859.0, 495.0, 239.0, 134.0, 92.0, 45.0, 31.0, 24.0, 18.0, 10.0, 10.0, 5.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2266845703125, -0.22015953063964844, -0.21363449096679688, -0.2071094512939453, -0.20058441162109375, -0.1940593719482422, -0.18753433227539062, -0.18100929260253906, -0.1744842529296875, -0.16795921325683594, -0.16143417358398438, -0.1549091339111328, -0.14838409423828125, -0.1418590545654297, -0.13533401489257812, -0.12880897521972656, -0.122283935546875, -0.11575889587402344, -0.10923385620117188, -0.10270881652832031, -0.09618377685546875, -0.08965873718261719, -0.08313369750976562, -0.07660865783691406, -0.0700836181640625, -0.06355857849121094, -0.057033538818359375, -0.05050849914550781, -0.04398345947265625, -0.03745841979980469, -0.030933380126953125, -0.024408340454101562, -0.01788330078125, -0.011358261108398438, -0.004833221435546875, 0.0016918182373046875, 0.00821685791015625, 0.014741897583007812, 0.021266937255859375, 0.027791976928710938, 0.0343170166015625, 0.04084205627441406, 0.047367095947265625, 0.05389213562011719, 0.06041717529296875, 0.06694221496582031, 0.07346725463867188, 0.07999229431152344, 0.086517333984375, 0.09304237365722656, 0.09956741333007812, 0.10609245300292969, 0.11261749267578125, 0.11914253234863281, 0.12566757202148438, 0.13219261169433594, 0.1387176513671875, 0.14524269104003906, 0.15176773071289062, 0.1582927703857422, 0.16481781005859375, 0.1713428497314453, 0.17786788940429688, 0.18439292907714844, 0.19091796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 7.0, 7.0, 13.0, 8.0, 21.0, 24.0, 20.0, 31.0, 33.0, 59.0, 70.0, 127.0, 155.0, 124.0, 77.0, 64.0, 52.0, 32.0, 26.0, 9.0, 16.0, 2.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0665283203125, -0.06427288055419922, -0.06201744079589844, -0.059762001037597656, -0.057506561279296875, -0.055251121520996094, -0.05299568176269531, -0.05074024200439453, -0.04848480224609375, -0.04622936248779297, -0.04397392272949219, -0.041718482971191406, -0.039463043212890625, -0.037207603454589844, -0.03495216369628906, -0.03269672393798828, -0.0304412841796875, -0.02818584442138672, -0.025930404663085938, -0.023674964904785156, -0.021419525146484375, -0.019164085388183594, -0.016908645629882812, -0.014653205871582031, -0.01239776611328125, -0.010142326354980469, -0.007886886596679688, -0.005631446838378906, -0.003376007080078125, -0.0011205673217773438, 0.0011348724365234375, 0.0033903121948242188, 0.005645751953125, 0.007901191711425781, 0.010156631469726562, 0.012412071228027344, 0.014667510986328125, 0.016922950744628906, 0.019178390502929688, 0.02143383026123047, 0.02368927001953125, 0.02594470977783203, 0.028200149536132812, 0.030455589294433594, 0.032711029052734375, 0.034966468811035156, 0.03722190856933594, 0.03947734832763672, 0.0417327880859375, 0.04398822784423828, 0.04624366760253906, 0.048499107360839844, 0.050754547119140625, 0.053009986877441406, 0.05526542663574219, 0.05752086639404297, 0.05977630615234375, 0.06203174591064453, 0.06428718566894531, 0.0665426254272461, 0.06879806518554688, 0.07105350494384766, 0.07330894470214844, 0.07556438446044922, 0.07781982421875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 5.0, 20.0, 94.0, 418.0, 370.0, 88.0, 15.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6520538926124573, -0.5211829543113708, -0.39031198620796204, -0.2594410181045532, -0.1285700798034668, 0.002300858497619629, 0.13317185640335083, 0.26404279470443726, 0.3949137330055237, 0.5257846713066101, 0.6566556692123413, 0.7875266075134277, 0.9183975458145142, 1.0492684841156006, 1.1801395416259766, 1.3110103607177734, 1.4418814182281494, 1.5727523565292358, 1.7036232948303223, 1.8344943523406982, 1.9653651714324951, 2.096236228942871, 2.227107048034668, 2.357978105545044, 2.488848924636841, 2.619719982147217, 2.7505908012390137, 2.8814618587493896, 3.0123326778411865, 3.1432037353515625, 3.2740745544433594, 3.4049456119537354, 3.535816192626953, 3.666687250137329, 3.797558069229126, 3.928429126739502, 4.059299945831299, 4.190170764923096, 4.321042060852051, 4.451912879943848, 4.5827836990356445, 4.713654518127441, 4.8445258140563965, 4.975396633148193, 5.10626745223999, 5.237138271331787, 5.368009567260742, 5.498880386352539, 5.629751205444336, 5.760622024536133, 5.891493320465088, 6.022364139556885, 6.153234958648682, 6.2841057777404785, 6.414977073669434, 6.5458478927612305, 6.6767191886901855, 6.807590007781982, 6.9384613037109375, 7.069332122802734, 7.200202941894531, 7.331073760986328, 7.461945056915283, 7.59281587600708, 7.723686695098877]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 10.0, 7.0, 6.0, 13.0, 13.0, 12.0, 8.0, 22.0, 22.0, 20.0, 28.0, 40.0, 33.0, 37.0, 42.0, 41.0, 43.0, 39.0, 57.0, 34.0, 37.0, 56.0, 42.0, 33.0, 27.0, 37.0, 22.0, 25.0, 27.0, 14.0, 24.0, 20.0, 13.0, 14.0, 16.0, 19.0, 10.0, 10.0, 3.0, 3.0, 8.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.9124016761779785, -0.8852574825286865, -0.8581132292747498, -0.8309690356254578, -0.803824782371521, -0.776680588722229, -0.749536395072937, -0.722392201423645, -0.6952479481697083, -0.6681037545204163, -0.6409595012664795, -0.6138153076171875, -0.5866711139678955, -0.5595268607139587, -0.5323826670646667, -0.50523841381073, -0.478094220161438, -0.4509499967098236, -0.42380577325820923, -0.39666157960891724, -0.36951735615730286, -0.3423731327056885, -0.3152289390563965, -0.2880847156047821, -0.2609404921531677, -0.23379626870155334, -0.20665206015110016, -0.17950785160064697, -0.1523636281490326, -0.1252194046974182, -0.09807519614696503, -0.07093098759651184, -0.04378676414489746, -0.016642548143863678, 0.010501667857170105, 0.03764588385820389, 0.06479009985923767, 0.09193432331085205, 0.11907853186130524, 0.14622274041175842, 0.1733669638633728, 0.20051118731498718, 0.22765539586544037, 0.25479960441589355, 0.28194382786750793, 0.3090880513191223, 0.3362322449684143, 0.3633764684200287, 0.39052069187164307, 0.41766491532325745, 0.4448091387748718, 0.4719533324241638, 0.4990975558757782, 0.5262417793273926, 0.5533859729766846, 0.5805301666259766, 0.6076744198799133, 0.6348186135292053, 0.6619628667831421, 0.6891070604324341, 0.7162512540817261, 0.7433955073356628, 0.7705397009849548, 0.7976839542388916, 0.8248281478881836]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 4.0, 4.0, 6.0, 13.0, 20.0, 23.0, 34.0, 52.0, 76.0, 119.0, 225.0, 331.0, 545.0, 998.0, 1715.0, 3538.0, 7700.0, 21466.0, 119056.0, 1604383.0, 2215191.0, 173061.0, 26946.0, 9600.0, 4242.0, 2052.0, 1199.0, 636.0, 396.0, 227.0, 151.0, 84.0, 54.0, 50.0, 25.0, 17.0, 13.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59521484375, -0.5787200927734375, -0.562225341796875, -0.5457305908203125, -0.52923583984375, -0.5127410888671875, -0.496246337890625, -0.4797515869140625, -0.4632568359375, -0.4467620849609375, -0.430267333984375, -0.4137725830078125, -0.39727783203125, -0.3807830810546875, -0.364288330078125, -0.3477935791015625, -0.331298828125, -0.3148040771484375, -0.298309326171875, -0.2818145751953125, -0.26531982421875, -0.2488250732421875, -0.232330322265625, -0.2158355712890625, -0.1993408203125, -0.1828460693359375, -0.166351318359375, -0.1498565673828125, -0.13336181640625, -0.1168670654296875, -0.100372314453125, -0.0838775634765625, -0.0673828125, -0.0508880615234375, -0.034393310546875, -0.0178985595703125, -0.00140380859375, 0.0150909423828125, 0.031585693359375, 0.0480804443359375, 0.0645751953125, 0.0810699462890625, 0.097564697265625, 0.1140594482421875, 0.13055419921875, 0.1470489501953125, 0.163543701171875, 0.1800384521484375, 0.196533203125, 0.2130279541015625, 0.229522705078125, 0.2460174560546875, 0.26251220703125, 0.2790069580078125, 0.295501708984375, 0.3119964599609375, 0.3284912109375, 0.3449859619140625, 0.361480712890625, 0.3779754638671875, 0.39447021484375, 0.4109649658203125, 0.427459716796875, 0.4439544677734375, 0.46044921875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 2.0, 10.0, 6.0, 8.0, 11.0, 16.0, 28.0, 22.0, 23.0, 26.0, 28.0, 46.0, 39.0, 41.0, 45.0, 44.0, 50.0, 57.0, 42.0, 48.0, 50.0, 37.0, 36.0, 42.0, 39.0, 22.0, 24.0, 21.0, 22.0, 10.0, 23.0, 21.0, 8.0, 5.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24895477294921875, -0.2403411865234375, -0.23172760009765625, -0.223114013671875, -0.21450042724609375, -0.2058868408203125, -0.19727325439453125, -0.18865966796875, -0.18004608154296875, -0.1714324951171875, -0.16281890869140625, -0.154205322265625, -0.14559173583984375, -0.1369781494140625, -0.12836456298828125, -0.1197509765625, -0.11113739013671875, -0.1025238037109375, -0.09391021728515625, -0.085296630859375, -0.07668304443359375, -0.0680694580078125, -0.05945587158203125, -0.05084228515625, -0.04222869873046875, -0.0336151123046875, -0.02500152587890625, -0.016387939453125, -0.00777435302734375, 0.0008392333984375, 0.00945281982421875, 0.01806640625, 0.02667999267578125, 0.0352935791015625, 0.04390716552734375, 0.052520751953125, 0.06113433837890625, 0.0697479248046875, 0.07836151123046875, 0.08697509765625, 0.09558868408203125, 0.1042022705078125, 0.11281585693359375, 0.121429443359375, 0.13004302978515625, 0.1386566162109375, 0.14727020263671875, 0.1558837890625, 0.16449737548828125, 0.1731109619140625, 0.18172454833984375, 0.190338134765625, 0.19895172119140625, 0.2075653076171875, 0.21617889404296875, 0.22479248046875, 0.23340606689453125, 0.2420196533203125, 0.25063323974609375, 0.259246826171875, 0.26786041259765625, 0.2764739990234375, 0.28508758544921875, 0.293701171875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 10.0, 18.0, 16.0, 30.0, 46.0, 61.0, 164.0, 344.0, 909.0, 2903.0, 14628.0, 267454.0, 3823876.0, 73297.0, 7431.0, 1866.0, 622.0, 251.0, 131.0, 63.0, 39.0, 27.0, 23.0, 8.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0353546142578125, -1.003326416015625, -0.9712982177734375, -0.93927001953125, -0.9072418212890625, -0.875213623046875, -0.8431854248046875, -0.8111572265625, -0.7791290283203125, -0.747100830078125, -0.7150726318359375, -0.68304443359375, -0.6510162353515625, -0.618988037109375, -0.5869598388671875, -0.554931640625, -0.5229034423828125, -0.490875244140625, -0.4588470458984375, -0.42681884765625, -0.3947906494140625, -0.362762451171875, -0.3307342529296875, -0.2987060546875, -0.2666778564453125, -0.234649658203125, -0.2026214599609375, -0.17059326171875, -0.1385650634765625, -0.106536865234375, -0.0745086669921875, -0.04248046875, -0.0104522705078125, 0.021575927734375, 0.0536041259765625, 0.08563232421875, 0.1176605224609375, 0.149688720703125, 0.1817169189453125, 0.2137451171875, 0.2457733154296875, 0.277801513671875, 0.3098297119140625, 0.34185791015625, 0.3738861083984375, 0.405914306640625, 0.4379425048828125, 0.469970703125, 0.5019989013671875, 0.534027099609375, 0.5660552978515625, 0.59808349609375, 0.6301116943359375, 0.662139892578125, 0.6941680908203125, 0.7261962890625, 0.7582244873046875, 0.790252685546875, 0.8222808837890625, 0.85430908203125, 0.8863372802734375, 0.918365478515625, 0.9503936767578125, 0.982421875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 8.0, 9.0, 14.0, 18.0, 31.0, 25.0, 51.0, 85.0, 125.0, 218.0, 368.0, 614.0, 755.0, 654.0, 429.0, 220.0, 147.0, 78.0, 59.0, 51.0, 30.0, 19.0, 11.0, 6.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1708984375, -0.1653118133544922, -0.15972518920898438, -0.15413856506347656, -0.14855194091796875, -0.14296531677246094, -0.13737869262695312, -0.1317920684814453, -0.1262054443359375, -0.12061882019042969, -0.11503219604492188, -0.10944557189941406, -0.10385894775390625, -0.09827232360839844, -0.09268569946289062, -0.08709907531738281, -0.081512451171875, -0.07592582702636719, -0.07033920288085938, -0.06475257873535156, -0.05916595458984375, -0.05357933044433594, -0.047992706298828125, -0.04240608215332031, -0.0368194580078125, -0.031232833862304688, -0.025646209716796875, -0.020059585571289062, -0.01447296142578125, -0.008886337280273438, -0.003299713134765625, 0.0022869110107421875, 0.00787353515625, 0.013460159301757812, 0.019046783447265625, 0.024633407592773438, 0.03022003173828125, 0.03580665588378906, 0.041393280029296875, 0.04697990417480469, 0.0525665283203125, 0.05815315246582031, 0.06373977661132812, 0.06932640075683594, 0.07491302490234375, 0.08049964904785156, 0.08608627319335938, 0.09167289733886719, 0.097259521484375, 0.10284614562988281, 0.10843276977539062, 0.11401939392089844, 0.11960601806640625, 0.12519264221191406, 0.13077926635742188, 0.1363658905029297, 0.1419525146484375, 0.1475391387939453, 0.15312576293945312, 0.15871238708496094, 0.16429901123046875, 0.16988563537597656, 0.17547225952148438, 0.1810588836669922, 0.1866455078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 16.0, 13.0, 16.0, 23.0, 22.0, 34.0, 23.0, 26.0, 37.0, 42.0, 56.0, 47.0, 69.0, 41.0, 59.0, 62.0, 57.0, 51.0, 46.0, 42.0, 30.0, 28.0, 31.0, 26.0, 11.0, 17.0, 11.0, 6.0, 9.0, 3.0, 9.0, 1.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3081919848918915, -0.29761067032814026, -0.28702932596206665, -0.27644801139831543, -0.2658666670322418, -0.2552853524684906, -0.244704008102417, -0.23412269353866577, -0.22354134917259216, -0.21296001970767975, -0.20237869024276733, -0.19179736077785492, -0.1812160313129425, -0.1706347018480301, -0.16005337238311768, -0.14947205781936646, -0.13889072835445404, -0.12830939888954163, -0.11772806942462921, -0.1071467399597168, -0.09656541049480438, -0.08598408102989197, -0.07540275901556015, -0.06482142955064774, -0.05424010008573532, -0.043658770620822906, -0.03307744115591049, -0.022496115416288376, -0.011914785951375961, -0.0013334564864635468, 0.00924786925315857, 0.019829198718070984, 0.0304105281829834, 0.04099185764789581, 0.05157318711280823, 0.062154512852430344, 0.07273584604263306, 0.08331717550754547, 0.09389849752187729, 0.1044798269867897, 0.11506115645170212, 0.12564247846603394, 0.13622380793094635, 0.14680513739585876, 0.15738646686077118, 0.1679677963256836, 0.178549125790596, 0.18913045525550842, 0.19971178472042084, 0.21029311418533325, 0.22087444365024567, 0.23145577311515808, 0.2420371025800705, 0.2526184320449829, 0.26319974660873413, 0.27378109097480774, 0.28436240553855896, 0.2949437201023102, 0.3055250644683838, 0.316106379032135, 0.3266877233982086, 0.33726903796195984, 0.34785038232803345, 0.35843169689178467, 0.3690130412578583]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 16.0, 16.0, 13.0, 11.0, 20.0, 20.0, 22.0, 28.0, 36.0, 37.0, 32.0, 44.0, 40.0, 37.0, 32.0, 33.0, 48.0, 47.0, 42.0, 39.0, 34.0, 28.0, 43.0, 37.0, 25.0, 34.0, 24.0, 22.0, 25.0, 27.0, 14.0, 9.0, 17.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34922969341278076, -0.3395542502403259, -0.3298787772655487, -0.32020333409309387, -0.31052789092063904, -0.3008524179458618, -0.291176974773407, -0.28150153160095215, -0.2718260884284973, -0.2621506452560425, -0.25247517228126526, -0.24279972910881042, -0.2331242859363556, -0.22344882786273956, -0.21377336978912354, -0.2040979266166687, -0.19442245364189148, -0.18474699556827545, -0.17507155239582062, -0.1653960943222046, -0.15572065114974976, -0.14604519307613373, -0.1363697350025177, -0.12669429183006287, -0.11701883375644684, -0.10734338313341141, -0.09766793251037598, -0.08799247443675995, -0.07831702381372452, -0.06864157319068909, -0.05896611884236336, -0.04929066449403763, -0.0396152138710022, -0.029939761385321617, -0.020264308899641037, -0.010588856413960457, -0.0009134039282798767, 0.008762046694755554, 0.018437501043081284, 0.028112955391407013, 0.037788406014442444, 0.047463856637477875, 0.057139310985803604, 0.06681476533412933, 0.07649021595716476, 0.0861656665802002, 0.09584112465381622, 0.10551657527685165, 0.11519202589988708, 0.12486747652292252, 0.13454292714595795, 0.14421838521957397, 0.1538938283920288, 0.16356928646564484, 0.17324474453926086, 0.1829201877117157, 0.19259564578533173, 0.20227110385894775, 0.2119465470314026, 0.22162200510501862, 0.23129746317863464, 0.24097290635108948, 0.2506483495235443, 0.26032382249832153, 0.26999926567077637]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 3.0, 11.0, 15.0, 22.0, 39.0, 45.0, 111.0, 170.0, 286.0, 566.0, 1082.0, 2261.0, 4893.0, 11670.0, 46057.0, 494701.0, 426095.0, 40603.0, 10923.0, 4539.0, 2170.0, 1032.0, 567.0, 282.0, 179.0, 89.0, 50.0, 29.0, 18.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1954345703125, -0.18912315368652344, -0.18281173706054688, -0.1765003204345703, -0.17018890380859375, -0.1638774871826172, -0.15756607055664062, -0.15125465393066406, -0.1449432373046875, -0.13863182067871094, -0.13232040405273438, -0.1260089874267578, -0.11969757080078125, -0.11338615417480469, -0.10707473754882812, -0.10076332092285156, -0.094451904296875, -0.08814048767089844, -0.08182907104492188, -0.07551765441894531, -0.06920623779296875, -0.06289482116699219, -0.056583404541015625, -0.05027198791503906, -0.0439605712890625, -0.03764915466308594, -0.031337738037109375, -0.025026321411132812, -0.01871490478515625, -0.012403488159179688, -0.006092071533203125, 0.0002193450927734375, 0.00653076171875, 0.012842178344726562, 0.019153594970703125, 0.025465011596679688, 0.03177642822265625, 0.03808784484863281, 0.044399261474609375, 0.05071067810058594, 0.0570220947265625, 0.06333351135253906, 0.06964492797851562, 0.07595634460449219, 0.08226776123046875, 0.08857917785644531, 0.09489059448242188, 0.10120201110839844, 0.107513427734375, 0.11382484436035156, 0.12013626098632812, 0.1264476776123047, 0.13275909423828125, 0.1390705108642578, 0.14538192749023438, 0.15169334411621094, 0.1580047607421875, 0.16431617736816406, 0.17062759399414062, 0.1769390106201172, 0.18325042724609375, 0.1895618438720703, 0.19587326049804688, 0.20218467712402344, 0.20849609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 4.0, 13.0, 8.0, 11.0, 9.0, 22.0, 20.0, 17.0, 45.0, 31.0, 32.0, 33.0, 45.0, 37.0, 46.0, 44.0, 41.0, 45.0, 49.0, 38.0, 32.0, 52.0, 41.0, 35.0, 29.0, 23.0, 30.0, 36.0, 20.0, 21.0, 18.0, 15.0, 7.0, 7.0, 9.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1912841796875, -0.1852264404296875, -0.179168701171875, -0.1731109619140625, -0.16705322265625, -0.1609954833984375, -0.154937744140625, -0.1488800048828125, -0.142822265625, -0.1367645263671875, -0.130706787109375, -0.1246490478515625, -0.11859130859375, -0.1125335693359375, -0.106475830078125, -0.1004180908203125, -0.0943603515625, -0.0883026123046875, -0.082244873046875, -0.0761871337890625, -0.07012939453125, -0.0640716552734375, -0.058013916015625, -0.0519561767578125, -0.0458984375, -0.0398406982421875, -0.033782958984375, -0.0277252197265625, -0.02166748046875, -0.0156097412109375, -0.009552001953125, -0.0034942626953125, 0.0025634765625, 0.0086212158203125, 0.014678955078125, 0.0207366943359375, 0.02679443359375, 0.0328521728515625, 0.038909912109375, 0.0449676513671875, 0.051025390625, 0.0570831298828125, 0.063140869140625, 0.0691986083984375, 0.07525634765625, 0.0813140869140625, 0.087371826171875, 0.0934295654296875, 0.0994873046875, 0.1055450439453125, 0.111602783203125, 0.1176605224609375, 0.12371826171875, 0.1297760009765625, 0.135833740234375, 0.1418914794921875, 0.14794921875, 0.1540069580078125, 0.160064697265625, 0.1661224365234375, 0.17218017578125, 0.1782379150390625, 0.184295654296875, 0.1903533935546875, 0.1964111328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 18.0, 36.0, 48.0, 108.0, 178.0, 242.0, 389.0, 709.0, 1283.0, 2466.0, 5143.0, 11917.0, 36092.0, 144844.0, 463156.0, 280099.0, 67514.0, 19529.0, 7412.0, 3433.0, 1697.0, 852.0, 526.0, 314.0, 170.0, 115.0, 71.0, 48.0, 27.0, 20.0, 19.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0872802734375, -0.08452987670898438, -0.08177947998046875, -0.07902908325195312, -0.0762786865234375, -0.07352828979492188, -0.07077789306640625, -0.06802749633789062, -0.065277099609375, -0.06252670288085938, -0.05977630615234375, -0.057025909423828125, -0.0542755126953125, -0.051525115966796875, -0.04877471923828125, -0.046024322509765625, -0.04327392578125, -0.040523529052734375, -0.03777313232421875, -0.035022735595703125, -0.0322723388671875, -0.029521942138671875, -0.02677154541015625, -0.024021148681640625, -0.021270751953125, -0.018520355224609375, -0.01576995849609375, -0.013019561767578125, -0.0102691650390625, -0.007518768310546875, -0.00476837158203125, -0.002017974853515625, 0.000732421875, 0.003482818603515625, 0.00623321533203125, 0.008983612060546875, 0.0117340087890625, 0.014484405517578125, 0.01723480224609375, 0.019985198974609375, 0.022735595703125, 0.025485992431640625, 0.02823638916015625, 0.030986785888671875, 0.0337371826171875, 0.036487579345703125, 0.03923797607421875, 0.041988372802734375, 0.04473876953125, 0.047489166259765625, 0.05023956298828125, 0.052989959716796875, 0.0557403564453125, 0.058490753173828125, 0.06124114990234375, 0.06399154663085938, 0.066741943359375, 0.06949234008789062, 0.07224273681640625, 0.07499313354492188, 0.0777435302734375, 0.08049392700195312, 0.08324432373046875, 0.08599472045898438, 0.0887451171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 3.0, 13.0, 9.0, 17.0, 11.0, 21.0, 24.0, 29.0, 25.0, 41.0, 35.0, 28.0, 54.0, 42.0, 39.0, 38.0, 51.0, 45.0, 48.0, 38.0, 50.0, 45.0, 31.0, 33.0, 30.0, 28.0, 25.0, 13.0, 25.0, 20.0, 9.0, 14.0, 12.0, 10.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39990234375, -0.387969970703125, -0.37603759765625, -0.364105224609375, -0.3521728515625, -0.340240478515625, -0.32830810546875, -0.316375732421875, -0.304443359375, -0.292510986328125, -0.28057861328125, -0.268646240234375, -0.2567138671875, -0.244781494140625, -0.23284912109375, -0.220916748046875, -0.208984375, -0.197052001953125, -0.18511962890625, -0.173187255859375, -0.1612548828125, -0.149322509765625, -0.13739013671875, -0.125457763671875, -0.113525390625, -0.101593017578125, -0.08966064453125, -0.077728271484375, -0.0657958984375, -0.053863525390625, -0.04193115234375, -0.029998779296875, -0.01806640625, -0.006134033203125, 0.00579833984375, 0.017730712890625, 0.0296630859375, 0.041595458984375, 0.05352783203125, 0.065460205078125, 0.077392578125, 0.089324951171875, 0.10125732421875, 0.113189697265625, 0.1251220703125, 0.137054443359375, 0.14898681640625, 0.160919189453125, 0.1728515625, 0.184783935546875, 0.19671630859375, 0.208648681640625, 0.2205810546875, 0.232513427734375, 0.24444580078125, 0.256378173828125, 0.268310546875, 0.280242919921875, 0.29217529296875, 0.304107666015625, 0.3160400390625, 0.327972412109375, 0.33990478515625, 0.351837158203125, 0.36376953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 15.0, 13.0, 28.0, 43.0, 59.0, 118.0, 199.0, 362.0, 696.0, 1450.0, 3438.0, 9486.0, 33031.0, 166531.0, 542348.0, 228352.0, 43471.0, 11487.0, 3983.0, 1646.0, 786.0, 420.0, 234.0, 129.0, 79.0, 53.0, 29.0, 14.0, 12.0, 7.0, 6.0, 3.0, 2.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03350830078125, -0.03248023986816406, -0.031452178955078125, -0.030424118041992188, -0.02939605712890625, -0.028367996215820312, -0.027339935302734375, -0.026311874389648438, -0.0252838134765625, -0.024255752563476562, -0.023227691650390625, -0.022199630737304688, -0.02117156982421875, -0.020143508911132812, -0.019115447998046875, -0.018087387084960938, -0.017059326171875, -0.016031265258789062, -0.015003204345703125, -0.013975143432617188, -0.01294708251953125, -0.011919021606445312, -0.010890960693359375, -0.009862899780273438, -0.0088348388671875, -0.0078067779541015625, -0.006778717041015625, -0.0057506561279296875, -0.00472259521484375, -0.0036945343017578125, -0.002666473388671875, -0.0016384124755859375, -0.0006103515625, 0.0004177093505859375, 0.001445770263671875, 0.0024738311767578125, 0.00350189208984375, 0.0045299530029296875, 0.005558013916015625, 0.0065860748291015625, 0.0076141357421875, 0.008642196655273438, 0.009670257568359375, 0.010698318481445312, 0.01172637939453125, 0.012754440307617188, 0.013782501220703125, 0.014810562133789062, 0.015838623046875, 0.016866683959960938, 0.017894744873046875, 0.018922805786132812, 0.01995086669921875, 0.020978927612304688, 0.022006988525390625, 0.023035049438476562, 0.0240631103515625, 0.025091171264648438, 0.026119232177734375, 0.027147293090820312, 0.02817535400390625, 0.029203414916992188, 0.030231475830078125, 0.03125953674316406, 0.03228759765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 6.0, 8.0, 7.0, 9.0, 15.0, 33.0, 30.0, 38.0, 60.0, 91.0, 78.0, 86.0, 111.0, 85.0, 85.0, 54.0, 63.0, 36.0, 28.0, 24.0, 13.0, 7.0, 8.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.424551010131836e-05, -1.368299126625061e-05, -1.3120472431182861e-05, -1.2557953596115112e-05, -1.1995434761047363e-05, -1.1432915925979614e-05, -1.0870397090911865e-05, -1.0307878255844116e-05, -9.745359420776367e-06, -9.182840585708618e-06, -8.620321750640869e-06, -8.05780291557312e-06, -7.495284080505371e-06, -6.932765245437622e-06, -6.370246410369873e-06, -5.807727575302124e-06, -5.245208740234375e-06, -4.682689905166626e-06, -4.120171070098877e-06, -3.557652235031128e-06, -2.995133399963379e-06, -2.43261456489563e-06, -1.8700957298278809e-06, -1.3075768947601318e-06, -7.450580596923828e-07, -1.825392246246338e-07, 3.7997961044311523e-07, 9.424984455108643e-07, 1.5050172805786133e-06, 2.0675361156463623e-06, 2.6300549507141113e-06, 3.1925737857818604e-06, 3.7550926208496094e-06, 4.317611455917358e-06, 4.880130290985107e-06, 5.4426491260528564e-06, 6.0051679611206055e-06, 6.5676867961883545e-06, 7.1302056312561035e-06, 7.692724466323853e-06, 8.255243301391602e-06, 8.81776213645935e-06, 9.3802809715271e-06, 9.942799806594849e-06, 1.0505318641662598e-05, 1.1067837476730347e-05, 1.1630356311798096e-05, 1.2192875146865845e-05, 1.2755393981933594e-05, 1.3317912817001343e-05, 1.3880431652069092e-05, 1.444295048713684e-05, 1.500546932220459e-05, 1.556798815727234e-05, 1.6130506992340088e-05, 1.6693025827407837e-05, 1.7255544662475586e-05, 1.7818063497543335e-05, 1.8380582332611084e-05, 1.8943101167678833e-05, 1.9505620002746582e-05, 2.006813883781433e-05, 2.063065767288208e-05, 2.119317650794983e-05, 2.1755695343017578e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 7.0, 3.0, 6.0, 14.0, 10.0, 22.0, 27.0, 26.0, 49.0, 68.0, 108.0, 162.0, 295.0, 571.0, 1033.0, 2029.0, 4287.0, 10237.0, 28266.0, 97623.0, 357638.0, 385061.0, 109319.0, 31305.0, 11049.0, 4718.0, 2122.0, 1041.0, 596.0, 327.0, 193.0, 118.0, 70.0, 44.0, 26.0, 18.0, 17.0, 12.0, 9.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0316162109375, -0.030563831329345703, -0.029511451721191406, -0.02845907211303711, -0.027406692504882812, -0.026354312896728516, -0.02530193328857422, -0.024249553680419922, -0.023197174072265625, -0.022144794464111328, -0.02109241485595703, -0.020040035247802734, -0.018987655639648438, -0.01793527603149414, -0.016882896423339844, -0.015830516815185547, -0.01477813720703125, -0.013725757598876953, -0.012673377990722656, -0.01162099838256836, -0.010568618774414062, -0.009516239166259766, -0.008463859558105469, -0.007411479949951172, -0.006359100341796875, -0.005306720733642578, -0.004254341125488281, -0.0032019615173339844, -0.0021495819091796875, -0.0010972023010253906, -4.482269287109375e-05, 0.0010075569152832031, 0.0020599365234375, 0.003112316131591797, 0.004164695739746094, 0.005217075347900391, 0.0062694549560546875, 0.007321834564208984, 0.008374214172363281, 0.009426593780517578, 0.010478973388671875, 0.011531352996826172, 0.012583732604980469, 0.013636112213134766, 0.014688491821289062, 0.01574087142944336, 0.016793251037597656, 0.017845630645751953, 0.01889801025390625, 0.019950389862060547, 0.021002769470214844, 0.02205514907836914, 0.023107528686523438, 0.024159908294677734, 0.02521228790283203, 0.026264667510986328, 0.027317047119140625, 0.028369426727294922, 0.02942180633544922, 0.030474185943603516, 0.03152656555175781, 0.03257894515991211, 0.033631324768066406, 0.0346837043762207, 0.035736083984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 10.0, 9.0, 18.0, 17.0, 26.0, 31.0, 53.0, 54.0, 61.0, 80.0, 68.0, 93.0, 79.0, 89.0, 51.0, 48.0, 39.0, 23.0, 28.0, 16.0, 18.0, 16.0, 6.0, 8.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008270263671875, -0.00800621509552002, -0.007742166519165039, -0.007478117942810059, -0.007214069366455078, -0.006950020790100098, -0.006685972213745117, -0.006421923637390137, -0.006157875061035156, -0.005893826484680176, -0.005629777908325195, -0.005365729331970215, -0.005101680755615234, -0.004837632179260254, -0.0045735836029052734, -0.004309535026550293, -0.0040454864501953125, -0.003781437873840332, -0.0035173892974853516, -0.003253340721130371, -0.0029892921447753906, -0.00272524356842041, -0.0024611949920654297, -0.0021971464157104492, -0.0019330978393554688, -0.0016690492630004883, -0.0014050006866455078, -0.0011409521102905273, -0.0008769035339355469, -0.0006128549575805664, -0.00034880638122558594, -8.475780487060547e-05, 0.000179290771484375, 0.00044333934783935547, 0.0007073879241943359, 0.0009714365005493164, 0.0012354850769042969, 0.0014995336532592773, 0.0017635822296142578, 0.0020276308059692383, 0.0022916793823242188, 0.0025557279586791992, 0.0028197765350341797, 0.00308382511138916, 0.0033478736877441406, 0.003611922264099121, 0.0038759708404541016, 0.004140019416809082, 0.0044040679931640625, 0.004668116569519043, 0.0049321651458740234, 0.005196213722229004, 0.005460262298583984, 0.005724310874938965, 0.005988359451293945, 0.006252408027648926, 0.006516456604003906, 0.006780505180358887, 0.007044553756713867, 0.007308602333068848, 0.007572650909423828, 0.007836699485778809, 0.008100748062133789, 0.00836479663848877, 0.00862884521484375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 11.0, 8.0, 18.0, 12.0, 21.0, 33.0, 32.0, 46.0, 57.0, 60.0, 60.0, 73.0, 65.0, 69.0, 71.0, 69.0, 56.0, 47.0, 37.0, 29.0, 23.0, 32.0, 14.0, 12.0, 13.0, 5.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26439544558525085, -0.25705698132514954, -0.2497185468673706, -0.2423800826072693, -0.23504163324832916, -0.22770318388938904, -0.22036471962928772, -0.2130262702703476, -0.20568782091140747, -0.19834937155246735, -0.19101092219352722, -0.1836724579334259, -0.17633400857448578, -0.16899555921554565, -0.16165709495544434, -0.1543186455965042, -0.1469801962375641, -0.13964174687862396, -0.13230329751968384, -0.12496483325958252, -0.1176263839006424, -0.11028793454170227, -0.10294947773218155, -0.09561102092266083, -0.0882725715637207, -0.08093412220478058, -0.07359566539525986, -0.06625720858573914, -0.05891875922679901, -0.05158030614256859, -0.044241853058338165, -0.03690339997410774, -0.029564961791038513, -0.02222650870680809, -0.014888055622577667, -0.007549602538347244, -0.0002111494541168213, 0.007127303630113602, 0.014465756714344025, 0.021804209798574448, 0.02914266288280487, 0.036481115967035294, 0.04381956905126572, 0.05115802213549614, 0.05849647521972656, 0.06583492457866669, 0.07317338138818741, 0.08051183819770813, 0.08785028755664825, 0.09518873691558838, 0.1025271937251091, 0.10986565053462982, 0.11720409989356995, 0.12454254925251007, 0.1318809986114502, 0.1392194628715515, 0.14655791223049164, 0.15389636158943176, 0.16123482584953308, 0.1685732752084732, 0.17591172456741333, 0.18325017392635345, 0.19058862328529358, 0.1979270875453949, 0.20526553690433502]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 5.0, 5.0, 6.0, 10.0, 12.0, 9.0, 12.0, 19.0, 19.0, 19.0, 31.0, 23.0, 42.0, 40.0, 48.0, 32.0, 41.0, 28.0, 47.0, 46.0, 55.0, 45.0, 37.0, 34.0, 36.0, 40.0, 31.0, 27.0, 30.0, 32.0, 27.0, 17.0, 24.0, 20.0, 8.0, 14.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1884523332118988, -0.18275634944438934, -0.17706038057804108, -0.17136439681053162, -0.16566841304302216, -0.1599724441766739, -0.15427646040916443, -0.14858049154281616, -0.1428845077753067, -0.13718852400779724, -0.13149255514144897, -0.12579657137393951, -0.12010059505701065, -0.11440461874008179, -0.10870863497257233, -0.10301265865564346, -0.097316674888134, -0.09162069857120514, -0.08592471480369568, -0.08022873848676682, -0.07453276216983795, -0.06883677840232849, -0.06314080208539963, -0.057444825768470764, -0.0517488457262516, -0.04605286568403244, -0.04035688936710358, -0.034660909324884415, -0.028964931145310402, -0.02326895296573639, -0.017572972923517227, -0.011876996606588364, -0.006181016564369202, -0.0004850379191339016, 0.0052109407261013985, 0.010906919836997986, 0.016602898016572, 0.02229887619614601, 0.027994856238365173, 0.03369083255529404, 0.0393868125975132, 0.04508279263973236, 0.050778768956661224, 0.056474748998880386, 0.06217072904109955, 0.06786670535802841, 0.07356268167495728, 0.07925866544246674, 0.0849546417593956, 0.09065061807632446, 0.09634660184383392, 0.10204257816076279, 0.10773855447769165, 0.11343453824520111, 0.11913051456212997, 0.12482649087905884, 0.1305224746465683, 0.13621845841407776, 0.14191442728042603, 0.14761041104793549, 0.15330639481544495, 0.1590023636817932, 0.16469834744930267, 0.17039433121681213, 0.1760903000831604]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 12.0, 11.0, 23.0, 38.0, 68.0, 78.0, 145.0, 276.0, 595.0, 1241.0, 2979.0, 7678.0, 21775.0, 75310.0, 478366.0, 368030.0, 61636.0, 18532.0, 6828.0, 2634.0, 1156.0, 488.0, 283.0, 161.0, 87.0, 38.0, 30.0, 12.0, 14.0, 11.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.37255859375, -0.3601112365722656, -0.34766387939453125, -0.3352165222167969, -0.3227691650390625, -0.3103218078613281, -0.29787445068359375, -0.2854270935058594, -0.272979736328125, -0.2605323791503906, -0.24808502197265625, -0.23563766479492188, -0.2231903076171875, -0.21074295043945312, -0.19829559326171875, -0.18584823608398438, -0.17340087890625, -0.16095352172851562, -0.14850616455078125, -0.13605880737304688, -0.1236114501953125, -0.11116409301757812, -0.09871673583984375, -0.08626937866210938, -0.073822021484375, -0.061374664306640625, -0.04892730712890625, -0.036479949951171875, -0.0240325927734375, -0.011585235595703125, 0.00086212158203125, 0.013309478759765625, 0.0257568359375, 0.038204193115234375, 0.05065155029296875, 0.06309890747070312, 0.0755462646484375, 0.08799362182617188, 0.10044097900390625, 0.11288833618164062, 0.125335693359375, 0.13778305053710938, 0.15023040771484375, 0.16267776489257812, 0.1751251220703125, 0.18757247924804688, 0.20001983642578125, 0.21246719360351562, 0.22491455078125, 0.23736190795898438, 0.24980926513671875, 0.2622566223144531, 0.2747039794921875, 0.2871513366699219, 0.29959869384765625, 0.3120460510253906, 0.324493408203125, 0.3369407653808594, 0.34938812255859375, 0.3618354797363281, 0.3742828369140625, 0.3867301940917969, 0.39917755126953125, 0.4116249084472656, 0.424072265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 7.0, 8.0, 9.0, 11.0, 11.0, 17.0, 15.0, 20.0, 30.0, 23.0, 28.0, 21.0, 30.0, 39.0, 42.0, 38.0, 49.0, 53.0, 44.0, 39.0, 37.0, 50.0, 28.0, 35.0, 37.0, 34.0, 41.0, 27.0, 23.0, 25.0, 16.0, 19.0, 19.0, 7.0, 13.0, 10.0, 10.0, 7.0, 9.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.405517578125, -0.39430999755859375, -0.3831024169921875, -0.37189483642578125, -0.360687255859375, -0.34947967529296875, -0.3382720947265625, -0.32706451416015625, -0.31585693359375, -0.30464935302734375, -0.2934417724609375, -0.28223419189453125, -0.271026611328125, -0.25981903076171875, -0.2486114501953125, -0.23740386962890625, -0.2261962890625, -0.21498870849609375, -0.2037811279296875, -0.19257354736328125, -0.181365966796875, -0.17015838623046875, -0.1589508056640625, -0.14774322509765625, -0.13653564453125, -0.12532806396484375, -0.1141204833984375, -0.10291290283203125, -0.091705322265625, -0.08049774169921875, -0.0692901611328125, -0.05808258056640625, -0.046875, -0.03566741943359375, -0.0244598388671875, -0.01325225830078125, -0.002044677734375, 0.00916290283203125, 0.0203704833984375, 0.03157806396484375, 0.04278564453125, 0.05399322509765625, 0.0652008056640625, 0.07640838623046875, 0.087615966796875, 0.09882354736328125, 0.1100311279296875, 0.12123870849609375, 0.1324462890625, 0.14365386962890625, 0.1548614501953125, 0.16606903076171875, 0.177276611328125, 0.18848419189453125, 0.1996917724609375, 0.21089935302734375, 0.22210693359375, 0.23331451416015625, 0.2445220947265625, 0.25572967529296875, 0.266937255859375, 0.27814483642578125, 0.2893524169921875, 0.30055999755859375, 0.311767578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 6.0, 5.0, 4.0, 7.0, 10.0, 15.0, 20.0, 34.0, 46.0, 39.0, 66.0, 106.0, 171.0, 406.0, 813.0, 2220.0, 7198.0, 30664.0, 264768.0, 662741.0, 60834.0, 12566.0, 3496.0, 1136.0, 499.0, 230.0, 143.0, 80.0, 55.0, 44.0, 33.0, 18.0, 21.0, 10.0, 8.0, 10.0, 5.0, 6.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.495361328125, -0.4799766540527344, -0.46459197998046875, -0.4492073059082031, -0.4338226318359375, -0.4184379577636719, -0.40305328369140625, -0.3876686096191406, -0.372283935546875, -0.3568992614746094, -0.34151458740234375, -0.3261299133300781, -0.3107452392578125, -0.2953605651855469, -0.27997589111328125, -0.2645912170410156, -0.24920654296875, -0.23382186889648438, -0.21843719482421875, -0.20305252075195312, -0.1876678466796875, -0.17228317260742188, -0.15689849853515625, -0.14151382446289062, -0.126129150390625, -0.11074447631835938, -0.09535980224609375, -0.07997512817382812, -0.0645904541015625, -0.049205780029296875, -0.03382110595703125, -0.018436431884765625, -0.0030517578125, 0.012332916259765625, 0.02771759033203125, 0.043102264404296875, 0.0584869384765625, 0.07387161254882812, 0.08925628662109375, 0.10464096069335938, 0.120025634765625, 0.13541030883789062, 0.15079498291015625, 0.16617965698242188, 0.1815643310546875, 0.19694900512695312, 0.21233367919921875, 0.22771835327148438, 0.24310302734375, 0.2584877014160156, 0.27387237548828125, 0.2892570495605469, 0.3046417236328125, 0.3200263977050781, 0.33541107177734375, 0.3507957458496094, 0.366180419921875, 0.3815650939941406, 0.39694976806640625, 0.4123344421386719, 0.4277191162109375, 0.4431037902832031, 0.45848846435546875, 0.4738731384277344, 0.4892578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 7.0, 15.0, 11.0, 16.0, 11.0, 15.0, 14.0, 20.0, 28.0, 25.0, 30.0, 34.0, 44.0, 33.0, 45.0, 34.0, 44.0, 47.0, 59.0, 44.0, 39.0, 48.0, 54.0, 37.0, 40.0, 30.0, 28.0, 27.0, 18.0, 12.0, 20.0, 13.0, 14.0, 8.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33251953125, -0.3195762634277344, -0.30663299560546875, -0.2936897277832031, -0.2807464599609375, -0.2678031921386719, -0.25485992431640625, -0.24191665649414062, -0.228973388671875, -0.21603012084960938, -0.20308685302734375, -0.19014358520507812, -0.1772003173828125, -0.16425704956054688, -0.15131378173828125, -0.13837051391601562, -0.12542724609375, -0.11248397827148438, -0.09954071044921875, -0.08659744262695312, -0.0736541748046875, -0.060710906982421875, -0.04776763916015625, -0.034824371337890625, -0.021881103515625, -0.008937835693359375, 0.00400543212890625, 0.016948699951171875, 0.0298919677734375, 0.042835235595703125, 0.05577850341796875, 0.06872177124023438, 0.0816650390625, 0.09460830688476562, 0.10755157470703125, 0.12049484252929688, 0.1334381103515625, 0.14638137817382812, 0.15932464599609375, 0.17226791381835938, 0.185211181640625, 0.19815444946289062, 0.21109771728515625, 0.22404098510742188, 0.2369842529296875, 0.24992752075195312, 0.26287078857421875, 0.2758140563964844, 0.28875732421875, 0.3017005920410156, 0.31464385986328125, 0.3275871276855469, 0.3405303955078125, 0.3534736633300781, 0.36641693115234375, 0.3793601989746094, 0.392303466796875, 0.4052467346191406, 0.41819000244140625, 0.4311332702636719, 0.4440765380859375, 0.4570198059082031, 0.46996307373046875, 0.4829063415527344, 0.495849609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 8.0, 3.0, 5.0, 7.0, 8.0, 11.0, 29.0, 34.0, 73.0, 128.0, 265.0, 574.0, 1732.0, 7310.0, 61695.0, 771117.0, 186317.0, 14688.0, 2844.0, 911.0, 372.0, 170.0, 89.0, 50.0, 33.0, 28.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.1471233367919922, -0.14300155639648438, -0.13887977600097656, -0.13475799560546875, -0.13063621520996094, -0.12651443481445312, -0.12239265441894531, -0.1182708740234375, -0.11414909362792969, -0.11002731323242188, -0.10590553283691406, -0.10178375244140625, -0.09766197204589844, -0.09354019165039062, -0.08941841125488281, -0.085296630859375, -0.08117485046386719, -0.07705307006835938, -0.07293128967285156, -0.06880950927734375, -0.06468772888183594, -0.060565948486328125, -0.05644416809082031, -0.0523223876953125, -0.04820060729980469, -0.044078826904296875, -0.03995704650878906, -0.03583526611328125, -0.03171348571777344, -0.027591705322265625, -0.023469924926757812, -0.01934814453125, -0.015226364135742188, -0.011104583740234375, -0.0069828033447265625, -0.00286102294921875, 0.0012607574462890625, 0.005382537841796875, 0.009504318237304688, 0.0136260986328125, 0.017747879028320312, 0.021869659423828125, 0.025991439819335938, 0.03011322021484375, 0.03423500061035156, 0.038356781005859375, 0.04247856140136719, 0.046600341796875, 0.05072212219238281, 0.054843902587890625, 0.05896568298339844, 0.06308746337890625, 0.06720924377441406, 0.07133102416992188, 0.07545280456542969, 0.0795745849609375, 0.08369636535644531, 0.08781814575195312, 0.09193992614746094, 0.09606170654296875, 0.10018348693847656, 0.10430526733398438, 0.10842704772949219, 0.112548828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 9.0, 13.0, 16.0, 29.0, 34.0, 34.0, 57.0, 83.0, 91.0, 154.0, 133.0, 89.0, 76.0, 64.0, 30.0, 26.0, 16.0, 12.0, 6.0, 3.0, 3.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.09808349609375e-05, -2.043880522251129e-05, -1.9896775484085083e-05, -1.9354745745658875e-05, -1.8812716007232666e-05, -1.8270686268806458e-05, -1.772865653038025e-05, -1.718662679195404e-05, -1.6644597053527832e-05, -1.6102567315101624e-05, -1.5560537576675415e-05, -1.5018507838249207e-05, -1.4476478099822998e-05, -1.393444836139679e-05, -1.3392418622970581e-05, -1.2850388884544373e-05, -1.2308359146118164e-05, -1.1766329407691956e-05, -1.1224299669265747e-05, -1.0682269930839539e-05, -1.014024019241333e-05, -9.598210453987122e-06, -9.056180715560913e-06, -8.514150977134705e-06, -7.972121238708496e-06, -7.430091500282288e-06, -6.888061761856079e-06, -6.346032023429871e-06, -5.804002285003662e-06, -5.261972546577454e-06, -4.719942808151245e-06, -4.177913069725037e-06, -3.635883331298828e-06, -3.0938535928726196e-06, -2.551823854446411e-06, -2.0097941160202026e-06, -1.4677643775939941e-06, -9.257346391677856e-07, -3.8370490074157715e-07, 1.5832483768463135e-07, 7.003545761108398e-07, 1.2423843145370483e-06, 1.7844140529632568e-06, 2.3264437913894653e-06, 2.868473529815674e-06, 3.4105032682418823e-06, 3.952533006668091e-06, 4.494562745094299e-06, 5.036592483520508e-06, 5.578622221946716e-06, 6.120651960372925e-06, 6.662681698799133e-06, 7.204711437225342e-06, 7.74674117565155e-06, 8.288770914077759e-06, 8.830800652503967e-06, 9.372830390930176e-06, 9.914860129356384e-06, 1.0456889867782593e-05, 1.0998919606208801e-05, 1.154094934463501e-05, 1.2082979083061218e-05, 1.2625008821487427e-05, 1.3167038559913635e-05, 1.3709068298339844e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 4.0, 5.0, 19.0, 38.0, 60.0, 82.0, 117.0, 198.0, 347.0, 544.0, 1060.0, 2201.0, 5792.0, 22872.0, 191742.0, 713037.0, 88756.0, 13717.0, 4104.0, 1711.0, 916.0, 487.0, 286.0, 176.0, 96.0, 51.0, 46.0, 23.0, 18.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.153564453125, -0.1493387222290039, -0.1451129913330078, -0.14088726043701172, -0.13666152954101562, -0.13243579864501953, -0.12821006774902344, -0.12398433685302734, -0.11975860595703125, -0.11553287506103516, -0.11130714416503906, -0.10708141326904297, -0.10285568237304688, -0.09862995147705078, -0.09440422058105469, -0.0901784896850586, -0.0859527587890625, -0.0817270278930664, -0.07750129699707031, -0.07327556610107422, -0.06904983520507812, -0.06482410430908203, -0.06059837341308594, -0.056372642517089844, -0.05214691162109375, -0.047921180725097656, -0.04369544982910156, -0.03946971893310547, -0.035243988037109375, -0.03101825714111328, -0.026792526245117188, -0.022566795349121094, -0.018341064453125, -0.014115333557128906, -0.009889602661132812, -0.005663871765136719, -0.001438140869140625, 0.0027875900268554688, 0.0070133209228515625, 0.011239051818847656, 0.01546478271484375, 0.019690513610839844, 0.023916244506835938, 0.02814197540283203, 0.032367706298828125, 0.03659343719482422, 0.04081916809082031, 0.045044898986816406, 0.0492706298828125, 0.053496360778808594, 0.05772209167480469, 0.06194782257080078, 0.06617355346679688, 0.07039928436279297, 0.07462501525878906, 0.07885074615478516, 0.08307647705078125, 0.08730220794677734, 0.09152793884277344, 0.09575366973876953, 0.09997940063476562, 0.10420513153076172, 0.10843086242675781, 0.1126565933227539, 0.11688232421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 15.0, 16.0, 21.0, 19.0, 32.0, 31.0, 42.0, 68.0, 80.0, 110.0, 119.0, 111.0, 66.0, 56.0, 56.0, 26.0, 28.0, 25.0, 12.0, 15.0, 8.0, 6.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0457763671875, -0.044361114501953125, -0.04294586181640625, -0.041530609130859375, -0.0401153564453125, -0.038700103759765625, -0.03728485107421875, -0.035869598388671875, -0.034454345703125, -0.033039093017578125, -0.03162384033203125, -0.030208587646484375, -0.0287933349609375, -0.027378082275390625, -0.02596282958984375, -0.024547576904296875, -0.02313232421875, -0.021717071533203125, -0.02030181884765625, -0.018886566162109375, -0.0174713134765625, -0.016056060791015625, -0.01464080810546875, -0.013225555419921875, -0.011810302734375, -0.010395050048828125, -0.00897979736328125, -0.007564544677734375, -0.0061492919921875, -0.004734039306640625, -0.00331878662109375, -0.001903533935546875, -0.00048828125, 0.000926971435546875, 0.00234222412109375, 0.003757476806640625, 0.0051727294921875, 0.006587982177734375, 0.00800323486328125, 0.009418487548828125, 0.010833740234375, 0.012248992919921875, 0.01366424560546875, 0.015079498291015625, 0.0164947509765625, 0.017910003662109375, 0.01932525634765625, 0.020740509033203125, 0.02215576171875, 0.023571014404296875, 0.02498626708984375, 0.026401519775390625, 0.0278167724609375, 0.029232025146484375, 0.03064727783203125, 0.032062530517578125, 0.033477783203125, 0.034893035888671875, 0.03630828857421875, 0.037723541259765625, 0.0391387939453125, 0.040554046630859375, 0.04196929931640625, 0.043384552001953125, 0.0447998046875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 9.0, 22.0, 35.0, 65.0, 93.0, 136.0, 131.0, 145.0, 132.0, 89.0, 53.0, 44.0, 28.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0], "bins": [-1.6661275625228882, -1.6341406106948853, -1.6021536588668823, -1.5701667070388794, -1.5381797552108765, -1.5061928033828735, -1.4742058515548706, -1.4422187805175781, -1.4102318286895752, -1.3782448768615723, -1.3462579250335693, -1.3142709732055664, -1.2822840213775635, -1.2502970695495605, -1.2183101177215576, -1.1863231658935547, -1.1543362140655518, -1.1223492622375488, -1.090362310409546, -1.058375358581543, -1.02638840675354, -0.9944014549255371, -0.9624144434928894, -0.9304274916648865, -0.8984405398368835, -0.8664535880088806, -0.8344666361808777, -0.8024796843528748, -0.770492672920227, -0.7385057210922241, -0.7065187692642212, -0.6745318174362183, -0.6425447463989258, -0.6105577945709229, -0.5785708427429199, -0.546583890914917, -0.5145969390869141, -0.48260995745658875, -0.4506229758262634, -0.4186360239982605, -0.38664907217025757, -0.35466212034225464, -0.3226751685142517, -0.2906881868839264, -0.25870123505592346, -0.22671428322792053, -0.1947273164987564, -0.16274034976959229, -0.13075339794158936, -0.09876643866300583, -0.0667794793844223, -0.034792520105838776, -0.002805560827255249, 0.02918139100074768, 0.061168357729911804, 0.09315532445907593, 0.12514227628707886, 0.1571292281150818, 0.1891161948442459, 0.22110316157341003, 0.25309011340141296, 0.2850770652294159, 0.3170640468597412, 0.34905099868774414, 0.38103795051574707]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 4.0, 10.0, 10.0, 15.0, 17.0, 18.0, 23.0, 23.0, 25.0, 19.0, 44.0, 38.0, 31.0, 26.0, 24.0, 37.0, 52.0, 26.0, 52.0, 37.0, 37.0, 33.0, 41.0, 35.0, 32.0, 28.0, 33.0, 20.0, 26.0, 28.0, 22.0, 18.0, 23.0, 16.0, 12.0, 18.0, 8.0, 7.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5250296592712402, -0.506401777267456, -0.48777392506599426, -0.46914607286453247, -0.4505181908607483, -0.4318903088569641, -0.4132624566555023, -0.3946346044540405, -0.37600672245025635, -0.35737884044647217, -0.3387509882450104, -0.3201231360435486, -0.3014952540397644, -0.2828673720359802, -0.26423951983451843, -0.24561165273189545, -0.22698378562927246, -0.20835591852664948, -0.1897280514240265, -0.1711001843214035, -0.15247231721878052, -0.13384445011615753, -0.11521658301353455, -0.09658871591091156, -0.07796084880828857, -0.05933298170566559, -0.0407051146030426, -0.022077247500419617, -0.003449380397796631, 0.015178486704826355, 0.03380635380744934, 0.05243422091007233, 0.07106208801269531, 0.0896899551153183, 0.10831782221794128, 0.12694568932056427, 0.14557355642318726, 0.16420142352581024, 0.18282929062843323, 0.2014571577310562, 0.2200850248336792, 0.23871289193630219, 0.25734075903892517, 0.27596861124038696, 0.29459649324417114, 0.3132243752479553, 0.3318522274494171, 0.3504800796508789, 0.3691079616546631, 0.38773584365844727, 0.40636369585990906, 0.42499154806137085, 0.44361943006515503, 0.4622473120689392, 0.480875164270401, 0.4995030164718628, 0.518130898475647, 0.5367587804794312, 0.5553866624832153, 0.5740144848823547, 0.5926423668861389, 0.6112702488899231, 0.6298980712890625, 0.6485259532928467, 0.6671538352966309]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 4.0, 8.0, 26.0, 29.0, 32.0, 36.0, 78.0, 185.0, 287.0, 669.0, 1367.0, 3007.0, 8027.0, 33514.0, 824762.0, 3172936.0, 125468.0, 14961.0, 4919.0, 1973.0, 963.0, 464.0, 220.0, 116.0, 58.0, 51.0, 42.0, 16.0, 16.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6470489501953125, -0.627593994140625, -0.6081390380859375, -0.58868408203125, -0.5692291259765625, -0.549774169921875, -0.5303192138671875, -0.5108642578125, -0.4914093017578125, -0.471954345703125, -0.4524993896484375, -0.43304443359375, -0.4135894775390625, -0.394134521484375, -0.3746795654296875, -0.355224609375, -0.3357696533203125, -0.316314697265625, -0.2968597412109375, -0.27740478515625, -0.2579498291015625, -0.238494873046875, -0.2190399169921875, -0.1995849609375, -0.1801300048828125, -0.160675048828125, -0.1412200927734375, -0.12176513671875, -0.1023101806640625, -0.082855224609375, -0.0634002685546875, -0.0439453125, -0.0244903564453125, -0.005035400390625, 0.0144195556640625, 0.03387451171875, 0.0533294677734375, 0.072784423828125, 0.0922393798828125, 0.1116943359375, 0.1311492919921875, 0.150604248046875, 0.1700592041015625, 0.18951416015625, 0.2089691162109375, 0.228424072265625, 0.2478790283203125, 0.267333984375, 0.2867889404296875, 0.306243896484375, 0.3256988525390625, 0.34515380859375, 0.3646087646484375, 0.384063720703125, 0.4035186767578125, 0.4229736328125, 0.4424285888671875, 0.461883544921875, 0.4813385009765625, 0.50079345703125, 0.5202484130859375, 0.539703369140625, 0.5591583251953125, 0.57861328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 13.0, 17.0, 26.0, 27.0, 20.0, 21.0, 21.0, 33.0, 25.0, 31.0, 38.0, 57.0, 49.0, 44.0, 35.0, 44.0, 43.0, 43.0, 50.0, 42.0, 35.0, 25.0, 36.0, 28.0, 32.0, 25.0, 22.0, 16.0, 21.0, 14.0, 10.0, 7.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17726898193359375, -0.1708221435546875, -0.16437530517578125, -0.157928466796875, -0.15148162841796875, -0.1450347900390625, -0.13858795166015625, -0.13214111328125, -0.12569427490234375, -0.1192474365234375, -0.11280059814453125, -0.106353759765625, -0.09990692138671875, -0.0934600830078125, -0.08701324462890625, -0.08056640625, -0.07411956787109375, -0.0676727294921875, -0.06122589111328125, -0.054779052734375, -0.04833221435546875, -0.0418853759765625, -0.03543853759765625, -0.02899169921875, -0.02254486083984375, -0.0160980224609375, -0.00965118408203125, -0.003204345703125, 0.00324249267578125, 0.0096893310546875, 0.01613616943359375, 0.0225830078125, 0.02902984619140625, 0.0354766845703125, 0.04192352294921875, 0.048370361328125, 0.05481719970703125, 0.0612640380859375, 0.06771087646484375, 0.07415771484375, 0.08060455322265625, 0.0870513916015625, 0.09349822998046875, 0.099945068359375, 0.10639190673828125, 0.1128387451171875, 0.11928558349609375, 0.125732421875, 0.13217926025390625, 0.1386260986328125, 0.14507293701171875, 0.151519775390625, 0.15796661376953125, 0.1644134521484375, 0.17086029052734375, 0.17730712890625, 0.18375396728515625, 0.1902008056640625, 0.19664764404296875, 0.203094482421875, 0.20954132080078125, 0.2159881591796875, 0.22243499755859375, 0.2288818359375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 22.0, 18.0, 46.0, 74.0, 179.0, 461.0, 1618.0, 8253.0, 134374.0, 3949160.0, 90920.0, 6915.0, 1446.0, 447.0, 161.0, 60.0, 46.0, 24.0, 18.0, 10.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8513107299804688, -0.8202972412109375, -0.7892837524414062, -0.758270263671875, -0.7272567749023438, -0.6962432861328125, -0.6652297973632812, -0.63421630859375, -0.6032028198242188, -0.5721893310546875, -0.5411758422851562, -0.510162353515625, -0.47914886474609375, -0.4481353759765625, -0.41712188720703125, -0.3861083984375, -0.35509490966796875, -0.3240814208984375, -0.29306793212890625, -0.262054443359375, -0.23104095458984375, -0.2000274658203125, -0.16901397705078125, -0.13800048828125, -0.10698699951171875, -0.0759735107421875, -0.04496002197265625, -0.013946533203125, 0.01706695556640625, 0.0480804443359375, 0.07909393310546875, 0.110107421875, 0.14112091064453125, 0.1721343994140625, 0.20314788818359375, 0.234161376953125, 0.26517486572265625, 0.2961883544921875, 0.32720184326171875, 0.35821533203125, 0.38922882080078125, 0.4202423095703125, 0.45125579833984375, 0.482269287109375, 0.5132827758789062, 0.5442962646484375, 0.5753097534179688, 0.6063232421875, 0.6373367309570312, 0.6683502197265625, 0.6993637084960938, 0.730377197265625, 0.7613906860351562, 0.7924041748046875, 0.8234176635742188, 0.85443115234375, 0.8854446411132812, 0.9164581298828125, 0.9474716186523438, 0.978485107421875, 1.0094985961914062, 1.0405120849609375, 1.0715255737304688, 1.1025390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 9.0, 16.0, 16.0, 17.0, 21.0, 32.0, 57.0, 89.0, 136.0, 214.0, 375.0, 607.0, 736.0, 652.0, 437.0, 251.0, 131.0, 83.0, 56.0, 34.0, 28.0, 21.0, 14.0, 12.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.185302734375, -0.18037033081054688, -0.17543792724609375, -0.17050552368164062, -0.1655731201171875, -0.16064071655273438, -0.15570831298828125, -0.15077590942382812, -0.145843505859375, -0.14091110229492188, -0.13597869873046875, -0.13104629516601562, -0.1261138916015625, -0.12118148803710938, -0.11624908447265625, -0.11131668090820312, -0.10638427734375, -0.10145187377929688, -0.09651947021484375, -0.09158706665039062, -0.0866546630859375, -0.08172225952148438, -0.07678985595703125, -0.07185745239257812, -0.066925048828125, -0.061992645263671875, -0.05706024169921875, -0.052127838134765625, -0.0471954345703125, -0.042263031005859375, -0.03733062744140625, -0.032398223876953125, -0.0274658203125, -0.022533416748046875, -0.01760101318359375, -0.012668609619140625, -0.0077362060546875, -0.002803802490234375, 0.00212860107421875, 0.007061004638671875, 0.011993408203125, 0.016925811767578125, 0.02185821533203125, 0.026790618896484375, 0.0317230224609375, 0.036655426025390625, 0.04158782958984375, 0.046520233154296875, 0.05145263671875, 0.056385040283203125, 0.06131744384765625, 0.06624984741210938, 0.0711822509765625, 0.07611465454101562, 0.08104705810546875, 0.08597946166992188, 0.090911865234375, 0.09584426879882812, 0.10077667236328125, 0.10570907592773438, 0.1106414794921875, 0.11557388305664062, 0.12050628662109375, 0.12543869018554688, 0.13037109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 12.0, 14.0, 15.0, 21.0, 25.0, 32.0, 38.0, 42.0, 54.0, 62.0, 70.0, 56.0, 70.0, 74.0, 64.0, 47.0, 56.0, 54.0, 41.0, 30.0, 17.0, 22.0, 17.0, 13.0, 12.0, 10.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29683399200439453, -0.2860824465751648, -0.27533093094825745, -0.2645793855190277, -0.25382786989212036, -0.24307632446289062, -0.2323247790336609, -0.22157324850559235, -0.2108217179775238, -0.20007018744945526, -0.18931865692138672, -0.17856711149215698, -0.16781558096408844, -0.1570640504360199, -0.14631250500679016, -0.13556097447872162, -0.12480944395065308, -0.11405791342258453, -0.1033063754439354, -0.09255483746528625, -0.08180330693721771, -0.07105177640914917, -0.06030023843050003, -0.04954870045185089, -0.03879716992378235, -0.028045635670423508, -0.017294101417064667, -0.006542567163705826, 0.004208967089653015, 0.014960501343011856, 0.025712035596370697, 0.036463573575019836, 0.04721510410308838, 0.05796663835644722, 0.06871817260980606, 0.0794697105884552, 0.09022124111652374, 0.10097277164459229, 0.11172430962324142, 0.12247584760189056, 0.1332273781299591, 0.14397890865802765, 0.1547304391860962, 0.16548198461532593, 0.17623351514339447, 0.186985045671463, 0.19773659110069275, 0.2084881216287613, 0.21923965215682983, 0.22999118268489838, 0.24074271321296692, 0.25149425864219666, 0.262245774269104, 0.27299731969833374, 0.2837488651275635, 0.2945004105567932, 0.30525192618370056, 0.3160034716129303, 0.32675498723983765, 0.3375065326690674, 0.3482580780982971, 0.35900959372520447, 0.3697611391544342, 0.38051265478134155, 0.3912642002105713]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 15.0, 25.0, 19.0, 23.0, 24.0, 29.0, 33.0, 37.0, 31.0, 40.0, 41.0, 46.0, 41.0, 38.0, 41.0, 35.0, 47.0, 36.0, 34.0, 37.0, 36.0, 33.0, 30.0, 26.0, 26.0, 35.0, 17.0, 20.0, 14.0, 11.0, 7.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376996874809265, -0.22973011434078217, -0.22176054120063782, -0.21379095315933228, -0.20582138001918793, -0.19785180687904358, -0.18988221883773804, -0.1819126456975937, -0.17394307255744934, -0.165973499417305, -0.15800392627716064, -0.1500343382358551, -0.14206476509571075, -0.1340951919555664, -0.12612560391426086, -0.11815603077411652, -0.11018645763397217, -0.10221688449382782, -0.09424730390310287, -0.08627772331237793, -0.07830815017223358, -0.07033857703208923, -0.06236899644136429, -0.05439941957592964, -0.046429842710494995, -0.03846026584506035, -0.030490688979625702, -0.022521112114191055, -0.014551535248756409, -0.006581958383321762, 0.0013876184821128845, 0.009357195347547531, 0.017326772212982178, 0.025296349078416824, 0.03326592594385147, 0.04123550280928612, 0.049205079674720764, 0.05717465654015541, 0.06514423340559006, 0.073113813996315, 0.08108338713645935, 0.0890529602766037, 0.09702254086732864, 0.10499212145805359, 0.11296169459819794, 0.12093126773834229, 0.12890085577964783, 0.13687042891979218, 0.14484000205993652, 0.15280957520008087, 0.16077914834022522, 0.16874873638153076, 0.1767183095216751, 0.18468788266181946, 0.192657470703125, 0.20062704384326935, 0.2085966169834137, 0.21656619012355804, 0.2245357632637024, 0.23250535130500793, 0.24047492444515228, 0.24844449758529663, 0.2564140856266022, 0.2643836438655853, 0.27235323190689087]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 14.0, 29.0, 38.0, 47.0, 67.0, 111.0, 152.0, 273.0, 458.0, 715.0, 1310.0, 2574.0, 4988.0, 10498.0, 25356.0, 115029.0, 594710.0, 226862.0, 38325.0, 13636.0, 6241.0, 3171.0, 1676.0, 906.0, 504.0, 287.0, 176.0, 115.0, 89.0, 46.0, 41.0, 34.0, 19.0, 12.0, 11.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0], "bins": [-0.1278076171875, -0.12441444396972656, -0.12102127075195312, -0.11762809753417969, -0.11423492431640625, -0.11084175109863281, -0.10744857788085938, -0.10405540466308594, -0.1006622314453125, -0.09726905822753906, -0.09387588500976562, -0.09048271179199219, -0.08708953857421875, -0.08369636535644531, -0.08030319213867188, -0.07691001892089844, -0.073516845703125, -0.07012367248535156, -0.06673049926757812, -0.06333732604980469, -0.05994415283203125, -0.05655097961425781, -0.053157806396484375, -0.04976463317871094, -0.0463714599609375, -0.04297828674316406, -0.039585113525390625, -0.03619194030761719, -0.03279876708984375, -0.029405593872070312, -0.026012420654296875, -0.022619247436523438, -0.01922607421875, -0.015832901000976562, -0.012439727783203125, -0.009046554565429688, -0.00565338134765625, -0.0022602081298828125, 0.001132965087890625, 0.0045261383056640625, 0.0079193115234375, 0.011312484741210938, 0.014705657958984375, 0.018098831176757812, 0.02149200439453125, 0.024885177612304688, 0.028278350830078125, 0.03167152404785156, 0.035064697265625, 0.03845787048339844, 0.041851043701171875, 0.04524421691894531, 0.04863739013671875, 0.05203056335449219, 0.055423736572265625, 0.05881690979003906, 0.0622100830078125, 0.06560325622558594, 0.06899642944335938, 0.07238960266113281, 0.07578277587890625, 0.07917594909667969, 0.08256912231445312, 0.08596229553222656, 0.08935546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 11.0, 8.0, 20.0, 23.0, 25.0, 18.0, 24.0, 38.0, 29.0, 41.0, 38.0, 44.0, 41.0, 47.0, 42.0, 46.0, 43.0, 37.0, 44.0, 46.0, 33.0, 34.0, 32.0, 28.0, 28.0, 35.0, 32.0, 18.0, 19.0, 9.0, 14.0, 6.0, 5.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14783668518066406, -0.14247512817382812, -0.1371135711669922, -0.13175201416015625, -0.1263904571533203, -0.12102890014648438, -0.11566734313964844, -0.1103057861328125, -0.10494422912597656, -0.09958267211914062, -0.09422111511230469, -0.08885955810546875, -0.08349800109863281, -0.07813644409179688, -0.07277488708496094, -0.067413330078125, -0.06205177307128906, -0.056690216064453125, -0.05132865905761719, -0.04596710205078125, -0.04060554504394531, -0.035243988037109375, -0.029882431030273438, -0.0245208740234375, -0.019159317016601562, -0.013797760009765625, -0.008436203002929688, -0.00307464599609375, 0.0022869110107421875, 0.007648468017578125, 0.013010025024414062, 0.01837158203125, 0.023733139038085938, 0.029094696044921875, 0.03445625305175781, 0.03981781005859375, 0.04517936706542969, 0.050540924072265625, 0.05590248107910156, 0.0612640380859375, 0.06662559509277344, 0.07198715209960938, 0.07734870910644531, 0.08271026611328125, 0.08807182312011719, 0.09343338012695312, 0.09879493713378906, 0.104156494140625, 0.10951805114746094, 0.11487960815429688, 0.12024116516113281, 0.12560272216796875, 0.1309642791748047, 0.13632583618164062, 0.14168739318847656, 0.1470489501953125, 0.15241050720214844, 0.15777206420898438, 0.1631336212158203, 0.16849517822265625, 0.1738567352294922, 0.17921829223632812, 0.18457984924316406, 0.18994140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 6.0, 16.0, 14.0, 27.0, 48.0, 84.0, 140.0, 240.0, 501.0, 1053.0, 2189.0, 5190.0, 14296.0, 45364.0, 193481.0, 526676.0, 190346.0, 45138.0, 14225.0, 5228.0, 2222.0, 957.0, 505.0, 251.0, 139.0, 92.0, 36.0, 35.0, 11.0, 12.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0882568359375, -0.08569812774658203, -0.08313941955566406, -0.0805807113647461, -0.07802200317382812, -0.07546329498291016, -0.07290458679199219, -0.07034587860107422, -0.06778717041015625, -0.06522846221923828, -0.06266975402832031, -0.060111045837402344, -0.057552337646484375, -0.054993629455566406, -0.05243492126464844, -0.04987621307373047, -0.0473175048828125, -0.04475879669189453, -0.04220008850097656, -0.039641380310058594, -0.037082672119140625, -0.034523963928222656, -0.03196525573730469, -0.02940654754638672, -0.02684783935546875, -0.02428913116455078, -0.021730422973632812, -0.019171714782714844, -0.016613006591796875, -0.014054298400878906, -0.011495590209960938, -0.008936882019042969, -0.006378173828125, -0.0038194656372070312, -0.0012607574462890625, 0.0012979507446289062, 0.003856658935546875, 0.006415367126464844, 0.008974075317382812, 0.011532783508300781, 0.01409149169921875, 0.01665019989013672, 0.019208908081054688, 0.021767616271972656, 0.024326324462890625, 0.026885032653808594, 0.029443740844726562, 0.03200244903564453, 0.0345611572265625, 0.03711986541748047, 0.03967857360839844, 0.042237281799316406, 0.044795989990234375, 0.047354698181152344, 0.04991340637207031, 0.05247211456298828, 0.05503082275390625, 0.05758953094482422, 0.06014823913574219, 0.06270694732666016, 0.06526565551757812, 0.0678243637084961, 0.07038307189941406, 0.07294178009033203, 0.07550048828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 4.0, 12.0, 15.0, 14.0, 15.0, 23.0, 26.0, 28.0, 24.0, 34.0, 41.0, 37.0, 25.0, 37.0, 40.0, 37.0, 27.0, 56.0, 35.0, 38.0, 50.0, 46.0, 34.0, 30.0, 31.0, 34.0, 24.0, 22.0, 23.0, 15.0, 18.0, 18.0, 12.0, 11.0, 9.0, 5.0, 4.0, 9.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.383056640625, -0.37109375, -0.359130859375, -0.34716796875, -0.335205078125, -0.3232421875, -0.311279296875, -0.29931640625, -0.287353515625, -0.275390625, -0.263427734375, -0.25146484375, -0.239501953125, -0.2275390625, -0.215576171875, -0.20361328125, -0.191650390625, -0.1796875, -0.167724609375, -0.15576171875, -0.143798828125, -0.1318359375, -0.119873046875, -0.10791015625, -0.095947265625, -0.083984375, -0.072021484375, -0.06005859375, -0.048095703125, -0.0361328125, -0.024169921875, -0.01220703125, -0.000244140625, 0.01171875, 0.023681640625, 0.03564453125, 0.047607421875, 0.0595703125, 0.071533203125, 0.08349609375, 0.095458984375, 0.107421875, 0.119384765625, 0.13134765625, 0.143310546875, 0.1552734375, 0.167236328125, 0.17919921875, 0.191162109375, 0.203125, 0.215087890625, 0.22705078125, 0.239013671875, 0.2509765625, 0.262939453125, 0.27490234375, 0.286865234375, 0.298828125, 0.310791015625, 0.32275390625, 0.334716796875, 0.3466796875, 0.358642578125, 0.37060546875, 0.382568359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 32.0, 53.0, 79.0, 151.0, 283.0, 578.0, 1215.0, 2737.0, 7592.0, 27488.0, 201988.0, 662020.0, 114309.0, 19649.0, 6023.0, 2326.0, 942.0, 481.0, 242.0, 121.0, 72.0, 47.0, 28.0, 23.0, 11.0, 5.0, 4.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055145263671875, -0.05366992950439453, -0.05219459533691406, -0.050719261169433594, -0.049243927001953125, -0.047768592834472656, -0.04629325866699219, -0.04481792449951172, -0.04334259033203125, -0.04186725616455078, -0.04039192199707031, -0.038916587829589844, -0.037441253662109375, -0.035965919494628906, -0.03449058532714844, -0.03301525115966797, -0.0315399169921875, -0.03006458282470703, -0.028589248657226562, -0.027113914489746094, -0.025638580322265625, -0.024163246154785156, -0.022687911987304688, -0.02121257781982422, -0.01973724365234375, -0.01826190948486328, -0.016786575317382812, -0.015311241149902344, -0.013835906982421875, -0.012360572814941406, -0.010885238647460938, -0.009409904479980469, -0.0079345703125, -0.006459236145019531, -0.0049839019775390625, -0.0035085678100585938, -0.002033233642578125, -0.0005578994750976562, 0.0009174346923828125, 0.0023927688598632812, 0.00386810302734375, 0.005343437194824219, 0.0068187713623046875, 0.008294105529785156, 0.009769439697265625, 0.011244773864746094, 0.012720108032226562, 0.014195442199707031, 0.0156707763671875, 0.01714611053466797, 0.018621444702148438, 0.020096778869628906, 0.021572113037109375, 0.023047447204589844, 0.024522781372070312, 0.02599811553955078, 0.02747344970703125, 0.02894878387451172, 0.030424118041992188, 0.031899452209472656, 0.033374786376953125, 0.034850120544433594, 0.03632545471191406, 0.03780078887939453, 0.039276123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 15.0, 11.0, 15.0, 37.0, 54.0, 86.0, 100.0, 138.0, 132.0, 123.0, 95.0, 48.0, 35.0, 37.0, 13.0, 14.0, 9.0, 9.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.9742717742919922e-05, -2.898741513490677e-05, -2.8232112526893616e-05, -2.7476809918880463e-05, -2.672150731086731e-05, -2.5966204702854156e-05, -2.5210902094841003e-05, -2.445559948682785e-05, -2.3700296878814697e-05, -2.2944994270801544e-05, -2.218969166278839e-05, -2.1434389054775238e-05, -2.0679086446762085e-05, -1.9923783838748932e-05, -1.916848123073578e-05, -1.8413178622722626e-05, -1.7657876014709473e-05, -1.690257340669632e-05, -1.6147270798683167e-05, -1.5391968190670013e-05, -1.463666558265686e-05, -1.3881362974643707e-05, -1.3126060366630554e-05, -1.2370757758617401e-05, -1.1615455150604248e-05, -1.0860152542591095e-05, -1.0104849934577942e-05, -9.349547326564789e-06, -8.594244718551636e-06, -7.838942110538483e-06, -7.08363950252533e-06, -6.3283368945121765e-06, -5.5730342864990234e-06, -4.81773167848587e-06, -4.062429070472717e-06, -3.307126462459564e-06, -2.551823854446411e-06, -1.796521246433258e-06, -1.041218638420105e-06, -2.859160304069519e-07, 4.6938657760620117e-07, 1.2246891856193542e-06, 1.9799917936325073e-06, 2.7352944016456604e-06, 3.4905970096588135e-06, 4.2458996176719666e-06, 5.00120222568512e-06, 5.756504833698273e-06, 6.511807441711426e-06, 7.267110049724579e-06, 8.022412657737732e-06, 8.777715265750885e-06, 9.533017873764038e-06, 1.0288320481777191e-05, 1.1043623089790344e-05, 1.1798925697803497e-05, 1.255422830581665e-05, 1.3309530913829803e-05, 1.4064833521842957e-05, 1.482013612985611e-05, 1.5575438737869263e-05, 1.6330741345882416e-05, 1.708604395389557e-05, 1.7841346561908722e-05, 1.8596649169921875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 6.0, 17.0, 30.0, 36.0, 57.0, 70.0, 140.0, 220.0, 377.0, 687.0, 1265.0, 2394.0, 4867.0, 10008.0, 22005.0, 56288.0, 154796.0, 328586.0, 279248.0, 113680.0, 41739.0, 16743.0, 7605.0, 3605.0, 1810.0, 954.0, 543.0, 310.0, 190.0, 99.0, 64.0, 42.0, 21.0, 17.0, 8.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0215606689453125, -0.02081298828125, -0.0200653076171875, -0.019317626953125, -0.0185699462890625, -0.017822265625, -0.0170745849609375, -0.016326904296875, -0.0155792236328125, -0.01483154296875, -0.0140838623046875, -0.013336181640625, -0.0125885009765625, -0.0118408203125, -0.0110931396484375, -0.010345458984375, -0.0095977783203125, -0.00885009765625, -0.0081024169921875, -0.007354736328125, -0.0066070556640625, -0.005859375, -0.0051116943359375, -0.004364013671875, -0.0036163330078125, -0.00286865234375, -0.0021209716796875, -0.001373291015625, -0.0006256103515625, 0.0001220703125, 0.0008697509765625, 0.001617431640625, 0.0023651123046875, 0.00311279296875, 0.0038604736328125, 0.004608154296875, 0.0053558349609375, 0.006103515625, 0.0068511962890625, 0.007598876953125, 0.0083465576171875, 0.00909423828125, 0.0098419189453125, 0.010589599609375, 0.0113372802734375, 0.0120849609375, 0.0128326416015625, 0.013580322265625, 0.0143280029296875, 0.01507568359375, 0.0158233642578125, 0.016571044921875, 0.0173187255859375, 0.01806640625, 0.0188140869140625, 0.019561767578125, 0.0203094482421875, 0.02105712890625, 0.0218048095703125, 0.022552490234375, 0.0233001708984375, 0.0240478515625, 0.0247955322265625, 0.025543212890625, 0.0262908935546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 10.0, 4.0, 9.0, 19.0, 22.0, 15.0, 40.0, 50.0, 47.0, 70.0, 80.0, 81.0, 78.0, 87.0, 72.0, 58.0, 64.0, 40.0, 34.0, 22.0, 18.0, 18.0, 9.0, 13.0, 6.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01059722900390625, -0.010306000709533691, -0.010014772415161133, -0.009723544120788574, -0.009432315826416016, -0.009141087532043457, -0.008849859237670898, -0.00855863094329834, -0.008267402648925781, -0.007976174354553223, -0.007684946060180664, -0.0073937177658081055, -0.007102489471435547, -0.006811261177062988, -0.00652003288269043, -0.006228804588317871, -0.0059375762939453125, -0.005646347999572754, -0.005355119705200195, -0.005063891410827637, -0.004772663116455078, -0.0044814348220825195, -0.004190206527709961, -0.0038989782333374023, -0.0036077499389648438, -0.003316521644592285, -0.0030252933502197266, -0.002734065055847168, -0.0024428367614746094, -0.0021516084671020508, -0.0018603801727294922, -0.0015691518783569336, -0.001277923583984375, -0.0009866952896118164, -0.0006954669952392578, -0.0004042387008666992, -0.00011301040649414062, 0.00017821788787841797, 0.00046944618225097656, 0.0007606744766235352, 0.0010519027709960938, 0.0013431310653686523, 0.001634359359741211, 0.0019255876541137695, 0.002216815948486328, 0.0025080442428588867, 0.0027992725372314453, 0.003090500831604004, 0.0033817291259765625, 0.003672957420349121, 0.00396418571472168, 0.004255414009094238, 0.004546642303466797, 0.0048378705978393555, 0.005129098892211914, 0.005420327186584473, 0.005711555480957031, 0.00600278377532959, 0.0062940120697021484, 0.006585240364074707, 0.006876468658447266, 0.007167696952819824, 0.007458925247192383, 0.007750153541564941, 0.0080413818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 3.0, 13.0, 16.0, 14.0, 28.0, 34.0, 39.0, 37.0, 44.0, 48.0, 58.0, 60.0, 72.0, 64.0, 72.0, 62.0, 71.0, 50.0, 35.0, 42.0, 34.0, 22.0, 18.0, 15.0, 10.0, 9.0, 9.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1898532509803772, -0.18336260318756104, -0.17687194049358368, -0.17038129270076752, -0.16389063000679016, -0.157399982213974, -0.15090933442115784, -0.14441867172718048, -0.13792800903320312, -0.13143736124038696, -0.1249466985464096, -0.11845605075359344, -0.11196538805961609, -0.10547474026679993, -0.09898408502340317, -0.09249342978000641, -0.08600278198719025, -0.07951212674379349, -0.07302147150039673, -0.06653082370758057, -0.06004016473889351, -0.05354950949549675, -0.04705885797739029, -0.04056820273399353, -0.03407754749059677, -0.027586892247200012, -0.021096238866448402, -0.014605585485696793, -0.008114930242300034, -0.0016242749989032745, 0.004866376519203186, 0.011357031762599945, 0.017847701907157898, 0.024338357150554657, 0.030829010531306267, 0.03731966391205788, 0.043810319155454636, 0.050300974398851395, 0.056791625916957855, 0.06328228116035461, 0.06977293640375137, 0.07626359164714813, 0.08275424689054489, 0.08924490213394165, 0.09573554992675781, 0.10222621262073517, 0.10871686041355133, 0.11520751565694809, 0.12169817090034485, 0.128188818693161, 0.13467948138713837, 0.14117012917995453, 0.14766079187393188, 0.15415143966674805, 0.1606420874595642, 0.16713275015354156, 0.17362341284751892, 0.18011406064033508, 0.18660472333431244, 0.1930953711271286, 0.19958603382110596, 0.20607668161392212, 0.21256732940673828, 0.21905799210071564, 0.2255486398935318]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 12.0, 14.0, 19.0, 19.0, 22.0, 30.0, 29.0, 34.0, 29.0, 52.0, 33.0, 54.0, 58.0, 35.0, 41.0, 44.0, 48.0, 42.0, 44.0, 41.0, 43.0, 38.0, 29.0, 36.0, 29.0, 26.0, 20.0, 18.0, 13.0, 9.0, 4.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16634730994701385, -0.16081269085407257, -0.1552780717611313, -0.14974345266819, -0.14420883357524872, -0.13867421448230743, -0.13313959538936615, -0.12760497629642487, -0.12207035720348358, -0.1165357381105423, -0.11100111901760101, -0.10546649992465973, -0.09993188083171844, -0.09439726173877716, -0.08886264264583588, -0.08332802355289459, -0.07779340445995331, -0.07225878536701202, -0.06672416627407074, -0.061189547181129456, -0.05565492808818817, -0.05012030899524689, -0.0445856899023056, -0.03905107080936432, -0.033516451716423035, -0.02798183262348175, -0.022447213530540466, -0.016912594437599182, -0.011377975344657898, -0.005843356251716614, -0.0003087371587753296, 0.005225881934165955, 0.010760486125946045, 0.01629510521888733, 0.021829724311828613, 0.027364343404769897, 0.03289896249771118, 0.038433581590652466, 0.04396820068359375, 0.049502819776535034, 0.05503743886947632, 0.0605720579624176, 0.06610667705535889, 0.07164129614830017, 0.07717591524124146, 0.08271053433418274, 0.08824515342712402, 0.09377977252006531, 0.09931439161300659, 0.10484901070594788, 0.11038362979888916, 0.11591824889183044, 0.12145286798477173, 0.126987487077713, 0.1325221061706543, 0.13805672526359558, 0.14359134435653687, 0.14912596344947815, 0.15466058254241943, 0.16019520163536072, 0.165729820728302, 0.1712644398212433, 0.17679905891418457, 0.18233367800712585, 0.18786829710006714]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 6.0, 15.0, 23.0, 25.0, 43.0, 102.0, 173.0, 309.0, 637.0, 1298.0, 3040.0, 7615.0, 23223.0, 96065.0, 396680.0, 389458.0, 93854.0, 22860.0, 7547.0, 3005.0, 1263.0, 616.0, 298.0, 158.0, 79.0, 57.0, 35.0, 22.0, 18.0, 8.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3655738830566406, -0.35150909423828125, -0.3374443054199219, -0.3233795166015625, -0.3093147277832031, -0.29524993896484375, -0.2811851501464844, -0.267120361328125, -0.2530555725097656, -0.23899078369140625, -0.22492599487304688, -0.2108612060546875, -0.19679641723632812, -0.18273162841796875, -0.16866683959960938, -0.15460205078125, -0.14053726196289062, -0.12647247314453125, -0.11240768432617188, -0.0983428955078125, -0.08427810668945312, -0.07021331787109375, -0.056148529052734375, -0.042083740234375, -0.028018951416015625, -0.01395416259765625, 0.000110626220703125, 0.0141754150390625, 0.028240203857421875, 0.04230499267578125, 0.056369781494140625, 0.0704345703125, 0.08449935913085938, 0.09856414794921875, 0.11262893676757812, 0.1266937255859375, 0.14075851440429688, 0.15482330322265625, 0.16888809204101562, 0.182952880859375, 0.19701766967773438, 0.21108245849609375, 0.22514724731445312, 0.2392120361328125, 0.2532768249511719, 0.26734161376953125, 0.2814064025878906, 0.29547119140625, 0.3095359802246094, 0.32360076904296875, 0.3376655578613281, 0.3517303466796875, 0.3657951354980469, 0.37985992431640625, 0.3939247131347656, 0.407989501953125, 0.4220542907714844, 0.43611907958984375, 0.4501838684082031, 0.4642486572265625, 0.4783134460449219, 0.49237823486328125, 0.5064430236816406, 0.5205078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 25.0, 13.0, 22.0, 15.0, 32.0, 28.0, 40.0, 42.0, 42.0, 53.0, 47.0, 49.0, 61.0, 46.0, 59.0, 48.0, 48.0, 43.0, 36.0, 35.0, 39.0, 32.0, 30.0, 24.0, 17.0, 15.0, 13.0, 5.0, 7.0, 8.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.3416404724121094, -0.33000946044921875, -0.3183784484863281, -0.3067474365234375, -0.2951164245605469, -0.28348541259765625, -0.2718544006347656, -0.260223388671875, -0.24859237670898438, -0.23696136474609375, -0.22533035278320312, -0.2136993408203125, -0.20206832885742188, -0.19043731689453125, -0.17880630493164062, -0.16717529296875, -0.15554428100585938, -0.14391326904296875, -0.13228225708007812, -0.1206512451171875, -0.10902023315429688, -0.09738922119140625, -0.08575820922851562, -0.074127197265625, -0.062496185302734375, -0.05086517333984375, -0.039234161376953125, -0.0276031494140625, -0.015972137451171875, -0.00434112548828125, 0.007289886474609375, 0.0189208984375, 0.030551910400390625, 0.04218292236328125, 0.053813934326171875, 0.0654449462890625, 0.07707595825195312, 0.08870697021484375, 0.10033798217773438, 0.111968994140625, 0.12360000610351562, 0.13523101806640625, 0.14686203002929688, 0.1584930419921875, 0.17012405395507812, 0.18175506591796875, 0.19338607788085938, 0.20501708984375, 0.21664810180664062, 0.22827911376953125, 0.23991012573242188, 0.2515411376953125, 0.2631721496582031, 0.27480316162109375, 0.2864341735839844, 0.298065185546875, 0.3096961975097656, 0.32132720947265625, 0.3329582214355469, 0.3445892333984375, 0.3562202453613281, 0.36785125732421875, 0.3794822692871094, 0.39111328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 9.0, 19.0, 39.0, 47.0, 80.0, 120.0, 219.0, 339.0, 635.0, 1192.0, 2421.0, 5686.0, 15839.0, 53791.0, 214402.0, 482237.0, 196650.0, 49728.0, 14780.0, 5353.0, 2301.0, 1176.0, 627.0, 332.0, 187.0, 121.0, 72.0, 43.0, 19.0, 12.0, 22.0, 11.0, 9.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4619140625, -0.4485130310058594, -0.43511199951171875, -0.4217109680175781, -0.4083099365234375, -0.3949089050292969, -0.38150787353515625, -0.3681068420410156, -0.354705810546875, -0.3413047790527344, -0.32790374755859375, -0.3145027160644531, -0.3011016845703125, -0.2877006530761719, -0.27429962158203125, -0.2608985900878906, -0.24749755859375, -0.23409652709960938, -0.22069549560546875, -0.20729446411132812, -0.1938934326171875, -0.18049240112304688, -0.16709136962890625, -0.15369033813476562, -0.140289306640625, -0.12688827514648438, -0.11348724365234375, -0.10008621215820312, -0.0866851806640625, -0.07328414916992188, -0.05988311767578125, -0.046482086181640625, -0.0330810546875, -0.019680023193359375, -0.00627899169921875, 0.007122039794921875, 0.0205230712890625, 0.033924102783203125, 0.04732513427734375, 0.060726165771484375, 0.074127197265625, 0.08752822875976562, 0.10092926025390625, 0.11433029174804688, 0.1277313232421875, 0.14113235473632812, 0.15453338623046875, 0.16793441772460938, 0.18133544921875, 0.19473648071289062, 0.20813751220703125, 0.22153854370117188, 0.2349395751953125, 0.24834060668945312, 0.26174163818359375, 0.2751426696777344, 0.288543701171875, 0.3019447326660156, 0.31534576416015625, 0.3287467956542969, 0.3421478271484375, 0.3555488586425781, 0.36894989013671875, 0.3823509216308594, 0.395751953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 0.0, 6.0, 5.0, 15.0, 10.0, 9.0, 9.0, 16.0, 16.0, 24.0, 21.0, 27.0, 30.0, 27.0, 45.0, 50.0, 31.0, 60.0, 40.0, 39.0, 52.0, 46.0, 45.0, 39.0, 42.0, 36.0, 40.0, 43.0, 25.0, 18.0, 22.0, 24.0, 15.0, 15.0, 13.0, 10.0, 9.0, 6.0, 3.0, 3.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3252449035644531, -0.31479644775390625, -0.3043479919433594, -0.2938995361328125, -0.2834510803222656, -0.27300262451171875, -0.2625541687011719, -0.252105712890625, -0.24165725708007812, -0.23120880126953125, -0.22076034545898438, -0.2103118896484375, -0.19986343383789062, -0.18941497802734375, -0.17896652221679688, -0.16851806640625, -0.15806961059570312, -0.14762115478515625, -0.13717269897460938, -0.1267242431640625, -0.11627578735351562, -0.10582733154296875, -0.09537887573242188, -0.084930419921875, -0.07448196411132812, -0.06403350830078125, -0.053585052490234375, -0.0431365966796875, -0.032688140869140625, -0.02223968505859375, -0.011791229248046875, -0.0013427734375, 0.009105682373046875, 0.01955413818359375, 0.030002593994140625, 0.0404510498046875, 0.050899505615234375, 0.06134796142578125, 0.07179641723632812, 0.082244873046875, 0.09269332885742188, 0.10314178466796875, 0.11359024047851562, 0.1240386962890625, 0.13448715209960938, 0.14493560791015625, 0.15538406372070312, 0.16583251953125, 0.17628097534179688, 0.18672943115234375, 0.19717788696289062, 0.2076263427734375, 0.21807479858398438, 0.22852325439453125, 0.23897171020507812, 0.249420166015625, 0.2598686218261719, 0.27031707763671875, 0.2807655334472656, 0.2912139892578125, 0.3016624450683594, 0.31211090087890625, 0.3225593566894531, 0.3330078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 11.0, 4.0, 7.0, 6.0, 4.0, 15.0, 19.0, 30.0, 29.0, 35.0, 60.0, 95.0, 129.0, 224.0, 351.0, 642.0, 1080.0, 1906.0, 3581.0, 6613.0, 13996.0, 32585.0, 82746.0, 211037.0, 394075.0, 177922.0, 68680.0, 27416.0, 12155.0, 5856.0, 3077.0, 1690.0, 966.0, 546.0, 342.0, 196.0, 150.0, 89.0, 52.0, 37.0, 23.0, 21.0, 9.0, 14.0, 14.0, 5.0, 5.0, 7.0, 7.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-0.06292724609375, -0.06109809875488281, -0.059268951416015625, -0.05743980407714844, -0.05561065673828125, -0.05378150939941406, -0.051952362060546875, -0.05012321472167969, -0.0482940673828125, -0.04646492004394531, -0.044635772705078125, -0.04280662536621094, -0.04097747802734375, -0.03914833068847656, -0.037319183349609375, -0.03549003601074219, -0.033660888671875, -0.03183174133300781, -0.030002593994140625, -0.028173446655273438, -0.02634429931640625, -0.024515151977539062, -0.022686004638671875, -0.020856857299804688, -0.0190277099609375, -0.017198562622070312, -0.015369415283203125, -0.013540267944335938, -0.01171112060546875, -0.009881973266601562, -0.008052825927734375, -0.0062236785888671875, -0.00439453125, -0.0025653839111328125, -0.000736236572265625, 0.0010929107666015625, 0.00292205810546875, 0.0047512054443359375, 0.006580352783203125, 0.008409500122070312, 0.0102386474609375, 0.012067794799804688, 0.013896942138671875, 0.015726089477539062, 0.01755523681640625, 0.019384384155273438, 0.021213531494140625, 0.023042678833007812, 0.024871826171875, 0.026700973510742188, 0.028530120849609375, 0.030359268188476562, 0.03218841552734375, 0.03401756286621094, 0.035846710205078125, 0.03767585754394531, 0.0395050048828125, 0.04133415222167969, 0.043163299560546875, 0.04499244689941406, 0.04682159423828125, 0.04865074157714844, 0.050479888916015625, 0.05230903625488281, 0.05413818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 21.0, 26.0, 39.0, 57.0, 69.0, 72.0, 122.0, 183.0, 92.0, 88.0, 57.0, 54.0, 29.0, 18.0, 19.0, 12.0, 7.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2411346435546875e-05, -2.1777115762233734e-05, -2.1142885088920593e-05, -2.0508654415607452e-05, -1.987442374229431e-05, -1.924019306898117e-05, -1.860596239566803e-05, -1.797173172235489e-05, -1.7337501049041748e-05, -1.6703270375728607e-05, -1.6069039702415466e-05, -1.5434809029102325e-05, -1.4800578355789185e-05, -1.4166347682476044e-05, -1.3532117009162903e-05, -1.2897886335849762e-05, -1.2263655662536621e-05, -1.162942498922348e-05, -1.099519431591034e-05, -1.0360963642597198e-05, -9.726732969284058e-06, -9.092502295970917e-06, -8.458271622657776e-06, -7.824040949344635e-06, -7.189810276031494e-06, -6.555579602718353e-06, -5.921348929405212e-06, -5.2871182560920715e-06, -4.652887582778931e-06, -4.01865690946579e-06, -3.384426236152649e-06, -2.750195562839508e-06, -2.115964889526367e-06, -1.4817342162132263e-06, -8.475035429000854e-07, -2.1327286958694458e-07, 4.209578037261963e-07, 1.0551884770393372e-06, 1.689419150352478e-06, 2.323649823665619e-06, 2.9578804969787598e-06, 3.5921111702919006e-06, 4.2263418436050415e-06, 4.860572516918182e-06, 5.494803190231323e-06, 6.129033863544464e-06, 6.763264536857605e-06, 7.397495210170746e-06, 8.031725883483887e-06, 8.665956556797028e-06, 9.300187230110168e-06, 9.93441790342331e-06, 1.056864857673645e-05, 1.1202879250049591e-05, 1.1837109923362732e-05, 1.2471340596675873e-05, 1.3105571269989014e-05, 1.3739801943302155e-05, 1.4374032616615295e-05, 1.5008263289928436e-05, 1.5642493963241577e-05, 1.6276724636554718e-05, 1.691095530986786e-05, 1.7545185983181e-05, 1.817941665649414e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 13.0, 29.0, 20.0, 34.0, 36.0, 70.0, 113.0, 158.0, 227.0, 339.0, 505.0, 842.0, 1465.0, 2611.0, 5404.0, 11781.0, 32163.0, 104408.0, 377768.0, 351455.0, 103623.0, 31882.0, 11857.0, 5120.0, 2545.0, 1511.0, 933.0, 556.0, 342.0, 212.0, 166.0, 115.0, 74.0, 39.0, 43.0, 30.0, 17.0, 10.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.07030391693115234, -0.06779289245605469, -0.06528186798095703, -0.06277084350585938, -0.06025981903076172, -0.05774879455566406, -0.055237770080566406, -0.05272674560546875, -0.050215721130371094, -0.04770469665527344, -0.04519367218017578, -0.042682647705078125, -0.04017162322998047, -0.03766059875488281, -0.035149574279785156, -0.0326385498046875, -0.030127525329589844, -0.027616500854492188, -0.02510547637939453, -0.022594451904296875, -0.02008342742919922, -0.017572402954101562, -0.015061378479003906, -0.01255035400390625, -0.010039329528808594, -0.0075283050537109375, -0.005017280578613281, -0.002506256103515625, 4.76837158203125e-06, 0.0025157928466796875, 0.005026817321777344, 0.007537841796875, 0.010048866271972656, 0.012559890747070312, 0.015070915222167969, 0.017581939697265625, 0.02009296417236328, 0.022603988647460938, 0.025115013122558594, 0.02762603759765625, 0.030137062072753906, 0.03264808654785156, 0.03515911102294922, 0.037670135498046875, 0.04018115997314453, 0.04269218444824219, 0.045203208923339844, 0.0477142333984375, 0.050225257873535156, 0.05273628234863281, 0.05524730682373047, 0.057758331298828125, 0.06026935577392578, 0.06278038024902344, 0.0652914047241211, 0.06780242919921875, 0.0703134536743164, 0.07282447814941406, 0.07533550262451172, 0.07784652709960938, 0.08035755157470703, 0.08286857604980469, 0.08537960052490234, 0.087890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 24.0, 20.0, 28.0, 34.0, 52.0, 71.0, 88.0, 103.0, 148.0, 102.0, 82.0, 42.0, 44.0, 35.0, 27.0, 19.0, 17.0, 5.0, 6.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05755615234375, -0.05576324462890625, -0.0539703369140625, -0.05217742919921875, -0.050384521484375, -0.04859161376953125, -0.0467987060546875, -0.04500579833984375, -0.043212890625, -0.04141998291015625, -0.0396270751953125, -0.03783416748046875, -0.036041259765625, -0.03424835205078125, -0.0324554443359375, -0.03066253662109375, -0.02886962890625, -0.02707672119140625, -0.0252838134765625, -0.02349090576171875, -0.021697998046875, -0.01990509033203125, -0.0181121826171875, -0.01631927490234375, -0.0145263671875, -0.01273345947265625, -0.0109405517578125, -0.00914764404296875, -0.007354736328125, -0.00556182861328125, -0.0037689208984375, -0.00197601318359375, -0.00018310546875, 0.00160980224609375, 0.0034027099609375, 0.00519561767578125, 0.006988525390625, 0.00878143310546875, 0.0105743408203125, 0.01236724853515625, 0.01416015625, 0.01595306396484375, 0.0177459716796875, 0.01953887939453125, 0.021331787109375, 0.02312469482421875, 0.0249176025390625, 0.02671051025390625, 0.02850341796875, 0.03029632568359375, 0.0320892333984375, 0.03388214111328125, 0.035675048828125, 0.03746795654296875, 0.0392608642578125, 0.04105377197265625, 0.0428466796875, 0.04463958740234375, 0.0464324951171875, 0.04822540283203125, 0.050018310546875, 0.05181121826171875, 0.0536041259765625, 0.05539703369140625, 0.05718994140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 13.0, 17.0, 76.0, 145.0, 236.0, 245.0, 152.0, 70.0, 28.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6368203163146973, -1.5886907577514648, -1.5405611991882324, -1.492431640625, -1.4443020820617676, -1.3961725234985352, -1.3480429649353027, -1.2999135255813599, -1.2517839670181274, -1.203654408454895, -1.1555248498916626, -1.1073952913284302, -1.0592657327651978, -1.0111362934112549, -0.9630066752433777, -0.91487717628479, -0.8667475581169128, -0.8186179995536804, -0.770488440990448, -0.7223589420318604, -0.6742293834686279, -0.6260998249053955, -0.5779702663421631, -0.5298407077789307, -0.48171117901802063, -0.4335816204547882, -0.3854520916938782, -0.33732253313064575, -0.28919297456741333, -0.2410634458065033, -0.19293388724327087, -0.14480435848236084, -0.09667479991912842, -0.04854525253176689, -0.000415705144405365, 0.04771384596824646, 0.09584338963031769, 0.14397293329238892, 0.19210249185562134, 0.24023202061653137, 0.2883615791797638, 0.3364911377429962, 0.38462066650390625, 0.43275022506713867, 0.4808797836303711, 0.5290093421936035, 0.5771389007568359, 0.6252683997154236, 0.673397958278656, 0.7215275168418884, 0.7696570754051208, 0.8177865743637085, 0.8659161329269409, 0.9140456914901733, 0.9621752500534058, 1.0103048086166382, 1.0584343671798706, 1.106563925743103, 1.1546934843063354, 1.2028230428695679, 1.2509526014328003, 1.2990820407867432, 1.3472115993499756, 1.395341157913208, 1.4434707164764404]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 9.0, 7.0, 5.0, 18.0, 10.0, 12.0, 11.0, 19.0, 28.0, 22.0, 32.0, 20.0, 31.0, 36.0, 26.0, 46.0, 52.0, 34.0, 45.0, 36.0, 38.0, 32.0, 44.0, 37.0, 42.0, 37.0, 37.0, 30.0, 33.0, 19.0, 17.0, 21.0, 15.0, 21.0, 12.0, 14.0, 12.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4828285574913025, -0.4659769833087921, -0.44912540912628174, -0.43227383494377136, -0.415422260761261, -0.398570716381073, -0.3817191421985626, -0.36486756801605225, -0.34801599383354187, -0.3311644196510315, -0.3143128454685211, -0.29746127128601074, -0.28060972690582275, -0.26375812292099, -0.246906578540802, -0.23005500435829163, -0.21320343017578125, -0.19635185599327087, -0.1795002818107605, -0.16264872252941132, -0.14579714834690094, -0.12894557416439056, -0.11209400743246078, -0.095242440700531, -0.07839086651802063, -0.06153929606080055, -0.044687725603580475, -0.027836155146360397, -0.01098458468914032, 0.005866989493370056, 0.022718556225299835, 0.039570122957229614, 0.056421756744384766, 0.07327333092689514, 0.09012489765882492, 0.1069764643907547, 0.12382803857326508, 0.14067961275577545, 0.15753117203712463, 0.174382746219635, 0.19123432040214539, 0.20808589458465576, 0.22493746876716614, 0.24178902804851532, 0.2586405873298645, 0.27549219131469727, 0.29234373569488525, 0.30919530987739563, 0.326046884059906, 0.3428984582424164, 0.35975003242492676, 0.37660160660743713, 0.3934531807899475, 0.4103047251701355, 0.4271562993526459, 0.44400787353515625, 0.4608594477176666, 0.477711021900177, 0.4945625960826874, 0.5114141702651978, 0.5282657146453857, 0.5451173186302185, 0.5619688630104065, 0.5788204669952393, 0.5956720113754272]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 8.0, 5.0, 12.0, 8.0, 16.0, 22.0, 32.0, 35.0, 51.0, 62.0, 73.0, 94.0, 111.0, 150.0, 173.0, 235.0, 292.0, 358.0, 522.0, 656.0, 1075.0, 1762.0, 3424.0, 6230.0, 1022313.0, 5154.0, 2755.0, 1446.0, 897.0, 602.0, 418.0, 334.0, 250.0, 216.0, 154.0, 122.0, 109.0, 87.0, 78.0, 57.0, 44.0, 44.0, 25.0, 26.0, 11.0, 16.0, 13.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.5101166367530823, -0.49481111764907837, -0.47950559854507446, -0.46420007944107056, -0.44889456033706665, -0.43358904123306274, -0.41828352212905884, -0.40297800302505493, -0.387672483921051, -0.3723669648170471, -0.3570614457130432, -0.3417559266090393, -0.3264504075050354, -0.3111448884010315, -0.2958393692970276, -0.2805338501930237, -0.2652283310890198, -0.24992281198501587, -0.23461729288101196, -0.21931177377700806, -0.20400625467300415, -0.18870073556900024, -0.17339521646499634, -0.15808969736099243, -0.1427842080593109, -0.127478688955307, -0.1121731698513031, -0.0968676507472992, -0.08156213164329529, -0.06625661998987198, -0.05095110088586807, -0.035645581781864166, -0.020340055227279663, -0.0050345370545983315, 0.010270981118083, 0.025576498359441757, 0.04088201746344566, 0.05618753284215927, 0.07149305194616318, 0.08679857105016708, 0.10210409015417099, 0.1174096092581749, 0.1327151209115982, 0.1480206400156021, 0.16332615911960602, 0.17863167822360992, 0.19393719732761383, 0.20924271643161774, 0.22454823553562164, 0.23985375463962555, 0.25515925884246826, 0.27046477794647217, 0.2857702970504761, 0.30107581615448, 0.3163813352584839, 0.3316868543624878, 0.3469923734664917, 0.3622978925704956, 0.3776034116744995, 0.3929089307785034, 0.4082144498825073, 0.42351996898651123, 0.43882548809051514, 0.45413100719451904, 0.46943652629852295]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 14.0, 12.0, 44.0, 76.0, 134.0, 260.0, 440.0, 977.0, 3176.0, 51460712.0, 2589.0, 855.0, 459.0, 272.0, 129.0, 71.0, 44.0, 19.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.461135864257812, -13.101757049560547, -12.742379188537598, -12.383000373840332, -12.023622512817383, -11.664243698120117, -11.304864883422852, -10.945487022399902, -10.586109161376953, -10.226730346679688, -9.867352485656738, -9.507973670959473, -9.148595809936523, -8.789216995239258, -8.429838180541992, -8.070460319519043, -7.711081504821777, -7.35170316696167, -6.9923248291015625, -6.632946014404297, -6.273568153381348, -5.914189338684082, -5.554811000823975, -5.195432662963867, -4.83605432510376, -4.476675987243652, -4.117297649383545, -3.7579190731048584, -3.398540735244751, -3.0391623973846436, -2.679783821105957, -2.3204054832458496, -1.9610261917114258, -1.6016478538513184, -1.2422693967819214, -0.8828909397125244, -0.523512601852417, -0.16413426399230957, 0.19524431228637695, 0.5546226501464844, 0.9140009880065918, 1.2733793258666992, 1.6327577829360962, 1.9921362400054932, 2.3515145778656006, 2.710892915725708, 3.0702714920043945, 3.429649829864502, 3.7890281677246094, 4.148406505584717, 4.507784843444824, 4.86716365814209, 5.226541519165039, 5.585920333862305, 5.945298671722412, 6.3046770095825195, 6.664055347442627, 7.023433685302734, 7.382812023162842, 7.742190361022949, 8.101569175720215, 8.460947036743164, 8.82032585144043, 9.179704666137695, 9.539082527160645]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 10.0, 17.0, 31.0, 43.0, 69.0, 127.0, 175.0, 252.0, 448.0, 716.0, 1230.0, 2018.0, 3539.0, 5622.0, 9967.0, 17205.0, 30138.0, 53068.0, 93071.0, 159083.0, 257784.0, 382826.0, 1025818.0, 3044189.0, 445323.0, 301240.0, 190758.0, 113970.0, 65532.0, 37203.0, 20872.0, 12068.0, 6825.0, 4025.0, 2455.0, 1430.0, 885.0, 530.0, 328.0, 218.0, 123.0, 70.0, 41.0, 32.0, 20.0, 10.0, 8.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.47412109375, -0.45938873291015625, -0.4446563720703125, -0.42992401123046875, -0.415191650390625, -0.40045928955078125, -0.3857269287109375, -0.37099456787109375, -0.35626220703125, -0.34152984619140625, -0.3267974853515625, -0.31206512451171875, -0.297332763671875, -0.28260040283203125, -0.2678680419921875, -0.25313568115234375, -0.2384033203125, -0.22367095947265625, -0.2089385986328125, -0.19420623779296875, -0.179473876953125, -0.16474151611328125, -0.1500091552734375, -0.13527679443359375, -0.12054443359375, -0.10581207275390625, -0.0910797119140625, -0.07634735107421875, -0.061614990234375, -0.04688262939453125, -0.0321502685546875, -0.01741790771484375, -0.002685546875, 0.01204681396484375, 0.0267791748046875, 0.04151153564453125, 0.056243896484375, 0.07097625732421875, 0.0857086181640625, 0.10044097900390625, 0.11517333984375, 0.12990570068359375, 0.1446380615234375, 0.15937042236328125, 0.174102783203125, 0.18883514404296875, 0.2035675048828125, 0.21829986572265625, 0.2330322265625, 0.24776458740234375, 0.2624969482421875, 0.27722930908203125, 0.291961669921875, 0.30669403076171875, 0.3214263916015625, 0.33615875244140625, 0.35089111328125, 0.36562347412109375, 0.3803558349609375, 0.39508819580078125, 0.409820556640625, 0.42455291748046875, 0.4392852783203125, 0.45401763916015625, 0.46875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 2.0, 8.0, 8.0, 6.0, 14.0, 18.0, 23.0, 18.0, 25.0, 27.0, 29.0, 33.0, 46.0, 50.0, 47.0, 60.0, 260.0, 835.0, 92.0, 45.0, 61.0, 42.0, 58.0, 40.0, 32.0, 29.0, 22.0, 17.0, 14.0, 19.0, 12.0, 10.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.430206298828125, -3.29986572265625, -3.169525146484375, -3.0391845703125, -2.908843994140625, -2.77850341796875, -2.648162841796875, -2.517822265625, -2.387481689453125, -2.25714111328125, -2.126800537109375, -1.9964599609375, -1.866119384765625, -1.73577880859375, -1.605438232421875, -1.47509765625, -1.344757080078125, -1.21441650390625, -1.084075927734375, -0.9537353515625, -0.823394775390625, -0.69305419921875, -0.562713623046875, -0.432373046875, -0.302032470703125, -0.17169189453125, -0.041351318359375, 0.0889892578125, 0.219329833984375, 0.34967041015625, 0.480010986328125, 0.6103515625, 0.740692138671875, 0.87103271484375, 1.001373291015625, 1.1317138671875, 1.262054443359375, 1.39239501953125, 1.522735595703125, 1.653076171875, 1.783416748046875, 1.91375732421875, 2.044097900390625, 2.1744384765625, 2.304779052734375, 2.43511962890625, 2.565460205078125, 2.69580078125, 2.826141357421875, 2.95648193359375, 3.086822509765625, 3.2171630859375, 3.347503662109375, 3.47784423828125, 3.608184814453125, 3.738525390625, 3.868865966796875, 3.99920654296875, 4.129547119140625, 4.2598876953125, 4.390228271484375, 4.52056884765625, 4.650909423828125, 4.78125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 13.0, 31.0, 37.0, 51.0, 86.0, 143.0, 186.0, 360.0, 530.0, 811.0, 1267.0, 2002.0, 3169.0, 5327.0, 8052.0, 13148.0, 20268.0, 31999.0, 49602.0, 75519.0, 111304.0, 159323.0, 217196.0, 277324.0, 361737.0, 2876094.0, 919415.0, 310966.0, 250368.0, 190162.0, 136919.0, 93830.0, 62304.0, 40750.0, 26139.0, 16748.0, 10447.0, 6654.0, 4179.0, 2562.0, 1611.0, 1032.0, 622.0, 403.0, 264.0, 178.0, 107.0, 65.0, 44.0, 26.0, 19.0, 19.0, 8.0, 6.0, 4.0, 0.0, 2.0], "bins": [-0.284912109375, -0.2762184143066406, -0.26752471923828125, -0.2588310241699219, -0.2501373291015625, -0.24144363403320312, -0.23274993896484375, -0.22405624389648438, -0.215362548828125, -0.20666885375976562, -0.19797515869140625, -0.18928146362304688, -0.1805877685546875, -0.17189407348632812, -0.16320037841796875, -0.15450668334960938, -0.14581298828125, -0.13711929321289062, -0.12842559814453125, -0.11973190307617188, -0.1110382080078125, -0.10234451293945312, -0.09365081787109375, -0.08495712280273438, -0.076263427734375, -0.06756973266601562, -0.05887603759765625, -0.050182342529296875, -0.0414886474609375, -0.032794952392578125, -0.02410125732421875, -0.015407562255859375, -0.0067138671875, 0.001979827880859375, 0.01067352294921875, 0.019367218017578125, 0.0280609130859375, 0.036754608154296875, 0.04544830322265625, 0.054141998291015625, 0.062835693359375, 0.07152938842773438, 0.08022308349609375, 0.08891677856445312, 0.0976104736328125, 0.10630416870117188, 0.11499786376953125, 0.12369155883789062, 0.13238525390625, 0.14107894897460938, 0.14977264404296875, 0.15846633911132812, 0.1671600341796875, 0.17585372924804688, 0.18454742431640625, 0.19324111938476562, 0.201934814453125, 0.21062850952148438, 0.21932220458984375, 0.22801589965820312, 0.2367095947265625, 0.24540328979492188, 0.25409698486328125, 0.2627906799316406, 0.271484375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 2.0, 8.0, 11.0, 17.0, 16.0, 14.0, 25.0, 19.0, 37.0, 38.0, 40.0, 37.0, 58.0, 65.0, 47.0, 194.0, 886.0, 101.0, 42.0, 50.0, 44.0, 51.0, 31.0, 27.0, 26.0, 30.0, 19.0, 18.0, 16.0, 13.0, 13.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.568359375, -3.46173095703125, -3.3551025390625, -3.24847412109375, -3.141845703125, -3.03521728515625, -2.9285888671875, -2.82196044921875, -2.71533203125, -2.60870361328125, -2.5020751953125, -2.39544677734375, -2.288818359375, -2.18218994140625, -2.0755615234375, -1.96893310546875, -1.8623046875, -1.75567626953125, -1.6490478515625, -1.54241943359375, -1.435791015625, -1.32916259765625, -1.2225341796875, -1.11590576171875, -1.00927734375, -0.90264892578125, -0.7960205078125, -0.68939208984375, -0.582763671875, -0.47613525390625, -0.3695068359375, -0.26287841796875, -0.15625, -0.04962158203125, 0.0570068359375, 0.16363525390625, 0.270263671875, 0.37689208984375, 0.4835205078125, 0.59014892578125, 0.69677734375, 0.80340576171875, 0.9100341796875, 1.01666259765625, 1.123291015625, 1.22991943359375, 1.3365478515625, 1.44317626953125, 1.5498046875, 1.65643310546875, 1.7630615234375, 1.86968994140625, 1.976318359375, 2.08294677734375, 2.1895751953125, 2.29620361328125, 2.40283203125, 2.50946044921875, 2.6160888671875, 2.72271728515625, 2.829345703125, 2.93597412109375, 3.0426025390625, 3.14923095703125, 3.255859375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 10.0, 8.0, 9.0, 16.0, 29.0, 38.0, 58.0, 66.0, 78.0, 105.0, 128.0, 198.0, 243.0, 341.0, 510.0, 872.0, 1468.0, 2877.0, 5912.0, 14983.0, 42601.0, 117875.0, 5529323.0, 430905.0, 88615.0, 31591.0, 11684.0, 4864.0, 2333.0, 1267.0, 764.0, 494.0, 264.0, 218.0, 155.0, 124.0, 113.0, 68.0, 64.0, 35.0, 20.0, 20.0, 28.0, 12.0, 10.0, 4.0, 4.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.396484375, -1.3552398681640625, -1.313995361328125, -1.2727508544921875, -1.23150634765625, -1.1902618408203125, -1.149017333984375, -1.1077728271484375, -1.0665283203125, -1.0252838134765625, -0.984039306640625, -0.9427947998046875, -0.90155029296875, -0.8603057861328125, -0.819061279296875, -0.7778167724609375, -0.736572265625, -0.6953277587890625, -0.654083251953125, -0.6128387451171875, -0.57159423828125, -0.5303497314453125, -0.489105224609375, -0.4478607177734375, -0.4066162109375, -0.3653717041015625, -0.324127197265625, -0.2828826904296875, -0.24163818359375, -0.2003936767578125, -0.159149169921875, -0.1179046630859375, -0.07666015625, -0.0354156494140625, 0.005828857421875, 0.0470733642578125, 0.08831787109375, 0.1295623779296875, 0.170806884765625, 0.2120513916015625, 0.2532958984375, 0.2945404052734375, 0.335784912109375, 0.3770294189453125, 0.41827392578125, 0.4595184326171875, 0.500762939453125, 0.5420074462890625, 0.583251953125, 0.6244964599609375, 0.665740966796875, 0.7069854736328125, 0.74822998046875, 0.7894744873046875, 0.830718994140625, 0.8719635009765625, 0.9132080078125, 0.9544525146484375, 0.995697021484375, 1.0369415283203125, 1.07818603515625, 1.1194305419921875, 1.160675048828125, 1.2019195556640625, 1.2431640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 5.0, 11.0, 7.0, 9.0, 15.0, 19.0, 22.0, 22.0, 28.0, 26.0, 41.0, 22.0, 38.0, 30.0, 42.0, 41.0, 45.0, 294.0, 770.0, 77.0, 38.0, 37.0, 43.0, 32.0, 43.0, 35.0, 30.0, 30.0, 27.0, 23.0, 21.0, 11.0, 14.0, 8.0, 9.0, 9.0, 7.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.787109375, -2.7034912109375, -2.619873046875, -2.5362548828125, -2.45263671875, -2.3690185546875, -2.285400390625, -2.2017822265625, -2.1181640625, -2.0345458984375, -1.950927734375, -1.8673095703125, -1.78369140625, -1.7000732421875, -1.616455078125, -1.5328369140625, -1.44921875, -1.3656005859375, -1.281982421875, -1.1983642578125, -1.11474609375, -1.0311279296875, -0.947509765625, -0.8638916015625, -0.7802734375, -0.6966552734375, -0.613037109375, -0.5294189453125, -0.44580078125, -0.3621826171875, -0.278564453125, -0.1949462890625, -0.111328125, -0.0277099609375, 0.055908203125, 0.1395263671875, 0.22314453125, 0.3067626953125, 0.390380859375, 0.4739990234375, 0.5576171875, 0.6412353515625, 0.724853515625, 0.8084716796875, 0.89208984375, 0.9757080078125, 1.059326171875, 1.1429443359375, 1.2265625, 1.3101806640625, 1.393798828125, 1.4774169921875, 1.56103515625, 1.6446533203125, 1.728271484375, 1.8118896484375, 1.8955078125, 1.9791259765625, 2.062744140625, 2.1463623046875, 2.22998046875, 2.3135986328125, 2.397216796875, 2.4808349609375, 2.564453125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 7.0, 4.0, 18.0, 21.0, 30.0, 47.0, 66.0, 97.0, 215.0, 195.0, 98.0, 63.0, 46.0, 36.0, 31.0, 11.0, 3.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.649308204650879, -13.836520195007324, -13.023733139038086, -12.210945129394531, -11.398158073425293, -10.585370063781738, -9.7725830078125, -8.959794998168945, -8.14700698852539, -7.334219455718994, -6.521431922912598, -5.708643913269043, -4.895856857299805, -4.08306884765625, -3.2702813148498535, -2.457493782043457, -1.6447067260742188, -0.8319191336631775, -0.01913154125213623, 0.7936561107635498, 1.6064436435699463, 2.419231414794922, 3.2320189476013184, 4.044806480407715, 4.857594013214111, 5.670381546020508, 6.483169078826904, 7.295956611633301, 8.108744621276855, 8.921531677246094, 9.734319686889648, 10.547107696533203, 11.359895706176758, 12.172683715820312, 12.98547077178955, 13.798258781433105, 14.611045837402344, 15.423833847045898, 16.236621856689453, 17.049407958984375, 17.86219596862793, 18.674983978271484, 19.48777198791504, 20.30055809020996, 21.113346099853516, 21.92613410949707, 22.738922119140625, 23.551708221435547, 24.364498138427734, 25.17728614807129, 25.990074157714844, 26.802860260009766, 27.61564826965332, 28.428436279296875, 29.24122428894043, 30.054012298583984, 30.866798400878906, 31.67958641052246, 32.492374420166016, 33.30516052246094, 34.117950439453125, 34.93073654174805, 35.74352264404297, 36.556312561035156, 37.36909866333008]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 4.0, 13.0, 12.0, 7.0, 15.0, 23.0, 23.0, 29.0, 25.0, 32.0, 58.0, 84.0, 91.0, 142.0, 106.0, 88.0, 48.0, 36.0, 28.0, 24.0, 19.0, 17.0, 19.0, 12.0, 9.0, 7.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.04505157470703, -41.72314453125, -40.40123748779297, -39.0793342590332, -37.75742721557617, -36.43552017211914, -35.11361312866211, -33.79170608520508, -32.46980285644531, -31.14789581298828, -29.825990676879883, -28.50408363342285, -27.182178497314453, -25.860271453857422, -24.53836441040039, -23.21645736694336, -21.894550323486328, -20.572643280029297, -19.2507381439209, -17.928831100463867, -16.60692596435547, -15.285018920898438, -13.963111877441406, -12.641205787658691, -11.319299697875977, -9.997393608093262, -8.675487518310547, -7.353580474853516, -6.031674385070801, -4.709768295288086, -3.387861728668213, -2.06595516204834, -0.744049072265625, 0.577857255935669, 1.899763584136963, 3.221669912338257, 4.543576240539551, 5.865482330322266, 7.187388896942139, 8.509295463562012, 9.831201553344727, 11.153107643127441, 12.475013732910156, 13.796920776367188, 15.118826866149902, 16.440732955932617, 17.76263999938965, 19.084545135498047, 20.406452178955078, 21.72835922241211, 23.050264358520508, 24.37217140197754, 25.694076538085938, 27.01598358154297, 28.337890625, 29.65979766845703, 30.98170280456543, 32.30360794067383, 33.62551498413086, 34.94742202758789, 36.26932907104492, 37.59123229980469, 38.91313934326172, 40.23504638671875, 41.55695343017578]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 7.0, 6.0, 22.0, 23.0, 23.0, 37.0, 41.0, 74.0, 91.0, 131.0, 194.0, 313.0, 497.0, 870.0, 1597.0, 3123.0, 6814.0, 18794.0, 77610.0, 3672268.0, 349515.0, 39735.0, 12243.0, 4860.0, 2307.0, 1128.0, 690.0, 416.0, 275.0, 161.0, 125.0, 77.0, 59.0, 33.0, 41.0, 23.0, 11.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09866523742675781, -0.09582901000976562, -0.09299278259277344, -0.09015655517578125, -0.08732032775878906, -0.08448410034179688, -0.08164787292480469, -0.0788116455078125, -0.07597541809082031, -0.07313919067382812, -0.07030296325683594, -0.06746673583984375, -0.06463050842285156, -0.061794281005859375, -0.05895805358886719, -0.056121826171875, -0.05328559875488281, -0.050449371337890625, -0.04761314392089844, -0.04477691650390625, -0.04194068908691406, -0.039104461669921875, -0.03626823425292969, -0.0334320068359375, -0.030595779418945312, -0.027759552001953125, -0.024923324584960938, -0.02208709716796875, -0.019250869750976562, -0.016414642333984375, -0.013578414916992188, -0.0107421875, -0.007905960083007812, -0.005069732666015625, -0.0022335052490234375, 0.00060272216796875, 0.0034389495849609375, 0.006275177001953125, 0.009111404418945312, 0.0119476318359375, 0.014783859252929688, 0.017620086669921875, 0.020456314086914062, 0.02329254150390625, 0.026128768920898438, 0.028964996337890625, 0.03180122375488281, 0.034637451171875, 0.03747367858886719, 0.040309906005859375, 0.04314613342285156, 0.04598236083984375, 0.04881858825683594, 0.051654815673828125, 0.05449104309082031, 0.0573272705078125, 0.06016349792480469, 0.06299972534179688, 0.06583595275878906, 0.06867218017578125, 0.07150840759277344, 0.07434463500976562, 0.07718086242675781, 0.08001708984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 2.0, 4.0, 7.0, 10.0, 12.0, 12.0, 15.0, 17.0, 18.0, 26.0, 36.0, 59.0, 62.0, 163.0, 210.0, 85.0, 43.0, 44.0, 35.0, 22.0, 19.0, 20.0, 10.0, 9.0, 7.0, 7.0, 7.0, 5.0, 3.0, 3.0, 5.0, 5.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02532958984375, -0.024565696716308594, -0.023801803588867188, -0.02303791046142578, -0.022274017333984375, -0.02151012420654297, -0.020746231079101562, -0.019982337951660156, -0.01921844482421875, -0.018454551696777344, -0.017690658569335938, -0.01692676544189453, -0.016162872314453125, -0.015398979187011719, -0.014635086059570312, -0.013871192932128906, -0.0131072998046875, -0.012343406677246094, -0.011579513549804688, -0.010815620422363281, -0.010051727294921875, -0.009287834167480469, -0.008523941040039062, -0.007760047912597656, -0.00699615478515625, -0.006232261657714844, -0.0054683685302734375, -0.004704475402832031, -0.003940582275390625, -0.0031766891479492188, -0.0024127960205078125, -0.0016489028930664062, -0.000885009765625, -0.00012111663818359375, 0.0006427764892578125, 0.0014066696166992188, 0.002170562744140625, 0.0029344558715820312, 0.0036983489990234375, 0.004462242126464844, 0.00522613525390625, 0.005990028381347656, 0.0067539215087890625, 0.007517814636230469, 0.008281707763671875, 0.009045600891113281, 0.009809494018554688, 0.010573387145996094, 0.0113372802734375, 0.012101173400878906, 0.012865066528320312, 0.013628959655761719, 0.014392852783203125, 0.015156745910644531, 0.015920639038085938, 0.016684532165527344, 0.01744842529296875, 0.018212318420410156, 0.018976211547851562, 0.01974010467529297, 0.020503997802734375, 0.02126789093017578, 0.022031784057617188, 0.022795677185058594, 0.0235595703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 10.0, 13.0, 17.0, 22.0, 27.0, 61.0, 85.0, 170.0, 323.0, 954.0, 3051.0, 12367.0, 72813.0, 1129495.0, 2828733.0, 122123.0, 17846.0, 3958.0, 1254.0, 477.0, 203.0, 111.0, 63.0, 38.0, 23.0, 13.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1063232421875, -0.10329532623291016, -0.10026741027832031, -0.09723949432373047, -0.09421157836914062, -0.09118366241455078, -0.08815574645996094, -0.0851278305053711, -0.08209991455078125, -0.0790719985961914, -0.07604408264160156, -0.07301616668701172, -0.06998825073242188, -0.06696033477783203, -0.06393241882324219, -0.060904502868652344, -0.0578765869140625, -0.054848670959472656, -0.05182075500488281, -0.04879283905029297, -0.045764923095703125, -0.04273700714111328, -0.03970909118652344, -0.036681175231933594, -0.03365325927734375, -0.030625343322753906, -0.027597427368164062, -0.02456951141357422, -0.021541595458984375, -0.01851367950439453, -0.015485763549804688, -0.012457847595214844, -0.009429931640625, -0.006402015686035156, -0.0033740997314453125, -0.00034618377685546875, 0.002681732177734375, 0.005709648132324219, 0.008737564086914062, 0.011765480041503906, 0.01479339599609375, 0.017821311950683594, 0.020849227905273438, 0.02387714385986328, 0.026905059814453125, 0.02993297576904297, 0.03296089172363281, 0.035988807678222656, 0.0390167236328125, 0.042044639587402344, 0.04507255554199219, 0.04810047149658203, 0.051128387451171875, 0.05415630340576172, 0.05718421936035156, 0.060212135314941406, 0.06324005126953125, 0.0662679672241211, 0.06929588317871094, 0.07232379913330078, 0.07535171508789062, 0.07837963104248047, 0.08140754699707031, 0.08443546295166016, 0.08746337890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 8.0, 4.0, 19.0, 14.0, 22.0, 27.0, 31.0, 45.0, 52.0, 78.0, 124.0, 197.0, 347.0, 626.0, 985.0, 520.0, 314.0, 172.0, 123.0, 89.0, 86.0, 44.0, 38.0, 31.0, 20.0, 12.0, 11.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022186279296875, -0.02137613296508789, -0.02056598663330078, -0.019755840301513672, -0.018945693969726562, -0.018135547637939453, -0.017325401306152344, -0.016515254974365234, -0.015705108642578125, -0.014894962310791016, -0.014084815979003906, -0.013274669647216797, -0.012464523315429688, -0.011654376983642578, -0.010844230651855469, -0.01003408432006836, -0.00922393798828125, -0.00841379165649414, -0.007603645324707031, -0.006793498992919922, -0.0059833526611328125, -0.005173206329345703, -0.004363059997558594, -0.0035529136657714844, -0.002742767333984375, -0.0019326210021972656, -0.0011224746704101562, -0.0003123283386230469, 0.0004978179931640625, 0.0013079643249511719, 0.0021181106567382812, 0.0029282569885253906, 0.0037384033203125, 0.004548549652099609, 0.005358695983886719, 0.006168842315673828, 0.0069789886474609375, 0.007789134979248047, 0.008599281311035156, 0.009409427642822266, 0.010219573974609375, 0.011029720306396484, 0.011839866638183594, 0.012650012969970703, 0.013460159301757812, 0.014270305633544922, 0.015080451965332031, 0.01589059829711914, 0.01670074462890625, 0.01751089096069336, 0.01832103729248047, 0.019131183624267578, 0.019941329956054688, 0.020751476287841797, 0.021561622619628906, 0.022371768951416016, 0.023181915283203125, 0.023992061614990234, 0.024802207946777344, 0.025612354278564453, 0.026422500610351562, 0.027232646942138672, 0.02804279327392578, 0.02885293960571289, 0.0296630859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 31.0, 97.0, 258.0, 329.0, 173.0, 68.0, 20.0, 10.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2873302400112152, -0.277182936668396, -0.2670356333255768, -0.25688835978507996, -0.24674105644226074, -0.23659375309944153, -0.22644644975662231, -0.2162991613149643, -0.20615187287330627, -0.19600456953048706, -0.18585728108882904, -0.17570997774600983, -0.1655626893043518, -0.1554153859615326, -0.14526808261871338, -0.13512079417705536, -0.12497349083423615, -0.11482619494199753, -0.10467889904975891, -0.0945315957069397, -0.08438430726528168, -0.07423700392246246, -0.06408970803022385, -0.05394241213798523, -0.04379511624574661, -0.033647820353507996, -0.02350052259862423, -0.013353224843740463, -0.0032059289515018463, 0.006941366940736771, 0.017088666558265686, 0.027235962450504303, 0.03738325834274292, 0.04753055423498154, 0.057677850127220154, 0.06782515347003937, 0.07797244191169739, 0.0881197452545166, 0.09826704114675522, 0.10841433703899384, 0.11856163293123245, 0.12870892882347107, 0.13885623216629028, 0.1490035206079483, 0.15915082395076752, 0.16929811239242554, 0.17944541573524475, 0.18959271907806396, 0.19974000751972198, 0.2098873108625412, 0.22003459930419922, 0.23018190264701843, 0.24032919108867645, 0.2504764795303345, 0.2606237828731537, 0.2707710862159729, 0.2809183895587921, 0.29106569290161133, 0.30121299624443054, 0.31136026978492737, 0.3215075731277466, 0.3316548764705658, 0.341802179813385, 0.35194945335388184, 0.36209675669670105]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 8.0, 3.0, 8.0, 8.0, 13.0, 16.0, 15.0, 22.0, 25.0, 38.0, 46.0, 46.0, 26.0, 47.0, 57.0, 48.0, 52.0, 65.0, 49.0, 56.0, 38.0, 44.0, 37.0, 31.0, 35.0, 23.0, 29.0, 29.0, 13.0, 22.0, 9.0, 8.0, 6.0, 6.0, 9.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10206902027130127, -0.09882151335477829, -0.09557400643825531, -0.09232649207115173, -0.08907898515462875, -0.08583147823810577, -0.0825839638710022, -0.07933645695447922, -0.07608895003795624, -0.07284144312143326, -0.06959393620491028, -0.0663464218378067, -0.06309891492128372, -0.05985140800476074, -0.056603897362947464, -0.053356386721134186, -0.050108879804611206, -0.046861372888088226, -0.04361386224627495, -0.04036635160446167, -0.03711884468793869, -0.03387133777141571, -0.030623827129602432, -0.027376318350434303, -0.024128809571266174, -0.020881300792098045, -0.017633792012929916, -0.014386283233761787, -0.011138774454593658, -0.00789126567542553, -0.0046437568962574005, -0.0013962481170892715, 0.0018512606620788574, 0.005098769441246986, 0.008346278220415115, 0.011593786999583244, 0.014841295778751373, 0.018088804557919502, 0.02133631333708763, 0.02458382211625576, 0.02783133089542389, 0.031078839674592018, 0.03432634845376015, 0.037573859095573425, 0.040821366012096405, 0.044068872928619385, 0.04731638357043266, 0.05056389421224594, 0.05381140112876892, 0.0570589080452919, 0.06030641868710518, 0.06355392932891846, 0.06680143624544144, 0.07004894316196442, 0.073296457529068, 0.07654396444559097, 0.07979147136211395, 0.08303897827863693, 0.08628648519515991, 0.08953399956226349, 0.09278150647878647, 0.09602901339530945, 0.09927652776241302, 0.102524034678936, 0.10577154159545898]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 15.0, 22.0, 33.0, 46.0, 69.0, 95.0, 172.0, 217.0, 321.0, 485.0, 766.0, 1170.0, 1736.0, 2735.0, 4753.0, 7903.0, 14722.0, 29842.0, 71374.0, 331052.0, 431888.0, 79688.0, 32028.0, 15810.0, 8368.0, 4933.0, 2946.0, 1870.0, 1172.0, 763.0, 492.0, 354.0, 239.0, 150.0, 108.0, 69.0, 47.0, 31.0, 26.0, 11.0, 12.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08176612854003906, -0.07936477661132812, -0.07696342468261719, -0.07456207275390625, -0.07216072082519531, -0.06975936889648438, -0.06735801696777344, -0.0649566650390625, -0.06255531311035156, -0.060153961181640625, -0.05775260925292969, -0.05535125732421875, -0.05294990539550781, -0.050548553466796875, -0.04814720153808594, -0.045745849609375, -0.04334449768066406, -0.040943145751953125, -0.03854179382324219, -0.03614044189453125, -0.03373908996582031, -0.031337738037109375, -0.028936386108398438, -0.0265350341796875, -0.024133682250976562, -0.021732330322265625, -0.019330978393554688, -0.01692962646484375, -0.014528274536132812, -0.012126922607421875, -0.009725570678710938, -0.00732421875, -0.0049228668212890625, -0.002521514892578125, -0.0001201629638671875, 0.00228118896484375, 0.0046825408935546875, 0.007083892822265625, 0.009485244750976562, 0.0118865966796875, 0.014287948608398438, 0.016689300537109375, 0.019090652465820312, 0.02149200439453125, 0.023893356323242188, 0.026294708251953125, 0.028696060180664062, 0.031097412109375, 0.03349876403808594, 0.035900115966796875, 0.03830146789550781, 0.04070281982421875, 0.04310417175292969, 0.045505523681640625, 0.04790687561035156, 0.0503082275390625, 0.05270957946777344, 0.055110931396484375, 0.05751228332519531, 0.05991363525390625, 0.06231498718261719, 0.06471633911132812, 0.06711769104003906, 0.06951904296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 12.0, 18.0, 19.0, 18.0, 22.0, 33.0, 36.0, 50.0, 77.0, 205.0, 144.0, 79.0, 52.0, 45.0, 30.0, 19.0, 16.0, 12.0, 8.0, 21.0, 4.0, 6.0, 7.0, 7.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.02667236328125, -0.02595043182373047, -0.025228500366210938, -0.024506568908691406, -0.023784637451171875, -0.023062705993652344, -0.022340774536132812, -0.02161884307861328, -0.02089691162109375, -0.02017498016357422, -0.019453048706054688, -0.018731117248535156, -0.018009185791015625, -0.017287254333496094, -0.016565322875976562, -0.01584339141845703, -0.0151214599609375, -0.014399528503417969, -0.013677597045898438, -0.012955665588378906, -0.012233734130859375, -0.011511802673339844, -0.010789871215820312, -0.010067939758300781, -0.00934600830078125, -0.008624076843261719, -0.007902145385742188, -0.007180213928222656, -0.006458282470703125, -0.005736351013183594, -0.0050144195556640625, -0.004292488098144531, -0.003570556640625, -0.0028486251831054688, -0.0021266937255859375, -0.0014047622680664062, -0.000682830810546875, 3.910064697265625e-05, 0.0007610321044921875, 0.0014829635620117188, 0.00220489501953125, 0.0029268264770507812, 0.0036487579345703125, 0.004370689392089844, 0.005092620849609375, 0.005814552307128906, 0.0065364837646484375, 0.007258415222167969, 0.0079803466796875, 0.008702278137207031, 0.009424209594726562, 0.010146141052246094, 0.010868072509765625, 0.011590003967285156, 0.012311935424804688, 0.013033866882324219, 0.01375579833984375, 0.014477729797363281, 0.015199661254882812, 0.015921592712402344, 0.016643524169921875, 0.017365455627441406, 0.018087387084960938, 0.01880931854248047, 0.01953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 10.0, 9.0, 14.0, 11.0, 26.0, 24.0, 40.0, 59.0, 80.0, 114.0, 182.0, 330.0, 615.0, 1298.0, 3199.0, 9195.0, 31794.0, 140352.0, 547163.0, 243017.0, 49557.0, 13439.0, 4491.0, 1685.0, 764.0, 410.0, 197.0, 144.0, 99.0, 60.0, 47.0, 37.0, 27.0, 11.0, 17.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06927490234375, -0.0670156478881836, -0.06475639343261719, -0.06249713897705078, -0.060237884521484375, -0.05797863006591797, -0.05571937561035156, -0.053460121154785156, -0.05120086669921875, -0.048941612243652344, -0.04668235778808594, -0.04442310333251953, -0.042163848876953125, -0.03990459442138672, -0.03764533996582031, -0.035386085510253906, -0.0331268310546875, -0.030867576599121094, -0.028608322143554688, -0.02634906768798828, -0.024089813232421875, -0.02183055877685547, -0.019571304321289062, -0.017312049865722656, -0.01505279541015625, -0.012793540954589844, -0.010534286499023438, -0.008275032043457031, -0.006015777587890625, -0.0037565231323242188, -0.0014972686767578125, 0.0007619857788085938, 0.003021240234375, 0.005280494689941406, 0.0075397491455078125, 0.009799003601074219, 0.012058258056640625, 0.014317512512207031, 0.016576766967773438, 0.018836021423339844, 0.02109527587890625, 0.023354530334472656, 0.025613784790039062, 0.02787303924560547, 0.030132293701171875, 0.03239154815673828, 0.03465080261230469, 0.036910057067871094, 0.0391693115234375, 0.041428565979003906, 0.04368782043457031, 0.04594707489013672, 0.048206329345703125, 0.05046558380126953, 0.05272483825683594, 0.054984092712402344, 0.05724334716796875, 0.059502601623535156, 0.06176185607910156, 0.06402111053466797, 0.06628036499023438, 0.06853961944580078, 0.07079887390136719, 0.0730581283569336, 0.0753173828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 5.0, 2.0, 7.0, 8.0, 15.0, 8.0, 10.0, 19.0, 28.0, 26.0, 25.0, 29.0, 38.0, 41.0, 56.0, 42.0, 47.0, 32.0, 46.0, 42.0, 49.0, 54.0, 35.0, 50.0, 43.0, 27.0, 24.0, 30.0, 31.0, 24.0, 18.0, 14.0, 21.0, 13.0, 12.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.087646484375, -0.0846567153930664, -0.08166694641113281, -0.07867717742919922, -0.07568740844726562, -0.07269763946533203, -0.06970787048339844, -0.06671810150146484, -0.06372833251953125, -0.060738563537597656, -0.05774879455566406, -0.05475902557373047, -0.051769256591796875, -0.04877948760986328, -0.04578971862792969, -0.042799949645996094, -0.0398101806640625, -0.036820411682128906, -0.03383064270019531, -0.03084087371826172, -0.027851104736328125, -0.02486133575439453, -0.021871566772460938, -0.018881797790527344, -0.01589202880859375, -0.012902259826660156, -0.009912490844726562, -0.006922721862792969, -0.003932952880859375, -0.0009431838989257812, 0.0020465850830078125, 0.005036354064941406, 0.008026123046875, 0.011015892028808594, 0.014005661010742188, 0.01699542999267578, 0.019985198974609375, 0.02297496795654297, 0.025964736938476562, 0.028954505920410156, 0.03194427490234375, 0.034934043884277344, 0.03792381286621094, 0.04091358184814453, 0.043903350830078125, 0.04689311981201172, 0.04988288879394531, 0.052872657775878906, 0.0558624267578125, 0.058852195739746094, 0.06184196472167969, 0.06483173370361328, 0.06782150268554688, 0.07081127166748047, 0.07380104064941406, 0.07679080963134766, 0.07978057861328125, 0.08277034759521484, 0.08576011657714844, 0.08874988555908203, 0.09173965454101562, 0.09472942352294922, 0.09771919250488281, 0.1007089614868164, 0.10369873046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 8.0, 10.0, 15.0, 33.0, 45.0, 68.0, 100.0, 160.0, 293.0, 553.0, 1132.0, 2901.0, 9478.0, 56323.0, 754507.0, 196603.0, 18425.0, 4517.0, 1717.0, 723.0, 366.0, 215.0, 137.0, 73.0, 46.0, 34.0, 20.0, 13.0, 9.0, 11.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07305908203125, -0.07010364532470703, -0.06714820861816406, -0.0641927719116211, -0.061237335205078125, -0.058281898498535156, -0.05532646179199219, -0.05237102508544922, -0.04941558837890625, -0.04646015167236328, -0.04350471496582031, -0.040549278259277344, -0.037593841552734375, -0.034638404846191406, -0.03168296813964844, -0.02872753143310547, -0.0257720947265625, -0.02281665802001953, -0.019861221313476562, -0.016905784606933594, -0.013950347900390625, -0.010994911193847656, -0.008039474487304688, -0.005084037780761719, -0.00212860107421875, 0.0008268356323242188, 0.0037822723388671875, 0.006737709045410156, 0.009693145751953125, 0.012648582458496094, 0.015604019165039062, 0.01855945587158203, 0.021514892578125, 0.02447032928466797, 0.027425765991210938, 0.030381202697753906, 0.033336639404296875, 0.036292076110839844, 0.03924751281738281, 0.04220294952392578, 0.04515838623046875, 0.04811382293701172, 0.05106925964355469, 0.054024696350097656, 0.056980133056640625, 0.059935569763183594, 0.06289100646972656, 0.06584644317626953, 0.0688018798828125, 0.07175731658935547, 0.07471275329589844, 0.0776681900024414, 0.08062362670898438, 0.08357906341552734, 0.08653450012207031, 0.08948993682861328, 0.09244537353515625, 0.09540081024169922, 0.09835624694824219, 0.10131168365478516, 0.10426712036132812, 0.1072225570678711, 0.11017799377441406, 0.11313343048095703, 0.1160888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 12.0, 13.0, 21.0, 28.0, 33.0, 32.0, 51.0, 55.0, 63.0, 77.0, 59.0, 51.0, 71.0, 59.0, 60.0, 47.0, 46.0, 41.0, 28.0, 22.0, 22.0, 16.0, 14.0, 9.0, 6.0, 14.0, 5.0, 2.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.1961669921875e-05, -4.0629878640174866e-05, -3.929808735847473e-05, -3.79662960767746e-05, -3.663450479507446e-05, -3.530271351337433e-05, -3.3970922231674194e-05, -3.263913094997406e-05, -3.1307339668273926e-05, -2.997554838657379e-05, -2.8643757104873657e-05, -2.7311965823173523e-05, -2.598017454147339e-05, -2.4648383259773254e-05, -2.331659197807312e-05, -2.1984800696372986e-05, -2.065300941467285e-05, -1.9321218132972717e-05, -1.7989426851272583e-05, -1.665763556957245e-05, -1.5325844287872314e-05, -1.399405300617218e-05, -1.2662261724472046e-05, -1.1330470442771912e-05, -9.998679161071777e-06, -8.666887879371643e-06, -7.335096597671509e-06, -6.0033053159713745e-06, -4.67151403427124e-06, -3.339722752571106e-06, -2.0079314708709717e-06, -6.761401891708374e-07, 6.556510925292969e-07, 1.987442374229431e-06, 3.3192336559295654e-06, 4.6510249376297e-06, 5.982816219329834e-06, 7.314607501029968e-06, 8.646398782730103e-06, 9.978190064430237e-06, 1.1309981346130371e-05, 1.2641772627830505e-05, 1.397356390953064e-05, 1.5305355191230774e-05, 1.6637146472930908e-05, 1.7968937754631042e-05, 1.9300729036331177e-05, 2.063252031803131e-05, 2.1964311599731445e-05, 2.329610288143158e-05, 2.4627894163131714e-05, 2.5959685444831848e-05, 2.7291476726531982e-05, 2.8623268008232117e-05, 2.995505928993225e-05, 3.1286850571632385e-05, 3.261864185333252e-05, 3.3950433135032654e-05, 3.528222441673279e-05, 3.661401569843292e-05, 3.794580698013306e-05, 3.927759826183319e-05, 4.0609389543533325e-05, 4.194118082523346e-05, 4.3272972106933594e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 5.0, 7.0, 20.0, 19.0, 31.0, 49.0, 78.0, 137.0, 274.0, 509.0, 1241.0, 3416.0, 13541.0, 139384.0, 805082.0, 70595.0, 9544.0, 2710.0, 977.0, 445.0, 207.0, 113.0, 63.0, 27.0, 26.0, 12.0, 12.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1275634765625, -0.12415122985839844, -0.12073898315429688, -0.11732673645019531, -0.11391448974609375, -0.11050224304199219, -0.10708999633789062, -0.10367774963378906, -0.1002655029296875, -0.09685325622558594, -0.09344100952148438, -0.09002876281738281, -0.08661651611328125, -0.08320426940917969, -0.07979202270507812, -0.07637977600097656, -0.072967529296875, -0.06955528259277344, -0.06614303588867188, -0.06273078918457031, -0.05931854248046875, -0.05590629577636719, -0.052494049072265625, -0.04908180236816406, -0.0456695556640625, -0.04225730895996094, -0.038845062255859375, -0.03543281555175781, -0.03202056884765625, -0.028608322143554688, -0.025196075439453125, -0.021783828735351562, -0.01837158203125, -0.014959335327148438, -0.011547088623046875, -0.008134841918945312, -0.00472259521484375, -0.0013103485107421875, 0.002101898193359375, 0.0055141448974609375, 0.0089263916015625, 0.012338638305664062, 0.015750885009765625, 0.019163131713867188, 0.02257537841796875, 0.025987625122070312, 0.029399871826171875, 0.03281211853027344, 0.036224365234375, 0.03963661193847656, 0.043048858642578125, 0.04646110534667969, 0.04987335205078125, 0.05328559875488281, 0.056697845458984375, 0.06011009216308594, 0.0635223388671875, 0.06693458557128906, 0.07034683227539062, 0.07375907897949219, 0.07717132568359375, 0.08058357238769531, 0.08399581909179688, 0.08740806579589844, 0.0908203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 13.0, 5.0, 16.0, 10.0, 9.0, 17.0, 42.0, 51.0, 69.0, 82.0, 81.0, 101.0, 95.0, 89.0, 78.0, 60.0, 52.0, 32.0, 22.0, 24.0, 11.0, 9.0, 5.0, 5.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.05039072036743164, -0.04819965362548828, -0.04600858688354492, -0.04381752014160156, -0.0416264533996582, -0.039435386657714844, -0.037244319915771484, -0.035053253173828125, -0.032862186431884766, -0.030671119689941406, -0.028480052947998047, -0.026288986206054688, -0.024097919464111328, -0.02190685272216797, -0.01971578598022461, -0.01752471923828125, -0.01533365249633789, -0.013142585754394531, -0.010951519012451172, -0.008760452270507812, -0.006569385528564453, -0.004378318786621094, -0.0021872520446777344, 3.814697265625e-06, 0.0021948814392089844, 0.004385948181152344, 0.006577014923095703, 0.008768081665039062, 0.010959148406982422, 0.013150215148925781, 0.01534128189086914, 0.0175323486328125, 0.01972341537475586, 0.02191448211669922, 0.024105548858642578, 0.026296615600585938, 0.028487682342529297, 0.030678749084472656, 0.032869815826416016, 0.035060882568359375, 0.037251949310302734, 0.039443016052246094, 0.04163408279418945, 0.04382514953613281, 0.04601621627807617, 0.04820728302001953, 0.05039834976196289, 0.05258941650390625, 0.05478048324584961, 0.05697154998779297, 0.05916261672973633, 0.06135368347167969, 0.06354475021362305, 0.0657358169555664, 0.06792688369750977, 0.07011795043945312, 0.07230901718139648, 0.07450008392333984, 0.0766911506652832, 0.07888221740722656, 0.08107328414916992, 0.08326435089111328, 0.08545541763305664, 0.087646484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 11.0, 17.0, 48.0, 95.0, 266.0, 287.0, 146.0, 61.0, 24.0, 16.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5372573733329773, -0.503674328327179, -0.4700912833213806, -0.4365082383155823, -0.40292519330978394, -0.3693421483039856, -0.33575907349586487, -0.30217602849006653, -0.2685929834842682, -0.23500993847846985, -0.2014268934726715, -0.16784383356571198, -0.13426078855991364, -0.1006777435541153, -0.06709468364715576, -0.03351163864135742, 7.140636444091797e-05, 0.033654455095529556, 0.0672375038266182, 0.10082055628299713, 0.13440360128879547, 0.1679866462945938, 0.20156970620155334, 0.23515275120735168, 0.26873579621315, 0.30231884121894836, 0.3359018862247467, 0.36948496103286743, 0.40306800603866577, 0.4366510510444641, 0.47023409605026245, 0.5038171410560608, 0.5374002456665039, 0.5709832906723022, 0.6045663356781006, 0.6381493806838989, 0.6717324256896973, 0.7053154706954956, 0.738898515701294, 0.7724815607070923, 0.8060646057128906, 0.839647650718689, 0.8732306957244873, 0.9068137407302856, 0.940396785736084, 0.9739798307418823, 1.0075628757476807, 1.041145920753479, 1.0747289657592773, 1.1083120107650757, 1.141895055770874, 1.1754781007766724, 1.2090611457824707, 1.242644190788269, 1.2762272357940674, 1.3098102807998657, 1.3433934450149536, 1.376976490020752, 1.4105595350265503, 1.4441425800323486, 1.477725625038147, 1.5113086700439453, 1.5448917150497437, 1.578474760055542, 1.6120578050613403]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 9.0, 4.0, 8.0, 8.0, 11.0, 19.0, 20.0, 45.0, 73.0, 88.0, 118.0, 147.0, 128.0, 96.0, 60.0, 49.0, 34.0, 14.0, 15.0, 12.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.849938988685608, -1.7947429418563843, -1.7395468950271606, -1.684350848197937, -1.6291548013687134, -1.5739587545394897, -1.5187625885009766, -1.463566541671753, -1.4083704948425293, -1.3531744480133057, -1.297978401184082, -1.2427823543548584, -1.1875863075256348, -1.1323902606964111, -1.0771942138671875, -1.0219981670379639, -0.9668021202087402, -0.9116060733795166, -0.856410026550293, -0.8012139797210693, -0.7460179328918457, -0.6908218860626221, -0.6356257796287537, -0.58042973279953, -0.5252336859703064, -0.47003763914108276, -0.41484159231185913, -0.3596455156803131, -0.3044494688510895, -0.24925342202186584, -0.19405734539031982, -0.1388612985610962, -0.08366537094116211, -0.02846931666135788, 0.02672673761844635, 0.08192279934883118, 0.1371188461780548, 0.19231489300727844, 0.24751096963882446, 0.3027070164680481, 0.35790306329727173, 0.41309911012649536, 0.468295156955719, 0.5234912633895874, 0.578687310218811, 0.6338833570480347, 0.6890794038772583, 0.7442754507064819, 0.7994714975357056, 0.8546675443649292, 0.9098635911941528, 0.9650596380233765, 1.0202556848526, 1.0754517316818237, 1.130647897720337, 1.1858439445495605, 1.2410399913787842, 1.2962360382080078, 1.3514320850372314, 1.406628131866455, 1.4618241786956787, 1.5170202255249023, 1.572216272354126, 1.6274123191833496, 1.6826083660125732]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 1.0, 17.0, 17.0, 23.0, 43.0, 61.0, 102.0, 134.0, 240.0, 372.0, 643.0, 1177.0, 2437.0, 5030.0, 12055.0, 37077.0, 204679.0, 3688597.0, 181115.0, 36960.0, 12484.0, 5346.0, 2466.0, 1249.0, 805.0, 464.0, 221.0, 151.0, 104.0, 72.0, 46.0, 39.0, 17.0, 13.0, 3.0, 7.0, 4.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.198486328125, -0.1919727325439453, -0.18545913696289062, -0.17894554138183594, -0.17243194580078125, -0.16591835021972656, -0.15940475463867188, -0.1528911590576172, -0.1463775634765625, -0.1398639678955078, -0.13335037231445312, -0.12683677673339844, -0.12032318115234375, -0.11380958557128906, -0.10729598999023438, -0.10078239440917969, -0.094268798828125, -0.08775520324707031, -0.08124160766601562, -0.07472801208496094, -0.06821441650390625, -0.06170082092285156, -0.055187225341796875, -0.04867362976074219, -0.0421600341796875, -0.03564643859863281, -0.029132843017578125, -0.022619247436523438, -0.01610565185546875, -0.009592056274414062, -0.003078460693359375, 0.0034351348876953125, 0.00994873046875, 0.016462326049804688, 0.022975921630859375, 0.029489517211914062, 0.03600311279296875, 0.04251670837402344, 0.049030303955078125, 0.05554389953613281, 0.0620574951171875, 0.06857109069824219, 0.07508468627929688, 0.08159828186035156, 0.08811187744140625, 0.09462547302246094, 0.10113906860351562, 0.10765266418457031, 0.114166259765625, 0.12067985534667969, 0.12719345092773438, 0.13370704650878906, 0.14022064208984375, 0.14673423767089844, 0.15324783325195312, 0.1597614288330078, 0.1662750244140625, 0.1727886199951172, 0.17930221557617188, 0.18581581115722656, 0.19232940673828125, 0.19884300231933594, 0.20535659790039062, 0.2118701934814453, 0.2183837890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 6.0, 4.0, 7.0, 6.0, 9.0, 9.0, 29.0, 22.0, 30.0, 32.0, 49.0, 71.0, 132.0, 131.0, 117.0, 81.0, 56.0, 32.0, 29.0, 34.0, 20.0, 18.0, 11.0, 12.0, 4.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210723876953125, -0.020339012145996094, -0.019605636596679688, -0.01887226104736328, -0.018138885498046875, -0.01740550994873047, -0.016672134399414062, -0.015938758850097656, -0.01520538330078125, -0.014472007751464844, -0.013738632202148438, -0.013005256652832031, -0.012271881103515625, -0.011538505554199219, -0.010805130004882812, -0.010071754455566406, -0.00933837890625, -0.008605003356933594, -0.007871627807617188, -0.007138252258300781, -0.006404876708984375, -0.005671501159667969, -0.0049381256103515625, -0.004204750061035156, -0.00347137451171875, -0.0027379989624023438, -0.0020046234130859375, -0.0012712478637695312, -0.000537872314453125, 0.00019550323486328125, 0.0009288787841796875, 0.0016622543334960938, 0.0023956298828125, 0.0031290054321289062, 0.0038623809814453125, 0.004595756530761719, 0.005329132080078125, 0.006062507629394531, 0.0067958831787109375, 0.007529258728027344, 0.00826263427734375, 0.008996009826660156, 0.009729385375976562, 0.010462760925292969, 0.011196136474609375, 0.011929512023925781, 0.012662887573242188, 0.013396263122558594, 0.014129638671875, 0.014863014221191406, 0.015596389770507812, 0.01632976531982422, 0.017063140869140625, 0.01779651641845703, 0.018529891967773438, 0.019263267517089844, 0.01999664306640625, 0.020730018615722656, 0.021463394165039062, 0.02219676971435547, 0.022930145263671875, 0.02366352081298828, 0.024396896362304688, 0.025130271911621094, 0.0258636474609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 1.0, 2.0, 9.0, 8.0, 12.0, 15.0, 27.0, 47.0, 61.0, 112.0, 163.0, 210.0, 405.0, 776.0, 1632.0, 4044.0, 11229.0, 39163.0, 201437.0, 3053336.0, 757107.0, 90818.0, 21507.0, 6930.0, 2693.0, 1138.0, 606.0, 308.0, 162.0, 101.0, 68.0, 43.0, 25.0, 19.0, 12.0, 13.0, 7.0, 6.0, 8.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140625, -0.13590240478515625, -0.1311798095703125, -0.12645721435546875, -0.121734619140625, -0.11701202392578125, -0.1122894287109375, -0.10756683349609375, -0.10284423828125, -0.09812164306640625, -0.0933990478515625, -0.08867645263671875, -0.083953857421875, -0.07923126220703125, -0.0745086669921875, -0.06978607177734375, -0.0650634765625, -0.06034088134765625, -0.0556182861328125, -0.05089569091796875, -0.046173095703125, -0.04145050048828125, -0.0367279052734375, -0.03200531005859375, -0.02728271484375, -0.02256011962890625, -0.0178375244140625, -0.01311492919921875, -0.008392333984375, -0.00366973876953125, 0.0010528564453125, 0.00577545166015625, 0.010498046875, 0.01522064208984375, 0.0199432373046875, 0.02466583251953125, 0.029388427734375, 0.03411102294921875, 0.0388336181640625, 0.04355621337890625, 0.04827880859375, 0.05300140380859375, 0.0577239990234375, 0.06244659423828125, 0.067169189453125, 0.07189178466796875, 0.0766143798828125, 0.08133697509765625, 0.0860595703125, 0.09078216552734375, 0.0955047607421875, 0.10022735595703125, 0.104949951171875, 0.10967254638671875, 0.1143951416015625, 0.11911773681640625, 0.12384033203125, 0.12856292724609375, 0.1332855224609375, 0.13800811767578125, 0.142730712890625, 0.14745330810546875, 0.1521759033203125, 0.15689849853515625, 0.16162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 5.0, 7.0, 13.0, 21.0, 18.0, 39.0, 46.0, 47.0, 80.0, 123.0, 219.0, 392.0, 1174.0, 871.0, 341.0, 213.0, 138.0, 95.0, 64.0, 41.0, 27.0, 19.0, 16.0, 11.0, 6.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025604248046875, -0.024687767028808594, -0.023771286010742188, -0.02285480499267578, -0.021938323974609375, -0.02102184295654297, -0.020105361938476562, -0.019188880920410156, -0.01827239990234375, -0.017355918884277344, -0.016439437866210938, -0.015522956848144531, -0.014606475830078125, -0.013689994812011719, -0.012773513793945312, -0.011857032775878906, -0.0109405517578125, -0.010024070739746094, -0.009107589721679688, -0.008191108703613281, -0.007274627685546875, -0.006358146667480469, -0.0054416656494140625, -0.004525184631347656, -0.00360870361328125, -0.0026922225952148438, -0.0017757415771484375, -0.0008592605590820312, 5.7220458984375e-05, 0.0009737014770507812, 0.0018901824951171875, 0.0028066635131835938, 0.00372314453125, 0.004639625549316406, 0.0055561065673828125, 0.006472587585449219, 0.007389068603515625, 0.008305549621582031, 0.009222030639648438, 0.010138511657714844, 0.01105499267578125, 0.011971473693847656, 0.012887954711914062, 0.013804435729980469, 0.014720916748046875, 0.01563739776611328, 0.016553878784179688, 0.017470359802246094, 0.0183868408203125, 0.019303321838378906, 0.020219802856445312, 0.02113628387451172, 0.022052764892578125, 0.02296924591064453, 0.023885726928710938, 0.024802207946777344, 0.02571868896484375, 0.026635169982910156, 0.027551651000976562, 0.02846813201904297, 0.029384613037109375, 0.03030109405517578, 0.031217575073242188, 0.032134056091308594, 0.033050537109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 42.0, 109.0, 275.0, 292.0, 178.0, 60.0, 13.0, 6.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19298139214515686, -0.1829526126384735, -0.17292381823062897, -0.16289502382278442, -0.15286624431610107, -0.14283746480941772, -0.13280867040157318, -0.12277988344430923, -0.11275109648704529, -0.10272230952978134, -0.0926935225725174, -0.08266473561525345, -0.0726359486579895, -0.06260716170072556, -0.05257837474346161, -0.04254958778619766, -0.032520800828933716, -0.02249201387166977, -0.012463226914405823, -0.0024344399571418762, 0.00759434700012207, 0.017623133957386017, 0.027651920914649963, 0.03768070787191391, 0.047709494829177856, 0.0577382817864418, 0.06776706874370575, 0.0777958557009697, 0.08782464265823364, 0.09785342961549759, 0.10788221657276154, 0.11791100353002548, 0.12793979048728943, 0.13796856999397278, 0.14799736440181732, 0.15802615880966187, 0.16805493831634521, 0.17808371782302856, 0.1881125122308731, 0.19814130663871765, 0.208170086145401, 0.21819886565208435, 0.2282276600599289, 0.23825645446777344, 0.2482852339744568, 0.25831401348114014, 0.2683427929878235, 0.2783716022968292, 0.2884003818035126, 0.2984291613101959, 0.30845797061920166, 0.318486750125885, 0.32851552963256836, 0.3385443091392517, 0.34857308864593506, 0.3586018979549408, 0.36863067746162415, 0.3786594569683075, 0.38868826627731323, 0.3987170457839966, 0.40874582529067993, 0.4187746047973633, 0.42880338430404663, 0.43883219361305237, 0.4488609731197357]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 16.0, 17.0, 16.0, 22.0, 32.0, 36.0, 43.0, 59.0, 78.0, 66.0, 80.0, 92.0, 77.0, 56.0, 57.0, 46.0, 42.0, 31.0, 28.0, 23.0, 15.0, 14.0, 9.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1550167202949524, -0.15049254894256592, -0.14596837759017944, -0.14144420623779297, -0.1369200348854065, -0.13239586353302002, -0.12787169218063354, -0.12334752082824707, -0.1188233494758606, -0.11429917812347412, -0.10977500677108765, -0.10525083541870117, -0.1007266640663147, -0.09620249271392822, -0.09167832136154175, -0.08715415000915527, -0.0826299786567688, -0.07810580730438232, -0.07358163595199585, -0.06905746459960938, -0.0645332932472229, -0.060009121894836426, -0.05548495054244995, -0.05096077919006348, -0.046436607837677, -0.04191243648529053, -0.03738826513290405, -0.03286409378051758, -0.028339922428131104, -0.02381575107574463, -0.019291579723358154, -0.01476740837097168, -0.010243237018585205, -0.0057190656661987305, -0.0011948943138122559, 0.0033292770385742188, 0.007853448390960693, 0.012377619743347168, 0.016901791095733643, 0.021425962448120117, 0.025950133800506592, 0.030474305152893066, 0.03499847650527954, 0.039522647857666016, 0.04404681921005249, 0.048570990562438965, 0.05309516191482544, 0.057619333267211914, 0.06214350461959839, 0.06666767597198486, 0.07119184732437134, 0.07571601867675781, 0.08024019002914429, 0.08476436138153076, 0.08928853273391724, 0.09381270408630371, 0.09833687543869019, 0.10286104679107666, 0.10738521814346313, 0.11190938949584961, 0.11643356084823608, 0.12095773220062256, 0.12548190355300903, 0.1300060749053955, 0.13453024625778198]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 4.0, 7.0, 14.0, 11.0, 17.0, 29.0, 30.0, 40.0, 88.0, 75.0, 135.0, 200.0, 348.0, 499.0, 755.0, 1241.0, 2062.0, 3452.0, 6255.0, 12144.0, 25351.0, 62115.0, 214958.0, 497036.0, 134698.0, 44945.0, 19446.0, 9660.0, 5190.0, 2965.0, 1751.0, 1076.0, 608.0, 423.0, 270.0, 214.0, 120.0, 80.0, 73.0, 41.0, 34.0, 23.0, 14.0, 16.0, 12.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.10882568359375, -0.1055612564086914, -0.10229682922363281, -0.09903240203857422, -0.09576797485351562, -0.09250354766845703, -0.08923912048339844, -0.08597469329833984, -0.08271026611328125, -0.07944583892822266, -0.07618141174316406, -0.07291698455810547, -0.06965255737304688, -0.06638813018798828, -0.06312370300292969, -0.059859275817871094, -0.0565948486328125, -0.053330421447753906, -0.05006599426269531, -0.04680156707763672, -0.043537139892578125, -0.04027271270751953, -0.03700828552246094, -0.033743858337402344, -0.03047943115234375, -0.027215003967285156, -0.023950576782226562, -0.02068614959716797, -0.017421722412109375, -0.014157295227050781, -0.010892868041992188, -0.007628440856933594, -0.004364013671875, -0.0010995864868164062, 0.0021648406982421875, 0.005429267883300781, 0.008693695068359375, 0.011958122253417969, 0.015222549438476562, 0.018486976623535156, 0.02175140380859375, 0.025015830993652344, 0.028280258178710938, 0.03154468536376953, 0.034809112548828125, 0.03807353973388672, 0.04133796691894531, 0.044602394104003906, 0.0478668212890625, 0.051131248474121094, 0.05439567565917969, 0.05766010284423828, 0.060924530029296875, 0.06418895721435547, 0.06745338439941406, 0.07071781158447266, 0.07398223876953125, 0.07724666595458984, 0.08051109313964844, 0.08377552032470703, 0.08703994750976562, 0.09030437469482422, 0.09356880187988281, 0.0968332290649414, 0.10009765625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 4.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 13.0, 15.0, 14.0, 20.0, 28.0, 44.0, 43.0, 68.0, 100.0, 130.0, 120.0, 85.0, 54.0, 58.0, 35.0, 24.0, 21.0, 13.0, 20.0, 10.0, 12.0, 4.0, 3.0, 4.0, 8.0, 5.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0231475830078125, -0.022467374801635742, -0.021787166595458984, -0.021106958389282227, -0.02042675018310547, -0.01974654197692871, -0.019066333770751953, -0.018386125564575195, -0.017705917358398438, -0.01702570915222168, -0.016345500946044922, -0.015665292739868164, -0.014985084533691406, -0.014304876327514648, -0.01362466812133789, -0.012944459915161133, -0.012264251708984375, -0.011584043502807617, -0.01090383529663086, -0.010223627090454102, -0.009543418884277344, -0.008863210678100586, -0.008183002471923828, -0.00750279426574707, -0.0068225860595703125, -0.006142377853393555, -0.005462169647216797, -0.004781961441040039, -0.004101753234863281, -0.0034215450286865234, -0.0027413368225097656, -0.002061128616333008, -0.00138092041015625, -0.0007007122039794922, -2.0503997802734375e-05, 0.0006597042083740234, 0.0013399124145507812, 0.002020120620727539, 0.002700328826904297, 0.0033805370330810547, 0.0040607452392578125, 0.00474095344543457, 0.005421161651611328, 0.006101369857788086, 0.006781578063964844, 0.0074617862701416016, 0.00814199447631836, 0.008822202682495117, 0.009502410888671875, 0.010182619094848633, 0.01086282730102539, 0.011543035507202148, 0.012223243713378906, 0.012903451919555664, 0.013583660125732422, 0.01426386833190918, 0.014944076538085938, 0.015624284744262695, 0.016304492950439453, 0.01698470115661621, 0.01766490936279297, 0.018345117568969727, 0.019025325775146484, 0.019705533981323242, 0.0203857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 11.0, 9.0, 10.0, 17.0, 18.0, 40.0, 62.0, 82.0, 140.0, 217.0, 406.0, 749.0, 1468.0, 3274.0, 9272.0, 33653.0, 187660.0, 605458.0, 161643.0, 30181.0, 8129.0, 3005.0, 1385.0, 673.0, 375.0, 228.0, 145.0, 73.0, 53.0, 41.0, 20.0, 17.0, 5.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.09478759765625, -0.0916748046875, -0.08856201171875, -0.08544921875, -0.08233642578125, -0.0792236328125, -0.07611083984375, -0.072998046875, -0.06988525390625, -0.0667724609375, -0.06365966796875, -0.060546875, -0.05743408203125, -0.0543212890625, -0.05120849609375, -0.048095703125, -0.04498291015625, -0.0418701171875, -0.03875732421875, -0.03564453125, -0.03253173828125, -0.0294189453125, -0.02630615234375, -0.023193359375, -0.02008056640625, -0.0169677734375, -0.01385498046875, -0.0107421875, -0.00762939453125, -0.0045166015625, -0.00140380859375, 0.001708984375, 0.00482177734375, 0.0079345703125, 0.01104736328125, 0.01416015625, 0.01727294921875, 0.0203857421875, 0.02349853515625, 0.026611328125, 0.02972412109375, 0.0328369140625, 0.03594970703125, 0.0390625, 0.04217529296875, 0.0452880859375, 0.04840087890625, 0.051513671875, 0.05462646484375, 0.0577392578125, 0.06085205078125, 0.06396484375, 0.06707763671875, 0.0701904296875, 0.07330322265625, 0.076416015625, 0.07952880859375, 0.0826416015625, 0.08575439453125, 0.0888671875, 0.09197998046875, 0.0950927734375, 0.09820556640625, 0.101318359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 22.0, 19.0, 37.0, 28.0, 30.0, 41.0, 58.0, 46.0, 59.0, 50.0, 70.0, 56.0, 54.0, 49.0, 49.0, 49.0, 50.0, 36.0, 33.0, 32.0, 27.0, 21.0, 8.0, 13.0, 12.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09783935546875, -0.09509849548339844, -0.09235763549804688, -0.08961677551269531, -0.08687591552734375, -0.08413505554199219, -0.08139419555664062, -0.07865333557128906, -0.0759124755859375, -0.07317161560058594, -0.07043075561523438, -0.06768989562988281, -0.06494903564453125, -0.06220817565917969, -0.059467315673828125, -0.05672645568847656, -0.053985595703125, -0.05124473571777344, -0.048503875732421875, -0.04576301574707031, -0.04302215576171875, -0.04028129577636719, -0.037540435791015625, -0.03479957580566406, -0.0320587158203125, -0.029317855834960938, -0.026576995849609375, -0.023836135864257812, -0.02109527587890625, -0.018354415893554688, -0.015613555908203125, -0.012872695922851562, -0.0101318359375, -0.0073909759521484375, -0.004650115966796875, -0.0019092559814453125, 0.00083160400390625, 0.0035724639892578125, 0.006313323974609375, 0.009054183959960938, 0.0117950439453125, 0.014535903930664062, 0.017276763916015625, 0.020017623901367188, 0.02275848388671875, 0.025499343872070312, 0.028240203857421875, 0.030981063842773438, 0.033721923828125, 0.03646278381347656, 0.039203643798828125, 0.04194450378417969, 0.04468536376953125, 0.04742622375488281, 0.050167083740234375, 0.05290794372558594, 0.0556488037109375, 0.05838966369628906, 0.061130523681640625, 0.06387138366699219, 0.06661224365234375, 0.06935310363769531, 0.07209396362304688, 0.07483482360839844, 0.07757568359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 11.0, 13.0, 20.0, 24.0, 32.0, 50.0, 87.0, 145.0, 220.0, 392.0, 816.0, 1822.0, 4952.0, 17845.0, 135905.0, 763815.0, 99894.0, 14932.0, 4301.0, 1616.0, 794.0, 339.0, 187.0, 108.0, 63.0, 54.0, 29.0, 29.0, 22.0, 8.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.21875, -0.2134714126586914, -0.2081928253173828, -0.20291423797607422, -0.19763565063476562, -0.19235706329345703, -0.18707847595214844, -0.18179988861083984, -0.17652130126953125, -0.17124271392822266, -0.16596412658691406, -0.16068553924560547, -0.15540695190429688, -0.15012836456298828, -0.1448497772216797, -0.1395711898803711, -0.1342926025390625, -0.1290140151977539, -0.12373542785644531, -0.11845684051513672, -0.11317825317382812, -0.10789966583251953, -0.10262107849121094, -0.09734249114990234, -0.09206390380859375, -0.08678531646728516, -0.08150672912597656, -0.07622814178466797, -0.07094955444335938, -0.06567096710205078, -0.06039237976074219, -0.055113792419433594, -0.049835205078125, -0.044556617736816406, -0.03927803039550781, -0.03399944305419922, -0.028720855712890625, -0.02344226837158203, -0.018163681030273438, -0.012885093688964844, -0.00760650634765625, -0.0023279190063476562, 0.0029506683349609375, 0.008229255676269531, 0.013507843017578125, 0.01878643035888672, 0.024065017700195312, 0.029343605041503906, 0.0346221923828125, 0.039900779724121094, 0.04517936706542969, 0.05045795440673828, 0.055736541748046875, 0.06101512908935547, 0.06629371643066406, 0.07157230377197266, 0.07685089111328125, 0.08212947845458984, 0.08740806579589844, 0.09268665313720703, 0.09796524047851562, 0.10324382781982422, 0.10852241516113281, 0.1138010025024414, 0.11907958984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 6.0, 17.0, 25.0, 30.0, 49.0, 63.0, 84.0, 111.0, 123.0, 109.0, 106.0, 81.0, 57.0, 46.0, 32.0, 23.0, 16.0, 3.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011849403381347656, -0.00011452659964561462, -0.00011055916547775269, -0.00010659173130989075, -0.00010262429714202881, -9.865686297416687e-05, -9.468942880630493e-05, -9.072199463844299e-05, -8.675456047058105e-05, -8.278712630271912e-05, -7.881969213485718e-05, -7.485225796699524e-05, -7.08848237991333e-05, -6.691738963127136e-05, -6.294995546340942e-05, -5.8982521295547485e-05, -5.501508712768555e-05, -5.104765295982361e-05, -4.708021879196167e-05, -4.311278462409973e-05, -3.914535045623779e-05, -3.5177916288375854e-05, -3.1210482120513916e-05, -2.7243047952651978e-05, -2.327561378479004e-05, -1.93081796169281e-05, -1.5340745449066162e-05, -1.1373311281204224e-05, -7.405877113342285e-06, -3.4384429454803467e-06, 5.289912223815918e-07, 4.49642539024353e-06, 8.463859558105469e-06, 1.2431293725967407e-05, 1.6398727893829346e-05, 2.0366162061691284e-05, 2.4333596229553223e-05, 2.830103039741516e-05, 3.22684645652771e-05, 3.623589873313904e-05, 4.0203332901000977e-05, 4.4170767068862915e-05, 4.8138201236724854e-05, 5.210563540458679e-05, 5.607306957244873e-05, 6.004050374031067e-05, 6.400793790817261e-05, 6.797537207603455e-05, 7.194280624389648e-05, 7.591024041175842e-05, 7.987767457962036e-05, 8.38451087474823e-05, 8.781254291534424e-05, 9.177997708320618e-05, 9.574741125106812e-05, 9.971484541893005e-05, 0.00010368227958679199, 0.00010764971375465393, 0.00011161714792251587, 0.00011558458209037781, 0.00011955201625823975, 0.00012351945042610168, 0.00012748688459396362, 0.00013145431876182556, 0.0001354217529296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 3.0, 4.0, 5.0, 7.0, 21.0, 22.0, 20.0, 26.0, 47.0, 68.0, 132.0, 197.0, 320.0, 614.0, 1446.0, 3277.0, 10297.0, 48882.0, 414320.0, 490756.0, 59444.0, 11965.0, 3557.0, 1467.0, 720.0, 337.0, 203.0, 130.0, 81.0, 40.0, 35.0, 28.0, 23.0, 16.0, 9.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12157249450683594, -0.11765670776367188, -0.11374092102050781, -0.10982513427734375, -0.10590934753417969, -0.10199356079101562, -0.09807777404785156, -0.0941619873046875, -0.09024620056152344, -0.08633041381835938, -0.08241462707519531, -0.07849884033203125, -0.07458305358886719, -0.07066726684570312, -0.06675148010253906, -0.062835693359375, -0.05891990661621094, -0.055004119873046875, -0.05108833312988281, -0.04717254638671875, -0.04325675964355469, -0.039340972900390625, -0.03542518615722656, -0.0315093994140625, -0.027593612670898438, -0.023677825927734375, -0.019762039184570312, -0.01584625244140625, -0.011930465698242188, -0.008014678955078125, -0.0040988922119140625, -0.00018310546875, 0.0037326812744140625, 0.007648468017578125, 0.011564254760742188, 0.01548004150390625, 0.019395828247070312, 0.023311614990234375, 0.027227401733398438, 0.0311431884765625, 0.03505897521972656, 0.038974761962890625, 0.04289054870605469, 0.04680633544921875, 0.05072212219238281, 0.054637908935546875, 0.05855369567871094, 0.062469482421875, 0.06638526916503906, 0.07030105590820312, 0.07421684265136719, 0.07813262939453125, 0.08204841613769531, 0.08596420288085938, 0.08987998962402344, 0.0937957763671875, 0.09771156311035156, 0.10162734985351562, 0.10554313659667969, 0.10945892333984375, 0.11337471008300781, 0.11729049682617188, 0.12120628356933594, 0.1251220703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 6.0, 12.0, 13.0, 20.0, 20.0, 20.0, 46.0, 57.0, 74.0, 104.0, 117.0, 89.0, 95.0, 72.0, 58.0, 42.0, 27.0, 32.0, 18.0, 22.0, 13.0, 5.0, 5.0, 9.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0653076171875, -0.06297492980957031, -0.060642242431640625, -0.05830955505371094, -0.05597686767578125, -0.05364418029785156, -0.051311492919921875, -0.04897880554199219, -0.0466461181640625, -0.04431343078613281, -0.041980743408203125, -0.03964805603027344, -0.03731536865234375, -0.03498268127441406, -0.032649993896484375, -0.030317306518554688, -0.027984619140625, -0.025651931762695312, -0.023319244384765625, -0.020986557006835938, -0.01865386962890625, -0.016321182250976562, -0.013988494873046875, -0.011655807495117188, -0.0093231201171875, -0.0069904327392578125, -0.004657745361328125, -0.0023250579833984375, 7.62939453125e-06, 0.0023403167724609375, 0.004673004150390625, 0.0070056915283203125, 0.00933837890625, 0.011671066284179688, 0.014003753662109375, 0.016336441040039062, 0.01866912841796875, 0.021001815795898438, 0.023334503173828125, 0.025667190551757812, 0.0279998779296875, 0.030332565307617188, 0.032665252685546875, 0.03499794006347656, 0.03733062744140625, 0.03966331481933594, 0.041996002197265625, 0.04432868957519531, 0.046661376953125, 0.04899406433105469, 0.051326751708984375, 0.05365943908691406, 0.05599212646484375, 0.05832481384277344, 0.060657501220703125, 0.06299018859863281, 0.0653228759765625, 0.06765556335449219, 0.06998825073242188, 0.07232093811035156, 0.07465362548828125, 0.07698631286621094, 0.07931900024414062, 0.08165168762207031, 0.083984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 13.0, 40.0, 152.0, 438.0, 266.0, 65.0, 16.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.279052972793579, -1.2293123006820679, -1.1795716285705566, -1.1298309564590454, -1.0800902843475342, -1.030349612236023, -0.9806089997291565, -0.9308683276176453, -0.881127655506134, -0.8313869833946228, -0.7816463112831116, -0.7319056987762451, -0.6821650266647339, -0.6324243545532227, -0.5826836824417114, -0.5329430103302002, -0.48320233821868896, -0.43346166610717773, -0.3837209939956665, -0.33398035168647766, -0.28423967957496643, -0.2344990074634552, -0.18475836515426636, -0.13501769304275513, -0.0852770209312439, -0.03553635627031326, 0.01420430839061737, 0.06394496560096741, 0.11368563771247864, 0.16342630982398987, 0.2131669521331787, 0.26290762424468994, 0.3126484155654907, 0.36238908767700195, 0.4121297597885132, 0.461870402097702, 0.5116111040115356, 0.5613517761230469, 0.6110923886299133, 0.6608330607414246, 0.7105737328529358, 0.760314404964447, 0.8100550770759583, 0.8597956895828247, 0.9095363616943359, 0.9592770338058472, 1.0090177059173584, 1.0587583780288696, 1.1084990501403809, 1.158239722251892, 1.2079803943634033, 1.2577210664749146, 1.3074617385864258, 1.357202410697937, 1.4069430828094482, 1.45668363571167, 1.5064244270324707, 1.556165099143982, 1.6059057712554932, 1.6556464433670044, 1.7053871154785156, 1.7551277875900269, 1.804868459701538, 1.8546090126037598, 1.904349684715271]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 12.0, 14.0, 15.0, 19.0, 27.0, 38.0, 47.0, 52.0, 60.0, 72.0, 68.0, 80.0, 63.0, 69.0, 63.0, 46.0, 53.0, 36.0, 32.0, 30.0, 17.0, 15.0, 11.0, 5.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6587620973587036, -0.6381540894508362, -0.6175460815429688, -0.5969380736351013, -0.5763300657272339, -0.5557220578193665, -0.535114049911499, -0.5145059823989868, -0.4938980042934418, -0.47328999638557434, -0.4526819884777069, -0.4320739805698395, -0.41146594285964966, -0.3908579349517822, -0.3702499270439148, -0.34964191913604736, -0.32903391122817993, -0.3084259033203125, -0.28781789541244507, -0.26720988750457764, -0.246601864695549, -0.22599385678768158, -0.20538583397865295, -0.18477782607078552, -0.1641698181629181, -0.14356181025505066, -0.12295379489660263, -0.1023457795381546, -0.08173777163028717, -0.06112976372241974, -0.04052174836397171, -0.01991373300552368, 0.00069427490234375, 0.02130228653550148, 0.04191029816865921, 0.06251831352710724, 0.08312632143497467, 0.1037343293428421, 0.12434234470129013, 0.14495036005973816, 0.1655583679676056, 0.18616637587547302, 0.20677438378334045, 0.22738240659236908, 0.2479904145002365, 0.26859843730926514, 0.28920644521713257, 0.309814453125, 0.33042246103286743, 0.35103046894073486, 0.3716384768486023, 0.3922464847564697, 0.41285449266433716, 0.4334625005722046, 0.4540705382823944, 0.47467854619026184, 0.4952865540981293, 0.5158945918083191, 0.5365025997161865, 0.557110607624054, 0.5777186155319214, 0.5983266234397888, 0.6189346313476562, 0.6395426392555237, 0.6601506471633911]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 6.0, 15.0, 18.0, 36.0, 32.0, 52.0, 57.0, 67.0, 102.0, 147.0, 163.0, 273.0, 341.0, 421.0, 594.0, 940.0, 1339.0, 2120.0, 3652.0, 6864.0, 14459.0, 38972.0, 182900.0, 3590924.0, 265041.0, 47462.0, 17002.0, 8115.0, 4293.0, 2522.0, 1576.0, 1099.0, 778.0, 544.0, 387.0, 252.0, 173.0, 153.0, 98.0, 71.0, 49.0, 48.0, 40.0, 22.0, 17.0, 9.0, 22.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1978759765625, -0.19161033630371094, -0.18534469604492188, -0.1790790557861328, -0.17281341552734375, -0.1665477752685547, -0.16028213500976562, -0.15401649475097656, -0.1477508544921875, -0.14148521423339844, -0.13521957397460938, -0.1289539337158203, -0.12268829345703125, -0.11642265319824219, -0.11015701293945312, -0.10389137268066406, -0.097625732421875, -0.09136009216308594, -0.08509445190429688, -0.07882881164550781, -0.07256317138671875, -0.06629753112792969, -0.060031890869140625, -0.05376625061035156, -0.0475006103515625, -0.04123497009277344, -0.034969329833984375, -0.028703689575195312, -0.02243804931640625, -0.016172409057617188, -0.009906768798828125, -0.0036411285400390625, 0.00262451171875, 0.008890151977539062, 0.015155792236328125, 0.021421432495117188, 0.02768707275390625, 0.03395271301269531, 0.040218353271484375, 0.04648399353027344, 0.0527496337890625, 0.05901527404785156, 0.06528091430664062, 0.07154655456542969, 0.07781219482421875, 0.08407783508300781, 0.09034347534179688, 0.09660911560058594, 0.102874755859375, 0.10914039611816406, 0.11540603637695312, 0.12167167663574219, 0.12793731689453125, 0.1342029571533203, 0.14046859741210938, 0.14673423767089844, 0.1529998779296875, 0.15926551818847656, 0.16553115844726562, 0.1717967987060547, 0.17806243896484375, 0.1843280792236328, 0.19059371948242188, 0.19685935974121094, 0.203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 8.0, 2.0, 7.0, 4.0, 5.0, 5.0, 9.0, 21.0, 15.0, 22.0, 47.0, 46.0, 49.0, 75.0, 104.0, 120.0, 109.0, 90.0, 47.0, 49.0, 33.0, 29.0, 23.0, 13.0, 15.0, 12.0, 6.0, 3.0, 9.0, 6.0, 7.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0202789306640625, -0.019596576690673828, -0.018914222717285156, -0.018231868743896484, -0.017549514770507812, -0.01686716079711914, -0.01618480682373047, -0.015502452850341797, -0.014820098876953125, -0.014137744903564453, -0.013455390930175781, -0.01277303695678711, -0.012090682983398438, -0.011408329010009766, -0.010725975036621094, -0.010043621063232422, -0.00936126708984375, -0.008678913116455078, -0.007996559143066406, -0.007314205169677734, -0.0066318511962890625, -0.005949497222900391, -0.005267143249511719, -0.004584789276123047, -0.003902435302734375, -0.003220081329345703, -0.0025377273559570312, -0.0018553733825683594, -0.0011730194091796875, -0.0004906654357910156, 0.00019168853759765625, 0.0008740425109863281, 0.001556396484375, 0.002238750457763672, 0.0029211044311523438, 0.0036034584045410156, 0.0042858123779296875, 0.004968166351318359, 0.005650520324707031, 0.006332874298095703, 0.007015228271484375, 0.007697582244873047, 0.008379936218261719, 0.00906229019165039, 0.009744644165039062, 0.010426998138427734, 0.011109352111816406, 0.011791706085205078, 0.01247406005859375, 0.013156414031982422, 0.013838768005371094, 0.014521121978759766, 0.015203475952148438, 0.01588582992553711, 0.01656818389892578, 0.017250537872314453, 0.017932891845703125, 0.018615245819091797, 0.01929759979248047, 0.01997995376586914, 0.020662307739257812, 0.021344661712646484, 0.022027015686035156, 0.022709369659423828, 0.0233917236328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 13.0, 28.0, 40.0, 70.0, 100.0, 187.0, 463.0, 1279.0, 4400.0, 21362.0, 225256.0, 3748624.0, 168311.0, 18094.0, 3897.0, 1200.0, 419.0, 212.0, 97.0, 68.0, 36.0, 36.0, 18.0, 12.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.309326171875, -0.300079345703125, -0.29083251953125, -0.281585693359375, -0.2723388671875, -0.263092041015625, -0.25384521484375, -0.244598388671875, -0.2353515625, -0.226104736328125, -0.21685791015625, -0.207611083984375, -0.1983642578125, -0.189117431640625, -0.17987060546875, -0.170623779296875, -0.161376953125, -0.152130126953125, -0.14288330078125, -0.133636474609375, -0.1243896484375, -0.115142822265625, -0.10589599609375, -0.096649169921875, -0.08740234375, -0.078155517578125, -0.06890869140625, -0.059661865234375, -0.0504150390625, -0.041168212890625, -0.03192138671875, -0.022674560546875, -0.013427734375, -0.004180908203125, 0.00506591796875, 0.014312744140625, 0.0235595703125, 0.032806396484375, 0.04205322265625, 0.051300048828125, 0.060546875, 0.069793701171875, 0.07904052734375, 0.088287353515625, 0.0975341796875, 0.106781005859375, 0.11602783203125, 0.125274658203125, 0.134521484375, 0.143768310546875, 0.15301513671875, 0.162261962890625, 0.1715087890625, 0.180755615234375, 0.19000244140625, 0.199249267578125, 0.20849609375, 0.217742919921875, 0.22698974609375, 0.236236572265625, 0.2454833984375, 0.254730224609375, 0.26397705078125, 0.273223876953125, 0.282470703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 14.0, 13.0, 25.0, 31.0, 42.0, 42.0, 108.0, 173.0, 330.0, 827.0, 1440.0, 438.0, 221.0, 115.0, 78.0, 50.0, 30.0, 24.0, 12.0, 8.0, 9.0, 12.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.0327754020690918, -0.031523704528808594, -0.03027200698852539, -0.029020309448242188, -0.027768611907958984, -0.02651691436767578, -0.025265216827392578, -0.024013519287109375, -0.022761821746826172, -0.02151012420654297, -0.020258426666259766, -0.019006729125976562, -0.01775503158569336, -0.016503334045410156, -0.015251636505126953, -0.01399993896484375, -0.012748241424560547, -0.011496543884277344, -0.01024484634399414, -0.008993148803710938, -0.007741451263427734, -0.006489753723144531, -0.005238056182861328, -0.003986358642578125, -0.002734661102294922, -0.0014829635620117188, -0.00023126602172851562, 0.0010204315185546875, 0.0022721290588378906, 0.0035238265991210938, 0.004775524139404297, 0.0060272216796875, 0.007278919219970703, 0.008530616760253906, 0.00978231430053711, 0.011034011840820312, 0.012285709381103516, 0.013537406921386719, 0.014789104461669922, 0.016040802001953125, 0.017292499542236328, 0.01854419708251953, 0.019795894622802734, 0.021047592163085938, 0.02229928970336914, 0.023550987243652344, 0.024802684783935547, 0.02605438232421875, 0.027306079864501953, 0.028557777404785156, 0.02980947494506836, 0.031061172485351562, 0.032312870025634766, 0.03356456756591797, 0.03481626510620117, 0.036067962646484375, 0.03731966018676758, 0.03857135772705078, 0.039823055267333984, 0.04107475280761719, 0.04232645034790039, 0.043578147888183594, 0.0448298454284668, 0.04608154296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 45.0, 253.0, 526.0, 146.0, 25.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17907801270484924, -0.15777893364429474, -0.13647985458374023, -0.11518077552318573, -0.09388169646263123, -0.07258261740207672, -0.05128353834152222, -0.029984459280967712, -0.008685380220413208, 0.012613698840141296, 0.0339127779006958, 0.055211856961250305, 0.07651093602180481, 0.09781001508235931, 0.11910909414291382, 0.14040817320346832, 0.16170725226402283, 0.18300633132457733, 0.20430541038513184, 0.22560448944568634, 0.24690356850624084, 0.26820266246795654, 0.28950172662734985, 0.31080079078674316, 0.33209988474845886, 0.35339897871017456, 0.37469804286956787, 0.3959971070289612, 0.4172962009906769, 0.4385952949523926, 0.4598943591117859, 0.4811934232711792, 0.5024925470352173, 0.5237916111946106, 0.5450906753540039, 0.566389799118042, 0.5876888632774353, 0.6089879274368286, 0.6302870512008667, 0.65158611536026, 0.6728851795196533, 0.6941842436790466, 0.7154833078384399, 0.736782431602478, 0.7580814957618713, 0.7793805599212646, 0.8006796836853027, 0.821978747844696, 0.8432778120040894, 0.8645768761634827, 0.885875940322876, 0.9071750640869141, 0.9284741282463074, 0.9497731924057007, 0.9710723161697388, 0.9923713803291321, 1.0136704444885254, 1.0349695682525635, 1.056268572807312, 1.07756769657135, 1.0988667011260986, 1.1201658248901367, 1.1414649486541748, 1.1627639532089233, 1.1840630769729614]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 9.0, 6.0, 8.0, 15.0, 17.0, 17.0, 29.0, 41.0, 47.0, 50.0, 51.0, 60.0, 67.0, 65.0, 76.0, 79.0, 68.0, 52.0, 47.0, 44.0, 40.0, 26.0, 26.0, 18.0, 13.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13987332582473755, -0.13462258875370026, -0.12937185168266296, -0.12412110716104507, -0.11887036263942719, -0.11361962556838989, -0.1083688884973526, -0.10311815142631531, -0.09786740690469742, -0.09261666983366013, -0.08736592531204224, -0.08211518824100494, -0.07686445116996765, -0.07161370664834976, -0.06636296957731247, -0.06111222878098488, -0.05586148798465729, -0.0506107471883297, -0.045360006392002106, -0.04010926932096481, -0.03485852852463722, -0.02960778772830963, -0.02435705065727234, -0.019106309860944748, -0.013855569064617157, -0.00860482919961214, -0.0033540893346071243, 0.0018966495990753174, 0.007147390395402908, 0.0123981311917305, 0.017648868262767792, 0.022899609059095383, 0.028150349855422974, 0.033401090651750565, 0.038651831448078156, 0.04390256851911545, 0.04915330931544304, 0.05440405011177063, 0.05965478718280792, 0.06490552425384521, 0.0701562687754631, 0.0754070058465004, 0.08065775036811829, 0.08590848743915558, 0.09115922451019287, 0.09640996903181076, 0.10166070610284805, 0.10691145062446594, 0.11216218769550323, 0.11741292476654053, 0.12266366928815842, 0.1279143989086151, 0.1331651508808136, 0.1384158879518509, 0.14366662502288818, 0.14891736209392548, 0.15416809916496277, 0.15941883623600006, 0.16466957330703735, 0.16992032527923584, 0.17517106235027313, 0.18042179942131042, 0.18567253649234772, 0.190923273563385, 0.1961740255355835]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 4.0, 6.0, 7.0, 11.0, 29.0, 36.0, 33.0, 55.0, 84.0, 110.0, 195.0, 315.0, 525.0, 864.0, 1412.0, 2577.0, 5307.0, 12258.0, 32483.0, 111144.0, 457812.0, 308831.0, 72156.0, 23634.0, 9300.0, 4211.0, 2071.0, 1181.0, 684.0, 403.0, 283.0, 185.0, 107.0, 77.0, 54.0, 36.0, 22.0, 18.0, 11.0, 9.0, 5.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1593017578125, -0.15459442138671875, -0.1498870849609375, -0.14517974853515625, -0.140472412109375, -0.13576507568359375, -0.1310577392578125, -0.12635040283203125, -0.12164306640625, -0.11693572998046875, -0.1122283935546875, -0.10752105712890625, -0.102813720703125, -0.09810638427734375, -0.0933990478515625, -0.08869171142578125, -0.083984375, -0.07927703857421875, -0.0745697021484375, -0.06986236572265625, -0.065155029296875, -0.06044769287109375, -0.0557403564453125, -0.05103302001953125, -0.04632568359375, -0.04161834716796875, -0.0369110107421875, -0.03220367431640625, -0.027496337890625, -0.02278900146484375, -0.0180816650390625, -0.01337432861328125, -0.0086669921875, -0.00395965576171875, 0.0007476806640625, 0.00545501708984375, 0.010162353515625, 0.01486968994140625, 0.0195770263671875, 0.02428436279296875, 0.02899169921875, 0.03369903564453125, 0.0384063720703125, 0.04311370849609375, 0.047821044921875, 0.05252838134765625, 0.0572357177734375, 0.06194305419921875, 0.066650390625, 0.07135772705078125, 0.0760650634765625, 0.08077239990234375, 0.085479736328125, 0.09018707275390625, 0.0948944091796875, 0.09960174560546875, 0.10430908203125, 0.10901641845703125, 0.1137237548828125, 0.11843109130859375, 0.123138427734375, 0.12784576416015625, 0.1325531005859375, 0.13726043701171875, 0.1419677734375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 5.0, 9.0, 15.0, 10.0, 14.0, 29.0, 19.0, 47.0, 79.0, 83.0, 96.0, 110.0, 97.0, 81.0, 78.0, 48.0, 42.0, 29.0, 22.0, 15.0, 13.0, 10.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0192108154296875, -0.018521785736083984, -0.01783275604248047, -0.017143726348876953, -0.016454696655273438, -0.015765666961669922, -0.015076637268066406, -0.01438760757446289, -0.013698577880859375, -0.01300954818725586, -0.012320518493652344, -0.011631488800048828, -0.010942459106445312, -0.010253429412841797, -0.009564399719238281, -0.008875370025634766, -0.00818634033203125, -0.007497310638427734, -0.006808280944824219, -0.006119251251220703, -0.0054302215576171875, -0.004741191864013672, -0.004052162170410156, -0.0033631324768066406, -0.002674102783203125, -0.0019850730895996094, -0.0012960433959960938, -0.0006070137023925781, 8.20159912109375e-05, 0.0007710456848144531, 0.0014600753784179688, 0.0021491050720214844, 0.002838134765625, 0.0035271644592285156, 0.004216194152832031, 0.004905223846435547, 0.0055942535400390625, 0.006283283233642578, 0.006972312927246094, 0.007661342620849609, 0.008350372314453125, 0.00903940200805664, 0.009728431701660156, 0.010417461395263672, 0.011106491088867188, 0.011795520782470703, 0.012484550476074219, 0.013173580169677734, 0.01386260986328125, 0.014551639556884766, 0.015240669250488281, 0.015929698944091797, 0.016618728637695312, 0.017307758331298828, 0.017996788024902344, 0.01868581771850586, 0.019374847412109375, 0.02006387710571289, 0.020752906799316406, 0.021441936492919922, 0.022130966186523438, 0.022819995880126953, 0.02350902557373047, 0.024198055267333984, 0.0248870849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 11.0, 6.0, 14.0, 16.0, 18.0, 27.0, 50.0, 58.0, 100.0, 129.0, 250.0, 390.0, 684.0, 1546.0, 4284.0, 19283.0, 126172.0, 615546.0, 236696.0, 32369.0, 6712.0, 2031.0, 884.0, 483.0, 281.0, 163.0, 101.0, 70.0, 48.0, 27.0, 23.0, 17.0, 15.0, 11.0, 7.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.16765975952148438, -0.16136932373046875, -0.15507888793945312, -0.1487884521484375, -0.14249801635742188, -0.13620758056640625, -0.12991714477539062, -0.123626708984375, -0.11733627319335938, -0.11104583740234375, -0.10475540161132812, -0.0984649658203125, -0.09217453002929688, -0.08588409423828125, -0.07959365844726562, -0.07330322265625, -0.06701278686523438, -0.06072235107421875, -0.054431915283203125, -0.0481414794921875, -0.041851043701171875, -0.03556060791015625, -0.029270172119140625, -0.022979736328125, -0.016689300537109375, -0.01039886474609375, -0.004108428955078125, 0.0021820068359375, 0.008472442626953125, 0.01476287841796875, 0.021053314208984375, 0.02734375, 0.033634185791015625, 0.03992462158203125, 0.046215057373046875, 0.0525054931640625, 0.058795928955078125, 0.06508636474609375, 0.07137680053710938, 0.077667236328125, 0.08395767211914062, 0.09024810791015625, 0.09653854370117188, 0.1028289794921875, 0.10911941528320312, 0.11540985107421875, 0.12170028686523438, 0.12799072265625, 0.13428115844726562, 0.14057159423828125, 0.14686203002929688, 0.1531524658203125, 0.15944290161132812, 0.16573333740234375, 0.17202377319335938, 0.178314208984375, 0.18460464477539062, 0.19089508056640625, 0.19718551635742188, 0.2034759521484375, 0.20976638793945312, 0.21605682373046875, 0.22234725952148438, 0.2286376953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 4.0, 9.0, 12.0, 29.0, 19.0, 26.0, 21.0, 32.0, 19.0, 34.0, 31.0, 37.0, 49.0, 46.0, 39.0, 48.0, 48.0, 52.0, 44.0, 32.0, 42.0, 36.0, 27.0, 33.0, 34.0, 33.0, 25.0, 19.0, 22.0, 8.0, 11.0, 9.0, 9.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07415771484375, -0.07146263122558594, -0.06876754760742188, -0.06607246398925781, -0.06337738037109375, -0.06068229675292969, -0.057987213134765625, -0.05529212951660156, -0.0525970458984375, -0.04990196228027344, -0.047206878662109375, -0.04451179504394531, -0.04181671142578125, -0.03912162780761719, -0.036426544189453125, -0.03373146057128906, -0.031036376953125, -0.028341293334960938, -0.025646209716796875, -0.022951126098632812, -0.02025604248046875, -0.017560958862304688, -0.014865875244140625, -0.012170791625976562, -0.0094757080078125, -0.0067806243896484375, -0.004085540771484375, -0.0013904571533203125, 0.00130462646484375, 0.0039997100830078125, 0.006694793701171875, 0.009389877319335938, 0.0120849609375, 0.014780044555664062, 0.017475128173828125, 0.020170211791992188, 0.02286529541015625, 0.025560379028320312, 0.028255462646484375, 0.030950546264648438, 0.0336456298828125, 0.03634071350097656, 0.039035797119140625, 0.04173088073730469, 0.04442596435546875, 0.04712104797363281, 0.049816131591796875, 0.05251121520996094, 0.055206298828125, 0.05790138244628906, 0.060596466064453125, 0.06329154968261719, 0.06598663330078125, 0.06868171691894531, 0.07137680053710938, 0.07407188415527344, 0.0767669677734375, 0.07946205139160156, 0.08215713500976562, 0.08485221862792969, 0.08754730224609375, 0.09024238586425781, 0.09293746948242188, 0.09563255310058594, 0.09832763671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 6.0, 5.0, 8.0, 11.0, 17.0, 29.0, 46.0, 62.0, 99.0, 172.0, 382.0, 636.0, 1248.0, 2794.0, 7011.0, 21499.0, 92707.0, 483973.0, 349325.0, 62457.0, 15881.0, 5567.0, 2272.0, 1087.0, 576.0, 272.0, 176.0, 83.0, 58.0, 28.0, 18.0, 17.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11090087890625, -0.10730934143066406, -0.10371780395507812, -0.10012626647949219, -0.09653472900390625, -0.09294319152832031, -0.08935165405273438, -0.08576011657714844, -0.0821685791015625, -0.07857704162597656, -0.07498550415039062, -0.07139396667480469, -0.06780242919921875, -0.06421089172363281, -0.060619354248046875, -0.05702781677246094, -0.053436279296875, -0.04984474182128906, -0.046253204345703125, -0.04266166687011719, -0.03907012939453125, -0.03547859191894531, -0.031887054443359375, -0.028295516967773438, -0.0247039794921875, -0.021112442016601562, -0.017520904541015625, -0.013929367065429688, -0.01033782958984375, -0.0067462921142578125, -0.003154754638671875, 0.0004367828369140625, 0.0040283203125, 0.0076198577880859375, 0.011211395263671875, 0.014802932739257812, 0.01839447021484375, 0.021986007690429688, 0.025577545166015625, 0.029169082641601562, 0.0327606201171875, 0.03635215759277344, 0.039943695068359375, 0.04353523254394531, 0.04712677001953125, 0.05071830749511719, 0.054309844970703125, 0.05790138244628906, 0.061492919921875, 0.06508445739746094, 0.06867599487304688, 0.07226753234863281, 0.07585906982421875, 0.07945060729980469, 0.08304214477539062, 0.08663368225097656, 0.0902252197265625, 0.09381675720214844, 0.09740829467773438, 0.10099983215332031, 0.10459136962890625, 0.10818290710449219, 0.11177444458007812, 0.11536598205566406, 0.11895751953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 9.0, 10.0, 16.0, 19.0, 42.0, 39.0, 42.0, 54.0, 74.0, 85.0, 96.0, 101.0, 90.0, 86.0, 56.0, 53.0, 41.0, 25.0, 26.0, 6.0, 10.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.654594421386719e-05, -8.392985910177231e-05, -8.131377398967743e-05, -7.869768887758255e-05, -7.608160376548767e-05, -7.346551865339279e-05, -7.084943354129791e-05, -6.823334842920303e-05, -6.561726331710815e-05, -6.300117820501328e-05, -6.0385093092918396e-05, -5.776900798082352e-05, -5.515292286872864e-05, -5.253683775663376e-05, -4.992075264453888e-05, -4.7304667532444e-05, -4.468858242034912e-05, -4.207249730825424e-05, -3.945641219615936e-05, -3.6840327084064484e-05, -3.4224241971969604e-05, -3.1608156859874725e-05, -2.8992071747779846e-05, -2.6375986635684967e-05, -2.3759901523590088e-05, -2.114381641149521e-05, -1.852773129940033e-05, -1.591164618730545e-05, -1.3295561075210571e-05, -1.0679475963115692e-05, -8.063390851020813e-06, -5.447305738925934e-06, -2.8312206268310547e-06, -2.1513551473617554e-07, 2.4009495973587036e-06, 5.017034709453583e-06, 7.633119821548462e-06, 1.0249204933643341e-05, 1.286529004573822e-05, 1.54813751578331e-05, 1.809746026992798e-05, 2.0713545382022858e-05, 2.3329630494117737e-05, 2.5945715606212616e-05, 2.8561800718307495e-05, 3.1177885830402374e-05, 3.3793970942497253e-05, 3.641005605459213e-05, 3.902614116668701e-05, 4.164222627878189e-05, 4.425831139087677e-05, 4.687439650297165e-05, 4.949048161506653e-05, 5.210656672716141e-05, 5.472265183925629e-05, 5.7338736951351166e-05, 5.9954822063446045e-05, 6.257090717554092e-05, 6.51869922876358e-05, 6.780307739973068e-05, 7.041916251182556e-05, 7.303524762392044e-05, 7.565133273601532e-05, 7.82674178481102e-05, 8.088350296020508e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 5.0, 3.0, 7.0, 13.0, 10.0, 17.0, 29.0, 58.0, 61.0, 104.0, 167.0, 299.0, 551.0, 1192.0, 3179.0, 10573.0, 46612.0, 358577.0, 537408.0, 68261.0, 14362.0, 4106.0, 1444.0, 661.0, 341.0, 173.0, 113.0, 71.0, 58.0, 36.0, 25.0, 8.0, 11.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.142578125, -0.1381378173828125, -0.133697509765625, -0.1292572021484375, -0.12481689453125, -0.1203765869140625, -0.115936279296875, -0.1114959716796875, -0.1070556640625, -0.1026153564453125, -0.098175048828125, -0.0937347412109375, -0.08929443359375, -0.0848541259765625, -0.080413818359375, -0.0759735107421875, -0.071533203125, -0.0670928955078125, -0.062652587890625, -0.0582122802734375, -0.05377197265625, -0.0493316650390625, -0.044891357421875, -0.0404510498046875, -0.0360107421875, -0.0315704345703125, -0.027130126953125, -0.0226898193359375, -0.01824951171875, -0.0138092041015625, -0.009368896484375, -0.0049285888671875, -0.00048828125, 0.0039520263671875, 0.008392333984375, 0.0128326416015625, 0.01727294921875, 0.0217132568359375, 0.026153564453125, 0.0305938720703125, 0.0350341796875, 0.0394744873046875, 0.043914794921875, 0.0483551025390625, 0.05279541015625, 0.0572357177734375, 0.061676025390625, 0.0661163330078125, 0.070556640625, 0.0749969482421875, 0.079437255859375, 0.0838775634765625, 0.08831787109375, 0.0927581787109375, 0.097198486328125, 0.1016387939453125, 0.1060791015625, 0.1105194091796875, 0.114959716796875, 0.1194000244140625, 0.12384033203125, 0.1282806396484375, 0.132720947265625, 0.1371612548828125, 0.1416015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 6.0, 5.0, 4.0, 8.0, 8.0, 6.0, 20.0, 13.0, 23.0, 24.0, 39.0, 27.0, 53.0, 61.0, 59.0, 71.0, 65.0, 66.0, 75.0, 50.0, 49.0, 49.0, 35.0, 27.0, 20.0, 18.0, 15.0, 14.0, 7.0, 14.0, 10.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.04904937744140625, -0.0476226806640625, -0.04619598388671875, -0.044769287109375, -0.04334259033203125, -0.0419158935546875, -0.04048919677734375, -0.0390625, -0.03763580322265625, -0.0362091064453125, -0.03478240966796875, -0.033355712890625, -0.03192901611328125, -0.0305023193359375, -0.02907562255859375, -0.02764892578125, -0.02622222900390625, -0.0247955322265625, -0.02336883544921875, -0.021942138671875, -0.02051544189453125, -0.0190887451171875, -0.01766204833984375, -0.0162353515625, -0.01480865478515625, -0.0133819580078125, -0.01195526123046875, -0.010528564453125, -0.00910186767578125, -0.0076751708984375, -0.00624847412109375, -0.00482177734375, -0.00339508056640625, -0.0019683837890625, -0.00054168701171875, 0.000885009765625, 0.00231170654296875, 0.0037384033203125, 0.00516510009765625, 0.006591796875, 0.00801849365234375, 0.0094451904296875, 0.01087188720703125, 0.012298583984375, 0.01372528076171875, 0.0151519775390625, 0.01657867431640625, 0.01800537109375, 0.01943206787109375, 0.0208587646484375, 0.02228546142578125, 0.023712158203125, 0.02513885498046875, 0.0265655517578125, 0.02799224853515625, 0.0294189453125, 0.03084564208984375, 0.0322723388671875, 0.03369903564453125, 0.035125732421875, 0.03655242919921875, 0.0379791259765625, 0.03940582275390625, 0.04083251953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 23.0, 92.0, 238.0, 333.0, 188.0, 77.0, 30.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2105929851531982, -1.1513837575912476, -1.0921745300292969, -1.0329654216766357, -0.9737561345100403, -0.9145469665527344, -0.8553377389907837, -0.796128511428833, -0.7369192838668823, -0.6777100563049316, -0.6185008883476257, -0.559291660785675, -0.5000824332237244, -0.44087323546409607, -0.3816640377044678, -0.3224548101425171, -0.2632456421852112, -0.2040364295244217, -0.1448272168636322, -0.0856180191040039, -0.026408806443214417, 0.03280040621757507, 0.09200960397720337, 0.15121883153915405, 0.21042802929878235, 0.26963722705841064, 0.32884645462036133, 0.3880556523799896, 0.4472648501396179, 0.5064740777015686, 0.5656832456588745, 0.6248924732208252, 0.6841017007827759, 0.7433109283447266, 0.8025200963020325, 0.8617293238639832, 0.9209385514259338, 0.9801477193832397, 1.0393569469451904, 1.0985661745071411, 1.1577754020690918, 1.2169846296310425, 1.2761938571929932, 1.3354029655456543, 1.394612193107605, 1.4538214206695557, 1.5130306482315063, 1.572239875793457, 1.6314489841461182, 1.6906582117080688, 1.7498674392700195, 1.8090765476226807, 1.8682857751846313, 1.927495002746582, 1.9867042303085327, 2.0459134578704834, 2.1051228046417236, 2.1643319129943848, 2.223541259765625, 2.282750368118286, 2.3419597148895264, 2.4011688232421875, 2.4603781700134277, 2.519587278366089, 2.57879638671875]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 11.0, 8.0, 14.0, 24.0, 24.0, 33.0, 29.0, 52.0, 42.0, 57.0, 51.0, 46.0, 61.0, 72.0, 55.0, 63.0, 45.0, 44.0, 45.0, 29.0, 25.0, 37.0, 26.0, 25.0, 20.0, 12.0, 10.0, 8.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8658173084259033, -0.8387893438339233, -0.8117614388465881, -0.7847334742546082, -0.757705569267273, -0.730677604675293, -0.703649640083313, -0.676621675491333, -0.6495937705039978, -0.6225658059120178, -0.5955379009246826, -0.5685099363327026, -0.5414819717407227, -0.5144540667533875, -0.48742610216140747, -0.4603981673717499, -0.4333702325820923, -0.4063422977924347, -0.3793143630027771, -0.3522863984107971, -0.3252584636211395, -0.29823052883148193, -0.27120256423950195, -0.24417462944984436, -0.21714669466018677, -0.19011875987052917, -0.1630908101797104, -0.1360628604888916, -0.10903492569923401, -0.08200699090957642, -0.05497904121875763, -0.027951091527938843, -0.00092315673828125, 0.02610478550195694, 0.05313272774219513, 0.08016066998243332, 0.10718861222267151, 0.1342165470123291, 0.1612444967031479, 0.18827244639396667, 0.21530038118362427, 0.24232831597328186, 0.26935625076293945, 0.29638421535491943, 0.323412150144577, 0.3504400849342346, 0.3774680495262146, 0.4044959843158722, 0.4315239191055298, 0.4585518538951874, 0.48557978868484497, 0.512607753276825, 0.5396356582641602, 0.5666636228561401, 0.5936915874481201, 0.6207195520401001, 0.6477474570274353, 0.6747754216194153, 0.7018033266067505, 0.7288312911987305, 0.7558592557907104, 0.7828871607780457, 0.8099151253700256, 0.8369430303573608, 0.8639709949493408]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 16.0, 23.0, 44.0, 72.0, 160.0, 317.0, 807.0, 2650.0, 15186.0, 729545.0, 3420041.0, 20225.0, 3353.0, 966.0, 429.0, 190.0, 92.0, 45.0, 27.0, 32.0, 7.0, 7.0, 6.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42305755615234375, -0.4061737060546875, -0.38928985595703125, -0.372406005859375, -0.35552215576171875, -0.3386383056640625, -0.32175445556640625, -0.30487060546875, -0.28798675537109375, -0.2711029052734375, -0.25421905517578125, -0.237335205078125, -0.22045135498046875, -0.2035675048828125, -0.18668365478515625, -0.1697998046875, -0.15291595458984375, -0.1360321044921875, -0.11914825439453125, -0.102264404296875, -0.08538055419921875, -0.0684967041015625, -0.05161285400390625, -0.03472900390625, -0.01784515380859375, -0.0009613037109375, 0.01592254638671875, 0.032806396484375, 0.04969024658203125, 0.0665740966796875, 0.08345794677734375, 0.100341796875, 0.11722564697265625, 0.1341094970703125, 0.15099334716796875, 0.167877197265625, 0.18476104736328125, 0.2016448974609375, 0.21852874755859375, 0.23541259765625, 0.25229644775390625, 0.2691802978515625, 0.28606414794921875, 0.302947998046875, 0.31983184814453125, 0.3367156982421875, 0.35359954833984375, 0.3704833984375, 0.38736724853515625, 0.4042510986328125, 0.42113494873046875, 0.438018798828125, 0.45490264892578125, 0.4717864990234375, 0.48867034912109375, 0.50555419921875, 0.5224380493164062, 0.5393218994140625, 0.5562057495117188, 0.573089599609375, 0.5899734497070312, 0.6068572998046875, 0.6237411499023438, 0.640625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 8.0, 17.0, 34.0, 33.0, 60.0, 74.0, 81.0, 86.0, 97.0, 105.0, 80.0, 80.0, 50.0, 55.0, 40.0, 20.0, 15.0, 13.0, 6.0, 7.0, 2.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219879150390625, -0.021027803421020508, -0.020067691802978516, -0.019107580184936523, -0.01814746856689453, -0.01718735694885254, -0.016227245330810547, -0.015267133712768555, -0.014307022094726562, -0.01334691047668457, -0.012386798858642578, -0.011426687240600586, -0.010466575622558594, -0.009506464004516602, -0.00854635238647461, -0.007586240768432617, -0.006626129150390625, -0.005666017532348633, -0.004705905914306641, -0.0037457942962646484, -0.0027856826782226562, -0.001825571060180664, -0.0008654594421386719, 9.465217590332031e-05, 0.0010547637939453125, 0.0020148754119873047, 0.002974987030029297, 0.003935098648071289, 0.004895210266113281, 0.0058553218841552734, 0.006815433502197266, 0.007775545120239258, 0.00873565673828125, 0.009695768356323242, 0.010655879974365234, 0.011615991592407227, 0.012576103210449219, 0.013536214828491211, 0.014496326446533203, 0.015456438064575195, 0.016416549682617188, 0.01737666130065918, 0.018336772918701172, 0.019296884536743164, 0.020256996154785156, 0.02121710777282715, 0.02217721939086914, 0.023137331008911133, 0.024097442626953125, 0.025057554244995117, 0.02601766586303711, 0.0269777774810791, 0.027937889099121094, 0.028898000717163086, 0.029858112335205078, 0.03081822395324707, 0.03177833557128906, 0.032738447189331055, 0.03369855880737305, 0.03465867042541504, 0.03561878204345703, 0.03657889366149902, 0.037539005279541016, 0.03849911689758301, 0.039459228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 12.0, 9.0, 23.0, 27.0, 59.0, 110.0, 189.0, 373.0, 1002.0, 3164.0, 14934.0, 151110.0, 3778657.0, 220913.0, 18511.0, 3430.0, 961.0, 370.0, 183.0, 99.0, 67.0, 20.0, 12.0, 15.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3955078125, -0.3857574462890625, -0.376007080078125, -0.3662567138671875, -0.35650634765625, -0.3467559814453125, -0.337005615234375, -0.3272552490234375, -0.3175048828125, -0.3077545166015625, -0.298004150390625, -0.2882537841796875, -0.27850341796875, -0.2687530517578125, -0.259002685546875, -0.2492523193359375, -0.239501953125, -0.2297515869140625, -0.220001220703125, -0.2102508544921875, -0.20050048828125, -0.1907501220703125, -0.180999755859375, -0.1712493896484375, -0.1614990234375, -0.1517486572265625, -0.141998291015625, -0.1322479248046875, -0.12249755859375, -0.1127471923828125, -0.102996826171875, -0.0932464599609375, -0.08349609375, -0.0737457275390625, -0.063995361328125, -0.0542449951171875, -0.04449462890625, -0.0347442626953125, -0.024993896484375, -0.0152435302734375, -0.0054931640625, 0.0042572021484375, 0.014007568359375, 0.0237579345703125, 0.03350830078125, 0.0432586669921875, 0.053009033203125, 0.0627593994140625, 0.072509765625, 0.0822601318359375, 0.092010498046875, 0.1017608642578125, 0.11151123046875, 0.1212615966796875, 0.131011962890625, 0.1407623291015625, 0.1505126953125, 0.1602630615234375, 0.170013427734375, 0.1797637939453125, 0.18951416015625, 0.1992645263671875, 0.209014892578125, 0.2187652587890625, 0.228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 5.0, 8.0, 19.0, 19.0, 31.0, 39.0, 70.0, 93.0, 118.0, 190.0, 431.0, 1492.0, 754.0, 286.0, 167.0, 113.0, 76.0, 36.0, 32.0, 22.0, 18.0, 10.0, 9.0, 8.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053497314453125, -0.05211925506591797, -0.05074119567871094, -0.049363136291503906, -0.047985076904296875, -0.046607017517089844, -0.04522895812988281, -0.04385089874267578, -0.04247283935546875, -0.04109477996826172, -0.03971672058105469, -0.038338661193847656, -0.036960601806640625, -0.035582542419433594, -0.03420448303222656, -0.03282642364501953, -0.0314483642578125, -0.03007030487060547, -0.028692245483398438, -0.027314186096191406, -0.025936126708984375, -0.024558067321777344, -0.023180007934570312, -0.02180194854736328, -0.02042388916015625, -0.01904582977294922, -0.017667770385742188, -0.016289710998535156, -0.014911651611328125, -0.013533592224121094, -0.012155532836914062, -0.010777473449707031, -0.0093994140625, -0.008021354675292969, -0.0066432952880859375, -0.005265235900878906, -0.003887176513671875, -0.0025091171264648438, -0.0011310577392578125, 0.00024700164794921875, 0.00162506103515625, 0.0030031204223632812, 0.0043811798095703125, 0.005759239196777344, 0.007137298583984375, 0.008515357971191406, 0.009893417358398438, 0.011271476745605469, 0.0126495361328125, 0.014027595520019531, 0.015405654907226562, 0.016783714294433594, 0.018161773681640625, 0.019539833068847656, 0.020917892456054688, 0.02229595184326172, 0.02367401123046875, 0.02505207061767578, 0.026430130004882812, 0.027808189392089844, 0.029186248779296875, 0.030564308166503906, 0.03194236755371094, 0.03332042694091797, 0.034698486328125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 19.0, 69.0, 267.0, 411.0, 174.0, 43.0, 14.0, 3.0, 1.0, 2.0], "bins": [-1.2653367519378662, -1.243304967880249, -1.2212731838226318, -1.1992413997650146, -1.1772096157073975, -1.1551779508590698, -1.1331461668014526, -1.1111143827438354, -1.0890825986862183, -1.067050814628601, -1.0450190305709839, -1.0229872465133667, -1.0009554624557495, -0.9789237380027771, -0.9568919539451599, -0.9348602294921875, -0.9128284454345703, -0.8907966613769531, -0.8687648773193359, -0.8467331528663635, -0.8247013688087463, -0.8026695847511292, -0.780637800693512, -0.7586060762405396, -0.7365742325782776, -0.7145424485206604, -0.6925106644630432, -0.6704789400100708, -0.6484471559524536, -0.6264153718948364, -0.6043835878372192, -0.582351803779602, -0.5603200793266296, -0.5382882952690125, -0.5162565112113953, -0.49422475695610046, -0.47219300270080566, -0.4501612186431885, -0.4281294345855713, -0.4060976803302765, -0.3840659260749817, -0.3620341420173645, -0.3400023877620697, -0.3179706037044525, -0.2959388494491577, -0.2739070653915405, -0.25187528133392334, -0.22984352707862854, -0.20781175792217255, -0.18577998876571655, -0.16374821960926056, -0.14171645045280457, -0.11968467384576797, -0.09765290468931198, -0.07562112808227539, -0.0535893589258194, -0.0315575897693634, -0.00952581875026226, 0.012505952268838882, 0.034537725150585175, 0.05656949430704117, 0.07860126346349716, 0.10063304007053375, 0.12266480922698975, 0.14469657838344574]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 17.0, 15.0, 13.0, 19.0, 14.0, 25.0, 22.0, 24.0, 25.0, 35.0, 39.0, 42.0, 49.0, 58.0, 44.0, 48.0, 56.0, 58.0, 39.0, 36.0, 33.0, 37.0, 36.0, 26.0, 24.0, 23.0, 22.0, 17.0, 9.0, 16.0, 13.0, 10.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.16236263513565063, -0.15772852301597595, -0.15309441089630127, -0.1484602838754654, -0.1438261717557907, -0.13919205963611603, -0.13455794751644135, -0.12992383539676666, -0.1252897083759308, -0.1206555962562561, -0.11602147668600082, -0.11138736456632614, -0.10675324499607086, -0.10211913287639618, -0.0974850207567215, -0.09285090863704681, -0.08821679651737213, -0.08358268439769745, -0.07894856482744217, -0.07431445270776749, -0.06968033313751221, -0.06504622101783752, -0.06041210889816284, -0.05577799305319786, -0.05114387720823288, -0.0465097613632679, -0.04187564551830292, -0.037241533398628235, -0.032607417553663254, -0.027973301708698273, -0.02333918772637844, -0.01870507374405861, -0.014070957899093628, -0.009436842985451221, -0.004802728071808815, -0.00016861315816640854, 0.004465501755475998, 0.009099617600440979, 0.01373373158276081, 0.018367845565080643, 0.023001961410045624, 0.027636077255010605, 0.032270193099975586, 0.03690430521965027, 0.04153842106461525, 0.04617253690958023, 0.05080664902925491, 0.055440764874219894, 0.060074880719184875, 0.06470899283885956, 0.06934311240911484, 0.07397722452878952, 0.0786113440990448, 0.08324545621871948, 0.08787956833839417, 0.09251368045806885, 0.09714780002832413, 0.10178191214799881, 0.10641603171825409, 0.11105014383792877, 0.11568425595760345, 0.12031837552785873, 0.12495248764753342, 0.1295866072177887, 0.13422071933746338]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 20.0, 42.0, 70.0, 86.0, 125.0, 195.0, 348.0, 607.0, 1094.0, 2044.0, 4445.0, 10525.0, 32480.0, 117342.0, 402597.0, 339840.0, 92984.0, 26756.0, 9094.0, 3691.0, 1852.0, 925.0, 517.0, 280.0, 195.0, 114.0, 81.0, 47.0, 35.0, 27.0, 16.0, 11.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13761138916015625, -0.1330108642578125, -0.12841033935546875, -0.123809814453125, -0.11920928955078125, -0.1146087646484375, -0.11000823974609375, -0.10540771484375, -0.10080718994140625, -0.0962066650390625, -0.09160614013671875, -0.087005615234375, -0.08240509033203125, -0.0778045654296875, -0.07320404052734375, -0.068603515625, -0.06400299072265625, -0.0594024658203125, -0.05480194091796875, -0.050201416015625, -0.04560089111328125, -0.0410003662109375, -0.03639984130859375, -0.03179931640625, -0.02719879150390625, -0.0225982666015625, -0.01799774169921875, -0.013397216796875, -0.00879669189453125, -0.0041961669921875, 0.00040435791015625, 0.0050048828125, 0.00960540771484375, 0.0142059326171875, 0.01880645751953125, 0.023406982421875, 0.02800750732421875, 0.0326080322265625, 0.03720855712890625, 0.04180908203125, 0.04640960693359375, 0.0510101318359375, 0.05561065673828125, 0.060211181640625, 0.06481170654296875, 0.0694122314453125, 0.07401275634765625, 0.07861328125, 0.08321380615234375, 0.0878143310546875, 0.09241485595703125, 0.097015380859375, 0.10161590576171875, 0.1062164306640625, 0.11081695556640625, 0.11541748046875, 0.12001800537109375, 0.1246185302734375, 0.12921905517578125, 0.133819580078125, 0.13842010498046875, 0.1430206298828125, 0.14762115478515625, 0.1522216796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 12.0, 21.0, 33.0, 30.0, 60.0, 78.0, 78.0, 88.0, 90.0, 81.0, 91.0, 96.0, 51.0, 39.0, 32.0, 32.0, 21.0, 14.0, 11.0, 7.0, 6.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247039794921875, -0.023755311965942383, -0.022806644439697266, -0.02185797691345215, -0.02090930938720703, -0.019960641860961914, -0.019011974334716797, -0.01806330680847168, -0.017114639282226562, -0.016165971755981445, -0.015217304229736328, -0.014268636703491211, -0.013319969177246094, -0.012371301651000977, -0.01142263412475586, -0.010473966598510742, -0.009525299072265625, -0.008576631546020508, -0.007627964019775391, -0.0066792964935302734, -0.005730628967285156, -0.004781961441040039, -0.003833293914794922, -0.0028846263885498047, -0.0019359588623046875, -0.0009872913360595703, -3.8623809814453125e-05, 0.0009100437164306641, 0.0018587112426757812, 0.0028073787689208984, 0.0037560462951660156, 0.004704713821411133, 0.00565338134765625, 0.006602048873901367, 0.007550716400146484, 0.008499383926391602, 0.009448051452636719, 0.010396718978881836, 0.011345386505126953, 0.01229405403137207, 0.013242721557617188, 0.014191389083862305, 0.015140056610107422, 0.01608872413635254, 0.017037391662597656, 0.017986059188842773, 0.01893472671508789, 0.019883394241333008, 0.020832061767578125, 0.021780729293823242, 0.02272939682006836, 0.023678064346313477, 0.024626731872558594, 0.02557539939880371, 0.026524066925048828, 0.027472734451293945, 0.028421401977539062, 0.02937006950378418, 0.030318737030029297, 0.031267404556274414, 0.03221607208251953, 0.03316473960876465, 0.034113407135009766, 0.03506207466125488, 0.0360107421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 10.0, 11.0, 15.0, 11.0, 29.0, 53.0, 83.0, 121.0, 177.0, 278.0, 426.0, 710.0, 1571.0, 4103.0, 15542.0, 82017.0, 456111.0, 397578.0, 69010.0, 13628.0, 3744.0, 1425.0, 706.0, 409.0, 256.0, 154.0, 125.0, 80.0, 42.0, 38.0, 22.0, 20.0, 10.0, 6.0, 10.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1727294921875, -0.1665496826171875, -0.160369873046875, -0.1541900634765625, -0.14801025390625, -0.1418304443359375, -0.135650634765625, -0.1294708251953125, -0.123291015625, -0.1171112060546875, -0.110931396484375, -0.1047515869140625, -0.09857177734375, -0.0923919677734375, -0.086212158203125, -0.0800323486328125, -0.0738525390625, -0.0676727294921875, -0.061492919921875, -0.0553131103515625, -0.04913330078125, -0.0429534912109375, -0.036773681640625, -0.0305938720703125, -0.0244140625, -0.0182342529296875, -0.012054443359375, -0.0058746337890625, 0.00030517578125, 0.0064849853515625, 0.012664794921875, 0.0188446044921875, 0.0250244140625, 0.0312042236328125, 0.037384033203125, 0.0435638427734375, 0.04974365234375, 0.0559234619140625, 0.062103271484375, 0.0682830810546875, 0.074462890625, 0.0806427001953125, 0.086822509765625, 0.0930023193359375, 0.09918212890625, 0.1053619384765625, 0.111541748046875, 0.1177215576171875, 0.1239013671875, 0.1300811767578125, 0.136260986328125, 0.1424407958984375, 0.14862060546875, 0.1548004150390625, 0.160980224609375, 0.1671600341796875, 0.17333984375, 0.1795196533203125, 0.185699462890625, 0.1918792724609375, 0.19805908203125, 0.2042388916015625, 0.210418701171875, 0.2165985107421875, 0.2227783203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 8.0, 0.0, 4.0, 7.0, 5.0, 11.0, 11.0, 14.0, 17.0, 18.0, 24.0, 25.0, 24.0, 31.0, 28.0, 33.0, 37.0, 47.0, 46.0, 48.0, 48.0, 46.0, 55.0, 43.0, 55.0, 30.0, 35.0, 33.0, 31.0, 37.0, 20.0, 25.0, 15.0, 16.0, 19.0, 10.0, 12.0, 10.0, 5.0, 11.0, 4.0, 0.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.105712890625, -0.1022186279296875, -0.098724365234375, -0.0952301025390625, -0.09173583984375, -0.0882415771484375, -0.084747314453125, -0.0812530517578125, -0.0777587890625, -0.0742645263671875, -0.070770263671875, -0.0672760009765625, -0.06378173828125, -0.0602874755859375, -0.056793212890625, -0.0532989501953125, -0.0498046875, -0.0463104248046875, -0.042816162109375, -0.0393218994140625, -0.03582763671875, -0.0323333740234375, -0.028839111328125, -0.0253448486328125, -0.0218505859375, -0.0183563232421875, -0.014862060546875, -0.0113677978515625, -0.00787353515625, -0.0043792724609375, -0.000885009765625, 0.0026092529296875, 0.006103515625, 0.0095977783203125, 0.013092041015625, 0.0165863037109375, 0.02008056640625, 0.0235748291015625, 0.027069091796875, 0.0305633544921875, 0.0340576171875, 0.0375518798828125, 0.041046142578125, 0.0445404052734375, 0.04803466796875, 0.0515289306640625, 0.055023193359375, 0.0585174560546875, 0.06201171875, 0.0655059814453125, 0.069000244140625, 0.0724945068359375, 0.07598876953125, 0.0794830322265625, 0.082977294921875, 0.0864715576171875, 0.0899658203125, 0.0934600830078125, 0.096954345703125, 0.1004486083984375, 0.10394287109375, 0.1074371337890625, 0.110931396484375, 0.1144256591796875, 0.117919921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 12.0, 14.0, 16.0, 23.0, 52.0, 80.0, 125.0, 175.0, 259.0, 505.0, 893.0, 1627.0, 3148.0, 6202.0, 14028.0, 33621.0, 91838.0, 308287.0, 392924.0, 119879.0, 42142.0, 17073.0, 7556.0, 3699.0, 1870.0, 1020.0, 553.0, 357.0, 214.0, 129.0, 73.0, 56.0, 20.0, 25.0, 19.0, 13.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06939697265625, -0.0670928955078125, -0.064788818359375, -0.0624847412109375, -0.0601806640625, -0.0578765869140625, -0.055572509765625, -0.0532684326171875, -0.05096435546875, -0.0486602783203125, -0.046356201171875, -0.0440521240234375, -0.041748046875, -0.0394439697265625, -0.037139892578125, -0.0348358154296875, -0.03253173828125, -0.0302276611328125, -0.027923583984375, -0.0256195068359375, -0.0233154296875, -0.0210113525390625, -0.018707275390625, -0.0164031982421875, -0.01409912109375, -0.0117950439453125, -0.009490966796875, -0.0071868896484375, -0.0048828125, -0.0025787353515625, -0.000274658203125, 0.0020294189453125, 0.00433349609375, 0.0066375732421875, 0.008941650390625, 0.0112457275390625, 0.0135498046875, 0.0158538818359375, 0.018157958984375, 0.0204620361328125, 0.02276611328125, 0.0250701904296875, 0.027374267578125, 0.0296783447265625, 0.031982421875, 0.0342864990234375, 0.036590576171875, 0.0388946533203125, 0.04119873046875, 0.0435028076171875, 0.045806884765625, 0.0481109619140625, 0.0504150390625, 0.0527191162109375, 0.055023193359375, 0.0573272705078125, 0.05963134765625, 0.0619354248046875, 0.064239501953125, 0.0665435791015625, 0.06884765625, 0.0711517333984375, 0.073455810546875, 0.0757598876953125, 0.07806396484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 13.0, 18.0, 41.0, 72.0, 74.0, 88.0, 123.0, 141.0, 93.0, 84.0, 76.0, 47.0, 42.0, 22.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.465217590332031e-05, -9.172502905130386e-05, -8.879788219928741e-05, -8.587073534727097e-05, -8.294358849525452e-05, -8.001644164323807e-05, -7.708929479122162e-05, -7.416214793920517e-05, -7.123500108718872e-05, -6.830785423517227e-05, -6.538070738315582e-05, -6.245356053113937e-05, -5.9526413679122925e-05, -5.6599266827106476e-05, -5.367211997509003e-05, -5.074497312307358e-05, -4.781782627105713e-05, -4.489067941904068e-05, -4.196353256702423e-05, -3.903638571500778e-05, -3.610923886299133e-05, -3.3182092010974884e-05, -3.0254945158958435e-05, -2.7327798306941986e-05, -2.4400651454925537e-05, -2.1473504602909088e-05, -1.854635775089264e-05, -1.561921089887619e-05, -1.2692064046859741e-05, -9.764917194843292e-06, -6.837770342826843e-06, -3.910623490810394e-06, -9.834766387939453e-07, 1.9436702132225037e-06, 4.870817065238953e-06, 7.797963917255402e-06, 1.072511076927185e-05, 1.36522576212883e-05, 1.657940447330475e-05, 1.9506551325321198e-05, 2.2433698177337646e-05, 2.5360845029354095e-05, 2.8287991881370544e-05, 3.1215138733386993e-05, 3.414228558540344e-05, 3.706943243741989e-05, 3.999657928943634e-05, 4.292372614145279e-05, 4.585087299346924e-05, 4.877801984548569e-05, 5.1705166697502136e-05, 5.4632313549518585e-05, 5.7559460401535034e-05, 6.048660725355148e-05, 6.341375410556793e-05, 6.634090095758438e-05, 6.926804780960083e-05, 7.219519466161728e-05, 7.512234151363373e-05, 7.804948836565018e-05, 8.097663521766663e-05, 8.390378206968307e-05, 8.683092892169952e-05, 8.975807577371597e-05, 9.268522262573242e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 16.0, 13.0, 20.0, 31.0, 37.0, 42.0, 83.0, 110.0, 183.0, 291.0, 476.0, 840.0, 1809.0, 4367.0, 13768.0, 54590.0, 311771.0, 541155.0, 87177.0, 20869.0, 6021.0, 2305.0, 1017.0, 573.0, 343.0, 193.0, 138.0, 83.0, 43.0, 41.0, 38.0, 22.0, 19.0, 11.0, 6.0, 6.0, 8.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.1160268783569336, -0.11230278015136719, -0.10857868194580078, -0.10485458374023438, -0.10113048553466797, -0.09740638732910156, -0.09368228912353516, -0.08995819091796875, -0.08623409271240234, -0.08250999450683594, -0.07878589630126953, -0.07506179809570312, -0.07133769989013672, -0.06761360168457031, -0.0638895034790039, -0.0601654052734375, -0.056441307067871094, -0.05271720886230469, -0.04899311065673828, -0.045269012451171875, -0.04154491424560547, -0.03782081604003906, -0.034096717834472656, -0.03037261962890625, -0.026648521423339844, -0.022924423217773438, -0.01920032501220703, -0.015476226806640625, -0.011752128601074219, -0.008028030395507812, -0.004303932189941406, -0.000579833984375, 0.0031442642211914062, 0.0068683624267578125, 0.010592460632324219, 0.014316558837890625, 0.01804065704345703, 0.021764755249023438, 0.025488853454589844, 0.02921295166015625, 0.032937049865722656, 0.03666114807128906, 0.04038524627685547, 0.044109344482421875, 0.04783344268798828, 0.05155754089355469, 0.055281639099121094, 0.0590057373046875, 0.0627298355102539, 0.06645393371582031, 0.07017803192138672, 0.07390213012695312, 0.07762622833251953, 0.08135032653808594, 0.08507442474365234, 0.08879852294921875, 0.09252262115478516, 0.09624671936035156, 0.09997081756591797, 0.10369491577148438, 0.10741901397705078, 0.11114311218261719, 0.1148672103881836, 0.11859130859375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 10.0, 7.0, 19.0, 12.0, 12.0, 26.0, 34.0, 28.0, 46.0, 63.0, 106.0, 89.0, 107.0, 100.0, 65.0, 62.0, 44.0, 30.0, 27.0, 22.0, 19.0, 12.0, 14.0, 5.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0689697265625, -0.06684303283691406, -0.06471633911132812, -0.06258964538574219, -0.06046295166015625, -0.05833625793457031, -0.056209564208984375, -0.05408287048339844, -0.0519561767578125, -0.04982948303222656, -0.047702789306640625, -0.04557609558105469, -0.04344940185546875, -0.04132270812988281, -0.039196014404296875, -0.03706932067871094, -0.034942626953125, -0.03281593322753906, -0.030689239501953125, -0.028562545776367188, -0.02643585205078125, -0.024309158325195312, -0.022182464599609375, -0.020055770874023438, -0.0179290771484375, -0.015802383422851562, -0.013675689697265625, -0.011548995971679688, -0.00942230224609375, -0.0072956085205078125, -0.005168914794921875, -0.0030422210693359375, -0.00091552734375, 0.0012111663818359375, 0.003337860107421875, 0.0054645538330078125, 0.00759124755859375, 0.009717941284179688, 0.011844635009765625, 0.013971328735351562, 0.0160980224609375, 0.018224716186523438, 0.020351409912109375, 0.022478103637695312, 0.02460479736328125, 0.026731491088867188, 0.028858184814453125, 0.030984878540039062, 0.033111572265625, 0.03523826599121094, 0.037364959716796875, 0.03949165344238281, 0.04161834716796875, 0.04374504089355469, 0.045871734619140625, 0.04799842834472656, 0.0501251220703125, 0.05225181579589844, 0.054378509521484375, 0.05650520324707031, 0.05863189697265625, 0.06075859069824219, 0.06288528442382812, 0.06501197814941406, 0.067138671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 11.0, 23.0, 35.0, 57.0, 87.0, 136.0, 166.0, 174.0, 118.0, 82.0, 38.0, 20.0, 13.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2780095338821411, -1.2444459199905396, -1.210882306098938, -1.1773186922073364, -1.1437550783157349, -1.1101914644241333, -1.0766278505325317, -1.0430642366409302, -1.0095006227493286, -0.975937008857727, -0.9423733949661255, -0.9088097810745239, -0.8752461671829224, -0.8416825532913208, -0.8081189393997192, -0.7745553255081177, -0.7409917116165161, -0.7074280977249146, -0.673864483833313, -0.6403008699417114, -0.6067372560501099, -0.5731736421585083, -0.5396100282669067, -0.5060464143753052, -0.4724828004837036, -0.43891918659210205, -0.4053555727005005, -0.3717919588088989, -0.33822834491729736, -0.3046647310256958, -0.27110111713409424, -0.23753750324249268, -0.2039739489555359, -0.17041033506393433, -0.13684672117233276, -0.1032831072807312, -0.06971949338912964, -0.036155879497528076, -0.0025922656059265137, 0.03097134828567505, 0.06453496217727661, 0.09809857606887817, 0.13166218996047974, 0.1652258038520813, 0.19878941774368286, 0.23235303163528442, 0.265916645526886, 0.29948025941848755, 0.3330438733100891, 0.3666074872016907, 0.40017110109329224, 0.4337347149848938, 0.46729832887649536, 0.5008619427680969, 0.5344255566596985, 0.5679891705513, 0.6015527844429016, 0.6351163983345032, 0.6686800122261047, 0.7022436261177063, 0.7358072400093079, 0.7693708539009094, 0.802934467792511, 0.8364980816841125, 0.8700616955757141]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 5.0, 11.0, 13.0, 11.0, 13.0, 21.0, 24.0, 24.0, 17.0, 35.0, 29.0, 34.0, 39.0, 45.0, 43.0, 45.0, 46.0, 42.0, 38.0, 49.0, 37.0, 37.0, 35.0, 35.0, 29.0, 38.0, 22.0, 18.0, 21.0, 25.0, 21.0, 11.0, 10.0, 12.0, 9.0, 10.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6594053506851196, -0.6379721164703369, -0.6165388822555542, -0.5951056480407715, -0.5736724138259888, -0.552239179611206, -0.5308059453964233, -0.5093727111816406, -0.4879395067691803, -0.4665062725543976, -0.44507303833961487, -0.42363983392715454, -0.4022065997123718, -0.3807733654975891, -0.3593401312828064, -0.3379068970680237, -0.31647366285324097, -0.29504042863845825, -0.27360719442367554, -0.2521739602088928, -0.2307407408952713, -0.2093075066804886, -0.18787428736686707, -0.16644105315208435, -0.14500781893730164, -0.12357458472251892, -0.1021413579583168, -0.08070813119411469, -0.05927489697933197, -0.037841662764549255, -0.016408443450927734, 0.0050247907638549805, 0.02645808458328247, 0.04789131507277489, 0.0693245455622673, 0.09075777232646942, 0.11219100654125214, 0.13362424075603485, 0.15505746006965637, 0.1764906942844391, 0.1979239284992218, 0.21935716271400452, 0.24079039692878723, 0.26222360134124756, 0.2836568355560303, 0.305090069770813, 0.3265233039855957, 0.3479565382003784, 0.36938977241516113, 0.39082300662994385, 0.41225624084472656, 0.4336894750595093, 0.455122709274292, 0.4765559434890747, 0.49798914790153503, 0.5194224119186401, 0.5408556461334229, 0.5622888803482056, 0.5837221145629883, 0.605155348777771, 0.6265885829925537, 0.6480218172073364, 0.6694550514221191, 0.6908882856369019, 0.7123214602470398]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 13.0, 12.0, 15.0, 30.0, 45.0, 62.0, 99.0, 155.0, 192.0, 378.0, 630.0, 1106.0, 2273.0, 5360.0, 15761.0, 70049.0, 2651013.0, 1354962.0, 65962.0, 15461.0, 5448.0, 2368.0, 1180.0, 578.0, 397.0, 232.0, 154.0, 103.0, 68.0, 57.0, 28.0, 17.0, 16.0, 16.0, 11.0, 11.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.196533203125, -0.19038772583007812, -0.18424224853515625, -0.17809677124023438, -0.1719512939453125, -0.16580581665039062, -0.15966033935546875, -0.15351486206054688, -0.147369384765625, -0.14122390747070312, -0.13507843017578125, -0.12893295288085938, -0.1227874755859375, -0.11664199829101562, -0.11049652099609375, -0.10435104370117188, -0.09820556640625, -0.09206008911132812, -0.08591461181640625, -0.07976913452148438, -0.0736236572265625, -0.06747817993164062, -0.06133270263671875, -0.055187225341796875, -0.049041748046875, -0.042896270751953125, -0.03675079345703125, -0.030605316162109375, -0.0244598388671875, -0.018314361572265625, -0.01216888427734375, -0.006023406982421875, 0.0001220703125, 0.006267547607421875, 0.01241302490234375, 0.018558502197265625, 0.0247039794921875, 0.030849456787109375, 0.03699493408203125, 0.043140411376953125, 0.049285888671875, 0.055431365966796875, 0.06157684326171875, 0.06772232055664062, 0.0738677978515625, 0.08001327514648438, 0.08615875244140625, 0.09230422973632812, 0.09844970703125, 0.10459518432617188, 0.11074066162109375, 0.11688613891601562, 0.1230316162109375, 0.12917709350585938, 0.13532257080078125, 0.14146804809570312, 0.147613525390625, 0.15375900268554688, 0.15990447998046875, 0.16604995727539062, 0.1721954345703125, 0.17834091186523438, 0.18448638916015625, 0.19063186645507812, 0.19677734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 19.0, 23.0, 34.0, 32.0, 49.0, 43.0, 57.0, 62.0, 62.0, 75.0, 64.0, 72.0, 64.0, 65.0, 49.0, 38.0, 35.0, 25.0, 21.0, 19.0, 11.0, 6.0, 15.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.02289104461669922, -0.021978378295898438, -0.021065711975097656, -0.020153045654296875, -0.019240379333496094, -0.018327713012695312, -0.01741504669189453, -0.01650238037109375, -0.015589714050292969, -0.014677047729492188, -0.013764381408691406, -0.012851715087890625, -0.011939048767089844, -0.011026382446289062, -0.010113716125488281, -0.0092010498046875, -0.008288383483886719, -0.0073757171630859375, -0.006463050842285156, -0.005550384521484375, -0.004637718200683594, -0.0037250518798828125, -0.0028123855590820312, -0.00189971923828125, -0.0009870529174804688, -7.43865966796875e-05, 0.0008382797241210938, 0.001750946044921875, 0.0026636123657226562, 0.0035762786865234375, 0.004488945007324219, 0.005401611328125, 0.006314277648925781, 0.0072269439697265625, 0.008139610290527344, 0.009052276611328125, 0.009964942932128906, 0.010877609252929688, 0.011790275573730469, 0.01270294189453125, 0.013615608215332031, 0.014528274536132812, 0.015440940856933594, 0.016353607177734375, 0.017266273498535156, 0.018178939819335938, 0.01909160614013672, 0.0200042724609375, 0.02091693878173828, 0.021829605102539062, 0.022742271423339844, 0.023654937744140625, 0.024567604064941406, 0.025480270385742188, 0.02639293670654297, 0.02730560302734375, 0.02821826934814453, 0.029130935668945312, 0.030043601989746094, 0.030956268310546875, 0.031868934631347656, 0.03278160095214844, 0.03369426727294922, 0.03460693359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 7.0, 9.0, 6.0, 12.0, 25.0, 35.0, 59.0, 96.0, 153.0, 284.0, 517.0, 1005.0, 2167.0, 5221.0, 14986.0, 54312.0, 354763.0, 3409758.0, 280800.0, 46965.0, 13575.0, 5039.0, 2142.0, 1048.0, 540.0, 291.0, 159.0, 90.0, 79.0, 38.0, 23.0, 22.0, 13.0, 11.0, 8.0, 7.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14832687377929688, -0.14345550537109375, -0.13858413696289062, -0.1337127685546875, -0.12884140014648438, -0.12397003173828125, -0.11909866333007812, -0.114227294921875, -0.10935592651367188, -0.10448455810546875, -0.09961318969726562, -0.0947418212890625, -0.08987045288085938, -0.08499908447265625, -0.08012771606445312, -0.07525634765625, -0.07038497924804688, -0.06551361083984375, -0.060642242431640625, -0.0557708740234375, -0.050899505615234375, -0.04602813720703125, -0.041156768798828125, -0.036285400390625, -0.031414031982421875, -0.02654266357421875, -0.021671295166015625, -0.0167999267578125, -0.011928558349609375, -0.00705718994140625, -0.002185821533203125, 0.002685546875, 0.007556915283203125, 0.01242828369140625, 0.017299652099609375, 0.0221710205078125, 0.027042388916015625, 0.03191375732421875, 0.036785125732421875, 0.041656494140625, 0.046527862548828125, 0.05139923095703125, 0.056270599365234375, 0.0611419677734375, 0.06601333618164062, 0.07088470458984375, 0.07575607299804688, 0.08062744140625, 0.08549880981445312, 0.09037017822265625, 0.09524154663085938, 0.1001129150390625, 0.10498428344726562, 0.10985565185546875, 0.11472702026367188, 0.119598388671875, 0.12446975708007812, 0.12934112548828125, 0.13421249389648438, 0.1390838623046875, 0.14395523071289062, 0.14882659912109375, 0.15369796752929688, 0.1585693359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 1.0, 5.0, 10.0, 17.0, 26.0, 25.0, 37.0, 59.0, 82.0, 118.0, 183.0, 424.0, 1514.0, 763.0, 300.0, 181.0, 90.0, 58.0, 42.0, 24.0, 22.0, 22.0, 19.0, 8.0, 12.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035430908203125, -0.03410625457763672, -0.03278160095214844, -0.031456947326660156, -0.030132293701171875, -0.028807640075683594, -0.027482986450195312, -0.02615833282470703, -0.02483367919921875, -0.02350902557373047, -0.022184371948242188, -0.020859718322753906, -0.019535064697265625, -0.018210411071777344, -0.016885757446289062, -0.015561103820800781, -0.0142364501953125, -0.012911796569824219, -0.011587142944335938, -0.010262489318847656, -0.008937835693359375, -0.007613182067871094, -0.0062885284423828125, -0.004963874816894531, -0.00363922119140625, -0.0023145675659179688, -0.0009899139404296875, 0.00033473968505859375, 0.001659393310546875, 0.0029840469360351562, 0.0043087005615234375, 0.005633354187011719, 0.0069580078125, 0.008282661437988281, 0.009607315063476562, 0.010931968688964844, 0.012256622314453125, 0.013581275939941406, 0.014905929565429688, 0.01623058319091797, 0.01755523681640625, 0.01887989044189453, 0.020204544067382812, 0.021529197692871094, 0.022853851318359375, 0.024178504943847656, 0.025503158569335938, 0.02682781219482422, 0.0281524658203125, 0.02947711944580078, 0.030801773071289062, 0.032126426696777344, 0.033451080322265625, 0.034775733947753906, 0.03610038757324219, 0.03742504119873047, 0.03874969482421875, 0.04007434844970703, 0.04139900207519531, 0.042723655700683594, 0.044048309326171875, 0.045372962951660156, 0.04669761657714844, 0.04802227020263672, 0.049346923828125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 8.0, 16.0, 64.0, 295.0, 434.0, 148.0, 39.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5539562702178955, -0.5278787016868591, -0.5018011927604675, -0.47572362422943115, -0.4496460556983948, -0.4235685169696808, -0.3974909782409668, -0.3714134097099304, -0.34533587098121643, -0.31925833225250244, -0.29318076372146606, -0.2671032249927521, -0.2410256713628769, -0.2149481177330017, -0.18887057900428772, -0.16279302537441254, -0.13671547174453735, -0.11063791811466217, -0.08456037193536758, -0.058482825756073, -0.032405272126197815, -0.006327718496322632, 0.019749820232391357, 0.04582737386226654, 0.07190492749214172, 0.0979824811220169, 0.12406002730131149, 0.15013757348060608, 0.17621512711048126, 0.20229268074035645, 0.22837021946907043, 0.2544477581977844, 0.2805253267288208, 0.3066028654575348, 0.33268043398857117, 0.35875797271728516, 0.38483554124832153, 0.4109130799770355, 0.4369906187057495, 0.4630681872367859, 0.4891457259654999, 0.5152232646942139, 0.5413008332252502, 0.5673784017562866, 0.5934559106826782, 0.6195334792137146, 0.645611047744751, 0.6716885566711426, 0.697766125202179, 0.7238436937332153, 0.7499212026596069, 0.7759987711906433, 0.8020763397216797, 0.8281538486480713, 0.8542314171791077, 0.880308985710144, 0.9063864946365356, 0.932464063167572, 0.9585415720939636, 0.984619140625, 1.0106966495513916, 1.0367742776870728, 1.0628517866134644, 1.088929295539856, 1.115006923675537]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 7.0, 7.0, 9.0, 17.0, 16.0, 18.0, 25.0, 18.0, 12.0, 35.0, 39.0, 29.0, 36.0, 40.0, 52.0, 59.0, 48.0, 57.0, 46.0, 47.0, 51.0, 45.0, 44.0, 41.0, 29.0, 28.0, 26.0, 27.0, 22.0, 17.0, 12.0, 11.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15133535861968994, -0.1461365967988968, -0.14093783497810364, -0.1357390582561493, -0.13054029643535614, -0.125341534614563, -0.12014277279376984, -0.11494401097297668, -0.10974524170160294, -0.10454647988080978, -0.09934771060943604, -0.09414894878864288, -0.08895018696784973, -0.08375141769647598, -0.07855265587568283, -0.07335388660430908, -0.06815512478351593, -0.06295636296272278, -0.05775759369134903, -0.05255883187055588, -0.04736006632447243, -0.04216130077838898, -0.036962538957595825, -0.031763773411512375, -0.026565007865428925, -0.021366242319345474, -0.016167478635907173, -0.010968714021146297, -0.005769949406385422, -0.0005711838603019714, 0.00462757982313633, 0.00982634350657463, 0.015025109052658081, 0.02022387459874153, 0.025422638282179832, 0.030621401965618134, 0.035820167511701584, 0.041018933057785034, 0.046217694878578186, 0.051416460424661636, 0.05661522597074509, 0.06181399151682854, 0.06701275706291199, 0.07221151888370514, 0.07741028070449829, 0.08260904997587204, 0.08780781179666519, 0.09300658106803894, 0.09820534288883209, 0.10340410470962524, 0.10860287398099899, 0.11380163580179214, 0.1190004050731659, 0.12419916689395905, 0.1293979287147522, 0.13459669053554535, 0.1397954523563385, 0.14499421417713165, 0.1501929759979248, 0.15539175271987915, 0.1605905145406723, 0.16578927636146545, 0.1709880381822586, 0.17618680000305176, 0.1813855767250061]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 9.0, 13.0, 26.0, 37.0, 47.0, 49.0, 91.0, 139.0, 192.0, 271.0, 471.0, 710.0, 1170.0, 1929.0, 3364.0, 6255.0, 11652.0, 23011.0, 46273.0, 98074.0, 202375.0, 299399.0, 181019.0, 86797.0, 41144.0, 20205.0, 10296.0, 5588.0, 3198.0, 1743.0, 1106.0, 668.0, 385.0, 258.0, 173.0, 119.0, 95.0, 55.0, 41.0, 31.0, 19.0, 15.0, 17.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0789794921875, -0.07646560668945312, -0.07395172119140625, -0.07143783569335938, -0.0689239501953125, -0.06641006469726562, -0.06389617919921875, -0.061382293701171875, -0.058868408203125, -0.056354522705078125, -0.05384063720703125, -0.051326751708984375, -0.0488128662109375, -0.046298980712890625, -0.04378509521484375, -0.041271209716796875, -0.03875732421875, -0.036243438720703125, -0.03372955322265625, -0.031215667724609375, -0.0287017822265625, -0.026187896728515625, -0.02367401123046875, -0.021160125732421875, -0.018646240234375, -0.016132354736328125, -0.01361846923828125, -0.011104583740234375, -0.0085906982421875, -0.006076812744140625, -0.00356292724609375, -0.001049041748046875, 0.00146484375, 0.003978729248046875, 0.00649261474609375, 0.009006500244140625, 0.0115203857421875, 0.014034271240234375, 0.01654815673828125, 0.019062042236328125, 0.021575927734375, 0.024089813232421875, 0.02660369873046875, 0.029117584228515625, 0.0316314697265625, 0.034145355224609375, 0.03665924072265625, 0.039173126220703125, 0.04168701171875, 0.044200897216796875, 0.04671478271484375, 0.049228668212890625, 0.0517425537109375, 0.054256439208984375, 0.05677032470703125, 0.059284210205078125, 0.061798095703125, 0.06431198120117188, 0.06682586669921875, 0.06933975219726562, 0.0718536376953125, 0.07436752319335938, 0.07688140869140625, 0.07939529418945312, 0.0819091796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 11.0, 15.0, 15.0, 15.0, 13.0, 29.0, 34.0, 43.0, 42.0, 53.0, 64.0, 56.0, 63.0, 67.0, 66.0, 57.0, 43.0, 71.0, 43.0, 35.0, 38.0, 23.0, 17.0, 11.0, 13.0, 14.0, 9.0, 9.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0227203369140625, -0.021863698959350586, -0.021007061004638672, -0.020150423049926758, -0.019293785095214844, -0.01843714714050293, -0.017580509185791016, -0.0167238712310791, -0.015867233276367188, -0.015010595321655273, -0.01415395736694336, -0.013297319412231445, -0.012440681457519531, -0.011584043502807617, -0.010727405548095703, -0.009870767593383789, -0.009014129638671875, -0.008157491683959961, -0.007300853729248047, -0.006444215774536133, -0.005587577819824219, -0.004730939865112305, -0.0038743019104003906, -0.0030176639556884766, -0.0021610260009765625, -0.0013043880462646484, -0.0004477500915527344, 0.0004088878631591797, 0.0012655258178710938, 0.002122163772583008, 0.002978801727294922, 0.003835439682006836, 0.00469207763671875, 0.005548715591430664, 0.006405353546142578, 0.007261991500854492, 0.008118629455566406, 0.00897526741027832, 0.009831905364990234, 0.010688543319702148, 0.011545181274414062, 0.012401819229125977, 0.01325845718383789, 0.014115095138549805, 0.014971733093261719, 0.015828371047973633, 0.016685009002685547, 0.01754164695739746, 0.018398284912109375, 0.01925492286682129, 0.020111560821533203, 0.020968198776245117, 0.02182483673095703, 0.022681474685668945, 0.02353811264038086, 0.024394750595092773, 0.025251388549804688, 0.0261080265045166, 0.026964664459228516, 0.02782130241394043, 0.028677940368652344, 0.029534578323364258, 0.030391216278076172, 0.031247854232788086, 0.0321044921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 19.0, 26.0, 28.0, 38.0, 69.0, 86.0, 114.0, 149.0, 243.0, 330.0, 534.0, 936.0, 1629.0, 3729.0, 9606.0, 30429.0, 110373.0, 366191.0, 365029.0, 110905.0, 30372.0, 9702.0, 3711.0, 1732.0, 885.0, 553.0, 330.0, 214.0, 174.0, 110.0, 75.0, 65.0, 33.0, 28.0, 22.0, 21.0, 8.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.122802734375, -0.11908149719238281, -0.11536026000976562, -0.11163902282714844, -0.10791778564453125, -0.10419654846191406, -0.10047531127929688, -0.09675407409667969, -0.0930328369140625, -0.08931159973144531, -0.08559036254882812, -0.08186912536621094, -0.07814788818359375, -0.07442665100097656, -0.07070541381835938, -0.06698417663574219, -0.063262939453125, -0.05954170227050781, -0.055820465087890625, -0.05209922790527344, -0.04837799072265625, -0.04465675354003906, -0.040935516357421875, -0.03721427917480469, -0.0334930419921875, -0.029771804809570312, -0.026050567626953125, -0.022329330444335938, -0.01860809326171875, -0.014886856079101562, -0.011165618896484375, -0.0074443817138671875, -0.00372314453125, -1.9073486328125e-06, 0.003719329833984375, 0.0074405670166015625, 0.01116180419921875, 0.014883041381835938, 0.018604278564453125, 0.022325515747070312, 0.0260467529296875, 0.029767990112304688, 0.033489227294921875, 0.03721046447753906, 0.04093170166015625, 0.04465293884277344, 0.048374176025390625, 0.05209541320800781, 0.055816650390625, 0.05953788757324219, 0.06325912475585938, 0.06698036193847656, 0.07070159912109375, 0.07442283630371094, 0.07814407348632812, 0.08186531066894531, 0.0855865478515625, 0.08930778503417969, 0.09302902221679688, 0.09675025939941406, 0.10047149658203125, 0.10419273376464844, 0.10791397094726562, 0.11163520812988281, 0.1153564453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 2.0, 7.0, 8.0, 12.0, 13.0, 14.0, 13.0, 12.0, 33.0, 28.0, 32.0, 29.0, 40.0, 38.0, 48.0, 57.0, 45.0, 54.0, 51.0, 55.0, 50.0, 47.0, 43.0, 38.0, 32.0, 33.0, 37.0, 21.0, 24.0, 16.0, 14.0, 13.0, 11.0, 5.0, 4.0, 7.0, 3.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.13510990142822266, -0.1311817169189453, -0.12725353240966797, -0.12332534790039062, -0.11939716339111328, -0.11546897888183594, -0.1115407943725586, -0.10761260986328125, -0.1036844253540039, -0.09975624084472656, -0.09582805633544922, -0.09189987182617188, -0.08797168731689453, -0.08404350280761719, -0.08011531829833984, -0.0761871337890625, -0.07225894927978516, -0.06833076477050781, -0.06440258026123047, -0.060474395751953125, -0.05654621124267578, -0.05261802673339844, -0.048689842224121094, -0.04476165771484375, -0.040833473205566406, -0.03690528869628906, -0.03297710418701172, -0.029048919677734375, -0.02512073516845703, -0.021192550659179688, -0.017264366149902344, -0.013336181640625, -0.009407997131347656, -0.0054798126220703125, -0.0015516281127929688, 0.002376556396484375, 0.006304740905761719, 0.010232925415039062, 0.014161109924316406, 0.01808929443359375, 0.022017478942871094, 0.025945663452148438, 0.02987384796142578, 0.033802032470703125, 0.03773021697998047, 0.04165840148925781, 0.045586585998535156, 0.0495147705078125, 0.053442955017089844, 0.05737113952636719, 0.06129932403564453, 0.06522750854492188, 0.06915569305419922, 0.07308387756347656, 0.0770120620727539, 0.08094024658203125, 0.0848684310913086, 0.08879661560058594, 0.09272480010986328, 0.09665298461914062, 0.10058116912841797, 0.10450935363769531, 0.10843753814697266, 0.11236572265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 11.0, 15.0, 12.0, 24.0, 24.0, 43.0, 67.0, 109.0, 189.0, 397.0, 826.0, 1959.0, 5302.0, 16946.0, 69285.0, 380389.0, 457268.0, 85426.0, 20012.0, 6087.0, 2229.0, 923.0, 439.0, 238.0, 110.0, 78.0, 47.0, 23.0, 15.0, 8.0, 12.0, 12.0, 7.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07647705078125, -0.07423210144042969, -0.07198715209960938, -0.06974220275878906, -0.06749725341796875, -0.06525230407714844, -0.06300735473632812, -0.06076240539550781, -0.0585174560546875, -0.05627250671386719, -0.054027557373046875, -0.05178260803222656, -0.04953765869140625, -0.04729270935058594, -0.045047760009765625, -0.04280281066894531, -0.040557861328125, -0.03831291198730469, -0.036067962646484375, -0.03382301330566406, -0.03157806396484375, -0.029333114624023438, -0.027088165283203125, -0.024843215942382812, -0.0225982666015625, -0.020353317260742188, -0.018108367919921875, -0.015863418579101562, -0.01361846923828125, -0.011373519897460938, -0.009128570556640625, -0.0068836212158203125, -0.004638671875, -0.0023937225341796875, -0.000148773193359375, 0.0020961761474609375, 0.00434112548828125, 0.0065860748291015625, 0.008831024169921875, 0.011075973510742188, 0.0133209228515625, 0.015565872192382812, 0.017810821533203125, 0.020055770874023438, 0.02230072021484375, 0.024545669555664062, 0.026790618896484375, 0.029035568237304688, 0.031280517578125, 0.03352546691894531, 0.035770416259765625, 0.03801536560058594, 0.04026031494140625, 0.04250526428222656, 0.044750213623046875, 0.04699516296386719, 0.0492401123046875, 0.05148506164550781, 0.053730010986328125, 0.05597496032714844, 0.05821990966796875, 0.06046485900878906, 0.06270980834960938, 0.06495475769042969, 0.06719970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 12.0, 14.0, 18.0, 23.0, 37.0, 44.0, 50.0, 48.0, 69.0, 66.0, 79.0, 85.0, 70.0, 67.0, 55.0, 50.0, 39.0, 36.0, 24.0, 21.0, 23.0, 8.0, 12.0, 6.0, 4.0, 5.0, 5.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.9723854064941406e-05, -5.8113597333431244e-05, -5.650334060192108e-05, -5.489308387041092e-05, -5.328282713890076e-05, -5.1672570407390594e-05, -5.006231367588043e-05, -4.845205694437027e-05, -4.684180021286011e-05, -4.5231543481349945e-05, -4.362128674983978e-05, -4.201103001832962e-05, -4.040077328681946e-05, -3.8790516555309296e-05, -3.718025982379913e-05, -3.557000309228897e-05, -3.395974636077881e-05, -3.2349489629268646e-05, -3.0739232897758484e-05, -2.912897616624832e-05, -2.751871943473816e-05, -2.5908462703227997e-05, -2.4298205971717834e-05, -2.2687949240207672e-05, -2.107769250869751e-05, -1.9467435777187347e-05, -1.7857179045677185e-05, -1.6246922314167023e-05, -1.463666558265686e-05, -1.3026408851146698e-05, -1.1416152119636536e-05, -9.805895388126373e-06, -8.195638656616211e-06, -6.585381925106049e-06, -4.975125193595886e-06, -3.364868462085724e-06, -1.7546117305755615e-06, -1.4435499906539917e-07, 1.4659017324447632e-06, 3.0761584639549255e-06, 4.686415195465088e-06, 6.29667192697525e-06, 7.906928658485413e-06, 9.517185389995575e-06, 1.1127442121505737e-05, 1.27376988530159e-05, 1.4347955584526062e-05, 1.5958212316036224e-05, 1.7568469047546387e-05, 1.917872577905655e-05, 2.078898251056671e-05, 2.2399239242076874e-05, 2.4009495973587036e-05, 2.56197527050972e-05, 2.723000943660736e-05, 2.8840266168117523e-05, 3.0450522899627686e-05, 3.206077963113785e-05, 3.367103636264801e-05, 3.528129309415817e-05, 3.6891549825668335e-05, 3.85018065571785e-05, 4.011206328868866e-05, 4.172232002019882e-05, 4.3332576751708984e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 3.0, 8.0, 13.0, 10.0, 21.0, 38.0, 60.0, 115.0, 236.0, 600.0, 1762.0, 7426.0, 57076.0, 749038.0, 210089.0, 17157.0, 3174.0, 967.0, 381.0, 177.0, 95.0, 45.0, 26.0, 12.0, 9.0, 9.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13265514373779297, -0.12883567810058594, -0.1250162124633789, -0.12119674682617188, -0.11737728118896484, -0.11355781555175781, -0.10973834991455078, -0.10591888427734375, -0.10209941864013672, -0.09827995300292969, -0.09446048736572266, -0.09064102172851562, -0.0868215560913086, -0.08300209045410156, -0.07918262481689453, -0.0753631591796875, -0.07154369354248047, -0.06772422790527344, -0.0639047622680664, -0.060085296630859375, -0.056265830993652344, -0.05244636535644531, -0.04862689971923828, -0.04480743408203125, -0.04098796844482422, -0.03716850280761719, -0.033349037170410156, -0.029529571533203125, -0.025710105895996094, -0.021890640258789062, -0.01807117462158203, -0.014251708984375, -0.010432243347167969, -0.0066127777099609375, -0.0027933120727539062, 0.001026153564453125, 0.004845619201660156, 0.008665084838867188, 0.012484550476074219, 0.01630401611328125, 0.02012348175048828, 0.023942947387695312, 0.027762413024902344, 0.031581878662109375, 0.035401344299316406, 0.03922080993652344, 0.04304027557373047, 0.0468597412109375, 0.05067920684814453, 0.05449867248535156, 0.058318138122558594, 0.062137603759765625, 0.06595706939697266, 0.06977653503417969, 0.07359600067138672, 0.07741546630859375, 0.08123493194580078, 0.08505439758300781, 0.08887386322021484, 0.09269332885742188, 0.0965127944946289, 0.10033226013183594, 0.10415172576904297, 0.10797119140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 8.0, 9.0, 15.0, 9.0, 11.0, 21.0, 35.0, 40.0, 56.0, 83.0, 96.0, 134.0, 124.0, 92.0, 83.0, 57.0, 36.0, 26.0, 19.0, 14.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04364013671875, -0.041728973388671875, -0.03981781005859375, -0.037906646728515625, -0.0359954833984375, -0.034084320068359375, -0.03217315673828125, -0.030261993408203125, -0.028350830078125, -0.026439666748046875, -0.02452850341796875, -0.022617340087890625, -0.0207061767578125, -0.018795013427734375, -0.01688385009765625, -0.014972686767578125, -0.0130615234375, -0.011150360107421875, -0.00923919677734375, -0.007328033447265625, -0.0054168701171875, -0.003505706787109375, -0.00159454345703125, 0.000316619873046875, 0.002227783203125, 0.004138946533203125, 0.00605010986328125, 0.007961273193359375, 0.0098724365234375, 0.011783599853515625, 0.01369476318359375, 0.015605926513671875, 0.01751708984375, 0.019428253173828125, 0.02133941650390625, 0.023250579833984375, 0.0251617431640625, 0.027072906494140625, 0.02898406982421875, 0.030895233154296875, 0.032806396484375, 0.034717559814453125, 0.03662872314453125, 0.038539886474609375, 0.0404510498046875, 0.042362213134765625, 0.04427337646484375, 0.046184539794921875, 0.048095703125, 0.050006866455078125, 0.05191802978515625, 0.053829193115234375, 0.0557403564453125, 0.057651519775390625, 0.05956268310546875, 0.061473846435546875, 0.063385009765625, 0.06529617309570312, 0.06720733642578125, 0.06911849975585938, 0.0710296630859375, 0.07294082641601562, 0.07485198974609375, 0.07676315307617188, 0.07867431640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 5.0, 3.0, 11.0, 26.0, 34.0, 46.0, 85.0, 104.0, 149.0, 156.0, 119.0, 86.0, 68.0, 40.0, 24.0, 12.0, 7.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5689632296562195, -0.5446256995201111, -0.5202881693840027, -0.4959506094455719, -0.4716130793094635, -0.4472755193710327, -0.4229379892349243, -0.3986004590988159, -0.3742629289627075, -0.3499253988265991, -0.32558783888816833, -0.30125030875205994, -0.27691277861595154, -0.25257521867752075, -0.22823768854141235, -0.20390015840530396, -0.17956259846687317, -0.15522505342960358, -0.13088752329349518, -0.10654997825622559, -0.08221244066953659, -0.057874903082847595, -0.033537358045578, -0.009199827909469604, 0.015137717127799988, 0.03947525471448898, 0.06381279230117798, 0.08815033733844757, 0.11248787492513657, 0.13682541251182556, 0.16116295754909515, 0.18550048768520355, 0.20983803272247314, 0.23417557775974274, 0.25851312279701233, 0.2828506529331207, 0.3071881830692291, 0.3315257430076599, 0.3558632731437683, 0.3802008032798767, 0.4045383334159851, 0.4288758635520935, 0.4532134234905243, 0.4775509536266327, 0.5018885135650635, 0.5262260437011719, 0.5505635738372803, 0.5749011039733887, 0.5992386341094971, 0.6235761642456055, 0.6479136943817139, 0.6722512245178223, 0.6965888142585754, 0.7209263443946838, 0.7452638745307922, 0.7696014046669006, 0.7939389944076538, 0.8182765245437622, 0.8426140546798706, 0.866951584815979, 0.8912891745567322, 0.9156267046928406, 0.939964234828949, 0.9643017649650574, 0.9886392951011658]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 2.0, 4.0, 7.0, 8.0, 9.0, 11.0, 11.0, 17.0, 22.0, 23.0, 19.0, 16.0, 32.0, 34.0, 28.0, 39.0, 33.0, 40.0, 40.0, 34.0, 38.0, 42.0, 44.0, 48.0, 45.0, 49.0, 29.0, 41.0, 31.0, 32.0, 28.0, 22.0, 17.0, 17.0, 11.0, 10.0, 12.0, 6.0, 9.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.6068695187568665, -0.5884832739830017, -0.5700969696044922, -0.5517107248306274, -0.5333244800567627, -0.5149381756782532, -0.4965519309043884, -0.4781656563282013, -0.45977938175201416, -0.441393107175827, -0.4230068624019623, -0.40462058782577515, -0.386234313249588, -0.3678480386734009, -0.34946179389953613, -0.331075519323349, -0.31268927454948425, -0.2943029999732971, -0.2759167551994324, -0.25753048062324524, -0.2391442060470581, -0.22075794637203217, -0.20237168669700623, -0.1839854121208191, -0.16559915244579315, -0.1472128927707672, -0.12882661819458008, -0.11044035851955414, -0.0920540913939476, -0.07366782426834106, -0.055281564593315125, -0.03689529001712799, -0.01850903034210205, -0.00012276507914066315, 0.018263500183820724, 0.03664976358413696, 0.0550360307097435, 0.07342229783535004, 0.09180855751037598, 0.11019483208656311, 0.12858109176158905, 0.146967351436615, 0.16535362601280212, 0.18373988568782806, 0.202126145362854, 0.22051241993904114, 0.23889867961406708, 0.257284939289093, 0.27567121386528015, 0.2940574884414673, 0.31244373321533203, 0.33083000779151917, 0.3492162823677063, 0.36760252714157104, 0.3859888017177582, 0.4043750762939453, 0.42276132106781006, 0.4411475956439972, 0.45953384041786194, 0.4779201149940491, 0.4963063895702362, 0.5146926641464233, 0.5330789089202881, 0.5514651536941528, 0.5698514580726624]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 11.0, 10.0, 20.0, 25.0, 46.0, 55.0, 110.0, 164.0, 282.0, 483.0, 886.0, 1504.0, 3277.0, 7949.0, 24573.0, 116143.0, 3633027.0, 339589.0, 43697.0, 12693.0, 4867.0, 2197.0, 1065.0, 636.0, 372.0, 230.0, 139.0, 81.0, 42.0, 34.0, 21.0, 17.0, 4.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.15860366821289062, -0.15375518798828125, -0.14890670776367188, -0.1440582275390625, -0.13920974731445312, -0.13436126708984375, -0.12951278686523438, -0.124664306640625, -0.11981582641601562, -0.11496734619140625, -0.11011886596679688, -0.1052703857421875, -0.10042190551757812, -0.09557342529296875, -0.09072494506835938, -0.08587646484375, -0.08102798461914062, -0.07617950439453125, -0.07133102416992188, -0.0664825439453125, -0.061634063720703125, -0.05678558349609375, -0.051937103271484375, -0.047088623046875, -0.042240142822265625, -0.03739166259765625, -0.032543182373046875, -0.0276947021484375, -0.022846221923828125, -0.01799774169921875, -0.013149261474609375, -0.00830078125, -0.003452301025390625, 0.00139617919921875, 0.006244659423828125, 0.0110931396484375, 0.015941619873046875, 0.02079010009765625, 0.025638580322265625, 0.030487060546875, 0.035335540771484375, 0.04018402099609375, 0.045032501220703125, 0.0498809814453125, 0.054729461669921875, 0.05957794189453125, 0.06442642211914062, 0.06927490234375, 0.07412338256835938, 0.07897186279296875, 0.08382034301757812, 0.0886688232421875, 0.09351730346679688, 0.09836578369140625, 0.10321426391601562, 0.108062744140625, 0.11291122436523438, 0.11775970458984375, 0.12260818481445312, 0.1274566650390625, 0.13230514526367188, 0.13715362548828125, 0.14200210571289062, 0.1468505859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 10.0, 15.0, 14.0, 11.0, 17.0, 30.0, 28.0, 43.0, 32.0, 53.0, 42.0, 54.0, 59.0, 47.0, 62.0, 60.0, 59.0, 51.0, 47.0, 38.0, 40.0, 35.0, 30.0, 25.0, 18.0, 14.0, 14.0, 9.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0238189697265625, -0.023005962371826172, -0.022192955017089844, -0.021379947662353516, -0.020566940307617188, -0.01975393295288086, -0.01894092559814453, -0.018127918243408203, -0.017314910888671875, -0.016501903533935547, -0.01568889617919922, -0.01487588882446289, -0.014062881469726562, -0.013249874114990234, -0.012436866760253906, -0.011623859405517578, -0.01081085205078125, -0.009997844696044922, -0.009184837341308594, -0.008371829986572266, -0.0075588226318359375, -0.006745815277099609, -0.005932807922363281, -0.005119800567626953, -0.004306793212890625, -0.003493785858154297, -0.0026807785034179688, -0.0018677711486816406, -0.0010547637939453125, -0.00024175643920898438, 0.0005712509155273438, 0.0013842582702636719, 0.002197265625, 0.003010272979736328, 0.0038232803344726562, 0.004636287689208984, 0.0054492950439453125, 0.006262302398681641, 0.007075309753417969, 0.007888317108154297, 0.008701324462890625, 0.009514331817626953, 0.010327339172363281, 0.01114034652709961, 0.011953353881835938, 0.012766361236572266, 0.013579368591308594, 0.014392375946044922, 0.01520538330078125, 0.016018390655517578, 0.016831398010253906, 0.017644405364990234, 0.018457412719726562, 0.01927042007446289, 0.02008342742919922, 0.020896434783935547, 0.021709442138671875, 0.022522449493408203, 0.02333545684814453, 0.02414846420288086, 0.024961471557617188, 0.025774478912353516, 0.026587486267089844, 0.027400493621826172, 0.0282135009765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 10.0, 4.0, 11.0, 15.0, 22.0, 36.0, 38.0, 66.0, 84.0, 168.0, 424.0, 1838.0, 15464.0, 865479.0, 3283964.0, 22980.0, 2658.0, 574.0, 194.0, 94.0, 47.0, 32.0, 27.0, 14.0, 14.0, 7.0, 9.0, 5.0, 2.0, 4.0, 0.0, 5.0], "bins": [-0.5107421875, -0.49965476989746094, -0.4885673522949219, -0.4774799346923828, -0.46639251708984375, -0.4553050994873047, -0.4442176818847656, -0.43313026428222656, -0.4220428466796875, -0.41095542907714844, -0.3998680114746094, -0.3887805938720703, -0.37769317626953125, -0.3666057586669922, -0.3555183410644531, -0.34443092346191406, -0.333343505859375, -0.32225608825683594, -0.3111686706542969, -0.3000812530517578, -0.28899383544921875, -0.2779064178466797, -0.2668190002441406, -0.25573158264160156, -0.2446441650390625, -0.23355674743652344, -0.22246932983398438, -0.2113819122314453, -0.20029449462890625, -0.1892070770263672, -0.17811965942382812, -0.16703224182128906, -0.15594482421875, -0.14485740661621094, -0.13376998901367188, -0.12268257141113281, -0.11159515380859375, -0.10050773620605469, -0.08942031860351562, -0.07833290100097656, -0.0672454833984375, -0.05615806579589844, -0.045070648193359375, -0.03398323059082031, -0.02289581298828125, -0.011808395385742188, -0.000720977783203125, 0.010366439819335938, 0.021453857421875, 0.03254127502441406, 0.043628692626953125, 0.05471611022949219, 0.06580352783203125, 0.07689094543457031, 0.08797836303710938, 0.09906578063964844, 0.1101531982421875, 0.12124061584472656, 0.13232803344726562, 0.1434154510498047, 0.15450286865234375, 0.1655902862548828, 0.17667770385742188, 0.18776512145996094, 0.1988525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 12.0, 31.0, 67.0, 110.0, 328.0, 1890.0, 1113.0, 253.0, 123.0, 50.0, 37.0, 16.0, 13.0, 8.0, 2.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10473775863647461, -0.10229778289794922, -0.09985780715942383, -0.09741783142089844, -0.09497785568237305, -0.09253787994384766, -0.09009790420532227, -0.08765792846679688, -0.08521795272827148, -0.0827779769897461, -0.0803380012512207, -0.07789802551269531, -0.07545804977416992, -0.07301807403564453, -0.07057809829711914, -0.06813812255859375, -0.06569814682006836, -0.06325817108154297, -0.06081819534301758, -0.05837821960449219, -0.0559382438659668, -0.053498268127441406, -0.051058292388916016, -0.048618316650390625, -0.046178340911865234, -0.043738365173339844, -0.04129838943481445, -0.03885841369628906, -0.03641843795776367, -0.03397846221923828, -0.03153848648071289, -0.0290985107421875, -0.02665853500366211, -0.02421855926513672, -0.021778583526611328, -0.019338607788085938, -0.016898632049560547, -0.014458656311035156, -0.012018680572509766, -0.009578704833984375, -0.007138729095458984, -0.004698753356933594, -0.002258777618408203, 0.0001811981201171875, 0.002621173858642578, 0.005061149597167969, 0.007501125335693359, 0.00994110107421875, 0.01238107681274414, 0.014821052551269531, 0.017261028289794922, 0.019701004028320312, 0.022140979766845703, 0.024580955505371094, 0.027020931243896484, 0.029460906982421875, 0.031900882720947266, 0.034340858459472656, 0.03678083419799805, 0.03922080993652344, 0.04166078567504883, 0.04410076141357422, 0.04654073715209961, 0.048980712890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 8.0, 14.0, 32.0, 69.0, 161.0, 241.0, 232.0, 138.0, 65.0, 31.0, 13.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2084607481956482, -0.19439680874347687, -0.18033288419246674, -0.1662689447402954, -0.15220502018928528, -0.13814108073711395, -0.12407714873552322, -0.1100132167339325, -0.09594928473234177, -0.08188535273075104, -0.06782142072916031, -0.05375748500227928, -0.03969355300068855, -0.025629617273807526, -0.011565685272216797, 0.002498246729373932, 0.01656217873096466, 0.03062611073255539, 0.04469004273414612, 0.058753978461027145, 0.07281790673732758, 0.0868818461894989, 0.10094577819108963, 0.11500971019268036, 0.12907364964485168, 0.143137589097023, 0.15720151364803314, 0.17126545310020447, 0.1853293776512146, 0.19939331710338593, 0.21345725655555725, 0.22752118110656738, 0.24158510565757751, 0.25564903020858765, 0.26971298456192017, 0.2837769091129303, 0.29784083366394043, 0.31190478801727295, 0.3259687125682831, 0.3400326371192932, 0.35409656167030334, 0.3681604862213135, 0.382224440574646, 0.39628836512565613, 0.41035228967666626, 0.4244162440299988, 0.4384801685810089, 0.45254409313201904, 0.46660804748535156, 0.4806719720363617, 0.4947359263896942, 0.5087998509407043, 0.5228638052940369, 0.5369277000427246, 0.5509916543960571, 0.5650556087493896, 0.5791195034980774, 0.5931834578514099, 0.6072473526000977, 0.6213113069534302, 0.6353752613067627, 0.6494391560554504, 0.663503110408783, 0.6775670051574707, 0.6916309595108032]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 9.0, 14.0, 7.0, 15.0, 17.0, 15.0, 26.0, 24.0, 29.0, 28.0, 35.0, 34.0, 36.0, 48.0, 42.0, 40.0, 38.0, 33.0, 33.0, 39.0, 32.0, 42.0, 30.0, 46.0, 28.0, 35.0, 30.0, 24.0, 25.0, 23.0, 13.0, 19.0, 20.0, 10.0, 11.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1454206109046936, -0.14092865586280823, -0.13643671572208405, -0.13194476068019867, -0.1274528205394745, -0.12296086549758911, -0.11846891045570374, -0.11397696286439896, -0.10948501527309418, -0.1049930676817894, -0.10050112009048462, -0.09600916504859924, -0.09151721745729446, -0.08702526986598969, -0.08253331482410431, -0.07804136723279953, -0.07354941964149475, -0.06905747205018997, -0.06456552445888519, -0.06007356941699982, -0.05558162182569504, -0.05108967423439026, -0.04659772291779518, -0.042105771601200104, -0.037613824009895325, -0.033121876418590546, -0.028629925101995468, -0.02413797564804554, -0.01964602619409561, -0.015154076740145683, -0.010662127286195755, -0.0061701759696006775, -0.0016782283782958984, 0.00281372107565403, 0.007305670529603958, 0.011797619983553886, 0.016289569437503815, 0.020781518891453743, 0.02527346834540367, 0.02976541966199875, 0.03425736725330353, 0.03874931484460831, 0.043241266161203384, 0.04773321747779846, 0.05222516506910324, 0.05671711266040802, 0.0612090639770031, 0.06570101529359818, 0.07019296288490295, 0.07468491047620773, 0.07917685806751251, 0.08366881310939789, 0.08816076070070267, 0.09265270829200745, 0.09714466333389282, 0.1016366109251976, 0.10612855851650238, 0.11062050610780716, 0.11511245369911194, 0.11960440874099731, 0.1240963563323021, 0.12858830392360687, 0.13308025896549225, 0.13757219910621643, 0.1420641541481018]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 10.0, 14.0, 24.0, 34.0, 39.0, 85.0, 146.0, 232.0, 400.0, 712.0, 1333.0, 2923.0, 6059.0, 13817.0, 33547.0, 88164.0, 229902.0, 366251.0, 186139.0, 69983.0, 27295.0, 11410.0, 4947.0, 2404.0, 1171.0, 652.0, 355.0, 209.0, 105.0, 84.0, 33.0, 27.0, 15.0, 9.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09923076629638672, -0.09616661071777344, -0.09310245513916016, -0.09003829956054688, -0.0869741439819336, -0.08390998840332031, -0.08084583282470703, -0.07778167724609375, -0.07471752166748047, -0.07165336608886719, -0.0685892105102539, -0.06552505493164062, -0.062460899353027344, -0.05939674377441406, -0.05633258819580078, -0.0532684326171875, -0.05020427703857422, -0.04714012145996094, -0.044075965881347656, -0.041011810302734375, -0.037947654724121094, -0.03488349914550781, -0.03181934356689453, -0.02875518798828125, -0.02569103240966797, -0.022626876831054688, -0.019562721252441406, -0.016498565673828125, -0.013434410095214844, -0.010370254516601562, -0.007306098937988281, -0.004241943359375, -0.0011777877807617188, 0.0018863677978515625, 0.004950523376464844, 0.008014678955078125, 0.011078834533691406, 0.014142990112304688, 0.01720714569091797, 0.02027130126953125, 0.02333545684814453, 0.026399612426757812, 0.029463768005371094, 0.032527923583984375, 0.035592079162597656, 0.03865623474121094, 0.04172039031982422, 0.0447845458984375, 0.04784870147705078, 0.05091285705566406, 0.053977012634277344, 0.057041168212890625, 0.060105323791503906, 0.06316947937011719, 0.06623363494873047, 0.06929779052734375, 0.07236194610595703, 0.07542610168457031, 0.0784902572631836, 0.08155441284179688, 0.08461856842041016, 0.08768272399902344, 0.09074687957763672, 0.09381103515625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 7.0, 8.0, 17.0, 19.0, 12.0, 22.0, 28.0, 42.0, 44.0, 41.0, 48.0, 44.0, 55.0, 50.0, 38.0, 55.0, 57.0, 65.0, 57.0, 44.0, 29.0, 29.0, 26.0, 35.0, 20.0, 23.0, 16.0, 13.0, 9.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224761962890625, -0.021669626235961914, -0.020863056182861328, -0.020056486129760742, -0.019249916076660156, -0.01844334602355957, -0.017636775970458984, -0.0168302059173584, -0.016023635864257812, -0.015217065811157227, -0.01441049575805664, -0.013603925704956055, -0.012797355651855469, -0.011990785598754883, -0.011184215545654297, -0.010377645492553711, -0.009571075439453125, -0.008764505386352539, -0.007957935333251953, -0.007151365280151367, -0.006344795227050781, -0.005538225173950195, -0.004731655120849609, -0.0039250850677490234, -0.0031185150146484375, -0.0023119449615478516, -0.0015053749084472656, -0.0006988048553466797, 0.00010776519775390625, 0.0009143352508544922, 0.0017209053039550781, 0.002527475357055664, 0.00333404541015625, 0.004140615463256836, 0.004947185516357422, 0.005753755569458008, 0.006560325622558594, 0.00736689567565918, 0.008173465728759766, 0.008980035781860352, 0.009786605834960938, 0.010593175888061523, 0.01139974594116211, 0.012206315994262695, 0.013012886047363281, 0.013819456100463867, 0.014626026153564453, 0.015432596206665039, 0.016239166259765625, 0.01704573631286621, 0.017852306365966797, 0.018658876419067383, 0.01946544647216797, 0.020272016525268555, 0.02107858657836914, 0.021885156631469727, 0.022691726684570312, 0.0234982967376709, 0.024304866790771484, 0.02511143684387207, 0.025918006896972656, 0.026724576950073242, 0.027531147003173828, 0.028337717056274414, 0.029144287109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 7.0, 25.0, 49.0, 65.0, 75.0, 92.0, 112.0, 220.0, 345.0, 542.0, 897.0, 1972.0, 4789.0, 16474.0, 68894.0, 315020.0, 476619.0, 122181.0, 27266.0, 7213.0, 2580.0, 1235.0, 677.0, 403.0, 234.0, 167.0, 116.0, 83.0, 44.0, 44.0, 19.0, 20.0, 20.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10243892669677734, -0.09837150573730469, -0.09430408477783203, -0.09023666381835938, -0.08616924285888672, -0.08210182189941406, -0.0780344009399414, -0.07396697998046875, -0.0698995590209961, -0.06583213806152344, -0.06176471710205078, -0.057697296142578125, -0.05362987518310547, -0.04956245422363281, -0.045495033264160156, -0.0414276123046875, -0.037360191345214844, -0.03329277038574219, -0.02922534942626953, -0.025157928466796875, -0.02109050750732422, -0.017023086547851562, -0.012955665588378906, -0.00888824462890625, -0.004820823669433594, -0.0007534027099609375, 0.0033140182495117188, 0.007381439208984375, 0.011448860168457031, 0.015516281127929688, 0.019583702087402344, 0.023651123046875, 0.027718544006347656, 0.03178596496582031, 0.03585338592529297, 0.039920806884765625, 0.04398822784423828, 0.04805564880371094, 0.052123069763183594, 0.05619049072265625, 0.060257911682128906, 0.06432533264160156, 0.06839275360107422, 0.07246017456054688, 0.07652759552001953, 0.08059501647949219, 0.08466243743896484, 0.0887298583984375, 0.09279727935791016, 0.09686470031738281, 0.10093212127685547, 0.10499954223632812, 0.10906696319580078, 0.11313438415527344, 0.1172018051147461, 0.12126922607421875, 0.1253366470336914, 0.12940406799316406, 0.13347148895263672, 0.13753890991210938, 0.14160633087158203, 0.1456737518310547, 0.14974117279052734, 0.15380859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 11.0, 14.0, 14.0, 13.0, 13.0, 14.0, 19.0, 31.0, 28.0, 40.0, 27.0, 35.0, 42.0, 52.0, 33.0, 52.0, 44.0, 48.0, 39.0, 42.0, 37.0, 43.0, 54.0, 43.0, 27.0, 22.0, 21.0, 21.0, 20.0, 10.0, 20.0, 16.0, 5.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.089599609375, -0.0863351821899414, -0.08307075500488281, -0.07980632781982422, -0.07654190063476562, -0.07327747344970703, -0.07001304626464844, -0.06674861907958984, -0.06348419189453125, -0.060219764709472656, -0.05695533752441406, -0.05369091033935547, -0.050426483154296875, -0.04716205596923828, -0.04389762878417969, -0.040633201599121094, -0.0373687744140625, -0.034104347229003906, -0.030839920043945312, -0.02757549285888672, -0.024311065673828125, -0.02104663848876953, -0.017782211303710938, -0.014517784118652344, -0.01125335693359375, -0.007988929748535156, -0.0047245025634765625, -0.0014600753784179688, 0.001804351806640625, 0.005068778991699219, 0.008333206176757812, 0.011597633361816406, 0.014862060546875, 0.018126487731933594, 0.021390914916992188, 0.02465534210205078, 0.027919769287109375, 0.03118419647216797, 0.03444862365722656, 0.037713050842285156, 0.04097747802734375, 0.044241905212402344, 0.04750633239746094, 0.05077075958251953, 0.054035186767578125, 0.05729961395263672, 0.06056404113769531, 0.0638284683227539, 0.0670928955078125, 0.0703573226928711, 0.07362174987792969, 0.07688617706298828, 0.08015060424804688, 0.08341503143310547, 0.08667945861816406, 0.08994388580322266, 0.09320831298828125, 0.09647274017333984, 0.09973716735839844, 0.10300159454345703, 0.10626602172851562, 0.10953044891357422, 0.11279487609863281, 0.1160593032836914, 0.11932373046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 11.0, 16.0, 35.0, 34.0, 73.0, 195.0, 459.0, 1340.0, 5019.0, 25110.0, 199132.0, 685038.0, 111106.0, 15962.0, 3349.0, 996.0, 362.0, 148.0, 70.0, 33.0, 23.0, 16.0, 8.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.085205078125, -0.082489013671875, -0.07977294921875, -0.077056884765625, -0.0743408203125, -0.071624755859375, -0.06890869140625, -0.066192626953125, -0.0634765625, -0.060760498046875, -0.05804443359375, -0.055328369140625, -0.0526123046875, -0.049896240234375, -0.04718017578125, -0.044464111328125, -0.041748046875, -0.039031982421875, -0.03631591796875, -0.033599853515625, -0.0308837890625, -0.028167724609375, -0.02545166015625, -0.022735595703125, -0.02001953125, -0.017303466796875, -0.01458740234375, -0.011871337890625, -0.0091552734375, -0.006439208984375, -0.00372314453125, -0.001007080078125, 0.001708984375, 0.004425048828125, 0.00714111328125, 0.009857177734375, 0.0125732421875, 0.015289306640625, 0.01800537109375, 0.020721435546875, 0.0234375, 0.026153564453125, 0.02886962890625, 0.031585693359375, 0.0343017578125, 0.037017822265625, 0.03973388671875, 0.042449951171875, 0.045166015625, 0.047882080078125, 0.05059814453125, 0.053314208984375, 0.0560302734375, 0.058746337890625, 0.06146240234375, 0.064178466796875, 0.06689453125, 0.069610595703125, 0.07232666015625, 0.075042724609375, 0.0777587890625, 0.080474853515625, 0.08319091796875, 0.085906982421875, 0.088623046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 13.0, 13.0, 18.0, 31.0, 48.0, 52.0, 76.0, 103.0, 130.0, 146.0, 101.0, 89.0, 61.0, 32.0, 31.0, 21.0, 13.0, 17.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.814168930053711e-05, -7.554329931735992e-05, -7.294490933418274e-05, -7.034651935100555e-05, -6.774812936782837e-05, -6.514973938465118e-05, -6.2551349401474e-05, -5.9952959418296814e-05, -5.735456943511963e-05, -5.4756179451942444e-05, -5.215778946876526e-05, -4.9559399485588074e-05, -4.696100950241089e-05, -4.4362619519233704e-05, -4.176422953605652e-05, -3.9165839552879333e-05, -3.656744956970215e-05, -3.396905958652496e-05, -3.137066960334778e-05, -2.8772279620170593e-05, -2.6173889636993408e-05, -2.3575499653816223e-05, -2.0977109670639038e-05, -1.8378719687461853e-05, -1.5780329704284668e-05, -1.3181939721107483e-05, -1.0583549737930298e-05, -7.985159754753113e-06, -5.386769771575928e-06, -2.7883797883987427e-06, -1.8998980522155762e-07, 2.4084001779556274e-06, 5.0067901611328125e-06, 7.6051801443099976e-06, 1.0203570127487183e-05, 1.2801960110664368e-05, 1.5400350093841553e-05, 1.7998740077018738e-05, 2.0597130060195923e-05, 2.3195520043373108e-05, 2.5793910026550293e-05, 2.8392300009727478e-05, 3.099068999290466e-05, 3.358907997608185e-05, 3.618746995925903e-05, 3.878585994243622e-05, 4.13842499256134e-05, 4.398263990879059e-05, 4.6581029891967773e-05, 4.917941987514496e-05, 5.1777809858322144e-05, 5.437619984149933e-05, 5.6974589824676514e-05, 5.95729798078537e-05, 6.217136979103088e-05, 6.476975977420807e-05, 6.736814975738525e-05, 6.996653974056244e-05, 7.256492972373962e-05, 7.516331970691681e-05, 7.7761709690094e-05, 8.036009967327118e-05, 8.295848965644836e-05, 8.555687963962555e-05, 8.815526962280273e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 6.0, 8.0, 9.0, 15.0, 12.0, 32.0, 45.0, 52.0, 74.0, 120.0, 187.0, 362.0, 659.0, 1309.0, 2793.0, 8148.0, 30201.0, 164490.0, 615813.0, 178234.0, 31843.0, 8223.0, 3007.0, 1299.0, 618.0, 381.0, 207.0, 118.0, 95.0, 51.0, 32.0, 18.0, 21.0, 19.0, 12.0, 5.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048858642578125, -0.04694414138793945, -0.045029640197753906, -0.04311513900756836, -0.04120063781738281, -0.039286136627197266, -0.03737163543701172, -0.03545713424682617, -0.033542633056640625, -0.03162813186645508, -0.02971363067626953, -0.027799129486083984, -0.025884628295898438, -0.02397012710571289, -0.022055625915527344, -0.020141124725341797, -0.01822662353515625, -0.016312122344970703, -0.014397621154785156, -0.01248311996459961, -0.010568618774414062, -0.008654117584228516, -0.006739616394042969, -0.004825115203857422, -0.002910614013671875, -0.0009961128234863281, 0.0009183883666992188, 0.0028328895568847656, 0.0047473907470703125, 0.006661891937255859, 0.008576393127441406, 0.010490894317626953, 0.0124053955078125, 0.014319896697998047, 0.016234397888183594, 0.01814889907836914, 0.020063400268554688, 0.021977901458740234, 0.02389240264892578, 0.025806903839111328, 0.027721405029296875, 0.029635906219482422, 0.03155040740966797, 0.033464908599853516, 0.03537940979003906, 0.03729391098022461, 0.039208412170410156, 0.0411229133605957, 0.04303741455078125, 0.0449519157409668, 0.046866416931152344, 0.04878091812133789, 0.05069541931152344, 0.052609920501708984, 0.05452442169189453, 0.05643892288208008, 0.058353424072265625, 0.06026792526245117, 0.06218242645263672, 0.06409692764282227, 0.06601142883300781, 0.06792593002319336, 0.0698404312133789, 0.07175493240356445, 0.07366943359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 5.0, 8.0, 11.0, 19.0, 16.0, 25.0, 41.0, 44.0, 61.0, 65.0, 80.0, 97.0, 85.0, 90.0, 79.0, 55.0, 40.0, 48.0, 33.0, 23.0, 17.0, 12.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038116455078125, -0.03685426712036133, -0.035592079162597656, -0.034329891204833984, -0.03306770324707031, -0.03180551528930664, -0.03054332733154297, -0.029281139373779297, -0.028018951416015625, -0.026756763458251953, -0.02549457550048828, -0.02423238754272461, -0.022970199584960938, -0.021708011627197266, -0.020445823669433594, -0.019183635711669922, -0.01792144775390625, -0.016659259796142578, -0.015397071838378906, -0.014134883880615234, -0.012872695922851562, -0.01161050796508789, -0.010348320007324219, -0.009086132049560547, -0.007823944091796875, -0.006561756134033203, -0.005299568176269531, -0.004037380218505859, -0.0027751922607421875, -0.0015130043029785156, -0.00025081634521484375, 0.0010113716125488281, 0.0022735595703125, 0.003535747528076172, 0.004797935485839844, 0.006060123443603516, 0.0073223114013671875, 0.00858449935913086, 0.009846687316894531, 0.011108875274658203, 0.012371063232421875, 0.013633251190185547, 0.014895439147949219, 0.01615762710571289, 0.017419815063476562, 0.018682003021240234, 0.019944190979003906, 0.021206378936767578, 0.02246856689453125, 0.023730754852294922, 0.024992942810058594, 0.026255130767822266, 0.027517318725585938, 0.02877950668334961, 0.03004169464111328, 0.03130388259887695, 0.032566070556640625, 0.0338282585144043, 0.03509044647216797, 0.03635263442993164, 0.03761482238769531, 0.038877010345458984, 0.040139198303222656, 0.04140138626098633, 0.04266357421875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 13.0, 29.0, 67.0, 109.0, 170.0, 202.0, 181.0, 121.0, 60.0, 27.0, 13.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740830421447754, -0.3383066654205322, -0.3025302588939667, -0.2667538821697235, -0.23097749054431915, -0.1952010989189148, -0.15942472219467163, -0.12364831566810608, -0.08787193894386292, -0.052095551043748856, -0.016319163143634796, 0.019457221031188965, 0.05523361265659332, 0.09101000428199768, 0.12678638100624084, 0.1625627875328064, 0.19833916425704956, 0.23411555588245392, 0.2698919475078583, 0.30566832423210144, 0.341444730758667, 0.37722110748291016, 0.4129974842071533, 0.44877389073371887, 0.48455026745796204, 0.5203266739845276, 0.5561030507087708, 0.5918794274330139, 0.6276558041572571, 0.663432240486145, 0.6992086172103882, 0.7349849939346313, 0.7707613706588745, 0.8065377473831177, 0.8423141241073608, 0.878090500831604, 0.9138669371604919, 0.9496433138847351, 0.9854196906089783, 1.0211961269378662, 1.0569725036621094, 1.0927488803863525, 1.1285252571105957, 1.1643016338348389, 1.200078010559082, 1.2358543872833252, 1.2716307640075684, 1.307407259941101, 1.3431835174560547, 1.3789598941802979, 1.414736270904541, 1.4505126476287842, 1.4862890243530273, 1.5220654010772705, 1.5578417778015137, 1.5936182737350464, 1.6293946504592896, 1.6651710271835327, 1.7009474039077759, 1.736723780632019, 1.7725001573562622, 1.808276653289795, 1.844053030014038, 1.8798294067382812, 1.9156057834625244]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 5.0, 5.0, 5.0, 10.0, 14.0, 12.0, 20.0, 20.0, 18.0, 34.0, 25.0, 33.0, 32.0, 35.0, 42.0, 38.0, 47.0, 43.0, 45.0, 46.0, 55.0, 41.0, 40.0, 47.0, 38.0, 30.0, 29.0, 24.0, 23.0, 31.0, 22.0, 16.0, 12.0, 11.0, 9.0, 13.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5758402347564697, -0.5574343800544739, -0.5390284657478333, -0.5206226110458374, -0.5022166967391968, -0.4838108420372009, -0.4654049575328827, -0.44699907302856445, -0.4285931885242462, -0.410187304019928, -0.39178141951560974, -0.3733755350112915, -0.35496968030929565, -0.33656376600265503, -0.3181579113006592, -0.29975202679634094, -0.2813461422920227, -0.26294025778770447, -0.24453437328338623, -0.2261285036802292, -0.20772261917591095, -0.1893167346715927, -0.17091086506843567, -0.15250498056411743, -0.1340990960597992, -0.11569321155548096, -0.09728733450174332, -0.07888145744800568, -0.06047557294368744, -0.0420696884393692, -0.02366381138563156, -0.005257934331893921, 0.013148009777069092, 0.03155389055609703, 0.04995977133512497, 0.06836564838886261, 0.08677153289318085, 0.10517741739749908, 0.12358329445123672, 0.14198917150497437, 0.1603950560092926, 0.17880094051361084, 0.19720682501792908, 0.21561269462108612, 0.23401857912540436, 0.2524244785308838, 0.27083033323287964, 0.2892362177371979, 0.3076421022415161, 0.32604798674583435, 0.3444538712501526, 0.3628597557544708, 0.38126564025878906, 0.3996714949607849, 0.41807737946510315, 0.4364832639694214, 0.4548891484737396, 0.47329503297805786, 0.4917009174823761, 0.5101068019866943, 0.5285126566886902, 0.5469185709953308, 0.5653244256973267, 0.5837303400039673, 0.6021361947059631]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 8.0, 8.0, 14.0, 26.0, 27.0, 35.0, 68.0, 68.0, 132.0, 205.0, 356.0, 543.0, 845.0, 1569.0, 2896.0, 5814.0, 13914.0, 39427.0, 170138.0, 3232404.0, 603934.0, 79945.0, 23270.0, 9081.0, 4316.0, 2251.0, 1193.0, 653.0, 411.0, 244.0, 159.0, 117.0, 57.0, 44.0, 32.0, 19.0, 17.0, 14.0, 7.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1297607421875, -0.12602901458740234, -0.12229728698730469, -0.11856555938720703, -0.11483383178710938, -0.11110210418701172, -0.10737037658691406, -0.1036386489868164, -0.09990692138671875, -0.0961751937866211, -0.09244346618652344, -0.08871173858642578, -0.08498001098632812, -0.08124828338623047, -0.07751655578613281, -0.07378482818603516, -0.0700531005859375, -0.06632137298583984, -0.06258964538574219, -0.05885791778564453, -0.055126190185546875, -0.05139446258544922, -0.04766273498535156, -0.043931007385253906, -0.04019927978515625, -0.036467552185058594, -0.03273582458496094, -0.02900409698486328, -0.025272369384765625, -0.02154064178466797, -0.017808914184570312, -0.014077186584472656, -0.010345458984375, -0.006613731384277344, -0.0028820037841796875, 0.0008497238159179688, 0.004581451416015625, 0.008313179016113281, 0.012044906616210938, 0.015776634216308594, 0.01950836181640625, 0.023240089416503906, 0.026971817016601562, 0.03070354461669922, 0.034435272216796875, 0.03816699981689453, 0.04189872741699219, 0.045630455017089844, 0.0493621826171875, 0.053093910217285156, 0.05682563781738281, 0.06055736541748047, 0.06428909301757812, 0.06802082061767578, 0.07175254821777344, 0.0754842758178711, 0.07921600341796875, 0.0829477310180664, 0.08667945861816406, 0.09041118621826172, 0.09414291381835938, 0.09787464141845703, 0.10160636901855469, 0.10533809661865234, 0.10906982421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 10.0, 7.0, 11.0, 13.0, 11.0, 11.0, 20.0, 27.0, 26.0, 35.0, 39.0, 47.0, 40.0, 46.0, 43.0, 52.0, 35.0, 50.0, 63.0, 37.0, 72.0, 38.0, 38.0, 44.0, 29.0, 25.0, 22.0, 16.0, 26.0, 10.0, 9.0, 10.0, 11.0, 4.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020782470703125, -0.020015954971313477, -0.019249439239501953, -0.01848292350769043, -0.017716407775878906, -0.016949892044067383, -0.01618337631225586, -0.015416860580444336, -0.014650344848632812, -0.013883829116821289, -0.013117313385009766, -0.012350797653198242, -0.011584281921386719, -0.010817766189575195, -0.010051250457763672, -0.009284734725952148, -0.008518218994140625, -0.0077517032623291016, -0.006985187530517578, -0.006218671798706055, -0.005452156066894531, -0.004685640335083008, -0.003919124603271484, -0.003152608871459961, -0.0023860931396484375, -0.001619577407836914, -0.0008530616760253906, -8.654594421386719e-05, 0.0006799697875976562, 0.0014464855194091797, 0.002213001251220703, 0.0029795169830322266, 0.00374603271484375, 0.0045125484466552734, 0.005279064178466797, 0.00604557991027832, 0.006812095642089844, 0.007578611373901367, 0.00834512710571289, 0.009111642837524414, 0.009878158569335938, 0.010644674301147461, 0.011411190032958984, 0.012177705764770508, 0.012944221496582031, 0.013710737228393555, 0.014477252960205078, 0.015243768692016602, 0.016010284423828125, 0.01677680015563965, 0.017543315887451172, 0.018309831619262695, 0.01907634735107422, 0.019842863082885742, 0.020609378814697266, 0.02137589454650879, 0.022142410278320312, 0.022908926010131836, 0.02367544174194336, 0.024441957473754883, 0.025208473205566406, 0.02597498893737793, 0.026741504669189453, 0.027508020401000977, 0.0282745361328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 12.0, 14.0, 21.0, 45.0, 83.0, 118.0, 219.0, 603.0, 2507.0, 21351.0, 1492518.0, 2647651.0, 25087.0, 2894.0, 643.0, 260.0, 102.0, 58.0, 38.0, 23.0, 15.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.423583984375, -0.41396331787109375, -0.4043426513671875, -0.39472198486328125, -0.385101318359375, -0.37548065185546875, -0.3658599853515625, -0.35623931884765625, -0.34661865234375, -0.33699798583984375, -0.3273773193359375, -0.31775665283203125, -0.308135986328125, -0.29851531982421875, -0.2888946533203125, -0.27927398681640625, -0.2696533203125, -0.26003265380859375, -0.2504119873046875, -0.24079132080078125, -0.231170654296875, -0.22154998779296875, -0.2119293212890625, -0.20230865478515625, -0.19268798828125, -0.18306732177734375, -0.1734466552734375, -0.16382598876953125, -0.154205322265625, -0.14458465576171875, -0.1349639892578125, -0.12534332275390625, -0.11572265625, -0.10610198974609375, -0.0964813232421875, -0.08686065673828125, -0.077239990234375, -0.06761932373046875, -0.0579986572265625, -0.04837799072265625, -0.03875732421875, -0.02913665771484375, -0.0195159912109375, -0.00989532470703125, -0.000274658203125, 0.00934600830078125, 0.0189666748046875, 0.02858734130859375, 0.0382080078125, 0.04782867431640625, 0.0574493408203125, 0.06707000732421875, 0.076690673828125, 0.08631134033203125, 0.0959320068359375, 0.10555267333984375, 0.11517333984375, 0.12479400634765625, 0.1344146728515625, 0.14403533935546875, 0.153656005859375, 0.16327667236328125, 0.1728973388671875, 0.18251800537109375, 0.192138671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 39.0, 38.0, 72.0, 117.0, 299.0, 678.0, 1764.0, 548.0, 231.0, 111.0, 59.0, 30.0, 22.0, 15.0, 17.0, 5.0, 4.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1043701171875, -0.10172557830810547, -0.09908103942871094, -0.0964365005493164, -0.09379196166992188, -0.09114742279052734, -0.08850288391113281, -0.08585834503173828, -0.08321380615234375, -0.08056926727294922, -0.07792472839355469, -0.07528018951416016, -0.07263565063476562, -0.0699911117553711, -0.06734657287597656, -0.06470203399658203, -0.0620574951171875, -0.05941295623779297, -0.05676841735839844, -0.054123878479003906, -0.051479339599609375, -0.048834800720214844, -0.04619026184082031, -0.04354572296142578, -0.04090118408203125, -0.03825664520263672, -0.03561210632324219, -0.032967567443847656, -0.030323028564453125, -0.027678489685058594, -0.025033950805664062, -0.02238941192626953, -0.019744873046875, -0.01710033416748047, -0.014455795288085938, -0.011811256408691406, -0.009166717529296875, -0.006522178649902344, -0.0038776397705078125, -0.0012331008911132812, 0.00141143798828125, 0.004055976867675781, 0.0067005157470703125, 0.009345054626464844, 0.011989593505859375, 0.014634132385253906, 0.017278671264648438, 0.01992321014404297, 0.0225677490234375, 0.02521228790283203, 0.027856826782226562, 0.030501365661621094, 0.033145904541015625, 0.035790443420410156, 0.03843498229980469, 0.04107952117919922, 0.04372406005859375, 0.04636859893798828, 0.04901313781738281, 0.051657676696777344, 0.054302215576171875, 0.056946754455566406, 0.05959129333496094, 0.06223583221435547, 0.06488037109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 34.0, 55.0, 113.0, 167.0, 191.0, 184.0, 123.0, 61.0, 32.0, 18.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.887373685836792, -0.8696142435073853, -0.8518548607826233, -0.8340954780578613, -0.8163360357284546, -0.7985765933990479, -0.7808172106742859, -0.7630578279495239, -0.7452983856201172, -0.7275389432907104, -0.7097795605659485, -0.6920201778411865, -0.6742607355117798, -0.656501293182373, -0.6387419104576111, -0.6209825277328491, -0.6032230854034424, -0.5854636430740356, -0.5677042603492737, -0.5499448776245117, -0.532185435295105, -0.5144259929656982, -0.4966666102409363, -0.47890719771385193, -0.4611477851867676, -0.4433883726596832, -0.4256289601325989, -0.4078695476055145, -0.3901101350784302, -0.3723507225513458, -0.3545913100242615, -0.3368318974971771, -0.319072425365448, -0.30131301283836365, -0.2835536003112793, -0.26579418778419495, -0.2480347752571106, -0.23027536273002625, -0.2125159502029419, -0.19475653767585754, -0.1769971251487732, -0.15923771262168884, -0.1414783000946045, -0.12371888756752014, -0.10595947504043579, -0.08820006251335144, -0.07044064998626709, -0.05268123745918274, -0.03492182493209839, -0.017162412405014038, 0.0005970001220703125, 0.018356412649154663, 0.036115825176239014, 0.053875237703323364, 0.07163465023040771, 0.08939406275749207, 0.10715347528457642, 0.12491288781166077, 0.14267230033874512, 0.16043171286582947, 0.17819112539291382, 0.19595053791999817, 0.21370995044708252, 0.23146936297416687, 0.24922877550125122]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 11.0, 16.0, 20.0, 26.0, 19.0, 27.0, 36.0, 31.0, 36.0, 39.0, 50.0, 43.0, 57.0, 55.0, 60.0, 55.0, 51.0, 45.0, 48.0, 38.0, 44.0, 36.0, 31.0, 26.0, 21.0, 20.0, 8.0, 12.0, 15.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.33886516094207764, -0.3301357924938202, -0.32140642404556274, -0.3126770555973053, -0.30394768714904785, -0.295218288898468, -0.28648892045021057, -0.2777595520019531, -0.2690301835536957, -0.26030081510543823, -0.2515714466571808, -0.24284206330776215, -0.2341126948595047, -0.22538332641124725, -0.2166539430618286, -0.20792457461357117, -0.19919520616531372, -0.19046583771705627, -0.18173646926879883, -0.1730070859193802, -0.16427771747112274, -0.1555483490228653, -0.14681896567344666, -0.1380895972251892, -0.12936022877693176, -0.12063086032867432, -0.11190148442983627, -0.10317210853099823, -0.09444274008274078, -0.08571337163448334, -0.0769839957356453, -0.06825461983680725, -0.059525251388549805, -0.05079587921500206, -0.042066507041454315, -0.03333713486790657, -0.024607762694358826, -0.01587839052081108, -0.007149018347263336, 0.0015803538262844086, 0.010309725999832153, 0.019039098173379898, 0.027768470346927643, 0.03649784252047539, 0.04522721469402313, 0.05395658686757088, 0.06268595904111862, 0.07141533493995667, 0.08014470338821411, 0.08887407183647156, 0.0976034477353096, 0.10633282363414764, 0.11506219208240509, 0.12379156053066254, 0.13252094388008118, 0.14125031232833862, 0.14997968077659607, 0.15870904922485352, 0.16743841767311096, 0.1761678010225296, 0.18489716947078705, 0.1936265379190445, 0.20235592126846313, 0.21108528971672058, 0.21981465816497803]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 12.0, 13.0, 20.0, 28.0, 42.0, 63.0, 143.0, 218.0, 455.0, 1057.0, 3155.0, 9534.0, 33429.0, 134208.0, 532904.0, 251313.0, 58331.0, 15764.0, 4794.0, 1723.0, 682.0, 283.0, 157.0, 79.0, 47.0, 30.0, 25.0, 14.0, 11.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1582469940185547, -0.15291976928710938, -0.14759254455566406, -0.14226531982421875, -0.13693809509277344, -0.13161087036132812, -0.1262836456298828, -0.1209564208984375, -0.11562919616699219, -0.11030197143554688, -0.10497474670410156, -0.09964752197265625, -0.09432029724121094, -0.08899307250976562, -0.08366584777832031, -0.078338623046875, -0.07301139831542969, -0.06768417358398438, -0.06235694885253906, -0.05702972412109375, -0.05170249938964844, -0.046375274658203125, -0.04104804992675781, -0.0357208251953125, -0.030393600463867188, -0.025066375732421875, -0.019739151000976562, -0.01441192626953125, -0.009084701538085938, -0.003757476806640625, 0.0015697479248046875, 0.00689697265625, 0.012224197387695312, 0.017551422119140625, 0.022878646850585938, 0.02820587158203125, 0.03353309631347656, 0.038860321044921875, 0.04418754577636719, 0.0495147705078125, 0.05484199523925781, 0.060169219970703125, 0.06549644470214844, 0.07082366943359375, 0.07615089416503906, 0.08147811889648438, 0.08680534362792969, 0.092132568359375, 0.09745979309082031, 0.10278701782226562, 0.10811424255371094, 0.11344146728515625, 0.11876869201660156, 0.12409591674804688, 0.1294231414794922, 0.1347503662109375, 0.1400775909423828, 0.14540481567382812, 0.15073204040527344, 0.15605926513671875, 0.16138648986816406, 0.16671371459960938, 0.1720409393310547, 0.1773681640625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 1.0, 3.0, 5.0, 9.0, 9.0, 9.0, 21.0, 19.0, 24.0, 21.0, 31.0, 32.0, 32.0, 41.0, 42.0, 45.0, 64.0, 37.0, 50.0, 52.0, 57.0, 35.0, 43.0, 36.0, 42.0, 43.0, 29.0, 36.0, 29.0, 14.0, 20.0, 13.0, 13.0, 12.0, 10.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.022735595703125, -0.021979808807373047, -0.021224021911621094, -0.02046823501586914, -0.019712448120117188, -0.018956661224365234, -0.01820087432861328, -0.017445087432861328, -0.016689300537109375, -0.015933513641357422, -0.015177726745605469, -0.014421939849853516, -0.013666152954101562, -0.01291036605834961, -0.012154579162597656, -0.011398792266845703, -0.01064300537109375, -0.009887218475341797, -0.009131431579589844, -0.00837564468383789, -0.0076198577880859375, -0.006864070892333984, -0.006108283996582031, -0.005352497100830078, -0.004596710205078125, -0.003840923309326172, -0.0030851364135742188, -0.0023293495178222656, -0.0015735626220703125, -0.0008177757263183594, -6.198883056640625e-05, 0.0006937980651855469, 0.0014495849609375, 0.002205371856689453, 0.0029611587524414062, 0.0037169456481933594, 0.0044727325439453125, 0.005228519439697266, 0.005984306335449219, 0.006740093231201172, 0.007495880126953125, 0.008251667022705078, 0.009007453918457031, 0.009763240814208984, 0.010519027709960938, 0.01127481460571289, 0.012030601501464844, 0.012786388397216797, 0.01354217529296875, 0.014297962188720703, 0.015053749084472656, 0.01580953598022461, 0.016565322875976562, 0.017321109771728516, 0.01807689666748047, 0.018832683563232422, 0.019588470458984375, 0.020344257354736328, 0.02110004425048828, 0.021855831146240234, 0.022611618041992188, 0.02336740493774414, 0.024123191833496094, 0.024878978729248047, 0.025634765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 9.0, 13.0, 19.0, 36.0, 49.0, 79.0, 143.0, 204.0, 393.0, 663.0, 1198.0, 2698.0, 7775.0, 30163.0, 160099.0, 600739.0, 194326.0, 35498.0, 8427.0, 2953.0, 1334.0, 723.0, 399.0, 222.0, 132.0, 83.0, 42.0, 31.0, 26.0, 19.0, 12.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1611328125, -0.15618324279785156, -0.15123367309570312, -0.1462841033935547, -0.14133453369140625, -0.1363849639892578, -0.13143539428710938, -0.12648582458496094, -0.1215362548828125, -0.11658668518066406, -0.11163711547851562, -0.10668754577636719, -0.10173797607421875, -0.09678840637207031, -0.09183883666992188, -0.08688926696777344, -0.081939697265625, -0.07699012756347656, -0.07204055786132812, -0.06709098815917969, -0.06214141845703125, -0.05719184875488281, -0.052242279052734375, -0.04729270935058594, -0.0423431396484375, -0.03739356994628906, -0.032444000244140625, -0.027494430541992188, -0.02254486083984375, -0.017595291137695312, -0.012645721435546875, -0.0076961517333984375, -0.00274658203125, 0.0022029876708984375, 0.007152557373046875, 0.012102127075195312, 0.01705169677734375, 0.022001266479492188, 0.026950836181640625, 0.03190040588378906, 0.0368499755859375, 0.04179954528808594, 0.046749114990234375, 0.05169868469238281, 0.05664825439453125, 0.06159782409667969, 0.06654739379882812, 0.07149696350097656, 0.076446533203125, 0.08139610290527344, 0.08634567260742188, 0.09129524230957031, 0.09624481201171875, 0.10119438171386719, 0.10614395141601562, 0.11109352111816406, 0.1160430908203125, 0.12099266052246094, 0.12594223022460938, 0.1308917999267578, 0.13584136962890625, 0.1407909393310547, 0.14574050903320312, 0.15069007873535156, 0.1556396484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 8.0, 7.0, 12.0, 19.0, 25.0, 27.0, 34.0, 44.0, 53.0, 59.0, 57.0, 60.0, 50.0, 65.0, 64.0, 74.0, 44.0, 36.0, 49.0, 57.0, 35.0, 27.0, 18.0, 15.0, 14.0, 14.0, 9.0, 6.0, 8.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.14836692810058594, -0.14329147338867188, -0.1382160186767578, -0.13314056396484375, -0.1280651092529297, -0.12298965454101562, -0.11791419982910156, -0.1128387451171875, -0.10776329040527344, -0.10268783569335938, -0.09761238098144531, -0.09253692626953125, -0.08746147155761719, -0.08238601684570312, -0.07731056213378906, -0.072235107421875, -0.06715965270996094, -0.062084197998046875, -0.05700874328613281, -0.05193328857421875, -0.04685783386230469, -0.041782379150390625, -0.03670692443847656, -0.0316314697265625, -0.026556015014648438, -0.021480560302734375, -0.016405105590820312, -0.01132965087890625, -0.0062541961669921875, -0.001178741455078125, 0.0038967132568359375, 0.00897216796875, 0.014047622680664062, 0.019123077392578125, 0.024198532104492188, 0.02927398681640625, 0.03434944152832031, 0.039424896240234375, 0.04450035095214844, 0.0495758056640625, 0.05465126037597656, 0.059726715087890625, 0.06480216979980469, 0.06987762451171875, 0.07495307922363281, 0.08002853393554688, 0.08510398864746094, 0.090179443359375, 0.09525489807128906, 0.10033035278320312, 0.10540580749511719, 0.11048126220703125, 0.11555671691894531, 0.12063217163085938, 0.12570762634277344, 0.1307830810546875, 0.13585853576660156, 0.14093399047851562, 0.1460094451904297, 0.15108489990234375, 0.1561603546142578, 0.16123580932617188, 0.16631126403808594, 0.17138671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 8.0, 15.0, 12.0, 24.0, 43.0, 54.0, 86.0, 129.0, 200.0, 302.0, 549.0, 1008.0, 2048.0, 4927.0, 15675.0, 84839.0, 700337.0, 199235.0, 26005.0, 7247.0, 2726.0, 1306.0, 660.0, 404.0, 216.0, 144.0, 100.0, 67.0, 60.0, 28.0, 24.0, 23.0, 13.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08488082885742188, -0.08113861083984375, -0.07739639282226562, -0.0736541748046875, -0.06991195678710938, -0.06616973876953125, -0.062427520751953125, -0.058685302734375, -0.054943084716796875, -0.05120086669921875, -0.047458648681640625, -0.0437164306640625, -0.039974212646484375, -0.03623199462890625, -0.032489776611328125, -0.02874755859375, -0.025005340576171875, -0.02126312255859375, -0.017520904541015625, -0.0137786865234375, -0.010036468505859375, -0.00629425048828125, -0.002552032470703125, 0.001190185546875, 0.004932403564453125, 0.00867462158203125, 0.012416839599609375, 0.0161590576171875, 0.019901275634765625, 0.02364349365234375, 0.027385711669921875, 0.0311279296875, 0.034870147705078125, 0.03861236572265625, 0.042354583740234375, 0.0460968017578125, 0.049839019775390625, 0.05358123779296875, 0.057323455810546875, 0.061065673828125, 0.06480789184570312, 0.06855010986328125, 0.07229232788085938, 0.0760345458984375, 0.07977676391601562, 0.08351898193359375, 0.08726119995117188, 0.09100341796875, 0.09474563598632812, 0.09848785400390625, 0.10223007202148438, 0.1059722900390625, 0.10971450805664062, 0.11345672607421875, 0.11719894409179688, 0.120941162109375, 0.12468338012695312, 0.12842559814453125, 0.13216781616210938, 0.1359100341796875, 0.13965225219726562, 0.14339447021484375, 0.14713668823242188, 0.15087890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 11.0, 8.0, 7.0, 16.0, 11.0, 12.0, 25.0, 31.0, 41.0, 60.0, 67.0, 74.0, 87.0, 65.0, 72.0, 68.0, 68.0, 64.0, 47.0, 37.0, 32.0, 19.0, 16.0, 15.0, 10.0, 5.0, 9.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.319450378417969e-05, -7.109809666872025e-05, -6.90016895532608e-05, -6.690528243780136e-05, -6.480887532234192e-05, -6.271246820688248e-05, -6.0616061091423035e-05, -5.851965397596359e-05, -5.642324686050415e-05, -5.432683974504471e-05, -5.2230432629585266e-05, -5.0134025514125824e-05, -4.803761839866638e-05, -4.594121128320694e-05, -4.38448041677475e-05, -4.1748397052288055e-05, -3.965198993682861e-05, -3.755558282136917e-05, -3.545917570590973e-05, -3.336276859045029e-05, -3.1266361474990845e-05, -2.9169954359531403e-05, -2.707354724407196e-05, -2.497714012861252e-05, -2.2880733013153076e-05, -2.0784325897693634e-05, -1.8687918782234192e-05, -1.659151166677475e-05, -1.4495104551315308e-05, -1.2398697435855865e-05, -1.0302290320396423e-05, -8.205883204936981e-06, -6.109476089477539e-06, -4.013068974018097e-06, -1.9166618585586548e-06, 1.7974525690078735e-07, 2.2761523723602295e-06, 4.372559487819672e-06, 6.468966603279114e-06, 8.565373718738556e-06, 1.0661780834197998e-05, 1.275818794965744e-05, 1.4854595065116882e-05, 1.6951002180576324e-05, 1.9047409296035767e-05, 2.114381641149521e-05, 2.324022352695465e-05, 2.5336630642414093e-05, 2.7433037757873535e-05, 2.9529444873332977e-05, 3.162585198879242e-05, 3.372225910425186e-05, 3.5818666219711304e-05, 3.7915073335170746e-05, 4.001148045063019e-05, 4.210788756608963e-05, 4.420429468154907e-05, 4.6300701797008514e-05, 4.8397108912467957e-05, 5.04935160279274e-05, 5.258992314338684e-05, 5.468633025884628e-05, 5.6782737374305725e-05, 5.887914448976517e-05, 6.097555160522461e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 3.0, 11.0, 11.0, 14.0, 30.0, 26.0, 48.0, 84.0, 131.0, 214.0, 330.0, 658.0, 1352.0, 3177.0, 8565.0, 33503.0, 361351.0, 573787.0, 47590.0, 10603.0, 3760.0, 1535.0, 719.0, 403.0, 211.0, 143.0, 95.0, 57.0, 39.0, 23.0, 17.0, 8.0, 14.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11287689208984375, -0.1093597412109375, -0.10584259033203125, -0.102325439453125, -0.09880828857421875, -0.0952911376953125, -0.09177398681640625, -0.0882568359375, -0.08473968505859375, -0.0812225341796875, -0.07770538330078125, -0.074188232421875, -0.07067108154296875, -0.0671539306640625, -0.06363677978515625, -0.06011962890625, -0.05660247802734375, -0.0530853271484375, -0.04956817626953125, -0.046051025390625, -0.04253387451171875, -0.0390167236328125, -0.03549957275390625, -0.031982421875, -0.02846527099609375, -0.0249481201171875, -0.02143096923828125, -0.017913818359375, -0.01439666748046875, -0.0108795166015625, -0.00736236572265625, -0.00384521484375, -0.00032806396484375, 0.0031890869140625, 0.00670623779296875, 0.010223388671875, 0.01374053955078125, 0.0172576904296875, 0.02077484130859375, 0.0242919921875, 0.02780914306640625, 0.0313262939453125, 0.03484344482421875, 0.038360595703125, 0.04187774658203125, 0.0453948974609375, 0.04891204833984375, 0.05242919921875, 0.05594635009765625, 0.0594635009765625, 0.06298065185546875, 0.066497802734375, 0.07001495361328125, 0.0735321044921875, 0.07704925537109375, 0.08056640625, 0.08408355712890625, 0.0876007080078125, 0.09111785888671875, 0.094635009765625, 0.09815216064453125, 0.1016693115234375, 0.10518646240234375, 0.10870361328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 11.0, 6.0, 19.0, 27.0, 25.0, 66.0, 67.0, 121.0, 173.0, 146.0, 94.0, 71.0, 45.0, 29.0, 28.0, 17.0, 13.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08807373046875, -0.085479736328125, -0.0828857421875, -0.080291748046875, -0.07769775390625, -0.075103759765625, -0.072509765625, -0.069915771484375, -0.06732177734375, -0.064727783203125, -0.0621337890625, -0.059539794921875, -0.05694580078125, -0.054351806640625, -0.0517578125, -0.049163818359375, -0.04656982421875, -0.043975830078125, -0.0413818359375, -0.038787841796875, -0.03619384765625, -0.033599853515625, -0.031005859375, -0.028411865234375, -0.02581787109375, -0.023223876953125, -0.0206298828125, -0.018035888671875, -0.01544189453125, -0.012847900390625, -0.01025390625, -0.007659912109375, -0.00506591796875, -0.002471923828125, 0.0001220703125, 0.002716064453125, 0.00531005859375, 0.007904052734375, 0.010498046875, 0.013092041015625, 0.01568603515625, 0.018280029296875, 0.0208740234375, 0.023468017578125, 0.02606201171875, 0.028656005859375, 0.03125, 0.033843994140625, 0.03643798828125, 0.039031982421875, 0.0416259765625, 0.044219970703125, 0.04681396484375, 0.049407958984375, 0.052001953125, 0.054595947265625, 0.05718994140625, 0.059783935546875, 0.0623779296875, 0.064971923828125, 0.06756591796875, 0.070159912109375, 0.07275390625, 0.075347900390625, 0.07794189453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 13.0, 25.0, 64.0, 111.0, 207.0, 193.0, 175.0, 94.0, 62.0, 28.0, 13.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2362054586410522, -1.1895357370376587, -1.1428661346435547, -1.0961964130401611, -1.0495268106460571, -1.0028570890426636, -0.9561874270439148, -0.909517765045166, -0.8628481030464172, -0.8161784410476685, -0.7695087790489197, -0.7228391170501709, -0.6761693954467773, -0.6294997930526733, -0.5828300714492798, -0.536160409450531, -0.4894907474517822, -0.44282108545303345, -0.39615142345428467, -0.3494817316532135, -0.3028120696544647, -0.25614240765571594, -0.20947271585464478, -0.162803053855896, -0.11613339185714722, -0.06946372240781784, -0.022794052958488464, 0.02387562394142151, 0.07054528594017029, 0.11721494793891907, 0.16388463973999023, 0.210554301738739, 0.2572239637374878, 0.3038936257362366, 0.35056328773498535, 0.3972329795360565, 0.4439026415348053, 0.4905723035335541, 0.5372419953346252, 0.583911657333374, 0.6305813193321228, 0.6772509813308716, 0.7239206433296204, 0.7705903053283691, 0.8172600269317627, 0.8639296293258667, 0.9105993509292603, 0.957269012928009, 1.0039386749267578, 1.0506083965301514, 1.0972779989242554, 1.143947720527649, 1.190617322921753, 1.2372870445251465, 1.28395676612854, 1.330626368522644, 1.377295970916748, 1.4239656925201416, 1.4706352949142456, 1.5173050165176392, 1.5639746189117432, 1.6106443405151367, 1.6573140621185303, 1.7039836645126343, 1.7506533861160278]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 7.0, 22.0, 15.0, 22.0, 34.0, 26.0, 22.0, 31.0, 31.0, 35.0, 42.0, 39.0, 41.0, 56.0, 50.0, 43.0, 54.0, 49.0, 37.0, 42.0, 30.0, 34.0, 27.0, 24.0, 27.0, 28.0, 12.0, 12.0, 14.0, 16.0, 6.0, 10.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.763144314289093, -0.741420567035675, -0.7196968197822571, -0.6979730725288391, -0.6762493848800659, -0.654525637626648, -0.63280189037323, -0.611078143119812, -0.589354395866394, -0.5676306486129761, -0.5459069013595581, -0.5241831541061401, -0.5024594068527222, -0.4807356894016266, -0.459011971950531, -0.43728822469711304, -0.41556447744369507, -0.3938407301902771, -0.37211698293685913, -0.35039326548576355, -0.3286695182323456, -0.3069457709789276, -0.28522205352783203, -0.26349830627441406, -0.2417745590209961, -0.22005081176757812, -0.19832707941532135, -0.17660334706306458, -0.1548795998096466, -0.13315585255622864, -0.11143212020397186, -0.08970838785171509, -0.06798464059829712, -0.04626090079545975, -0.024537160992622375, -0.0028134211897850037, 0.018910318613052368, 0.04063405841588974, 0.06235779821872711, 0.08408153057098389, 0.10580527782440186, 0.12752902507781982, 0.1492527574300766, 0.17097648978233337, 0.19270023703575134, 0.2144239842891693, 0.2361477166414261, 0.25787144899368286, 0.27959519624710083, 0.3013189435005188, 0.32304269075393677, 0.34476640820503235, 0.3664901554584503, 0.3882139027118683, 0.40993762016296387, 0.43166136741638184, 0.4533851146697998, 0.4751088619232178, 0.49683260917663574, 0.5185563564300537, 0.5402801036834717, 0.5620037913322449, 0.5837275385856628, 0.6054512858390808, 0.6271750330924988]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 6.0, 11.0, 9.0, 12.0, 15.0, 24.0, 20.0, 57.0, 59.0, 77.0, 133.0, 169.0, 251.0, 370.0, 543.0, 828.0, 1466.0, 2372.0, 4175.0, 8034.0, 16961.0, 43740.0, 178132.0, 3435755.0, 388248.0, 66754.0, 23066.0, 10170.0, 5115.0, 2908.0, 1689.0, 1053.0, 655.0, 409.0, 307.0, 173.0, 151.0, 98.0, 83.0, 47.0, 33.0, 23.0, 23.0, 14.0, 9.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.107421875, -0.10391998291015625, -0.1004180908203125, -0.09691619873046875, -0.093414306640625, -0.08991241455078125, -0.0864105224609375, -0.08290863037109375, -0.07940673828125, -0.07590484619140625, -0.0724029541015625, -0.06890106201171875, -0.065399169921875, -0.06189727783203125, -0.0583953857421875, -0.05489349365234375, -0.0513916015625, -0.04788970947265625, -0.0443878173828125, -0.04088592529296875, -0.037384033203125, -0.03388214111328125, -0.0303802490234375, -0.02687835693359375, -0.02337646484375, -0.01987457275390625, -0.0163726806640625, -0.01287078857421875, -0.009368896484375, -0.00586700439453125, -0.0023651123046875, 0.00113677978515625, 0.004638671875, 0.00814056396484375, 0.0116424560546875, 0.01514434814453125, 0.018646240234375, 0.02214813232421875, 0.0256500244140625, 0.02915191650390625, 0.03265380859375, 0.03615570068359375, 0.0396575927734375, 0.04315948486328125, 0.046661376953125, 0.05016326904296875, 0.0536651611328125, 0.05716705322265625, 0.0606689453125, 0.06417083740234375, 0.0676727294921875, 0.07117462158203125, 0.074676513671875, 0.07817840576171875, 0.0816802978515625, 0.08518218994140625, 0.08868408203125, 0.09218597412109375, 0.0956878662109375, 0.09918975830078125, 0.102691650390625, 0.10619354248046875, 0.1096954345703125, 0.11319732666015625, 0.11669921875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 6.0, 8.0, 10.0, 18.0, 27.0, 20.0, 28.0, 37.0, 27.0, 22.0, 34.0, 53.0, 55.0, 53.0, 50.0, 58.0, 29.0, 43.0, 41.0, 51.0, 49.0, 41.0, 40.0, 34.0, 25.0, 21.0, 22.0, 10.0, 11.0, 12.0, 10.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.023895263671875, -0.023090362548828125, -0.02228546142578125, -0.021480560302734375, -0.0206756591796875, -0.019870758056640625, -0.01906585693359375, -0.018260955810546875, -0.0174560546875, -0.016651153564453125, -0.01584625244140625, -0.015041351318359375, -0.0142364501953125, -0.013431549072265625, -0.01262664794921875, -0.011821746826171875, -0.011016845703125, -0.010211944580078125, -0.00940704345703125, -0.008602142333984375, -0.0077972412109375, -0.006992340087890625, -0.00618743896484375, -0.005382537841796875, -0.00457763671875, -0.003772735595703125, -0.00296783447265625, -0.002162933349609375, -0.0013580322265625, -0.000553131103515625, 0.00025177001953125, 0.001056671142578125, 0.001861572265625, 0.002666473388671875, 0.00347137451171875, 0.004276275634765625, 0.0050811767578125, 0.005886077880859375, 0.00669097900390625, 0.007495880126953125, 0.00830078125, 0.009105682373046875, 0.00991058349609375, 0.010715484619140625, 0.0115203857421875, 0.012325286865234375, 0.01313018798828125, 0.013935089111328125, 0.014739990234375, 0.015544891357421875, 0.01634979248046875, 0.017154693603515625, 0.0179595947265625, 0.018764495849609375, 0.01956939697265625, 0.020374298095703125, 0.02117919921875, 0.021984100341796875, 0.02278900146484375, 0.023593902587890625, 0.0243988037109375, 0.025203704833984375, 0.02600860595703125, 0.026813507080078125, 0.027618408203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 7.0, 22.0, 27.0, 33.0, 47.0, 100.0, 171.0, 311.0, 716.0, 1989.0, 8170.0, 56427.0, 3529340.0, 559708.0, 29017.0, 5372.0, 1566.0, 559.0, 288.0, 172.0, 88.0, 51.0, 27.0, 23.0, 17.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3244457244873047, -0.3153953552246094, -0.30634498596191406, -0.29729461669921875, -0.28824424743652344, -0.2791938781738281, -0.2701435089111328, -0.2610931396484375, -0.2520427703857422, -0.24299240112304688, -0.23394203186035156, -0.22489166259765625, -0.21584129333496094, -0.20679092407226562, -0.1977405548095703, -0.188690185546875, -0.1796398162841797, -0.17058944702148438, -0.16153907775878906, -0.15248870849609375, -0.14343833923339844, -0.13438796997070312, -0.1253376007080078, -0.1162872314453125, -0.10723686218261719, -0.09818649291992188, -0.08913612365722656, -0.08008575439453125, -0.07103538513183594, -0.061985015869140625, -0.05293464660644531, -0.04388427734375, -0.03483390808105469, -0.025783538818359375, -0.016733169555664062, -0.00768280029296875, 0.0013675689697265625, 0.010417938232421875, 0.019468307495117188, 0.0285186767578125, 0.03756904602050781, 0.046619415283203125, 0.05566978454589844, 0.06472015380859375, 0.07377052307128906, 0.08282089233398438, 0.09187126159667969, 0.100921630859375, 0.10997200012207031, 0.11902236938476562, 0.12807273864746094, 0.13712310791015625, 0.14617347717285156, 0.15522384643554688, 0.1642742156982422, 0.1733245849609375, 0.1823749542236328, 0.19142532348632812, 0.20047569274902344, 0.20952606201171875, 0.21857643127441406, 0.22762680053710938, 0.2366771697998047, 0.2457275390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 12.0, 16.0, 44.0, 68.0, 107.0, 257.0, 1304.0, 1639.0, 310.0, 141.0, 64.0, 36.0, 26.0, 14.0, 10.0, 2.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.09750652313232422, -0.09436607360839844, -0.09122562408447266, -0.08808517456054688, -0.0849447250366211, -0.08180427551269531, -0.07866382598876953, -0.07552337646484375, -0.07238292694091797, -0.06924247741699219, -0.0661020278930664, -0.06296157836914062, -0.059821128845214844, -0.05668067932128906, -0.05354022979736328, -0.0503997802734375, -0.04725933074951172, -0.04411888122558594, -0.040978431701660156, -0.037837982177734375, -0.034697532653808594, -0.03155708312988281, -0.02841663360595703, -0.02527618408203125, -0.02213573455810547, -0.018995285034179688, -0.015854835510253906, -0.012714385986328125, -0.009573936462402344, -0.0064334869384765625, -0.0032930374145507812, -0.000152587890625, 0.0029878616333007812, 0.0061283111572265625, 0.009268760681152344, 0.012409210205078125, 0.015549659729003906, 0.018690109252929688, 0.02183055877685547, 0.02497100830078125, 0.02811145782470703, 0.03125190734863281, 0.034392356872558594, 0.037532806396484375, 0.040673255920410156, 0.04381370544433594, 0.04695415496826172, 0.0500946044921875, 0.05323505401611328, 0.05637550354003906, 0.059515953063964844, 0.06265640258789062, 0.0657968521118164, 0.06893730163574219, 0.07207775115966797, 0.07521820068359375, 0.07835865020751953, 0.08149909973144531, 0.0846395492553711, 0.08777999877929688, 0.09092044830322266, 0.09406089782714844, 0.09720134735107422, 0.100341796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 11.0, 23.0, 29.0, 55.0, 88.0, 152.0, 185.0, 155.0, 124.0, 81.0, 52.0, 24.0, 12.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548175573348999, -0.5317947864532471, -0.5154139995574951, -0.49903321266174316, -0.4826524257659912, -0.46627163887023926, -0.4498908817768097, -0.43351009488105774, -0.4171293079853058, -0.40074852108955383, -0.3843677341938019, -0.3679869472980499, -0.35160619020462036, -0.3352254033088684, -0.31884461641311646, -0.3024638295173645, -0.28608304262161255, -0.2697022557258606, -0.25332146883010864, -0.23694069683551788, -0.22055990993976593, -0.20417912304401398, -0.18779835104942322, -0.17141756415367126, -0.1550367772579193, -0.13865599036216736, -0.122275210916996, -0.10589443147182465, -0.08951364457607269, -0.07313285768032074, -0.056752078235149384, -0.04037129878997803, -0.0239904522895813, -0.007609669119119644, 0.00877111405134201, 0.025151897221803665, 0.04153268039226532, 0.05791346728801727, 0.07429424673318863, 0.09067502617835999, 0.10705581307411194, 0.12343659996986389, 0.13981738686561584, 0.1561981588602066, 0.17257894575595856, 0.1889597326517105, 0.20534050464630127, 0.22172129154205322, 0.23810207843780518, 0.25448286533355713, 0.2708636522293091, 0.28724443912506104, 0.303625226020813, 0.32000601291656494, 0.3363867700099945, 0.35276755690574646, 0.3691483438014984, 0.38552913069725037, 0.4019099175930023, 0.4182907044887543, 0.43467146158218384, 0.4510522484779358, 0.46743303537368774, 0.4838138222694397, 0.5001946091651917]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 9.0, 18.0, 15.0, 21.0, 16.0, 12.0, 21.0, 18.0, 25.0, 25.0, 21.0, 22.0, 30.0, 39.0, 35.0, 26.0, 32.0, 31.0, 36.0, 35.0, 25.0, 29.0, 24.0, 33.0, 30.0, 41.0, 31.0, 32.0, 34.0, 27.0, 13.0, 18.0, 15.0, 14.0, 13.0, 14.0, 16.0, 12.0, 13.0, 6.0, 3.0, 6.0, 4.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.17574048042297363, -0.1703668087720871, -0.16499315202236176, -0.15961948037147522, -0.15424582362174988, -0.14887215197086334, -0.1434984803199768, -0.13812482357025146, -0.13275116682052612, -0.1273774951696396, -0.12200383841991425, -0.11663016676902771, -0.11125651001930237, -0.10588283836841583, -0.1005091741681099, -0.09513550996780396, -0.08976183831691742, -0.08438817411661148, -0.07901450991630554, -0.073640838265419, -0.06826718151569366, -0.06289350986480713, -0.05751984566450119, -0.05214618146419525, -0.04677251726388931, -0.041398853063583374, -0.036025188863277435, -0.030651520937681198, -0.02527785673737526, -0.01990419253706932, -0.014530524611473083, -0.009156860411167145, -0.003783196210861206, 0.0015904689207673073, 0.006964134052395821, 0.012337800115346909, 0.017711464315652847, 0.023085128515958786, 0.028458796441555023, 0.03383246064186096, 0.0392061248421669, 0.04457978904247284, 0.04995345324277878, 0.055327121168375015, 0.060700785368680954, 0.0660744458436966, 0.07144811749458313, 0.07682178169488907, 0.08219544589519501, 0.08756911009550095, 0.09294277429580688, 0.09831644594669342, 0.10369010269641876, 0.1090637743473053, 0.11443743854761124, 0.11981110274791718, 0.1251847743988037, 0.13055844604969025, 0.1359321027994156, 0.14130577445030212, 0.14667943120002747, 0.152053102850914, 0.15742677450180054, 0.16280043125152588, 0.16817408800125122]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 12.0, 10.0, 14.0, 19.0, 49.0, 58.0, 68.0, 98.0, 148.0, 229.0, 373.0, 528.0, 868.0, 1283.0, 2076.0, 3251.0, 5304.0, 8896.0, 14797.0, 25464.0, 44707.0, 80797.0, 151192.0, 257682.0, 202762.0, 107315.0, 58898.0, 33389.0, 19409.0, 11096.0, 6666.0, 4072.0, 2494.0, 1550.0, 994.0, 637.0, 456.0, 266.0, 177.0, 148.0, 95.0, 53.0, 43.0, 23.0, 31.0, 14.0, 15.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0748291015625, -0.07239437103271484, -0.06995964050292969, -0.06752490997314453, -0.06509017944335938, -0.06265544891357422, -0.06022071838378906, -0.057785987854003906, -0.05535125732421875, -0.052916526794433594, -0.05048179626464844, -0.04804706573486328, -0.045612335205078125, -0.04317760467529297, -0.04074287414550781, -0.038308143615722656, -0.0358734130859375, -0.033438682556152344, -0.031003952026367188, -0.02856922149658203, -0.026134490966796875, -0.02369976043701172, -0.021265029907226562, -0.018830299377441406, -0.01639556884765625, -0.013960838317871094, -0.011526107788085938, -0.009091377258300781, -0.006656646728515625, -0.004221916198730469, -0.0017871856689453125, 0.0006475448608398438, 0.003082275390625, 0.005517005920410156, 0.007951736450195312, 0.010386466979980469, 0.012821197509765625, 0.015255928039550781, 0.017690658569335938, 0.020125389099121094, 0.02256011962890625, 0.024994850158691406, 0.027429580688476562, 0.02986431121826172, 0.032299041748046875, 0.03473377227783203, 0.03716850280761719, 0.039603233337402344, 0.0420379638671875, 0.044472694396972656, 0.04690742492675781, 0.04934215545654297, 0.051776885986328125, 0.05421161651611328, 0.05664634704589844, 0.059081077575683594, 0.06151580810546875, 0.0639505386352539, 0.06638526916503906, 0.06881999969482422, 0.07125473022460938, 0.07368946075439453, 0.07612419128417969, 0.07855892181396484, 0.08099365234375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 6.0, 13.0, 5.0, 12.0, 17.0, 25.0, 17.0, 36.0, 34.0, 36.0, 38.0, 38.0, 45.0, 42.0, 59.0, 64.0, 52.0, 48.0, 41.0, 51.0, 38.0, 43.0, 33.0, 34.0, 27.0, 26.0, 19.0, 19.0, 16.0, 9.0, 19.0, 10.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0289764404296875, -0.028099775314331055, -0.02722311019897461, -0.026346445083618164, -0.02546977996826172, -0.024593114852905273, -0.023716449737548828, -0.022839784622192383, -0.021963119506835938, -0.021086454391479492, -0.020209789276123047, -0.0193331241607666, -0.018456459045410156, -0.01757979393005371, -0.016703128814697266, -0.01582646369934082, -0.014949798583984375, -0.01407313346862793, -0.013196468353271484, -0.012319803237915039, -0.011443138122558594, -0.010566473007202148, -0.009689807891845703, -0.008813142776489258, -0.007936477661132812, -0.007059812545776367, -0.006183147430419922, -0.0053064823150634766, -0.004429817199707031, -0.003553152084350586, -0.0026764869689941406, -0.0017998218536376953, -0.00092315673828125, -4.649162292480469e-05, 0.0008301734924316406, 0.001706838607788086, 0.0025835037231445312, 0.0034601688385009766, 0.004336833953857422, 0.005213499069213867, 0.0060901641845703125, 0.006966829299926758, 0.007843494415283203, 0.008720159530639648, 0.009596824645996094, 0.010473489761352539, 0.011350154876708984, 0.01222681999206543, 0.013103485107421875, 0.01398015022277832, 0.014856815338134766, 0.01573348045349121, 0.016610145568847656, 0.0174868106842041, 0.018363475799560547, 0.019240140914916992, 0.020116806030273438, 0.020993471145629883, 0.021870136260986328, 0.022746801376342773, 0.02362346649169922, 0.024500131607055664, 0.02537679672241211, 0.026253461837768555, 0.027130126953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 6.0, 19.0, 21.0, 34.0, 30.0, 56.0, 63.0, 87.0, 114.0, 119.0, 215.0, 307.0, 486.0, 719.0, 1236.0, 2518.0, 6826.0, 23396.0, 99421.0, 451407.0, 356800.0, 75475.0, 18092.0, 5508.0, 2227.0, 1116.0, 674.0, 444.0, 309.0, 219.0, 168.0, 107.0, 72.0, 59.0, 55.0, 26.0, 31.0, 20.0, 14.0, 12.0, 8.0, 8.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1510009765625, -0.1462688446044922, -0.14153671264648438, -0.13680458068847656, -0.13207244873046875, -0.12734031677246094, -0.12260818481445312, -0.11787605285644531, -0.1131439208984375, -0.10841178894042969, -0.10367965698242188, -0.09894752502441406, -0.09421539306640625, -0.08948326110839844, -0.08475112915039062, -0.08001899719238281, -0.075286865234375, -0.07055473327636719, -0.06582260131835938, -0.06109046936035156, -0.05635833740234375, -0.05162620544433594, -0.046894073486328125, -0.04216194152832031, -0.0374298095703125, -0.03269767761230469, -0.027965545654296875, -0.023233413696289062, -0.01850128173828125, -0.013769149780273438, -0.009037017822265625, -0.0043048858642578125, 0.00042724609375, 0.0051593780517578125, 0.009891510009765625, 0.014623641967773438, 0.01935577392578125, 0.024087905883789062, 0.028820037841796875, 0.03355216979980469, 0.0382843017578125, 0.04301643371582031, 0.047748565673828125, 0.05248069763183594, 0.05721282958984375, 0.06194496154785156, 0.06667709350585938, 0.07140922546386719, 0.076141357421875, 0.08087348937988281, 0.08560562133789062, 0.09033775329589844, 0.09506988525390625, 0.09980201721191406, 0.10453414916992188, 0.10926628112792969, 0.1139984130859375, 0.11873054504394531, 0.12346267700195312, 0.12819480895996094, 0.13292694091796875, 0.13765907287597656, 0.14239120483398438, 0.1471233367919922, 0.15185546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 7.0, 7.0, 7.0, 13.0, 16.0, 12.0, 18.0, 17.0, 18.0, 23.0, 20.0, 30.0, 25.0, 38.0, 41.0, 34.0, 33.0, 41.0, 52.0, 42.0, 37.0, 38.0, 43.0, 38.0, 46.0, 36.0, 31.0, 30.0, 28.0, 30.0, 30.0, 23.0, 17.0, 13.0, 12.0, 9.0, 16.0, 7.0, 7.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.127197265625, -0.12349224090576172, -0.11978721618652344, -0.11608219146728516, -0.11237716674804688, -0.1086721420288086, -0.10496711730957031, -0.10126209259033203, -0.09755706787109375, -0.09385204315185547, -0.09014701843261719, -0.0864419937133789, -0.08273696899414062, -0.07903194427490234, -0.07532691955566406, -0.07162189483642578, -0.0679168701171875, -0.06421184539794922, -0.06050682067871094, -0.056801795959472656, -0.053096771240234375, -0.049391746520996094, -0.04568672180175781, -0.04198169708251953, -0.03827667236328125, -0.03457164764404297, -0.030866622924804688, -0.027161598205566406, -0.023456573486328125, -0.019751548767089844, -0.016046524047851562, -0.012341499328613281, -0.008636474609375, -0.004931449890136719, -0.0012264251708984375, 0.0024785995483398438, 0.006183624267578125, 0.009888648986816406, 0.013593673706054688, 0.01729869842529297, 0.02100372314453125, 0.02470874786376953, 0.028413772583007812, 0.032118797302246094, 0.035823822021484375, 0.039528846740722656, 0.04323387145996094, 0.04693889617919922, 0.0506439208984375, 0.05434894561767578, 0.05805397033691406, 0.061758995056152344, 0.06546401977539062, 0.0691690444946289, 0.07287406921386719, 0.07657909393310547, 0.08028411865234375, 0.08398914337158203, 0.08769416809082031, 0.0913991928100586, 0.09510421752929688, 0.09880924224853516, 0.10251426696777344, 0.10621929168701172, 0.10992431640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 14.0, 18.0, 26.0, 58.0, 84.0, 147.0, 243.0, 463.0, 897.0, 1927.0, 4495.0, 11791.0, 37726.0, 168259.0, 557905.0, 199515.0, 42744.0, 13151.0, 4863.0, 2108.0, 976.0, 508.0, 263.0, 145.0, 75.0, 48.0, 35.0, 15.0, 8.0, 12.0, 11.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07574462890625, -0.07309150695800781, -0.07043838500976562, -0.06778526306152344, -0.06513214111328125, -0.06247901916503906, -0.059825897216796875, -0.05717277526855469, -0.0545196533203125, -0.05186653137207031, -0.049213409423828125, -0.04656028747558594, -0.04390716552734375, -0.04125404357910156, -0.038600921630859375, -0.03594779968261719, -0.033294677734375, -0.030641555786132812, -0.027988433837890625, -0.025335311889648438, -0.02268218994140625, -0.020029067993164062, -0.017375946044921875, -0.014722824096679688, -0.0120697021484375, -0.009416580200195312, -0.006763458251953125, -0.0041103363037109375, -0.00145721435546875, 0.0011959075927734375, 0.003849029541015625, 0.0065021514892578125, 0.0091552734375, 0.011808395385742188, 0.014461517333984375, 0.017114639282226562, 0.01976776123046875, 0.022420883178710938, 0.025074005126953125, 0.027727127075195312, 0.0303802490234375, 0.03303337097167969, 0.035686492919921875, 0.03833961486816406, 0.04099273681640625, 0.04364585876464844, 0.046298980712890625, 0.04895210266113281, 0.051605224609375, 0.05425834655761719, 0.056911468505859375, 0.05956459045410156, 0.06221771240234375, 0.06487083435058594, 0.06752395629882812, 0.07017707824707031, 0.0728302001953125, 0.07548332214355469, 0.07813644409179688, 0.08078956604003906, 0.08344268798828125, 0.08609580993652344, 0.08874893188476562, 0.09140205383300781, 0.09405517578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 14.0, 18.0, 18.0, 22.0, 37.0, 39.0, 50.0, 51.0, 57.0, 63.0, 64.0, 82.0, 60.0, 60.0, 63.0, 48.0, 47.0, 38.0, 20.0, 30.0, 30.0, 19.0, 11.0, 10.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220008850097656e-05, -4.048086702823639e-05, -3.8761645555496216e-05, -3.704242408275604e-05, -3.532320261001587e-05, -3.3603981137275696e-05, -3.188475966453552e-05, -3.016553819179535e-05, -2.8446316719055176e-05, -2.6727095246315002e-05, -2.500787377357483e-05, -2.3288652300834656e-05, -2.1569430828094482e-05, -1.985020935535431e-05, -1.8130987882614136e-05, -1.6411766409873962e-05, -1.4692544937133789e-05, -1.2973323464393616e-05, -1.1254101991653442e-05, -9.534880518913269e-06, -7.815659046173096e-06, -6.096437573432922e-06, -4.377216100692749e-06, -2.6579946279525757e-06, -9.387731552124023e-07, 7.80448317527771e-07, 2.4996697902679443e-06, 4.218891263008118e-06, 5.938112735748291e-06, 7.657334208488464e-06, 9.376555681228638e-06, 1.1095777153968811e-05, 1.2814998626708984e-05, 1.4534220099449158e-05, 1.625344157218933e-05, 1.7972663044929504e-05, 1.9691884517669678e-05, 2.141110599040985e-05, 2.3130327463150024e-05, 2.4849548935890198e-05, 2.656877040863037e-05, 2.8287991881370544e-05, 3.0007213354110718e-05, 3.172643482685089e-05, 3.3445656299591064e-05, 3.516487777233124e-05, 3.688409924507141e-05, 3.8603320717811584e-05, 4.032254219055176e-05, 4.204176366329193e-05, 4.3760985136032104e-05, 4.548020660877228e-05, 4.719942808151245e-05, 4.8918649554252625e-05, 5.06378710269928e-05, 5.235709249973297e-05, 5.4076313972473145e-05, 5.579553544521332e-05, 5.751475691795349e-05, 5.9233978390693665e-05, 6.095319986343384e-05, 6.267242133617401e-05, 6.439164280891418e-05, 6.611086428165436e-05, 6.783008575439453e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 4.0, 10.0, 12.0, 19.0, 32.0, 35.0, 53.0, 75.0, 129.0, 164.0, 267.0, 470.0, 877.0, 1814.0, 4547.0, 13858.0, 54879.0, 348403.0, 511859.0, 81789.0, 18717.0, 5866.0, 2240.0, 1019.0, 521.0, 304.0, 201.0, 123.0, 74.0, 55.0, 41.0, 32.0, 20.0, 12.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07958984375, -0.07685661315917969, -0.07412338256835938, -0.07139015197753906, -0.06865692138671875, -0.06592369079589844, -0.06319046020507812, -0.06045722961425781, -0.0577239990234375, -0.05499076843261719, -0.052257537841796875, -0.04952430725097656, -0.04679107666015625, -0.04405784606933594, -0.041324615478515625, -0.03859138488769531, -0.035858154296875, -0.03312492370605469, -0.030391693115234375, -0.027658462524414062, -0.02492523193359375, -0.022192001342773438, -0.019458770751953125, -0.016725540161132812, -0.0139923095703125, -0.011259078979492188, -0.008525848388671875, -0.0057926177978515625, -0.00305938720703125, -0.0003261566162109375, 0.002407073974609375, 0.0051403045654296875, 0.00787353515625, 0.010606765747070312, 0.013339996337890625, 0.016073226928710938, 0.01880645751953125, 0.021539688110351562, 0.024272918701171875, 0.027006149291992188, 0.0297393798828125, 0.03247261047363281, 0.035205841064453125, 0.03793907165527344, 0.04067230224609375, 0.04340553283691406, 0.046138763427734375, 0.04887199401855469, 0.051605224609375, 0.05433845520019531, 0.057071685791015625, 0.05980491638183594, 0.06253814697265625, 0.06527137756347656, 0.06800460815429688, 0.07073783874511719, 0.0734710693359375, 0.07620429992675781, 0.07893753051757812, 0.08167076110839844, 0.08440399169921875, 0.08713722229003906, 0.08987045288085938, 0.09260368347167969, 0.0953369140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 13.0, 8.0, 8.0, 8.0, 19.0, 21.0, 35.0, 31.0, 35.0, 63.0, 79.0, 78.0, 92.0, 105.0, 79.0, 78.0, 49.0, 49.0, 38.0, 19.0, 15.0, 12.0, 15.0, 9.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059661865234375, -0.05780172348022461, -0.05594158172607422, -0.05408143997192383, -0.05222129821777344, -0.05036115646362305, -0.048501014709472656, -0.046640872955322266, -0.044780731201171875, -0.042920589447021484, -0.041060447692871094, -0.0392003059387207, -0.03734016418457031, -0.03548002243041992, -0.03361988067626953, -0.03175973892211914, -0.02989959716796875, -0.02803945541381836, -0.02617931365966797, -0.024319171905517578, -0.022459030151367188, -0.020598888397216797, -0.018738746643066406, -0.016878604888916016, -0.015018463134765625, -0.013158321380615234, -0.011298179626464844, -0.009438037872314453, -0.0075778961181640625, -0.005717754364013672, -0.0038576126098632812, -0.0019974708557128906, -0.0001373291015625, 0.0017228126525878906, 0.0035829544067382812, 0.005443096160888672, 0.0073032379150390625, 0.009163379669189453, 0.011023521423339844, 0.012883663177490234, 0.014743804931640625, 0.016603946685791016, 0.018464088439941406, 0.020324230194091797, 0.022184371948242188, 0.024044513702392578, 0.02590465545654297, 0.02776479721069336, 0.02962493896484375, 0.03148508071899414, 0.03334522247314453, 0.03520536422729492, 0.03706550598144531, 0.0389256477355957, 0.040785789489746094, 0.042645931243896484, 0.044506072998046875, 0.046366214752197266, 0.048226356506347656, 0.05008649826049805, 0.05194664001464844, 0.05380678176879883, 0.05566692352294922, 0.05752706527709961, 0.05938720703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 26.0, 52.0, 100.0, 178.0, 189.0, 187.0, 125.0, 70.0, 36.0, 13.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8133844137191772, -1.7654263973236084, -1.717468500137329, -1.6695106029510498, -1.621552586555481, -1.573594570159912, -1.5256366729736328, -1.4776787757873535, -1.4297207593917847, -1.3817627429962158, -1.3338048458099365, -1.2858469486236572, -1.2378889322280884, -1.1899309158325195, -1.1419730186462402, -1.094015121459961, -1.046057105064392, -0.998099148273468, -0.950141191482544, -0.9021832346916199, -0.8542252779006958, -0.8062673211097717, -0.7583093643188477, -0.7103514075279236, -0.6623934507369995, -0.6144354939460754, -0.5664775371551514, -0.5185195803642273, -0.4705616235733032, -0.42260366678237915, -0.3746457099914551, -0.326687753200531, -0.2787296772003174, -0.2307717204093933, -0.18281376361846924, -0.13485580682754517, -0.0868978500366211, -0.03893989324569702, 0.00901806354522705, 0.05697602033615112, 0.1049339771270752, 0.15289193391799927, 0.20084989070892334, 0.2488078474998474, 0.2967658042907715, 0.34472376108169556, 0.39268171787261963, 0.4406396746635437, 0.4885976314544678, 0.5365555882453918, 0.5845135450363159, 0.63247150182724, 0.6804294586181641, 0.7283874154090881, 0.7763453722000122, 0.8243033289909363, 0.8722612857818604, 0.9202192425727844, 0.9681771993637085, 1.0161352157592773, 1.0640931129455566, 1.112051010131836, 1.1600090265274048, 1.2079670429229736, 1.255924940109253]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 7.0, 7.0, 7.0, 9.0, 5.0, 16.0, 14.0, 23.0, 16.0, 22.0, 29.0, 19.0, 29.0, 29.0, 34.0, 54.0, 32.0, 24.0, 39.0, 41.0, 39.0, 43.0, 42.0, 42.0, 40.0, 31.0, 43.0, 25.0, 23.0, 29.0, 21.0, 31.0, 16.0, 22.0, 15.0, 16.0, 7.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.646960437297821, -0.6269792914390564, -0.6069981455802917, -0.5870169997215271, -0.5670359134674072, -0.5470547676086426, -0.5270736217498779, -0.5070924758911133, -0.48711133003234863, -0.467130184173584, -0.44714903831481934, -0.4271679222583771, -0.4071867763996124, -0.3872056305408478, -0.3672245144844055, -0.34724336862564087, -0.3272622227668762, -0.3072810769081116, -0.2872999310493469, -0.26731881499290466, -0.24733766913414001, -0.22735652327537537, -0.2073753923177719, -0.18739426136016846, -0.1674131155014038, -0.14743196964263916, -0.1274508386850357, -0.10746970027685165, -0.0874885618686676, -0.06750742346048355, -0.0475262850522995, -0.027545154094696045, -0.007563948631286621, 0.01241718977689743, 0.03239832818508148, 0.05237946659326553, 0.07236060500144958, 0.09234174340963364, 0.11232288181781769, 0.13230401277542114, 0.1522851586341858, 0.17226630449295044, 0.1922474354505539, 0.21222856640815735, 0.232209712266922, 0.25219085812568665, 0.2721719741821289, 0.29215312004089355, 0.3121342658996582, 0.33211541175842285, 0.3520965576171875, 0.37207767367362976, 0.3920588195323944, 0.41203996539115906, 0.4320210814476013, 0.45200222730636597, 0.4719833731651306, 0.49196451902389526, 0.5119456648826599, 0.5319268107414246, 0.5519078969955444, 0.5718890428543091, 0.5918701887130737, 0.6118513345718384, 0.631832480430603]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 13.0, 15.0, 14.0, 29.0, 33.0, 64.0, 71.0, 137.0, 170.0, 265.0, 436.0, 704.0, 1161.0, 2074.0, 3739.0, 7716.0, 18809.0, 52989.0, 232675.0, 3371801.0, 387146.0, 70670.0, 23130.0, 9610.0, 4602.0, 2451.0, 1366.0, 862.0, 463.0, 312.0, 232.0, 154.0, 95.0, 86.0, 56.0, 42.0, 30.0, 17.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114990234375, -0.11123466491699219, -0.10747909545898438, -0.10372352600097656, -0.09996795654296875, -0.09621238708496094, -0.09245681762695312, -0.08870124816894531, -0.0849456787109375, -0.08119010925292969, -0.07743453979492188, -0.07367897033691406, -0.06992340087890625, -0.06616783142089844, -0.062412261962890625, -0.05865669250488281, -0.054901123046875, -0.05114555358886719, -0.047389984130859375, -0.04363441467285156, -0.03987884521484375, -0.03612327575683594, -0.032367706298828125, -0.028612136840820312, -0.0248565673828125, -0.021100997924804688, -0.017345428466796875, -0.013589859008789062, -0.00983428955078125, -0.0060787200927734375, -0.002323150634765625, 0.0014324188232421875, 0.00518798828125, 0.008943557739257812, 0.012699127197265625, 0.016454696655273438, 0.02021026611328125, 0.023965835571289062, 0.027721405029296875, 0.03147697448730469, 0.0352325439453125, 0.03898811340332031, 0.042743682861328125, 0.04649925231933594, 0.05025482177734375, 0.05401039123535156, 0.057765960693359375, 0.06152153015136719, 0.065277099609375, 0.06903266906738281, 0.07278823852539062, 0.07654380798339844, 0.08029937744140625, 0.08405494689941406, 0.08781051635742188, 0.09156608581542969, 0.0953216552734375, 0.09907722473144531, 0.10283279418945312, 0.10658836364746094, 0.11034393310546875, 0.11409950256347656, 0.11785507202148438, 0.12161064147949219, 0.1253662109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 6.0, 11.0, 13.0, 19.0, 23.0, 31.0, 18.0, 41.0, 49.0, 40.0, 65.0, 60.0, 53.0, 54.0, 44.0, 63.0, 47.0, 56.0, 41.0, 45.0, 42.0, 31.0, 32.0, 26.0, 13.0, 16.0, 12.0, 15.0, 10.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0243072509765625, -0.023263216018676758, -0.022219181060791016, -0.021175146102905273, -0.02013111114501953, -0.01908707618713379, -0.018043041229248047, -0.016999006271362305, -0.015954971313476562, -0.01491093635559082, -0.013866901397705078, -0.012822866439819336, -0.011778831481933594, -0.010734796524047852, -0.00969076156616211, -0.008646726608276367, -0.007602691650390625, -0.006558656692504883, -0.005514621734619141, -0.0044705867767333984, -0.0034265518188476562, -0.002382516860961914, -0.0013384819030761719, -0.0002944469451904297, 0.0007495880126953125, 0.0017936229705810547, 0.002837657928466797, 0.003881692886352539, 0.004925727844238281, 0.0059697628021240234, 0.007013797760009766, 0.008057832717895508, 0.00910186767578125, 0.010145902633666992, 0.011189937591552734, 0.012233972549438477, 0.013278007507324219, 0.014322042465209961, 0.015366077423095703, 0.016410112380981445, 0.017454147338867188, 0.01849818229675293, 0.019542217254638672, 0.020586252212524414, 0.021630287170410156, 0.0226743221282959, 0.02371835708618164, 0.024762392044067383, 0.025806427001953125, 0.026850461959838867, 0.02789449691772461, 0.02893853187561035, 0.029982566833496094, 0.031026601791381836, 0.03207063674926758, 0.03311467170715332, 0.03415870666503906, 0.035202741622924805, 0.03624677658081055, 0.03729081153869629, 0.03833484649658203, 0.03937888145446777, 0.040422916412353516, 0.04146695137023926, 0.042510986328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 8.0, 7.0, 16.0, 24.0, 32.0, 63.0, 101.0, 159.0, 323.0, 591.0, 1485.0, 4545.0, 22073.0, 230034.0, 3750998.0, 159739.0, 17547.0, 3881.0, 1369.0, 564.0, 327.0, 157.0, 98.0, 63.0, 36.0, 18.0, 11.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2359619140625, -0.22736167907714844, -0.21876144409179688, -0.2101612091064453, -0.20156097412109375, -0.1929607391357422, -0.18436050415039062, -0.17576026916503906, -0.1671600341796875, -0.15855979919433594, -0.14995956420898438, -0.1413593292236328, -0.13275909423828125, -0.12415885925292969, -0.11555862426757812, -0.10695838928222656, -0.098358154296875, -0.08975791931152344, -0.08115768432617188, -0.07255744934082031, -0.06395721435546875, -0.05535697937011719, -0.046756744384765625, -0.03815650939941406, -0.0295562744140625, -0.020956039428710938, -0.012355804443359375, -0.0037555694580078125, 0.00484466552734375, 0.013444900512695312, 0.022045135498046875, 0.030645370483398438, 0.03924560546875, 0.04784584045410156, 0.056446075439453125, 0.06504631042480469, 0.07364654541015625, 0.08224678039550781, 0.09084701538085938, 0.09944725036621094, 0.1080474853515625, 0.11664772033691406, 0.12524795532226562, 0.1338481903076172, 0.14244842529296875, 0.1510486602783203, 0.15964889526367188, 0.16824913024902344, 0.176849365234375, 0.18544960021972656, 0.19404983520507812, 0.2026500701904297, 0.21125030517578125, 0.2198505401611328, 0.22845077514648438, 0.23705101013183594, 0.2456512451171875, 0.25425148010253906, 0.2628517150878906, 0.2714519500732422, 0.28005218505859375, 0.2886524200439453, 0.2972526550292969, 0.30585289001464844, 0.314453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 9.0, 15.0, 13.0, 19.0, 36.0, 32.0, 61.0, 96.0, 146.0, 326.0, 897.0, 1385.0, 454.0, 201.0, 131.0, 76.0, 47.0, 47.0, 19.0, 18.0, 11.0, 10.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07666015625, -0.07394027709960938, -0.07122039794921875, -0.06850051879882812, -0.0657806396484375, -0.06306076049804688, -0.06034088134765625, -0.057621002197265625, -0.054901123046875, -0.052181243896484375, -0.04946136474609375, -0.046741485595703125, -0.0440216064453125, -0.041301727294921875, -0.03858184814453125, -0.035861968994140625, -0.03314208984375, -0.030422210693359375, -0.02770233154296875, -0.024982452392578125, -0.0222625732421875, -0.019542694091796875, -0.01682281494140625, -0.014102935791015625, -0.011383056640625, -0.008663177490234375, -0.00594329833984375, -0.003223419189453125, -0.0005035400390625, 0.002216339111328125, 0.00493621826171875, 0.007656097412109375, 0.0103759765625, 0.013095855712890625, 0.01581573486328125, 0.018535614013671875, 0.0212554931640625, 0.023975372314453125, 0.02669525146484375, 0.029415130615234375, 0.032135009765625, 0.034854888916015625, 0.03757476806640625, 0.040294647216796875, 0.0430145263671875, 0.045734405517578125, 0.04845428466796875, 0.051174163818359375, 0.05389404296875, 0.056613922119140625, 0.05933380126953125, 0.062053680419921875, 0.0647735595703125, 0.06749343872070312, 0.07021331787109375, 0.07293319702148438, 0.075653076171875, 0.07837295532226562, 0.08109283447265625, 0.08381271362304688, 0.0865325927734375, 0.08925247192382812, 0.09197235107421875, 0.09469223022460938, 0.097412109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 8.0, 46.0, 224.0, 376.0, 252.0, 73.0, 19.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3516697883605957, -1.3043086528778076, -1.256947636604309, -1.209586501121521, -1.1622254848480225, -1.1148643493652344, -1.0675033330917358, -1.0201421976089478, -0.9727811813354492, -0.9254201054573059, -0.8780590295791626, -0.8306979537010193, -0.783336877822876, -0.7359758019447327, -0.6886147260665894, -0.6412535905838013, -0.593892514705658, -0.5465314388275146, -0.49917036294937134, -0.451809287071228, -0.4044482111930847, -0.3570871353149414, -0.3097260296344757, -0.2623649537563324, -0.2150038778781891, -0.16764280200004578, -0.12028171867132187, -0.07292063534259796, -0.02555955946445465, 0.02180151641368866, 0.06916260719299316, 0.11652368307113647, 0.16388475894927979, 0.2112458348274231, 0.2586069107055664, 0.3059679865837097, 0.353329062461853, 0.40069013833999634, 0.44805124402046204, 0.49541231989860535, 0.5427733659744263, 0.5901344418525696, 0.6374955177307129, 0.6848565936088562, 0.7322176694869995, 0.7795787453651428, 0.8269398212432861, 0.8743009567260742, 0.9216620326042175, 0.9690231084823608, 1.016384243965149, 1.0637452602386475, 1.1111063957214355, 1.158467411994934, 1.2058285474777222, 1.2531895637512207, 1.3005506992340088, 1.3479118347167969, 1.3952728509902954, 1.4426339864730835, 1.489995002746582, 1.5373561382293701, 1.5847171545028687, 1.6320782899856567, 1.6794393062591553]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 12.0, 17.0, 19.0, 16.0, 24.0, 33.0, 28.0, 29.0, 42.0, 46.0, 30.0, 46.0, 50.0, 50.0, 46.0, 40.0, 55.0, 42.0, 48.0, 41.0, 48.0, 40.0, 19.0, 37.0, 14.0, 19.0, 18.0, 18.0, 10.0, 13.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.3421061038970947, -0.3330096900463104, -0.3239132761955261, -0.31481683254241943, -0.30572041869163513, -0.29662400484085083, -0.28752759099006653, -0.2784311771392822, -0.26933473348617554, -0.26023831963539124, -0.25114190578460693, -0.24204547703266144, -0.23294904828071594, -0.22385263442993164, -0.21475622057914734, -0.20565979182720184, -0.19656337797641754, -0.18746696412563324, -0.17837053537368774, -0.16927412152290344, -0.16017769277095795, -0.15108127892017365, -0.14198485016822815, -0.13288843631744385, -0.12379201501607895, -0.11469559371471405, -0.10559917241334915, -0.09650275111198425, -0.08740633726119995, -0.07830990850925446, -0.06921349465847015, -0.060117073357105255, -0.051020652055740356, -0.04192423075437546, -0.03282780945301056, -0.02373139187693596, -0.01463497057557106, -0.0055385492742061615, 0.0035578683018684387, 0.012654289603233337, 0.021750710904598236, 0.030847132205963135, 0.03994355350732803, 0.049039971083402634, 0.05813639238476753, 0.06723281741142273, 0.07632923126220703, 0.08542565256357193, 0.09452207386493683, 0.10361849516630173, 0.11271491646766663, 0.12181133031845093, 0.13090775907039642, 0.14000417292118073, 0.14910060167312622, 0.15819701552391052, 0.16729342937469482, 0.17638984322547913, 0.18548627197742462, 0.19458268582820892, 0.20367911458015442, 0.21277552843093872, 0.22187194228172302, 0.23096837103366852, 0.240064799785614]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 16.0, 10.0, 36.0, 25.0, 69.0, 84.0, 122.0, 180.0, 257.0, 421.0, 690.0, 1123.0, 1903.0, 3245.0, 6077.0, 11504.0, 24368.0, 55263.0, 170549.0, 532327.0, 144193.0, 49640.0, 22167.0, 10742.0, 5745.0, 3070.0, 1768.0, 1072.0, 638.0, 401.0, 264.0, 185.0, 114.0, 86.0, 54.0, 35.0, 31.0, 19.0, 19.0, 6.0, 7.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.130126953125, -0.1262359619140625, -0.122344970703125, -0.1184539794921875, -0.11456298828125, -0.1106719970703125, -0.106781005859375, -0.1028900146484375, -0.0989990234375, -0.0951080322265625, -0.091217041015625, -0.0873260498046875, -0.08343505859375, -0.0795440673828125, -0.075653076171875, -0.0717620849609375, -0.06787109375, -0.0639801025390625, -0.060089111328125, -0.0561981201171875, -0.05230712890625, -0.0484161376953125, -0.044525146484375, -0.0406341552734375, -0.0367431640625, -0.0328521728515625, -0.028961181640625, -0.0250701904296875, -0.02117919921875, -0.0172882080078125, -0.013397216796875, -0.0095062255859375, -0.005615234375, -0.0017242431640625, 0.002166748046875, 0.0060577392578125, 0.00994873046875, 0.0138397216796875, 0.017730712890625, 0.0216217041015625, 0.0255126953125, 0.0294036865234375, 0.033294677734375, 0.0371856689453125, 0.04107666015625, 0.0449676513671875, 0.048858642578125, 0.0527496337890625, 0.056640625, 0.0605316162109375, 0.064422607421875, 0.0683135986328125, 0.07220458984375, 0.0760955810546875, 0.079986572265625, 0.0838775634765625, 0.0877685546875, 0.0916595458984375, 0.095550537109375, 0.0994415283203125, 0.10333251953125, 0.1072235107421875, 0.111114501953125, 0.1150054931640625, 0.118896484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 11.0, 11.0, 17.0, 17.0, 19.0, 22.0, 21.0, 39.0, 26.0, 39.0, 31.0, 50.0, 45.0, 43.0, 58.0, 56.0, 38.0, 49.0, 47.0, 52.0, 44.0, 37.0, 40.0, 27.0, 22.0, 25.0, 21.0, 19.0, 10.0, 14.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0289306640625, -0.02801990509033203, -0.027109146118164062, -0.026198387145996094, -0.025287628173828125, -0.024376869201660156, -0.023466110229492188, -0.02255535125732422, -0.02164459228515625, -0.02073383331298828, -0.019823074340820312, -0.018912315368652344, -0.018001556396484375, -0.017090797424316406, -0.016180038452148438, -0.015269279479980469, -0.0143585205078125, -0.013447761535644531, -0.012537002563476562, -0.011626243591308594, -0.010715484619140625, -0.009804725646972656, -0.008893966674804688, -0.007983207702636719, -0.00707244873046875, -0.006161689758300781, -0.0052509307861328125, -0.004340171813964844, -0.003429412841796875, -0.0025186538696289062, -0.0016078948974609375, -0.0006971359252929688, 0.000213623046875, 0.0011243820190429688, 0.0020351409912109375, 0.0029458999633789062, 0.003856658935546875, 0.004767417907714844, 0.0056781768798828125, 0.006588935852050781, 0.00749969482421875, 0.008410453796386719, 0.009321212768554688, 0.010231971740722656, 0.011142730712890625, 0.012053489685058594, 0.012964248657226562, 0.013875007629394531, 0.0147857666015625, 0.01569652557373047, 0.016607284545898438, 0.017518043518066406, 0.018428802490234375, 0.019339561462402344, 0.020250320434570312, 0.02116107940673828, 0.02207183837890625, 0.02298259735107422, 0.023893356323242188, 0.024804115295410156, 0.025714874267578125, 0.026625633239746094, 0.027536392211914062, 0.02844715118408203, 0.02935791015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 8.0, 17.0, 13.0, 20.0, 28.0, 40.0, 48.0, 93.0, 100.0, 121.0, 170.0, 268.0, 339.0, 582.0, 858.0, 1686.0, 3811.0, 10707.0, 42327.0, 253634.0, 620608.0, 82761.0, 19013.0, 5672.0, 2255.0, 1182.0, 678.0, 409.0, 308.0, 219.0, 156.0, 101.0, 91.0, 52.0, 36.0, 40.0, 24.0, 17.0, 16.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.16259765625, -0.15738868713378906, -0.15217971801757812, -0.1469707489013672, -0.14176177978515625, -0.1365528106689453, -0.13134384155273438, -0.12613487243652344, -0.1209259033203125, -0.11571693420410156, -0.11050796508789062, -0.10529899597167969, -0.10009002685546875, -0.09488105773925781, -0.08967208862304688, -0.08446311950683594, -0.079254150390625, -0.07404518127441406, -0.06883621215820312, -0.06362724304199219, -0.05841827392578125, -0.05320930480957031, -0.048000335693359375, -0.04279136657714844, -0.0375823974609375, -0.03237342834472656, -0.027164459228515625, -0.021955490112304688, -0.01674652099609375, -0.011537551879882812, -0.006328582763671875, -0.0011196136474609375, 0.00408935546875, 0.009298324584960938, 0.014507293701171875, 0.019716262817382812, 0.02492523193359375, 0.030134201049804688, 0.035343170166015625, 0.04055213928222656, 0.0457611083984375, 0.05097007751464844, 0.056179046630859375, 0.06138801574707031, 0.06659698486328125, 0.07180595397949219, 0.07701492309570312, 0.08222389221191406, 0.087432861328125, 0.09264183044433594, 0.09785079956054688, 0.10305976867675781, 0.10826873779296875, 0.11347770690917969, 0.11868667602539062, 0.12389564514160156, 0.1291046142578125, 0.13431358337402344, 0.13952255249023438, 0.1447315216064453, 0.14994049072265625, 0.1551494598388672, 0.16035842895507812, 0.16556739807128906, 0.1707763671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 15.0, 13.0, 21.0, 23.0, 27.0, 23.0, 33.0, 35.0, 34.0, 43.0, 44.0, 48.0, 49.0, 58.0, 62.0, 64.0, 62.0, 42.0, 34.0, 42.0, 26.0, 36.0, 26.0, 26.0, 20.0, 20.0, 13.0, 14.0, 10.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13614463806152344, -0.13190841674804688, -0.1276721954345703, -0.12343597412109375, -0.11919975280761719, -0.11496353149414062, -0.11072731018066406, -0.1064910888671875, -0.10225486755371094, -0.09801864624023438, -0.09378242492675781, -0.08954620361328125, -0.08530998229980469, -0.08107376098632812, -0.07683753967285156, -0.072601318359375, -0.06836509704589844, -0.06412887573242188, -0.05989265441894531, -0.05565643310546875, -0.05142021179199219, -0.047183990478515625, -0.04294776916503906, -0.0387115478515625, -0.03447532653808594, -0.030239105224609375, -0.026002883911132812, -0.02176666259765625, -0.017530441284179688, -0.013294219970703125, -0.009057998657226562, -0.00482177734375, -0.0005855560302734375, 0.003650665283203125, 0.007886886596679688, 0.01212310791015625, 0.016359329223632812, 0.020595550537109375, 0.024831771850585938, 0.0290679931640625, 0.03330421447753906, 0.037540435791015625, 0.04177665710449219, 0.04601287841796875, 0.05024909973144531, 0.054485321044921875, 0.05872154235839844, 0.062957763671875, 0.06719398498535156, 0.07143020629882812, 0.07566642761230469, 0.07990264892578125, 0.08413887023925781, 0.08837509155273438, 0.09261131286621094, 0.0968475341796875, 0.10108375549316406, 0.10531997680664062, 0.10955619812011719, 0.11379241943359375, 0.11802864074707031, 0.12226486206054688, 0.12650108337402344, 0.1307373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 18.0, 34.0, 58.0, 71.0, 124.0, 275.0, 500.0, 1265.0, 3686.0, 12594.0, 61200.0, 796465.0, 141542.0, 21616.0, 5669.0, 1849.0, 759.0, 337.0, 182.0, 99.0, 63.0, 41.0, 22.0, 13.0, 11.0, 6.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.15139007568359375, -0.1468963623046875, -0.14240264892578125, -0.137908935546875, -0.13341522216796875, -0.1289215087890625, -0.12442779541015625, -0.11993408203125, -0.11544036865234375, -0.1109466552734375, -0.10645294189453125, -0.101959228515625, -0.09746551513671875, -0.0929718017578125, -0.08847808837890625, -0.083984375, -0.07949066162109375, -0.0749969482421875, -0.07050323486328125, -0.066009521484375, -0.06151580810546875, -0.0570220947265625, -0.05252838134765625, -0.04803466796875, -0.04354095458984375, -0.0390472412109375, -0.03455352783203125, -0.030059814453125, -0.02556610107421875, -0.0210723876953125, -0.01657867431640625, -0.0120849609375, -0.00759124755859375, -0.0030975341796875, 0.00139617919921875, 0.005889892578125, 0.01038360595703125, 0.0148773193359375, 0.01937103271484375, 0.02386474609375, 0.02835845947265625, 0.0328521728515625, 0.03734588623046875, 0.041839599609375, 0.04633331298828125, 0.0508270263671875, 0.05532073974609375, 0.059814453125, 0.06430816650390625, 0.0688018798828125, 0.07329559326171875, 0.077789306640625, 0.08228302001953125, 0.0867767333984375, 0.09127044677734375, 0.09576416015625, 0.10025787353515625, 0.1047515869140625, 0.10924530029296875, 0.113739013671875, 0.11823272705078125, 0.1227264404296875, 0.12722015380859375, 0.1317138671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 16.0, 22.0, 27.0, 44.0, 63.0, 84.0, 108.0, 116.0, 146.0, 103.0, 75.0, 43.0, 43.0, 25.0, 21.0, 19.0, 9.0, 4.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00011807680130004883, -0.00011532846838235855, -0.00011258013546466827, -0.000109831802546978, -0.00010708346962928772, -0.00010433513671159744, -0.00010158680379390717, -9.883847087621689e-05, -9.609013795852661e-05, -9.334180504083633e-05, -9.059347212314606e-05, -8.784513920545578e-05, -8.50968062877655e-05, -8.234847337007523e-05, -7.960014045238495e-05, -7.685180753469467e-05, -7.41034746170044e-05, -7.135514169931412e-05, -6.860680878162384e-05, -6.585847586393356e-05, -6.311014294624329e-05, -6.036181002855301e-05, -5.761347711086273e-05, -5.4865144193172455e-05, -5.211681127548218e-05, -4.93684783577919e-05, -4.6620145440101624e-05, -4.3871812522411346e-05, -4.112347960472107e-05, -3.837514668703079e-05, -3.5626813769340515e-05, -3.287848085165024e-05, -3.013014793395996e-05, -2.7381815016269684e-05, -2.4633482098579407e-05, -2.188514918088913e-05, -1.9136816263198853e-05, -1.6388483345508575e-05, -1.3640150427818298e-05, -1.0891817510128021e-05, -8.143484592437744e-06, -5.395151674747467e-06, -2.64681875705719e-06, 1.0151416063308716e-07, 2.8498470783233643e-06, 5.598179996013641e-06, 8.346512913703918e-06, 1.1094845831394196e-05, 1.3843178749084473e-05, 1.659151166677475e-05, 1.9339844584465027e-05, 2.2088177502155304e-05, 2.483651041984558e-05, 2.7584843337535858e-05, 3.0333176255226135e-05, 3.308150917291641e-05, 3.582984209060669e-05, 3.8578175008296967e-05, 4.1326507925987244e-05, 4.407484084367752e-05, 4.68231737613678e-05, 4.9571506679058075e-05, 5.231983959674835e-05, 5.506817251443863e-05, 5.7816505432128906e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 15.0, 11.0, 23.0, 20.0, 35.0, 44.0, 81.0, 102.0, 185.0, 278.0, 454.0, 841.0, 1839.0, 4911.0, 16165.0, 71741.0, 778610.0, 136304.0, 24936.0, 7018.0, 2433.0, 1059.0, 520.0, 283.0, 166.0, 137.0, 84.0, 67.0, 48.0, 33.0, 19.0, 19.0, 11.0, 11.0, 4.0, 11.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090087890625, -0.08657646179199219, -0.08306503295898438, -0.07955360412597656, -0.07604217529296875, -0.07253074645996094, -0.06901931762695312, -0.06550788879394531, -0.0619964599609375, -0.05848503112792969, -0.054973602294921875, -0.05146217346191406, -0.04795074462890625, -0.04443931579589844, -0.040927886962890625, -0.03741645812988281, -0.033905029296875, -0.030393600463867188, -0.026882171630859375, -0.023370742797851562, -0.01985931396484375, -0.016347885131835938, -0.012836456298828125, -0.009325027465820312, -0.0058135986328125, -0.0023021697998046875, 0.001209259033203125, 0.0047206878662109375, 0.00823211669921875, 0.011743545532226562, 0.015254974365234375, 0.018766403198242188, 0.02227783203125, 0.025789260864257812, 0.029300689697265625, 0.03281211853027344, 0.03632354736328125, 0.03983497619628906, 0.043346405029296875, 0.04685783386230469, 0.0503692626953125, 0.05388069152832031, 0.057392120361328125, 0.06090354919433594, 0.06441497802734375, 0.06792640686035156, 0.07143783569335938, 0.07494926452636719, 0.078460693359375, 0.08197212219238281, 0.08548355102539062, 0.08899497985839844, 0.09250640869140625, 0.09601783752441406, 0.09952926635742188, 0.10304069519042969, 0.1065521240234375, 0.11006355285644531, 0.11357498168945312, 0.11708641052246094, 0.12059783935546875, 0.12410926818847656, 0.12762069702148438, 0.1311321258544922, 0.1346435546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 5.0, 3.0, 2.0, 7.0, 10.0, 13.0, 17.0, 16.0, 30.0, 38.0, 65.0, 146.0, 193.0, 163.0, 91.0, 55.0, 37.0, 20.0, 7.0, 13.0, 13.0, 14.0, 5.0, 5.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.07171630859375, -0.0693807601928711, -0.06704521179199219, -0.06470966339111328, -0.062374114990234375, -0.06003856658935547, -0.05770301818847656, -0.055367469787597656, -0.05303192138671875, -0.050696372985839844, -0.04836082458496094, -0.04602527618408203, -0.043689727783203125, -0.04135417938232422, -0.03901863098144531, -0.036683082580566406, -0.0343475341796875, -0.032011985778808594, -0.029676437377929688, -0.02734088897705078, -0.025005340576171875, -0.02266979217529297, -0.020334243774414062, -0.017998695373535156, -0.01566314697265625, -0.013327598571777344, -0.010992050170898438, -0.008656501770019531, -0.006320953369140625, -0.003985404968261719, -0.0016498565673828125, 0.0006856918334960938, 0.003021240234375, 0.005356788635253906, 0.0076923370361328125, 0.010027885437011719, 0.012363433837890625, 0.014698982238769531, 0.017034530639648438, 0.019370079040527344, 0.02170562744140625, 0.024041175842285156, 0.026376724243164062, 0.02871227264404297, 0.031047821044921875, 0.03338336944580078, 0.03571891784667969, 0.038054466247558594, 0.0403900146484375, 0.042725563049316406, 0.04506111145019531, 0.04739665985107422, 0.049732208251953125, 0.05206775665283203, 0.05440330505371094, 0.056738853454589844, 0.05907440185546875, 0.061409950256347656, 0.06374549865722656, 0.06608104705810547, 0.06841659545898438, 0.07075214385986328, 0.07308769226074219, 0.0754232406616211, 0.0777587890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 11.0, 42.0, 104.0, 167.0, 219.0, 215.0, 131.0, 67.0, 26.0, 5.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9758763313293457, -1.9248700141906738, -1.873863697052002, -1.82285737991333, -1.7718510627746582, -1.7208447456359863, -1.6698384284973145, -1.6188321113586426, -1.5678257942199707, -1.5168194770812988, -1.465813159942627, -1.414806842803955, -1.3638005256652832, -1.3127942085266113, -1.2617878913879395, -1.2107815742492676, -1.1597752571105957, -1.1087689399719238, -1.057762622833252, -1.00675630569458, -0.9557499885559082, -0.9047436714172363, -0.8537373542785645, -0.8027310371398926, -0.7517248392105103, -0.7007185220718384, -0.6497122049331665, -0.5987058877944946, -0.5476995706558228, -0.49669328331947327, -0.4456869661808014, -0.3946806490421295, -0.34367430210113525, -0.2926679849624634, -0.2416616678237915, -0.19065536558628082, -0.13964904844760895, -0.08864274621009827, -0.03763642907142639, 0.013369888067245483, 0.06437620520591736, 0.11538252234458923, 0.1663888394832611, 0.2173951417207718, 0.26840144395828247, 0.31940776109695435, 0.3704140782356262, 0.4214203953742981, 0.47242671251296997, 0.5234330296516418, 0.5744393467903137, 0.6254456639289856, 0.6764519810676575, 0.7274582386016846, 0.7784645557403564, 0.8294708728790283, 0.8804771900177002, 0.9314835071563721, 0.982489824295044, 1.0334961414337158, 1.0845024585723877, 1.1355087757110596, 1.1865150928497314, 1.2375214099884033, 1.2885277271270752]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 2.0, 11.0, 11.0, 5.0, 7.0, 7.0, 18.0, 15.0, 15.0, 22.0, 22.0, 21.0, 36.0, 41.0, 36.0, 38.0, 34.0, 34.0, 38.0, 45.0, 41.0, 36.0, 23.0, 43.0, 39.0, 37.0, 27.0, 26.0, 29.0, 24.0, 27.0, 30.0, 23.0, 20.0, 17.0, 15.0, 11.0, 11.0, 13.0, 11.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.4881681203842163, -0.47227415442466736, -0.4563801884651184, -0.44048619270324707, -0.4245922267436981, -0.40869826078414917, -0.39280426502227783, -0.3769102990627289, -0.36101633310317993, -0.345122367143631, -0.32922840118408203, -0.3133344054222107, -0.29744043946266174, -0.2815464735031128, -0.26565247774124146, -0.2497585117816925, -0.23386454582214355, -0.2179705798625946, -0.20207659900188446, -0.18618261814117432, -0.17028865218162537, -0.15439468622207642, -0.13850070536136627, -0.12260673195123672, -0.10671275854110718, -0.09081878513097763, -0.07492481172084808, -0.059030838310718536, -0.04313686490058899, -0.027242891490459442, -0.011348918080329895, 0.004545055329799652, 0.0204390287399292, 0.036333002150058746, 0.05222697556018829, 0.06812094897031784, 0.08401492238044739, 0.09990889579057693, 0.11580286920070648, 0.13169685006141663, 0.14759081602096558, 0.16348478198051453, 0.17937876284122467, 0.19527274370193481, 0.21116670966148376, 0.22706067562103271, 0.24295465648174286, 0.258848637342453, 0.27474260330200195, 0.2906365692615509, 0.30653053522109985, 0.3224245309829712, 0.33831849694252014, 0.3542124629020691, 0.37010645866394043, 0.3860004246234894, 0.40189439058303833, 0.4177883565425873, 0.43368232250213623, 0.44957631826400757, 0.4654702842235565, 0.48136425018310547, 0.4972582459449768, 0.5131521821022034, 0.5290461778640747]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 5.0, 15.0, 25.0, 43.0, 48.0, 77.0, 94.0, 150.0, 334.0, 540.0, 1260.0, 2668.0, 6349.0, 18458.0, 75574.0, 2718853.0, 1274535.0, 67522.0, 16782.0, 5928.0, 2470.0, 1155.0, 571.0, 303.0, 155.0, 117.0, 57.0, 58.0, 27.0, 27.0, 16.0, 14.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17581939697265625, -0.1704864501953125, -0.16515350341796875, -0.159820556640625, -0.15448760986328125, -0.1491546630859375, -0.14382171630859375, -0.13848876953125, -0.13315582275390625, -0.1278228759765625, -0.12248992919921875, -0.117156982421875, -0.11182403564453125, -0.1064910888671875, -0.10115814208984375, -0.0958251953125, -0.09049224853515625, -0.0851593017578125, -0.07982635498046875, -0.074493408203125, -0.06916046142578125, -0.0638275146484375, -0.05849456787109375, -0.05316162109375, -0.04782867431640625, -0.0424957275390625, -0.03716278076171875, -0.031829833984375, -0.02649688720703125, -0.0211639404296875, -0.01583099365234375, -0.010498046875, -0.00516510009765625, 0.0001678466796875, 0.00550079345703125, 0.010833740234375, 0.01616668701171875, 0.0214996337890625, 0.02683258056640625, 0.03216552734375, 0.03749847412109375, 0.0428314208984375, 0.04816436767578125, 0.053497314453125, 0.05883026123046875, 0.0641632080078125, 0.06949615478515625, 0.0748291015625, 0.08016204833984375, 0.0854949951171875, 0.09082794189453125, 0.096160888671875, 0.10149383544921875, 0.1068267822265625, 0.11215972900390625, 0.11749267578125, 0.12282562255859375, 0.1281585693359375, 0.13349151611328125, 0.138824462890625, 0.14415740966796875, 0.1494903564453125, 0.15482330322265625, 0.16015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 9.0, 11.0, 10.0, 19.0, 21.0, 21.0, 18.0, 24.0, 32.0, 42.0, 40.0, 44.0, 38.0, 41.0, 44.0, 37.0, 55.0, 58.0, 46.0, 51.0, 48.0, 42.0, 37.0, 36.0, 26.0, 28.0, 14.0, 18.0, 17.0, 18.0, 7.0, 9.0, 9.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028638839721679688, -0.027690887451171875, -0.026742935180664062, -0.02579498291015625, -0.024847030639648438, -0.023899078369140625, -0.022951126098632812, -0.022003173828125, -0.021055221557617188, -0.020107269287109375, -0.019159317016601562, -0.01821136474609375, -0.017263412475585938, -0.016315460205078125, -0.015367507934570312, -0.0144195556640625, -0.013471603393554688, -0.012523651123046875, -0.011575698852539062, -0.01062774658203125, -0.009679794311523438, -0.008731842041015625, -0.0077838897705078125, -0.0068359375, -0.0058879852294921875, -0.004940032958984375, -0.0039920806884765625, -0.00304412841796875, -0.0020961761474609375, -0.001148223876953125, -0.0002002716064453125, 0.0007476806640625, 0.0016956329345703125, 0.002643585205078125, 0.0035915374755859375, 0.00453948974609375, 0.0054874420166015625, 0.006435394287109375, 0.0073833465576171875, 0.008331298828125, 0.009279251098632812, 0.010227203369140625, 0.011175155639648438, 0.01212310791015625, 0.013071060180664062, 0.014019012451171875, 0.014966964721679688, 0.0159149169921875, 0.016862869262695312, 0.017810821533203125, 0.018758773803710938, 0.01970672607421875, 0.020654678344726562, 0.021602630615234375, 0.022550582885742188, 0.02349853515625, 0.024446487426757812, 0.025394439697265625, 0.026342391967773438, 0.02729034423828125, 0.028238296508789062, 0.029186248779296875, 0.030134201049804688, 0.0310821533203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 12.0, 14.0, 19.0, 35.0, 42.0, 72.0, 123.0, 205.0, 395.0, 890.0, 2873.0, 18266.0, 703775.0, 3433722.0, 28182.0, 3659.0, 1028.0, 400.0, 208.0, 113.0, 83.0, 54.0, 34.0, 20.0, 18.0, 14.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.4900627136230469, -0.47719573974609375, -0.4643287658691406, -0.4514617919921875, -0.4385948181152344, -0.42572784423828125, -0.4128608703613281, -0.399993896484375, -0.3871269226074219, -0.37425994873046875, -0.3613929748535156, -0.3485260009765625, -0.3356590270996094, -0.32279205322265625, -0.3099250793457031, -0.29705810546875, -0.2841911315917969, -0.27132415771484375, -0.2584571838378906, -0.2455902099609375, -0.23272323608398438, -0.21985626220703125, -0.20698928833007812, -0.194122314453125, -0.18125534057617188, -0.16838836669921875, -0.15552139282226562, -0.1426544189453125, -0.12978744506835938, -0.11692047119140625, -0.10405349731445312, -0.0911865234375, -0.07831954956054688, -0.06545257568359375, -0.052585601806640625, -0.0397186279296875, -0.026851654052734375, -0.01398468017578125, -0.001117706298828125, 0.011749267578125, 0.024616241455078125, 0.03748321533203125, 0.050350189208984375, 0.0632171630859375, 0.07608413696289062, 0.08895111083984375, 0.10181808471679688, 0.11468505859375, 0.12755203247070312, 0.14041900634765625, 0.15328598022460938, 0.1661529541015625, 0.17901992797851562, 0.19188690185546875, 0.20475387573242188, 0.217620849609375, 0.23048782348632812, 0.24335479736328125, 0.2562217712402344, 0.2690887451171875, 0.2819557189941406, 0.29482269287109375, 0.3076896667480469, 0.320556640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 11.0, 13.0, 25.0, 60.0, 104.0, 319.0, 1926.0, 1123.0, 244.0, 112.0, 44.0, 36.0, 15.0, 11.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1856689453125, -0.1814422607421875, -0.177215576171875, -0.1729888916015625, -0.16876220703125, -0.1645355224609375, -0.160308837890625, -0.1560821533203125, -0.15185546875, -0.1476287841796875, -0.143402099609375, -0.1391754150390625, -0.13494873046875, -0.1307220458984375, -0.126495361328125, -0.1222686767578125, -0.1180419921875, -0.1138153076171875, -0.109588623046875, -0.1053619384765625, -0.10113525390625, -0.0969085693359375, -0.092681884765625, -0.0884552001953125, -0.084228515625, -0.0800018310546875, -0.075775146484375, -0.0715484619140625, -0.06732177734375, -0.0630950927734375, -0.058868408203125, -0.0546417236328125, -0.0504150390625, -0.0461883544921875, -0.041961669921875, -0.0377349853515625, -0.03350830078125, -0.0292816162109375, -0.025054931640625, -0.0208282470703125, -0.0166015625, -0.0123748779296875, -0.008148193359375, -0.0039215087890625, 0.00030517578125, 0.0045318603515625, 0.008758544921875, 0.0129852294921875, 0.0172119140625, 0.0214385986328125, 0.025665283203125, 0.0298919677734375, 0.03411865234375, 0.0383453369140625, 0.042572021484375, 0.0467987060546875, 0.051025390625, 0.0552520751953125, 0.059478759765625, 0.0637054443359375, 0.06793212890625, 0.0721588134765625, 0.076385498046875, 0.0806121826171875, 0.0848388671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 3.0, 7.0, 12.0, 28.0, 59.0, 168.0, 333.0, 262.0, 101.0, 22.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1944665908813477, -2.155172109603882, -2.115877628326416, -2.07658314704895, -2.0372886657714844, -1.9979941844940186, -1.9586997032165527, -1.919405221939087, -1.880110740661621, -1.8408162593841553, -1.8015217781066895, -1.7622272968292236, -1.7229328155517578, -1.683638334274292, -1.6443438529968262, -1.6050493717193604, -1.565755009651184, -1.5264605283737183, -1.4871660470962524, -1.4478715658187866, -1.4085770845413208, -1.369282603263855, -1.3299881219863892, -1.290693759918213, -1.251399278640747, -1.2121047973632812, -1.1728103160858154, -1.1335158348083496, -1.0942213535308838, -1.054926872253418, -1.0156323909759521, -0.9763379693031311, -0.9370435476303101, -0.8977490663528442, -0.8584545850753784, -0.8191601037979126, -0.7798656225204468, -0.740571141242981, -0.7012767195701599, -0.6619822382926941, -0.6226877570152283, -0.5833932757377625, -0.5440987944602966, -0.5048043131828308, -0.4655098617076874, -0.42621538043022156, -0.3869209289550781, -0.3476264476776123, -0.3083319664001465, -0.26903748512268066, -0.22974301874637604, -0.1904485523700714, -0.1511540710926056, -0.11185958981513977, -0.07256512343883514, -0.03327065706253052, 0.006023824214935303, 0.045318298041820526, 0.08461277186870575, 0.12390724569559097, 0.1632017195224762, 0.20249620079994202, 0.24179066717624664, 0.28108513355255127, 0.3203796148300171]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 9.0, 7.0, 16.0, 16.0, 16.0, 24.0, 23.0, 18.0, 44.0, 35.0, 36.0, 41.0, 36.0, 48.0, 42.0, 50.0, 40.0, 50.0, 57.0, 39.0, 41.0, 39.0, 44.0, 24.0, 38.0, 21.0, 21.0, 28.0, 15.0, 19.0, 14.0, 12.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.3971271514892578, -0.3860683739185333, -0.37500959634780884, -0.36395084857940674, -0.35289207100868225, -0.34183329343795776, -0.33077454566955566, -0.3197157680988312, -0.3086569905281067, -0.2975982129573822, -0.2865394353866577, -0.2754806876182556, -0.26442191004753113, -0.25336313247680664, -0.24230436980724335, -0.23124560713768005, -0.22018682956695557, -0.20912805199623108, -0.19806928932666779, -0.1870105266571045, -0.17595174908638, -0.16489297151565552, -0.15383420884609222, -0.14277544617652893, -0.13171666860580444, -0.12065789848566055, -0.10959912836551666, -0.09854035824537277, -0.08748158812522888, -0.07642281800508499, -0.0653640478849411, -0.05430527776479721, -0.04324650764465332, -0.03218773752450943, -0.02112896740436554, -0.01007019728422165, 0.0009885728359222412, 0.012047342956066132, 0.023106113076210022, 0.03416488319635391, 0.0452236533164978, 0.05628242343664169, 0.06734119355678558, 0.07839996367692947, 0.08945873379707336, 0.10051750391721725, 0.11157627403736115, 0.12263504415750504, 0.13369381427764893, 0.1447525918483734, 0.1558113545179367, 0.1668701171875, 0.1779288947582245, 0.18898767232894897, 0.20004643499851227, 0.21110519766807556, 0.22216397523880005, 0.23322275280952454, 0.24428151547908783, 0.2553402781486511, 0.2663990557193756, 0.2774578332901001, 0.2885165810585022, 0.2995753586292267, 0.31063413619995117]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 1.0, 8.0, 3.0, 5.0, 9.0, 11.0, 19.0, 22.0, 23.0, 37.0, 43.0, 67.0, 92.0, 135.0, 223.0, 355.0, 542.0, 995.0, 1666.0, 3079.0, 5930.0, 11402.0, 23915.0, 56239.0, 180791.0, 477148.0, 180985.0, 56369.0, 23867.0, 11454.0, 5783.0, 3050.0, 1742.0, 934.0, 563.0, 344.0, 216.0, 138.0, 88.0, 61.0, 48.0, 41.0, 21.0, 22.0, 14.0, 11.0, 8.0, 9.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.10113525390625, -0.0980234146118164, -0.09491157531738281, -0.09179973602294922, -0.08868789672851562, -0.08557605743408203, -0.08246421813964844, -0.07935237884521484, -0.07624053955078125, -0.07312870025634766, -0.07001686096191406, -0.06690502166748047, -0.06379318237304688, -0.06068134307861328, -0.05756950378417969, -0.054457664489746094, -0.0513458251953125, -0.048233985900878906, -0.04512214660644531, -0.04201030731201172, -0.038898468017578125, -0.03578662872314453, -0.03267478942871094, -0.029562950134277344, -0.02645111083984375, -0.023339271545410156, -0.020227432250976562, -0.01711559295654297, -0.014003753662109375, -0.010891914367675781, -0.0077800750732421875, -0.004668235778808594, -0.001556396484375, 0.0015554428100585938, 0.0046672821044921875, 0.007779121398925781, 0.010890960693359375, 0.014002799987792969, 0.017114639282226562, 0.020226478576660156, 0.02333831787109375, 0.026450157165527344, 0.029561996459960938, 0.03267383575439453, 0.035785675048828125, 0.03889751434326172, 0.04200935363769531, 0.045121192932128906, 0.0482330322265625, 0.051344871520996094, 0.05445671081542969, 0.05756855010986328, 0.060680389404296875, 0.06379222869873047, 0.06690406799316406, 0.07001590728759766, 0.07312774658203125, 0.07623958587646484, 0.07935142517089844, 0.08246326446533203, 0.08557510375976562, 0.08868694305419922, 0.09179878234863281, 0.0949106216430664, 0.0980224609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 9.0, 5.0, 14.0, 10.0, 11.0, 15.0, 14.0, 15.0, 19.0, 30.0, 27.0, 27.0, 29.0, 30.0, 34.0, 28.0, 35.0, 30.0, 43.0, 36.0, 46.0, 36.0, 46.0, 47.0, 43.0, 37.0, 31.0, 25.0, 27.0, 24.0, 27.0, 20.0, 16.0, 18.0, 15.0, 14.0, 10.0, 12.0, 8.0, 7.0, 6.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02996826171875, -0.029040813446044922, -0.028113365173339844, -0.027185916900634766, -0.026258468627929688, -0.02533102035522461, -0.02440357208251953, -0.023476123809814453, -0.022548675537109375, -0.021621227264404297, -0.02069377899169922, -0.01976633071899414, -0.018838882446289062, -0.017911434173583984, -0.016983985900878906, -0.016056537628173828, -0.01512908935546875, -0.014201641082763672, -0.013274192810058594, -0.012346744537353516, -0.011419296264648438, -0.01049184799194336, -0.009564399719238281, -0.008636951446533203, -0.007709503173828125, -0.006782054901123047, -0.005854606628417969, -0.004927158355712891, -0.0039997100830078125, -0.0030722618103027344, -0.0021448135375976562, -0.0012173652648925781, -0.0002899169921875, 0.0006375312805175781, 0.0015649795532226562, 0.0024924278259277344, 0.0034198760986328125, 0.004347324371337891, 0.005274772644042969, 0.006202220916748047, 0.007129669189453125, 0.008057117462158203, 0.008984565734863281, 0.00991201400756836, 0.010839462280273438, 0.011766910552978516, 0.012694358825683594, 0.013621807098388672, 0.01454925537109375, 0.015476703643798828, 0.016404151916503906, 0.017331600189208984, 0.018259048461914062, 0.01918649673461914, 0.02011394500732422, 0.021041393280029297, 0.021968841552734375, 0.022896289825439453, 0.02382373809814453, 0.02475118637084961, 0.025678634643554688, 0.026606082916259766, 0.027533531188964844, 0.028460979461669922, 0.029388427734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 10.0, 7.0, 13.0, 19.0, 15.0, 17.0, 25.0, 41.0, 66.0, 88.0, 182.0, 262.0, 449.0, 901.0, 1929.0, 5260.0, 17451.0, 78168.0, 807341.0, 104741.0, 20841.0, 6043.0, 2334.0, 1056.0, 489.0, 313.0, 143.0, 111.0, 60.0, 46.0, 36.0, 29.0, 11.0, 10.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.2418212890625, -0.2346172332763672, -0.22741317749023438, -0.22020912170410156, -0.21300506591796875, -0.20580101013183594, -0.19859695434570312, -0.1913928985595703, -0.1841888427734375, -0.1769847869873047, -0.16978073120117188, -0.16257667541503906, -0.15537261962890625, -0.14816856384277344, -0.14096450805664062, -0.1337604522705078, -0.126556396484375, -0.11935234069824219, -0.11214828491210938, -0.10494422912597656, -0.09774017333984375, -0.09053611755371094, -0.08333206176757812, -0.07612800598144531, -0.0689239501953125, -0.06171989440917969, -0.054515838623046875, -0.04731178283691406, -0.04010772705078125, -0.03290367126464844, -0.025699615478515625, -0.018495559692382812, -0.01129150390625, -0.0040874481201171875, 0.003116607666015625, 0.010320663452148438, 0.01752471923828125, 0.024728775024414062, 0.031932830810546875, 0.03913688659667969, 0.0463409423828125, 0.05354499816894531, 0.060749053955078125, 0.06795310974121094, 0.07515716552734375, 0.08236122131347656, 0.08956527709960938, 0.09676933288574219, 0.103973388671875, 0.11117744445800781, 0.11838150024414062, 0.12558555603027344, 0.13278961181640625, 0.13999366760253906, 0.14719772338867188, 0.1544017791748047, 0.1616058349609375, 0.1688098907470703, 0.17601394653320312, 0.18321800231933594, 0.19042205810546875, 0.19762611389160156, 0.20483016967773438, 0.2120342254638672, 0.21923828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 0.0, 3.0, 8.0, 6.0, 7.0, 5.0, 10.0, 15.0, 33.0, 44.0, 66.0, 48.0, 67.0, 78.0, 82.0, 90.0, 76.0, 81.0, 75.0, 55.0, 36.0, 39.0, 14.0, 13.0, 9.0, 7.0, 7.0, 9.0, 6.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.271240234375, -0.26287841796875, -0.2545166015625, -0.24615478515625, -0.23779296875, -0.22943115234375, -0.2210693359375, -0.21270751953125, -0.204345703125, -0.19598388671875, -0.1876220703125, -0.17926025390625, -0.1708984375, -0.16253662109375, -0.1541748046875, -0.14581298828125, -0.137451171875, -0.12908935546875, -0.1207275390625, -0.11236572265625, -0.10400390625, -0.09564208984375, -0.0872802734375, -0.07891845703125, -0.070556640625, -0.06219482421875, -0.0538330078125, -0.04547119140625, -0.037109375, -0.02874755859375, -0.0203857421875, -0.01202392578125, -0.003662109375, 0.00469970703125, 0.0130615234375, 0.02142333984375, 0.02978515625, 0.03814697265625, 0.0465087890625, 0.05487060546875, 0.063232421875, 0.07159423828125, 0.0799560546875, 0.08831787109375, 0.0966796875, 0.10504150390625, 0.1134033203125, 0.12176513671875, 0.130126953125, 0.13848876953125, 0.1468505859375, 0.15521240234375, 0.16357421875, 0.17193603515625, 0.1802978515625, 0.18865966796875, 0.197021484375, 0.20538330078125, 0.2137451171875, 0.22210693359375, 0.23046875, 0.23883056640625, 0.2471923828125, 0.25555419921875, 0.263916015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 7.0, 7.0, 6.0, 16.0, 20.0, 35.0, 33.0, 61.0, 108.0, 172.0, 249.0, 477.0, 771.0, 1286.0, 2311.0, 4561.0, 10911.0, 34098.0, 262206.0, 653270.0, 51444.0, 14343.0, 5643.0, 2770.0, 1489.0, 884.0, 504.0, 313.0, 213.0, 120.0, 74.0, 40.0, 38.0, 23.0, 14.0, 8.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.10986328125, -0.10664558410644531, -0.10342788696289062, -0.10021018981933594, -0.09699249267578125, -0.09377479553222656, -0.09055709838867188, -0.08733940124511719, -0.0841217041015625, -0.08090400695800781, -0.07768630981445312, -0.07446861267089844, -0.07125091552734375, -0.06803321838378906, -0.06481552124023438, -0.06159782409667969, -0.058380126953125, -0.05516242980957031, -0.051944732666015625, -0.04872703552246094, -0.04550933837890625, -0.04229164123535156, -0.039073944091796875, -0.03585624694824219, -0.0326385498046875, -0.029420852661132812, -0.026203155517578125, -0.022985458374023438, -0.01976776123046875, -0.016550064086914062, -0.013332366943359375, -0.010114669799804688, -0.00689697265625, -0.0036792755126953125, -0.000461578369140625, 0.0027561187744140625, 0.00597381591796875, 0.009191513061523438, 0.012409210205078125, 0.015626907348632812, 0.0188446044921875, 0.022062301635742188, 0.025279998779296875, 0.028497695922851562, 0.03171539306640625, 0.03493309020996094, 0.038150787353515625, 0.04136848449707031, 0.044586181640625, 0.04780387878417969, 0.051021575927734375, 0.05423927307128906, 0.05745697021484375, 0.06067466735839844, 0.06389236450195312, 0.06711006164550781, 0.0703277587890625, 0.07354545593261719, 0.07676315307617188, 0.07998085021972656, 0.08319854736328125, 0.08641624450683594, 0.08963394165039062, 0.09285163879394531, 0.0960693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 6.0, 2.0, 11.0, 19.0, 19.0, 32.0, 24.0, 47.0, 47.0, 51.0, 83.0, 81.0, 73.0, 90.0, 82.0, 61.0, 56.0, 51.0, 43.0, 28.0, 20.0, 21.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.252527236938477e-05, -6.0549937188625336e-05, -5.8574602007865906e-05, -5.6599266827106476e-05, -5.4623931646347046e-05, -5.2648596465587616e-05, -5.0673261284828186e-05, -4.8697926104068756e-05, -4.6722590923309326e-05, -4.4747255742549896e-05, -4.2771920561790466e-05, -4.0796585381031036e-05, -3.8821250200271606e-05, -3.6845915019512177e-05, -3.4870579838752747e-05, -3.289524465799332e-05, -3.091990947723389e-05, -2.8944574296474457e-05, -2.6969239115715027e-05, -2.4993903934955597e-05, -2.3018568754196167e-05, -2.1043233573436737e-05, -1.9067898392677307e-05, -1.7092563211917877e-05, -1.5117228031158447e-05, -1.3141892850399017e-05, -1.1166557669639587e-05, -9.191222488880157e-06, -7.2158873081207275e-06, -5.240552127361298e-06, -3.2652169466018677e-06, -1.2898817658424377e-06, 6.854534149169922e-07, 2.660788595676422e-06, 4.636123776435852e-06, 6.611458957195282e-06, 8.586794137954712e-06, 1.0562129318714142e-05, 1.2537464499473572e-05, 1.4512799680233002e-05, 1.648813486099243e-05, 1.846347004175186e-05, 2.043880522251129e-05, 2.241414040327072e-05, 2.438947558403015e-05, 2.636481076478958e-05, 2.834014594554901e-05, 3.031548112630844e-05, 3.229081630706787e-05, 3.42661514878273e-05, 3.624148666858673e-05, 3.821682184934616e-05, 4.019215703010559e-05, 4.216749221086502e-05, 4.414282739162445e-05, 4.611816257238388e-05, 4.809349775314331e-05, 5.006883293390274e-05, 5.204416811466217e-05, 5.40195032954216e-05, 5.599483847618103e-05, 5.797017365694046e-05, 5.994550883769989e-05, 6.192084401845932e-05, 6.389617919921875e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 4.0, 10.0, 11.0, 19.0, 18.0, 24.0, 37.0, 51.0, 82.0, 154.0, 209.0, 404.0, 711.0, 1455.0, 2973.0, 7242.0, 22237.0, 112134.0, 802762.0, 70029.0, 16652.0, 5965.0, 2582.0, 1208.0, 635.0, 336.0, 180.0, 120.0, 86.0, 58.0, 44.0, 33.0, 22.0, 12.0, 5.0, 5.0, 10.0, 2.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.1033935546875, -0.10009956359863281, -0.09680557250976562, -0.09351158142089844, -0.09021759033203125, -0.08692359924316406, -0.08362960815429688, -0.08033561706542969, -0.0770416259765625, -0.07374763488769531, -0.07045364379882812, -0.06715965270996094, -0.06386566162109375, -0.06057167053222656, -0.057277679443359375, -0.05398368835449219, -0.050689697265625, -0.04739570617675781, -0.044101715087890625, -0.04080772399902344, -0.03751373291015625, -0.03421974182128906, -0.030925750732421875, -0.027631759643554688, -0.0243377685546875, -0.021043777465820312, -0.017749786376953125, -0.014455795288085938, -0.01116180419921875, -0.007867813110351562, -0.004573822021484375, -0.0012798309326171875, 0.00201416015625, 0.0053081512451171875, 0.008602142333984375, 0.011896133422851562, 0.01519012451171875, 0.018484115600585938, 0.021778106689453125, 0.025072097778320312, 0.0283660888671875, 0.03166007995605469, 0.034954071044921875, 0.03824806213378906, 0.04154205322265625, 0.04483604431152344, 0.048130035400390625, 0.05142402648925781, 0.054718017578125, 0.05801200866699219, 0.061305999755859375, 0.06459999084472656, 0.06789398193359375, 0.07118797302246094, 0.07448196411132812, 0.07777595520019531, 0.0810699462890625, 0.08436393737792969, 0.08765792846679688, 0.09095191955566406, 0.09424591064453125, 0.09753990173339844, 0.10083389282226562, 0.10412788391113281, 0.107421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 7.0, 9.0, 20.0, 15.0, 22.0, 48.0, 106.0, 209.0, 224.0, 123.0, 59.0, 31.0, 14.0, 13.0, 9.0, 13.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.096923828125, -0.09407806396484375, -0.0912322998046875, -0.08838653564453125, -0.085540771484375, -0.08269500732421875, -0.0798492431640625, -0.07700347900390625, -0.07415771484375, -0.07131195068359375, -0.0684661865234375, -0.06562042236328125, -0.062774658203125, -0.05992889404296875, -0.0570831298828125, -0.05423736572265625, -0.0513916015625, -0.04854583740234375, -0.0457000732421875, -0.04285430908203125, -0.040008544921875, -0.03716278076171875, -0.0343170166015625, -0.03147125244140625, -0.02862548828125, -0.02577972412109375, -0.0229339599609375, -0.02008819580078125, -0.017242431640625, -0.01439666748046875, -0.0115509033203125, -0.00870513916015625, -0.005859375, -0.00301361083984375, -0.0001678466796875, 0.00267791748046875, 0.005523681640625, 0.00836944580078125, 0.0112152099609375, 0.01406097412109375, 0.01690673828125, 0.01975250244140625, 0.0225982666015625, 0.02544403076171875, 0.028289794921875, 0.03113555908203125, 0.0339813232421875, 0.03682708740234375, 0.0396728515625, 0.04251861572265625, 0.0453643798828125, 0.04821014404296875, 0.051055908203125, 0.05390167236328125, 0.0567474365234375, 0.05959320068359375, 0.06243896484375, 0.06528472900390625, 0.0681304931640625, 0.07097625732421875, 0.073822021484375, 0.07666778564453125, 0.0795135498046875, 0.08235931396484375, 0.085205078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 29.0, 114.0, 293.0, 311.0, 163.0, 59.0, 16.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9813679456710815, -0.9007859230041504, -0.8202039003372192, -0.7396219372749329, -0.6590399146080017, -0.5784578919410706, -0.4978758990764618, -0.417293906211853, -0.3367118835449219, -0.2561298608779907, -0.17554786801338196, -0.094965860247612, -0.014383852481842041, 0.06619817018508911, 0.14678016304969788, 0.22736215591430664, 0.3079441785812378, 0.38852620124816895, 0.4691081941127777, 0.5496901869773865, 0.6302722096443176, 0.7108542323112488, 0.7914361953735352, 0.8720182180404663, 0.9526002407073975, 1.0331822633743286, 1.1137642860412598, 1.194346308708191, 1.274928331375122, 1.3555102348327637, 1.4360922574996948, 1.516674280166626, 1.5972561836242676, 1.6778382062911987, 1.7584202289581299, 1.839002251625061, 1.9195842742919922, 2.000166177749634, 2.0807483196258545, 2.161330223083496, 2.241912364959717, 2.3224942684173584, 2.403076410293579, 2.4836583137512207, 2.5642404556274414, 2.644822359085083, 2.7254045009613037, 2.8059864044189453, 2.886568307876587, 2.9671502113342285, 3.047732353210449, 3.128314256668091, 3.2088963985443115, 3.289478302001953, 3.370060443878174, 3.4506423473358154, 3.531224250793457, 3.6118061542510986, 3.6923882961273193, 3.772970199584961, 3.8535523414611816, 3.9341342449188232, 4.014716148376465, 4.0952982902526855, 4.175880432128906]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 12.0, 16.0, 14.0, 7.0, 22.0, 13.0, 15.0, 25.0, 20.0, 19.0, 24.0, 18.0, 22.0, 32.0, 29.0, 41.0, 36.0, 42.0, 45.0, 27.0, 38.0, 40.0, 48.0, 37.0, 41.0, 30.0, 34.0, 24.0, 15.0, 19.0, 26.0, 30.0, 20.0, 12.0, 19.0, 10.0, 17.0, 9.0, 12.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6211733818054199, -0.6012370586395264, -0.5813007354736328, -0.5613644123077393, -0.5414280891418457, -0.5214917659759521, -0.5015554428100586, -0.4816191494464874, -0.46168282628059387, -0.4417465031147003, -0.42181017994880676, -0.4018738567829132, -0.38193756341934204, -0.3620012402534485, -0.34206491708755493, -0.3221285939216614, -0.3021922707557678, -0.28225594758987427, -0.2623196244239807, -0.24238331615924835, -0.2224469929933548, -0.20251066982746124, -0.18257436156272888, -0.16263803839683533, -0.14270171523094177, -0.12276539206504822, -0.10282907634973526, -0.0828927606344223, -0.06295643746852875, -0.04302011430263519, -0.023083798587322235, -0.0031474828720092773, 0.016788840293884277, 0.036725159734487534, 0.05666147917509079, 0.07659779489040375, 0.0965341180562973, 0.11647044122219086, 0.13640674948692322, 0.15634307265281677, 0.17627939581871033, 0.19621571898460388, 0.21615204215049744, 0.2360883504152298, 0.25602465867996216, 0.2759609818458557, 0.29589730501174927, 0.3158336281776428, 0.3357699513435364, 0.35570627450942993, 0.3756425976753235, 0.39557892084121704, 0.4155152440071106, 0.43545156717300415, 0.4553878605365753, 0.47532418370246887, 0.4952605068683624, 0.5151968002319336, 0.5351331233978271, 0.5550694465637207, 0.5750057697296143, 0.5949420928955078, 0.6148784160614014, 0.6348147392272949, 0.6547510623931885]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 8.0, 5.0, 10.0, 25.0, 28.0, 52.0, 73.0, 122.0, 180.0, 341.0, 594.0, 1037.0, 1771.0, 3311.0, 6697.0, 15294.0, 45056.0, 274311.0, 3626938.0, 160182.0, 33887.0, 12305.0, 5557.0, 2807.0, 1516.0, 892.0, 544.0, 276.0, 174.0, 105.0, 70.0, 51.0, 15.0, 19.0, 10.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24920082092285156, -0.24303054809570312, -0.2368602752685547, -0.23069000244140625, -0.2245197296142578, -0.21834945678710938, -0.21217918395996094, -0.2060089111328125, -0.19983863830566406, -0.19366836547851562, -0.1874980926513672, -0.18132781982421875, -0.1751575469970703, -0.16898727416992188, -0.16281700134277344, -0.156646728515625, -0.15047645568847656, -0.14430618286132812, -0.1381359100341797, -0.13196563720703125, -0.1257953643798828, -0.11962509155273438, -0.11345481872558594, -0.1072845458984375, -0.10111427307128906, -0.09494400024414062, -0.08877372741699219, -0.08260345458984375, -0.07643318176269531, -0.07026290893554688, -0.06409263610839844, -0.05792236328125, -0.05175209045410156, -0.045581817626953125, -0.03941154479980469, -0.03324127197265625, -0.027070999145507812, -0.020900726318359375, -0.014730453491210938, -0.0085601806640625, -0.0023899078369140625, 0.003780364990234375, 0.009950637817382812, 0.01612091064453125, 0.022291183471679688, 0.028461456298828125, 0.03463172912597656, 0.040802001953125, 0.04697227478027344, 0.053142547607421875, 0.05931282043457031, 0.06548309326171875, 0.07165336608886719, 0.07782363891601562, 0.08399391174316406, 0.0901641845703125, 0.09633445739746094, 0.10250473022460938, 0.10867500305175781, 0.11484527587890625, 0.12101554870605469, 0.12718582153320312, 0.13335609436035156, 0.1395263671875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 15.0, 12.0, 17.0, 19.0, 21.0, 24.0, 17.0, 24.0, 19.0, 32.0, 31.0, 33.0, 34.0, 38.0, 42.0, 37.0, 43.0, 34.0, 38.0, 42.0, 43.0, 35.0, 29.0, 35.0, 32.0, 24.0, 29.0, 24.0, 28.0, 16.0, 17.0, 22.0, 14.0, 8.0, 15.0, 7.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.032196044921875, -0.03123307228088379, -0.030270099639892578, -0.029307126998901367, -0.028344154357910156, -0.027381181716918945, -0.026418209075927734, -0.025455236434936523, -0.024492263793945312, -0.0235292911529541, -0.02256631851196289, -0.02160334587097168, -0.02064037322998047, -0.019677400588989258, -0.018714427947998047, -0.017751455307006836, -0.016788482666015625, -0.015825510025024414, -0.014862537384033203, -0.013899564743041992, -0.012936592102050781, -0.01197361946105957, -0.01101064682006836, -0.010047674179077148, -0.009084701538085938, -0.008121728897094727, -0.007158756256103516, -0.006195783615112305, -0.005232810974121094, -0.004269838333129883, -0.003306865692138672, -0.002343893051147461, -0.00138092041015625, -0.00041794776916503906, 0.0005450248718261719, 0.0015079975128173828, 0.0024709701538085938, 0.0034339427947998047, 0.004396915435791016, 0.0053598880767822266, 0.0063228607177734375, 0.0072858333587646484, 0.00824880599975586, 0.00921177864074707, 0.010174751281738281, 0.011137723922729492, 0.012100696563720703, 0.013063669204711914, 0.014026641845703125, 0.014989614486694336, 0.015952587127685547, 0.016915559768676758, 0.01787853240966797, 0.01884150505065918, 0.01980447769165039, 0.0207674503326416, 0.021730422973632812, 0.022693395614624023, 0.023656368255615234, 0.024619340896606445, 0.025582313537597656, 0.026545286178588867, 0.027508258819580078, 0.02847123146057129, 0.0294342041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 12.0, 7.0, 31.0, 40.0, 32.0, 54.0, 102.0, 255.0, 727.0, 2937.0, 35754.0, 4089469.0, 59573.0, 3796.0, 832.0, 263.0, 125.0, 82.0, 50.0, 41.0, 26.0, 21.0, 9.0, 14.0, 0.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6267013549804688, -0.5976409912109375, -0.5685806274414062, -0.539520263671875, -0.5104598999023438, -0.4813995361328125, -0.45233917236328125, -0.42327880859375, -0.39421844482421875, -0.3651580810546875, -0.33609771728515625, -0.307037353515625, -0.27797698974609375, -0.2489166259765625, -0.21985626220703125, -0.1907958984375, -0.16173553466796875, -0.1326751708984375, -0.10361480712890625, -0.074554443359375, -0.04549407958984375, -0.0164337158203125, 0.01262664794921875, 0.04168701171875, 0.07074737548828125, 0.0998077392578125, 0.12886810302734375, 0.157928466796875, 0.18698883056640625, 0.2160491943359375, 0.24510955810546875, 0.274169921875, 0.30323028564453125, 0.3322906494140625, 0.36135101318359375, 0.390411376953125, 0.41947174072265625, 0.4485321044921875, 0.47759246826171875, 0.50665283203125, 0.5357131958007812, 0.5647735595703125, 0.5938339233398438, 0.622894287109375, 0.6519546508789062, 0.6810150146484375, 0.7100753784179688, 0.7391357421875, 0.7681961059570312, 0.7972564697265625, 0.8263168334960938, 0.855377197265625, 0.8844375610351562, 0.9134979248046875, 0.9425582885742188, 0.97161865234375, 1.0006790161132812, 1.0297393798828125, 1.0587997436523438, 1.087860107421875, 1.1169204711914062, 1.1459808349609375, 1.1750411987304688, 1.2041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 12.0, 24.0, 35.0, 97.0, 352.0, 2965.0, 394.0, 100.0, 40.0, 19.0, 19.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1458415985107422, -0.13702011108398438, -0.12819862365722656, -0.11937713623046875, -0.11055564880371094, -0.10173416137695312, -0.09291267395019531, -0.0840911865234375, -0.07526969909667969, -0.06644821166992188, -0.05762672424316406, -0.04880523681640625, -0.03998374938964844, -0.031162261962890625, -0.022340774536132812, -0.013519287109375, -0.0046977996826171875, 0.004123687744140625, 0.012945175170898438, 0.02176666259765625, 0.030588150024414062, 0.039409637451171875, 0.04823112487792969, 0.0570526123046875, 0.06587409973144531, 0.07469558715820312, 0.08351707458496094, 0.09233856201171875, 0.10116004943847656, 0.10998153686523438, 0.11880302429199219, 0.12762451171875, 0.1364459991455078, 0.14526748657226562, 0.15408897399902344, 0.16291046142578125, 0.17173194885253906, 0.18055343627929688, 0.1893749237060547, 0.1981964111328125, 0.2070178985595703, 0.21583938598632812, 0.22466087341308594, 0.23348236083984375, 0.24230384826660156, 0.2511253356933594, 0.2599468231201172, 0.268768310546875, 0.2775897979736328, 0.2864112854003906, 0.29523277282714844, 0.30405426025390625, 0.31287574768066406, 0.3216972351074219, 0.3305187225341797, 0.3393402099609375, 0.3481616973876953, 0.3569831848144531, 0.36580467224121094, 0.37462615966796875, 0.38344764709472656, 0.3922691345214844, 0.4010906219482422, 0.409912109375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 22.0, 24.0, 40.0, 86.0, 119.0, 208.0, 171.0, 125.0, 76.0, 49.0, 28.0, 16.0, 8.0, 4.0, 2.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1639801263809204, -1.1332707405090332, -1.1025614738464355, -1.0718520879745483, -1.0411428213119507, -1.0104334354400635, -0.979724109172821, -0.9490147829055786, -0.9183054566383362, -0.8875961303710938, -0.8568868041038513, -0.8261774778366089, -0.7954680919647217, -0.764758825302124, -0.7340494394302368, -0.7033401131629944, -0.672630786895752, -0.6419214606285095, -0.6112121343612671, -0.5805028080940247, -0.5497934818267822, -0.519084095954895, -0.4883747696876526, -0.45766544342041016, -0.4269561171531677, -0.3962467908859253, -0.36553746461868286, -0.33482810854911804, -0.3041187822818756, -0.2734094560146332, -0.24270011484622955, -0.21199077367782593, -0.18128150701522827, -0.15057218074798584, -0.11986283957958221, -0.08915350586175919, -0.05844417214393616, -0.027734845876693726, 0.0029744952917099, 0.033683836460113525, 0.06439316272735596, 0.09510249644517899, 0.12581183016300201, 0.15652117133140564, 0.18723049759864807, 0.2179398238658905, 0.24864916503429413, 0.27935850620269775, 0.3100678324699402, 0.3407771587371826, 0.37148648500442505, 0.40219584107398987, 0.4329051673412323, 0.46361449360847473, 0.49432384967803955, 0.525033175945282, 0.5557425022125244, 0.5864518284797668, 0.6171611547470093, 0.6478704810142517, 0.6785798072814941, 0.7092891931533813, 0.7399985194206238, 0.7707078456878662, 0.8014171719551086]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 9.0, 12.0, 8.0, 8.0, 15.0, 20.0, 16.0, 21.0, 25.0, 24.0, 30.0, 38.0, 38.0, 44.0, 41.0, 47.0, 35.0, 33.0, 59.0, 50.0, 46.0, 42.0, 42.0, 41.0, 24.0, 41.0, 28.0, 30.0, 22.0, 14.0, 15.0, 18.0, 14.0, 6.0, 6.0, 8.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4577382802963257, -0.44301486015319824, -0.4282914698123932, -0.41356804966926575, -0.3988446295261383, -0.38412123918533325, -0.3693978190422058, -0.35467439889907837, -0.3399509787559509, -0.3252275586128235, -0.31050416827201843, -0.295780748128891, -0.28105732798576355, -0.2663339376449585, -0.25161051750183105, -0.2368870973587036, -0.22216370701789856, -0.2074403017759323, -0.19271688163280487, -0.17799347639083862, -0.16327005624771118, -0.14854665100574493, -0.1338232457637787, -0.11909983307123184, -0.104376420378685, -0.08965300768613815, -0.07492959499359131, -0.06020618975162506, -0.04548277705907822, -0.030759364366531372, -0.016035959124565125, -0.00131254643201828, 0.013410866260528564, 0.02813427709043026, 0.042857687920331955, 0.0575810968875885, 0.07230450958013535, 0.08702792227268219, 0.10175132751464844, 0.11647474020719528, 0.13119815289974213, 0.14592155814170837, 0.16064497828483582, 0.17536838352680206, 0.1900917887687683, 0.20481520891189575, 0.219538614153862, 0.23426201939582825, 0.2489854395389557, 0.26370885968208313, 0.2784322500228882, 0.2931556701660156, 0.30787909030914307, 0.3226025104522705, 0.33732590079307556, 0.352049320936203, 0.36677271127700806, 0.3814961314201355, 0.39621952176094055, 0.410942941904068, 0.42566636204719543, 0.4403897523880005, 0.45511317253112793, 0.46983659267425537, 0.4845600128173828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 7.0, 4.0, 14.0, 14.0, 43.0, 50.0, 91.0, 186.0, 317.0, 592.0, 1261.0, 2903.0, 7308.0, 19841.0, 62455.0, 214376.0, 493058.0, 168203.0, 50396.0, 16575.0, 6107.0, 2452.0, 1123.0, 536.0, 280.0, 156.0, 78.0, 44.0, 38.0, 17.0, 5.0, 10.0, 8.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1715087890625, -0.16475868225097656, -0.15800857543945312, -0.1512584686279297, -0.14450836181640625, -0.1377582550048828, -0.13100814819335938, -0.12425804138183594, -0.1175079345703125, -0.11075782775878906, -0.10400772094726562, -0.09725761413574219, -0.09050750732421875, -0.08375740051269531, -0.07700729370117188, -0.07025718688964844, -0.063507080078125, -0.05675697326660156, -0.050006866455078125, -0.04325675964355469, -0.03650665283203125, -0.029756546020507812, -0.023006439208984375, -0.016256332397460938, -0.0095062255859375, -0.0027561187744140625, 0.003993988037109375, 0.010744094848632812, 0.01749420166015625, 0.024244308471679688, 0.030994415283203125, 0.03774452209472656, 0.04449462890625, 0.05124473571777344, 0.057994842529296875, 0.06474494934082031, 0.07149505615234375, 0.07824516296386719, 0.08499526977539062, 0.09174537658691406, 0.0984954833984375, 0.10524559020996094, 0.11199569702148438, 0.11874580383300781, 0.12549591064453125, 0.1322460174560547, 0.13899612426757812, 0.14574623107910156, 0.152496337890625, 0.15924644470214844, 0.16599655151367188, 0.1727466583251953, 0.17949676513671875, 0.1862468719482422, 0.19299697875976562, 0.19974708557128906, 0.2064971923828125, 0.21324729919433594, 0.21999740600585938, 0.2267475128173828, 0.23349761962890625, 0.2402477264404297, 0.24699783325195312, 0.25374794006347656, 0.260498046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 5.0, 5.0, 7.0, 9.0, 9.0, 12.0, 10.0, 19.0, 18.0, 22.0, 23.0, 27.0, 29.0, 33.0, 27.0, 34.0, 26.0, 34.0, 33.0, 48.0, 34.0, 38.0, 42.0, 37.0, 42.0, 38.0, 36.0, 36.0, 33.0, 37.0, 28.0, 22.0, 24.0, 21.0, 14.0, 17.0, 16.0, 13.0, 7.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.042266845703125, -0.04100465774536133, -0.039742469787597656, -0.038480281829833984, -0.03721809387207031, -0.03595590591430664, -0.03469371795654297, -0.0334315299987793, -0.032169342041015625, -0.030907154083251953, -0.02964496612548828, -0.02838277816772461, -0.027120590209960938, -0.025858402252197266, -0.024596214294433594, -0.023334026336669922, -0.02207183837890625, -0.020809650421142578, -0.019547462463378906, -0.018285274505615234, -0.017023086547851562, -0.01576089859008789, -0.014498710632324219, -0.013236522674560547, -0.011974334716796875, -0.010712146759033203, -0.009449958801269531, -0.00818777084350586, -0.0069255828857421875, -0.005663394927978516, -0.004401206970214844, -0.003139019012451172, -0.0018768310546875, -0.0006146430969238281, 0.0006475448608398438, 0.0019097328186035156, 0.0031719207763671875, 0.004434108734130859, 0.005696296691894531, 0.006958484649658203, 0.008220672607421875, 0.009482860565185547, 0.010745048522949219, 0.01200723648071289, 0.013269424438476562, 0.014531612396240234, 0.015793800354003906, 0.017055988311767578, 0.01831817626953125, 0.019580364227294922, 0.020842552185058594, 0.022104740142822266, 0.023366928100585938, 0.02462911605834961, 0.02589130401611328, 0.027153491973876953, 0.028415679931640625, 0.029677867889404297, 0.03094005584716797, 0.03220224380493164, 0.03346443176269531, 0.034726619720458984, 0.035988807678222656, 0.03725099563598633, 0.03851318359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 5.0, 11.0, 13.0, 17.0, 25.0, 39.0, 41.0, 69.0, 84.0, 118.0, 191.0, 236.0, 346.0, 600.0, 915.0, 1724.0, 3799.0, 10789.0, 44075.0, 250974.0, 606974.0, 95703.0, 20062.0, 5963.0, 2439.0, 1264.0, 688.0, 416.0, 264.0, 208.0, 137.0, 109.0, 63.0, 49.0, 27.0, 24.0, 31.0, 20.0, 6.0, 10.0, 4.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283935546875, -0.2748451232910156, -0.26575469970703125, -0.2566642761230469, -0.2475738525390625, -0.23848342895507812, -0.22939300537109375, -0.22030258178710938, -0.211212158203125, -0.20212173461914062, -0.19303131103515625, -0.18394088745117188, -0.1748504638671875, -0.16576004028320312, -0.15666961669921875, -0.14757919311523438, -0.13848876953125, -0.12939834594726562, -0.12030792236328125, -0.11121749877929688, -0.1021270751953125, -0.09303665161132812, -0.08394622802734375, -0.07485580444335938, -0.065765380859375, -0.056674957275390625, -0.04758453369140625, -0.038494110107421875, -0.0294036865234375, -0.020313262939453125, -0.01122283935546875, -0.002132415771484375, 0.0069580078125, 0.016048431396484375, 0.02513885498046875, 0.034229278564453125, 0.0433197021484375, 0.052410125732421875, 0.06150054931640625, 0.07059097290039062, 0.079681396484375, 0.08877182006835938, 0.09786224365234375, 0.10695266723632812, 0.1160430908203125, 0.12513351440429688, 0.13422393798828125, 0.14331436157226562, 0.15240478515625, 0.16149520874023438, 0.17058563232421875, 0.17967605590820312, 0.1887664794921875, 0.19785690307617188, 0.20694732666015625, 0.21603775024414062, 0.225128173828125, 0.23421859741210938, 0.24330902099609375, 0.2523994445800781, 0.2614898681640625, 0.2705802917480469, 0.27967071533203125, 0.2887611389160156, 0.2978515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 15.0, 9.0, 15.0, 13.0, 19.0, 26.0, 25.0, 34.0, 40.0, 48.0, 37.0, 47.0, 61.0, 55.0, 70.0, 58.0, 55.0, 51.0, 42.0, 35.0, 30.0, 29.0, 31.0, 27.0, 21.0, 14.0, 15.0, 12.0, 13.0, 12.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.22795486450195312, -0.21909332275390625, -0.21023178100585938, -0.2013702392578125, -0.19250869750976562, -0.18364715576171875, -0.17478561401367188, -0.165924072265625, -0.15706253051757812, -0.14820098876953125, -0.13933944702148438, -0.1304779052734375, -0.12161636352539062, -0.11275482177734375, -0.10389328002929688, -0.09503173828125, -0.08617019653320312, -0.07730865478515625, -0.06844711303710938, -0.0595855712890625, -0.050724029541015625, -0.04186248779296875, -0.033000946044921875, -0.024139404296875, -0.015277862548828125, -0.00641632080078125, 0.002445220947265625, 0.0113067626953125, 0.020168304443359375, 0.02902984619140625, 0.037891387939453125, 0.0467529296875, 0.055614471435546875, 0.06447601318359375, 0.07333755493164062, 0.0821990966796875, 0.09106063842773438, 0.09992218017578125, 0.10878372192382812, 0.117645263671875, 0.12650680541992188, 0.13536834716796875, 0.14422988891601562, 0.1530914306640625, 0.16195297241210938, 0.17081451416015625, 0.17967605590820312, 0.18853759765625, 0.19739913940429688, 0.20626068115234375, 0.21512222290039062, 0.2239837646484375, 0.23284530639648438, 0.24170684814453125, 0.2505683898925781, 0.259429931640625, 0.2682914733886719, 0.27715301513671875, 0.2860145568847656, 0.2948760986328125, 0.3037376403808594, 0.31259918212890625, 0.3214607238769531, 0.330322265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 3.0, 16.0, 20.0, 27.0, 56.0, 81.0, 167.0, 345.0, 808.0, 2554.0, 20841.0, 997900.0, 21743.0, 2493.0, 791.0, 311.0, 160.0, 102.0, 46.0, 34.0, 17.0, 9.0, 7.0, 6.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8342208862304688, -0.8100433349609375, -0.7858657836914062, -0.761688232421875, -0.7375106811523438, -0.7133331298828125, -0.6891555786132812, -0.66497802734375, -0.6408004760742188, -0.6166229248046875, -0.5924453735351562, -0.568267822265625, -0.5440902709960938, -0.5199127197265625, -0.49573516845703125, -0.4715576171875, -0.44738006591796875, -0.4232025146484375, -0.39902496337890625, -0.374847412109375, -0.35066986083984375, -0.3264923095703125, -0.30231475830078125, -0.27813720703125, -0.25395965576171875, -0.2297821044921875, -0.20560455322265625, -0.181427001953125, -0.15724945068359375, -0.1330718994140625, -0.10889434814453125, -0.084716796875, -0.06053924560546875, -0.0363616943359375, -0.01218414306640625, 0.011993408203125, 0.03617095947265625, 0.0603485107421875, 0.08452606201171875, 0.10870361328125, 0.13288116455078125, 0.1570587158203125, 0.18123626708984375, 0.205413818359375, 0.22959136962890625, 0.2537689208984375, 0.27794647216796875, 0.3021240234375, 0.32630157470703125, 0.3504791259765625, 0.37465667724609375, 0.398834228515625, 0.42301177978515625, 0.4471893310546875, 0.47136688232421875, 0.49554443359375, 0.5197219848632812, 0.5438995361328125, 0.5680770874023438, 0.592254638671875, 0.6164321899414062, 0.6406097412109375, 0.6647872924804688, 0.68896484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 32.0, 33.0, 44.0, 46.0, 80.0, 107.0, 103.0, 107.0, 126.0, 87.0, 75.0, 35.0, 29.0, 27.0, 17.0, 9.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011971313506364822, -0.00011664070188999176, -0.0001135682687163353, -0.00011049583554267883, -0.00010742340236902237, -0.0001043509691953659, -0.00010127853602170944, -9.820610284805298e-05, -9.513366967439651e-05, -9.206123650074005e-05, -8.898880332708359e-05, -8.591637015342712e-05, -8.284393697977066e-05, -7.97715038061142e-05, -7.669907063245773e-05, -7.362663745880127e-05, -7.05542042851448e-05, -6.748177111148834e-05, -6.440933793783188e-05, -6.133690476417542e-05, -5.826447159051895e-05, -5.519203841686249e-05, -5.2119605243206024e-05, -4.904717206954956e-05, -4.59747388958931e-05, -4.290230572223663e-05, -3.982987254858017e-05, -3.6757439374923706e-05, -3.368500620126724e-05, -3.061257302761078e-05, -2.7540139853954315e-05, -2.446770668029785e-05, -2.1395273506641388e-05, -1.8322840332984924e-05, -1.525040715932846e-05, -1.2177973985671997e-05, -9.105540812015533e-06, -6.03310763835907e-06, -2.960674464702606e-06, 1.1175870895385742e-07, 3.184191882610321e-06, 6.256625056266785e-06, 9.329058229923248e-06, 1.2401491403579712e-05, 1.5473924577236176e-05, 1.854635775089264e-05, 2.1618790924549103e-05, 2.4691224098205566e-05, 2.776365727186203e-05, 3.0836090445518494e-05, 3.390852361917496e-05, 3.698095679283142e-05, 4.0053389966487885e-05, 4.312582314014435e-05, 4.619825631380081e-05, 4.9270689487457275e-05, 5.234312266111374e-05, 5.54155558347702e-05, 5.8487989008426666e-05, 6.156042218208313e-05, 6.46328553557396e-05, 6.770528852939606e-05, 7.077772170305252e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 12.0, 21.0, 21.0, 41.0, 45.0, 87.0, 135.0, 235.0, 410.0, 1018.0, 2820.0, 11485.0, 326860.0, 685081.0, 14716.0, 3247.0, 1170.0, 488.0, 268.0, 134.0, 76.0, 59.0, 24.0, 21.0, 18.0, 19.0, 10.0, 3.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4165763854980469, -0.40224456787109375, -0.3879127502441406, -0.3735809326171875, -0.3592491149902344, -0.34491729736328125, -0.3305854797363281, -0.316253662109375, -0.3019218444824219, -0.28759002685546875, -0.2732582092285156, -0.2589263916015625, -0.24459457397460938, -0.23026275634765625, -0.21593093872070312, -0.20159912109375, -0.18726730346679688, -0.17293548583984375, -0.15860366821289062, -0.1442718505859375, -0.12994003295898438, -0.11560821533203125, -0.10127639770507812, -0.086944580078125, -0.07261276245117188, -0.05828094482421875, -0.043949127197265625, -0.0296173095703125, -0.015285491943359375, -0.00095367431640625, 0.013378143310546875, 0.0277099609375, 0.042041778564453125, 0.05637359619140625, 0.07070541381835938, 0.0850372314453125, 0.09936904907226562, 0.11370086669921875, 0.12803268432617188, 0.142364501953125, 0.15669631958007812, 0.17102813720703125, 0.18535995483398438, 0.1996917724609375, 0.21402359008789062, 0.22835540771484375, 0.24268722534179688, 0.25701904296875, 0.2713508605957031, 0.28568267822265625, 0.3000144958496094, 0.3143463134765625, 0.3286781311035156, 0.34300994873046875, 0.3573417663574219, 0.371673583984375, 0.3860054016113281, 0.40033721923828125, 0.4146690368652344, 0.4290008544921875, 0.4433326721191406, 0.45766448974609375, 0.4719963073730469, 0.486328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 7.0, 6.0, 2.0, 9.0, 16.0, 22.0, 47.0, 62.0, 132.0, 215.0, 190.0, 107.0, 67.0, 44.0, 25.0, 16.0, 1.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.310791015625, -0.3018836975097656, -0.29297637939453125, -0.2840690612792969, -0.2751617431640625, -0.2662544250488281, -0.25734710693359375, -0.24843978881835938, -0.239532470703125, -0.23062515258789062, -0.22171783447265625, -0.21281051635742188, -0.2039031982421875, -0.19499588012695312, -0.18608856201171875, -0.17718124389648438, -0.16827392578125, -0.15936660766601562, -0.15045928955078125, -0.14155197143554688, -0.1326446533203125, -0.12373733520507812, -0.11483001708984375, -0.10592269897460938, -0.097015380859375, -0.08810806274414062, -0.07920074462890625, -0.07029342651367188, -0.0613861083984375, -0.052478790283203125, -0.04357147216796875, -0.034664154052734375, -0.0257568359375, -0.016849517822265625, -0.00794219970703125, 0.000965118408203125, 0.0098724365234375, 0.018779754638671875, 0.02768707275390625, 0.036594390869140625, 0.045501708984375, 0.054409027099609375, 0.06331634521484375, 0.07222366333007812, 0.0811309814453125, 0.09003829956054688, 0.09894561767578125, 0.10785293579101562, 0.11676025390625, 0.12566757202148438, 0.13457489013671875, 0.14348220825195312, 0.1523895263671875, 0.16129684448242188, 0.17020416259765625, 0.17911148071289062, 0.188018798828125, 0.19692611694335938, 0.20583343505859375, 0.21474075317382812, 0.2236480712890625, 0.23255538940429688, 0.24146270751953125, 0.2503700256347656, 0.25927734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 18.0, 36.0, 88.0, 143.0, 191.0, 182.0, 129.0, 85.0, 55.0, 24.0, 11.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7615129947662354, -2.662475347518921, -2.5634377002716064, -2.464400053024292, -2.3653626441955566, -2.266324996948242, -2.1672873497009277, -2.0682497024536133, -1.9692120552062988, -1.8701744079589844, -1.77113676071167, -1.672099232673645, -1.5730615854263306, -1.4740239381790161, -1.3749864101409912, -1.2759487628936768, -1.1769111156463623, -1.0778734683990479, -0.9788358807563782, -0.8797982931137085, -0.780760645866394, -0.6817229986190796, -0.5826854109764099, -0.48364782333374023, -0.3846101760864258, -0.2855725586414337, -0.18653494119644165, -0.08749732375144958, 0.01154029369354248, 0.11057791113853455, 0.2096155285835266, 0.3086531162261963, 0.40769052505493164, 0.5067281723022461, 0.6057657599449158, 0.7048033475875854, 0.8038409948348999, 0.9028786420822144, 1.0019161701202393, 1.1009538173675537, 1.1999914646148682, 1.2990291118621826, 1.398066759109497, 1.497104287147522, 1.5961419343948364, 1.6951795816421509, 1.7942171096801758, 1.8932547569274902, 1.9922924041748047, 2.091330051422119, 2.1903676986694336, 2.289405345916748, 2.3884429931640625, 2.487480401992798, 2.5865180492401123, 2.6855556964874268, 2.784593343734741, 2.8836309909820557, 2.98266863822937, 3.0817062854766846, 3.18074369430542, 3.2797813415527344, 3.378818988800049, 3.4778566360473633, 3.5768942832946777]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 6.0, 13.0, 14.0, 15.0, 10.0, 14.0, 19.0, 17.0, 23.0, 33.0, 22.0, 31.0, 34.0, 26.0, 48.0, 39.0, 44.0, 42.0, 34.0, 41.0, 45.0, 45.0, 41.0, 44.0, 40.0, 40.0, 35.0, 19.0, 23.0, 19.0, 18.0, 14.0, 11.0, 6.0, 7.0, 8.0, 8.0, 9.0, 14.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0], "bins": [-1.4417780637741089, -1.4001396894454956, -1.3585011959075928, -1.3168628215789795, -1.2752244472503662, -1.2335859537124634, -1.19194757938385, -1.1503090858459473, -1.108670711517334, -1.0670323371887207, -1.0253938436508179, -0.9837554693222046, -0.9421170353889465, -0.9004786014556885, -0.8588402271270752, -0.8172017931938171, -0.7755633592605591, -0.733924925327301, -0.692286491394043, -0.6506481170654297, -0.6090096831321716, -0.5673712491989136, -0.5257328748703003, -0.48409444093704224, -0.4424560070037842, -0.4008175730705261, -0.35917916893959045, -0.3175407648086548, -0.27590233087539673, -0.23426391184329987, -0.192625492811203, -0.15098708868026733, -0.10934877395629883, -0.06771035492420197, -0.026071935892105103, 0.01556648313999176, 0.05720490217208862, 0.09884332120418549, 0.14048174023628235, 0.18212014436721802, 0.22375857830047607, 0.26539701223373413, 0.3070354163646698, 0.34867382049560547, 0.3903122544288635, 0.4319506883621216, 0.47358909249305725, 0.5152274966239929, 0.556865930557251, 0.598504364490509, 0.6401427984237671, 0.6817811727523804, 0.7234196066856384, 0.7650580406188965, 0.8066964149475098, 0.8483348488807678, 0.8899732828140259, 0.9316117167472839, 0.973250150680542, 1.0148885250091553, 1.0565268993377686, 1.0981653928756714, 1.1398037672042847, 1.1814422607421875, 1.2230806350708008]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 8.0, 19.0, 27.0, 45.0, 41.0, 90.0, 113.0, 189.0, 268.0, 353.0, 615.0, 1126.0, 2172.0, 4697.0, 12432.0, 37876.0, 188206.0, 3652982.0, 227306.0, 41797.0, 13156.0, 5222.0, 2369.0, 1188.0, 692.0, 454.0, 249.0, 173.0, 121.0, 82.0, 64.0, 45.0, 24.0, 24.0, 16.0, 9.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27392578125, -0.2659950256347656, -0.25806427001953125, -0.2501335144042969, -0.2422027587890625, -0.23427200317382812, -0.22634124755859375, -0.21841049194335938, -0.210479736328125, -0.20254898071289062, -0.19461822509765625, -0.18668746948242188, -0.1787567138671875, -0.17082595825195312, -0.16289520263671875, -0.15496444702148438, -0.14703369140625, -0.13910293579101562, -0.13117218017578125, -0.12324142456054688, -0.1153106689453125, -0.10737991333007812, -0.09944915771484375, -0.09151840209960938, -0.083587646484375, -0.07565689086914062, -0.06772613525390625, -0.059795379638671875, -0.0518646240234375, -0.043933868408203125, -0.03600311279296875, -0.028072357177734375, -0.0201416015625, -0.012210845947265625, -0.00428009033203125, 0.003650665283203125, 0.0115814208984375, 0.019512176513671875, 0.02744293212890625, 0.035373687744140625, 0.043304443359375, 0.051235198974609375, 0.05916595458984375, 0.06709671020507812, 0.0750274658203125, 0.08295822143554688, 0.09088897705078125, 0.09881973266601562, 0.10675048828125, 0.11468124389648438, 0.12261199951171875, 0.13054275512695312, 0.1384735107421875, 0.14640426635742188, 0.15433502197265625, 0.16226577758789062, 0.170196533203125, 0.17812728881835938, 0.18605804443359375, 0.19398880004882812, 0.2019195556640625, 0.20985031127929688, 0.21778106689453125, 0.22571182250976562, 0.233642578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 2.0, 10.0, 10.0, 9.0, 12.0, 11.0, 13.0, 25.0, 20.0, 29.0, 25.0, 40.0, 25.0, 39.0, 40.0, 44.0, 48.0, 38.0, 39.0, 26.0, 37.0, 41.0, 33.0, 34.0, 43.0, 36.0, 35.0, 29.0, 30.0, 18.0, 23.0, 15.0, 21.0, 19.0, 11.0, 8.0, 15.0, 10.0, 5.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0404052734375, -0.03900623321533203, -0.03760719299316406, -0.036208152770996094, -0.034809112548828125, -0.033410072326660156, -0.03201103210449219, -0.03061199188232422, -0.02921295166015625, -0.02781391143798828, -0.026414871215820312, -0.025015830993652344, -0.023616790771484375, -0.022217750549316406, -0.020818710327148438, -0.01941967010498047, -0.0180206298828125, -0.01662158966064453, -0.015222549438476562, -0.013823509216308594, -0.012424468994140625, -0.011025428771972656, -0.009626388549804688, -0.008227348327636719, -0.00682830810546875, -0.005429267883300781, -0.0040302276611328125, -0.0026311874389648438, -0.001232147216796875, 0.00016689300537109375, 0.0015659332275390625, 0.0029649734497070312, 0.004364013671875, 0.005763053894042969, 0.0071620941162109375, 0.008561134338378906, 0.009960174560546875, 0.011359214782714844, 0.012758255004882812, 0.014157295227050781, 0.01555633544921875, 0.01695537567138672, 0.018354415893554688, 0.019753456115722656, 0.021152496337890625, 0.022551536560058594, 0.023950576782226562, 0.02534961700439453, 0.0267486572265625, 0.02814769744873047, 0.029546737670898438, 0.030945777893066406, 0.032344818115234375, 0.033743858337402344, 0.03514289855957031, 0.03654193878173828, 0.03794097900390625, 0.03934001922607422, 0.04073905944824219, 0.042138099670410156, 0.043537139892578125, 0.044936180114746094, 0.04633522033691406, 0.04773426055908203, 0.04913330078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 13.0, 12.0, 40.0, 36.0, 86.0, 162.0, 264.0, 512.0, 1115.0, 2626.0, 8396.0, 37852.0, 601028.0, 3454243.0, 69087.0, 12425.0, 3665.0, 1353.0, 641.0, 291.0, 188.0, 105.0, 53.0, 34.0, 18.0, 19.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.45795440673828125, -0.4427642822265625, -0.42757415771484375, -0.412384033203125, -0.39719390869140625, -0.3820037841796875, -0.36681365966796875, -0.35162353515625, -0.33643341064453125, -0.3212432861328125, -0.30605316162109375, -0.290863037109375, -0.27567291259765625, -0.2604827880859375, -0.24529266357421875, -0.2301025390625, -0.21491241455078125, -0.1997222900390625, -0.18453216552734375, -0.169342041015625, -0.15415191650390625, -0.1389617919921875, -0.12377166748046875, -0.10858154296875, -0.09339141845703125, -0.0782012939453125, -0.06301116943359375, -0.047821044921875, -0.03263092041015625, -0.0174407958984375, -0.00225067138671875, 0.012939453125, 0.02812957763671875, 0.0433197021484375, 0.05850982666015625, 0.073699951171875, 0.08889007568359375, 0.1040802001953125, 0.11927032470703125, 0.13446044921875, 0.14965057373046875, 0.1648406982421875, 0.18003082275390625, 0.195220947265625, 0.21041107177734375, 0.2256011962890625, 0.24079132080078125, 0.2559814453125, 0.27117156982421875, 0.2863616943359375, 0.30155181884765625, 0.316741943359375, 0.33193206787109375, 0.3471221923828125, 0.36231231689453125, 0.37750244140625, 0.39269256591796875, 0.4078826904296875, 0.42307281494140625, 0.438262939453125, 0.45345306396484375, 0.4686431884765625, 0.48383331298828125, 0.4990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 12.0, 6.0, 11.0, 14.0, 22.0, 42.0, 64.0, 89.0, 224.0, 566.0, 2131.0, 457.0, 180.0, 94.0, 52.0, 32.0, 21.0, 15.0, 7.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.1746501922607422, -0.16827011108398438, -0.16189002990722656, -0.15550994873046875, -0.14912986755371094, -0.14274978637695312, -0.1363697052001953, -0.1299896240234375, -0.12360954284667969, -0.11722946166992188, -0.11084938049316406, -0.10446929931640625, -0.09808921813964844, -0.09170913696289062, -0.08532905578613281, -0.078948974609375, -0.07256889343261719, -0.06618881225585938, -0.05980873107910156, -0.05342864990234375, -0.04704856872558594, -0.040668487548828125, -0.03428840637207031, -0.0279083251953125, -0.021528244018554688, -0.015148162841796875, -0.008768081665039062, -0.00238800048828125, 0.0039920806884765625, 0.010372161865234375, 0.016752243041992188, 0.02313232421875, 0.029512405395507812, 0.035892486572265625, 0.04227256774902344, 0.04865264892578125, 0.05503273010253906, 0.061412811279296875, 0.06779289245605469, 0.0741729736328125, 0.08055305480957031, 0.08693313598632812, 0.09331321716308594, 0.09969329833984375, 0.10607337951660156, 0.11245346069335938, 0.11883354187011719, 0.125213623046875, 0.1315937042236328, 0.13797378540039062, 0.14435386657714844, 0.15073394775390625, 0.15711402893066406, 0.16349411010742188, 0.1698741912841797, 0.1762542724609375, 0.1826343536376953, 0.18901443481445312, 0.19539451599121094, 0.20177459716796875, 0.20815467834472656, 0.21453475952148438, 0.2209148406982422, 0.227294921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 22.0, 39.0, 93.0, 192.0, 281.0, 195.0, 104.0, 44.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6991891860961914, -2.6360106468200684, -2.5728321075439453, -2.509653329849243, -2.44647479057312, -2.383296251296997, -2.320117712020874, -2.256938934326172, -2.193760395050049, -2.130581855773926, -2.0674033164978027, -2.0042245388031006, -1.9410459995269775, -1.8778674602508545, -1.8146889209747314, -1.7515102624893188, -1.6883317232131958, -1.6251531839370728, -1.5619745254516602, -1.498795986175537, -1.4356173276901245, -1.3724387884140015, -1.3092601299285889, -1.2460815906524658, -1.1829030513763428, -1.1197245121002197, -1.0565458536148071, -0.9933673143386841, -0.9301886558532715, -0.8670101165771484, -0.8038315176963806, -0.7406529188156128, -0.6774741411209106, -0.6142955422401428, -0.551116943359375, -0.48793837428092957, -0.42475977540016174, -0.3615811765193939, -0.2984026074409485, -0.23522400856018066, -0.17204540967941284, -0.10886681824922562, -0.04568822681903839, 0.017490357160568237, 0.08066895604133606, 0.14384755492210388, 0.20702612400054932, 0.27020472288131714, 0.33338332176208496, 0.3965619206428528, 0.4597405195236206, 0.5229190587997437, 0.5860977172851562, 0.6492762565612793, 0.7124548554420471, 0.7756334543228149, 0.8388120532035828, 0.9019906520843506, 0.9651692509651184, 1.0283478498458862, 1.0915263891220093, 1.1547050476074219, 1.217883586883545, 1.281062126159668, 1.3442407846450806]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 9.0, 8.0, 3.0, 7.0, 9.0, 11.0, 11.0, 17.0, 19.0, 22.0, 21.0, 32.0, 39.0, 27.0, 34.0, 30.0, 37.0, 35.0, 48.0, 42.0, 41.0, 41.0, 52.0, 47.0, 43.0, 31.0, 35.0, 31.0, 39.0, 18.0, 32.0, 17.0, 20.0, 14.0, 15.0, 16.0, 15.0, 12.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5356293320655823, -0.5192423462867737, -0.5028553605079651, -0.4864684045314789, -0.4700814485549927, -0.4536944627761841, -0.4373074769973755, -0.4209204912185669, -0.4045335352420807, -0.3881465494632721, -0.3717595934867859, -0.3553726077079773, -0.3389856219291687, -0.3225986659526825, -0.3062116801738739, -0.2898247241973877, -0.2734377384185791, -0.2570507526397705, -0.2406637966632843, -0.2242768108844757, -0.2078898400068283, -0.1915028691291809, -0.17511588335037231, -0.15872891247272491, -0.14234194159507751, -0.12595497071743011, -0.10956799238920212, -0.09318101406097412, -0.07679404318332672, -0.06040707230567932, -0.044020093977451324, -0.027633115649223328, -0.011246144771575928, 0.005140829831361771, 0.02152780443429947, 0.03791477903723717, 0.054301753640174866, 0.07068872451782227, 0.08707570284605026, 0.10346268117427826, 0.11984965205192566, 0.13623662292957306, 0.15262359380722046, 0.16901057958602905, 0.18539755046367645, 0.20178452134132385, 0.21817150712013245, 0.23455847799777985, 0.25094544887542725, 0.26733243465423584, 0.28371939063072205, 0.30010637640953064, 0.31649333238601685, 0.33288031816482544, 0.34926730394363403, 0.3656542897224426, 0.38204124569892883, 0.3984282314777374, 0.41481518745422363, 0.4312021732330322, 0.4475891590118408, 0.463976114988327, 0.4803631007671356, 0.4967500567436218, 0.5131370425224304]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 11.0, 11.0, 24.0, 56.0, 72.0, 137.0, 234.0, 458.0, 967.0, 2085.0, 4656.0, 10878.0, 27256.0, 70405.0, 180527.0, 340878.0, 244586.0, 100176.0, 38469.0, 15067.0, 6299.0, 2796.0, 1220.0, 597.0, 300.0, 154.0, 82.0, 80.0, 21.0, 19.0, 11.0, 11.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1949462890625, -0.18932533264160156, -0.18370437622070312, -0.1780834197998047, -0.17246246337890625, -0.1668415069580078, -0.16122055053710938, -0.15559959411621094, -0.1499786376953125, -0.14435768127441406, -0.13873672485351562, -0.1331157684326172, -0.12749481201171875, -0.12187385559082031, -0.11625289916992188, -0.11063194274902344, -0.105010986328125, -0.09939002990722656, -0.09376907348632812, -0.08814811706542969, -0.08252716064453125, -0.07690620422363281, -0.07128524780273438, -0.06566429138183594, -0.0600433349609375, -0.05442237854003906, -0.048801422119140625, -0.04318046569824219, -0.03755950927734375, -0.03193855285644531, -0.026317596435546875, -0.020696640014648438, -0.01507568359375, -0.009454727172851562, -0.003833770751953125, 0.0017871856689453125, 0.00740814208984375, 0.013029098510742188, 0.018650054931640625, 0.024271011352539062, 0.0298919677734375, 0.03551292419433594, 0.041133880615234375, 0.04675483703613281, 0.05237579345703125, 0.05799674987792969, 0.06361770629882812, 0.06923866271972656, 0.074859619140625, 0.08048057556152344, 0.08610153198242188, 0.09172248840332031, 0.09734344482421875, 0.10296440124511719, 0.10858535766601562, 0.11420631408691406, 0.1198272705078125, 0.12544822692871094, 0.13106918334960938, 0.1366901397705078, 0.14231109619140625, 0.1479320526123047, 0.15355300903320312, 0.15917396545410156, 0.164794921875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 4.0, 5.0, 10.0, 8.0, 13.0, 17.0, 17.0, 22.0, 22.0, 26.0, 20.0, 35.0, 33.0, 37.0, 30.0, 39.0, 24.0, 45.0, 38.0, 44.0, 56.0, 40.0, 48.0, 38.0, 43.0, 31.0, 42.0, 22.0, 25.0, 22.0, 24.0, 19.0, 19.0, 11.0, 13.0, 10.0, 8.0, 15.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.052001953125, -0.0504145622253418, -0.048827171325683594, -0.04723978042602539, -0.04565238952636719, -0.044064998626708984, -0.04247760772705078, -0.04089021682739258, -0.039302825927734375, -0.03771543502807617, -0.03612804412841797, -0.034540653228759766, -0.03295326232910156, -0.03136587142944336, -0.029778480529785156, -0.028191089630126953, -0.02660369873046875, -0.025016307830810547, -0.023428916931152344, -0.02184152603149414, -0.020254135131835938, -0.018666744232177734, -0.01707935333251953, -0.015491962432861328, -0.013904571533203125, -0.012317180633544922, -0.010729789733886719, -0.009142398834228516, -0.0075550079345703125, -0.005967617034912109, -0.004380226135253906, -0.002792835235595703, -0.0012054443359375, 0.0003819465637207031, 0.0019693374633789062, 0.0035567283630371094, 0.0051441192626953125, 0.006731510162353516, 0.008318901062011719, 0.009906291961669922, 0.011493682861328125, 0.013081073760986328, 0.014668464660644531, 0.016255855560302734, 0.017843246459960938, 0.01943063735961914, 0.021018028259277344, 0.022605419158935547, 0.02419281005859375, 0.025780200958251953, 0.027367591857910156, 0.02895498275756836, 0.030542373657226562, 0.032129764556884766, 0.03371715545654297, 0.03530454635620117, 0.036891937255859375, 0.03847932815551758, 0.04006671905517578, 0.041654109954833984, 0.04324150085449219, 0.04482889175415039, 0.046416282653808594, 0.0480036735534668, 0.049591064453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 7.0, 17.0, 17.0, 26.0, 22.0, 33.0, 51.0, 63.0, 93.0, 158.0, 238.0, 376.0, 599.0, 1177.0, 3036.0, 11928.0, 78351.0, 591133.0, 314209.0, 35799.0, 6744.0, 2109.0, 872.0, 535.0, 298.0, 215.0, 124.0, 92.0, 49.0, 42.0, 33.0, 24.0, 19.0, 9.0, 9.0, 3.0, 8.0, 5.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.37023162841796875, -0.3569183349609375, -0.34360504150390625, -0.330291748046875, -0.31697845458984375, -0.3036651611328125, -0.29035186767578125, -0.27703857421875, -0.26372528076171875, -0.2504119873046875, -0.23709869384765625, -0.223785400390625, -0.21047210693359375, -0.1971588134765625, -0.18384552001953125, -0.1705322265625, -0.15721893310546875, -0.1439056396484375, -0.13059234619140625, -0.117279052734375, -0.10396575927734375, -0.0906524658203125, -0.07733917236328125, -0.06402587890625, -0.05071258544921875, -0.0373992919921875, -0.02408599853515625, -0.010772705078125, 0.00254058837890625, 0.0158538818359375, 0.02916717529296875, 0.04248046875, 0.05579376220703125, 0.0691070556640625, 0.08242034912109375, 0.095733642578125, 0.10904693603515625, 0.1223602294921875, 0.13567352294921875, 0.14898681640625, 0.16230010986328125, 0.1756134033203125, 0.18892669677734375, 0.202239990234375, 0.21555328369140625, 0.2288665771484375, 0.24217987060546875, 0.2554931640625, 0.26880645751953125, 0.2821197509765625, 0.29543304443359375, 0.308746337890625, 0.32205963134765625, 0.3353729248046875, 0.34868621826171875, 0.36199951171875, 0.37531280517578125, 0.3886260986328125, 0.40193939208984375, 0.415252685546875, 0.42856597900390625, 0.4418792724609375, 0.45519256591796875, 0.468505859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 1.0, 8.0, 11.0, 9.0, 12.0, 11.0, 28.0, 27.0, 28.0, 23.0, 29.0, 41.0, 42.0, 40.0, 41.0, 50.0, 49.0, 66.0, 53.0, 39.0, 35.0, 48.0, 47.0, 37.0, 32.0, 42.0, 25.0, 29.0, 21.0, 16.0, 14.0, 6.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.339599609375, -0.32884979248046875, -0.3180999755859375, -0.30735015869140625, -0.296600341796875, -0.28585052490234375, -0.2751007080078125, -0.26435089111328125, -0.25360107421875, -0.24285125732421875, -0.2321014404296875, -0.22135162353515625, -0.210601806640625, -0.19985198974609375, -0.1891021728515625, -0.17835235595703125, -0.1676025390625, -0.15685272216796875, -0.1461029052734375, -0.13535308837890625, -0.124603271484375, -0.11385345458984375, -0.1031036376953125, -0.09235382080078125, -0.08160400390625, -0.07085418701171875, -0.0601043701171875, -0.04935455322265625, -0.038604736328125, -0.02785491943359375, -0.0171051025390625, -0.00635528564453125, 0.00439453125, 0.01514434814453125, 0.0258941650390625, 0.03664398193359375, 0.047393798828125, 0.05814361572265625, 0.0688934326171875, 0.07964324951171875, 0.09039306640625, 0.10114288330078125, 0.1118927001953125, 0.12264251708984375, 0.133392333984375, 0.14414215087890625, 0.1548919677734375, 0.16564178466796875, 0.1763916015625, 0.18714141845703125, 0.1978912353515625, 0.20864105224609375, 0.219390869140625, 0.23014068603515625, 0.2408905029296875, 0.25164031982421875, 0.26239013671875, 0.27313995361328125, 0.2838897705078125, 0.29463958740234375, 0.305389404296875, 0.31613922119140625, 0.3268890380859375, 0.33763885498046875, 0.348388671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 14.0, 13.0, 19.0, 30.0, 51.0, 88.0, 127.0, 299.0, 762.0, 2808.0, 18151.0, 499875.0, 503819.0, 18265.0, 2815.0, 805.0, 286.0, 142.0, 72.0, 38.0, 27.0, 25.0, 14.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54443359375, -0.5314712524414062, -0.5185089111328125, -0.5055465698242188, -0.492584228515625, -0.47962188720703125, -0.4666595458984375, -0.45369720458984375, -0.44073486328125, -0.42777252197265625, -0.4148101806640625, -0.40184783935546875, -0.388885498046875, -0.37592315673828125, -0.3629608154296875, -0.34999847412109375, -0.3370361328125, -0.32407379150390625, -0.3111114501953125, -0.29814910888671875, -0.285186767578125, -0.27222442626953125, -0.2592620849609375, -0.24629974365234375, -0.23333740234375, -0.22037506103515625, -0.2074127197265625, -0.19445037841796875, -0.181488037109375, -0.16852569580078125, -0.1555633544921875, -0.14260101318359375, -0.129638671875, -0.11667633056640625, -0.1037139892578125, -0.09075164794921875, -0.077789306640625, -0.06482696533203125, -0.0518646240234375, -0.03890228271484375, -0.02593994140625, -0.01297760009765625, -1.52587890625e-05, 0.01294708251953125, 0.025909423828125, 0.03887176513671875, 0.0518341064453125, 0.06479644775390625, 0.0777587890625, 0.09072113037109375, 0.1036834716796875, 0.11664581298828125, 0.129608154296875, 0.14257049560546875, 0.1555328369140625, 0.16849517822265625, 0.18145751953125, 0.19441986083984375, 0.2073822021484375, 0.22034454345703125, 0.233306884765625, 0.24626922607421875, 0.2592315673828125, 0.27219390869140625, 0.28515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 14.0, 17.0, 23.0, 38.0, 40.0, 47.0, 59.0, 66.0, 75.0, 91.0, 84.0, 82.0, 71.0, 51.0, 50.0, 39.0, 36.0, 23.0, 25.0, 17.0, 13.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010460615158081055, -0.00010221637785434723, -9.982660412788391e-05, -9.74368304014206e-05, -9.504705667495728e-05, -9.265728294849396e-05, -9.026750922203064e-05, -8.787773549556732e-05, -8.5487961769104e-05, -8.309818804264069e-05, -8.070841431617737e-05, -7.831864058971405e-05, -7.592886686325073e-05, -7.353909313678741e-05, -7.11493194103241e-05, -6.875954568386078e-05, -6.636977195739746e-05, -6.397999823093414e-05, -6.159022450447083e-05, -5.920045077800751e-05, -5.681067705154419e-05, -5.442090332508087e-05, -5.2031129598617554e-05, -4.9641355872154236e-05, -4.725158214569092e-05, -4.48618084192276e-05, -4.247203469276428e-05, -4.0082260966300964e-05, -3.7692487239837646e-05, -3.530271351337433e-05, -3.291293978691101e-05, -3.052316606044769e-05, -2.8133392333984375e-05, -2.5743618607521057e-05, -2.335384488105774e-05, -2.096407115459442e-05, -1.8574297428131104e-05, -1.6184523701667786e-05, -1.3794749975204468e-05, -1.140497624874115e-05, -9.015202522277832e-06, -6.625428795814514e-06, -4.235655069351196e-06, -1.8458813428878784e-06, 5.438923835754395e-07, 2.9336661100387573e-06, 5.323439836502075e-06, 7.713213562965393e-06, 1.0102987289428711e-05, 1.2492761015892029e-05, 1.4882534742355347e-05, 1.7272308468818665e-05, 1.9662082195281982e-05, 2.20518559217453e-05, 2.4441629648208618e-05, 2.6831403374671936e-05, 2.9221177101135254e-05, 3.161095082759857e-05, 3.400072455406189e-05, 3.639049828052521e-05, 3.8780272006988525e-05, 4.117004573345184e-05, 4.355981945991516e-05, 4.594959318637848e-05, 4.83393669128418e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 6.0, 14.0, 22.0, 30.0, 47.0, 78.0, 109.0, 204.0, 405.0, 957.0, 2346.0, 7318.0, 38546.0, 560956.0, 398654.0, 28938.0, 6211.0, 1990.0, 824.0, 373.0, 220.0, 111.0, 58.0, 42.0, 27.0, 17.0, 13.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27490234375, -0.2653999328613281, -0.25589752197265625, -0.24639511108398438, -0.2368927001953125, -0.22739028930664062, -0.21788787841796875, -0.20838546752929688, -0.198883056640625, -0.18938064575195312, -0.17987823486328125, -0.17037582397460938, -0.1608734130859375, -0.15137100219726562, -0.14186859130859375, -0.13236618041992188, -0.12286376953125, -0.11336135864257812, -0.10385894775390625, -0.09435653686523438, -0.0848541259765625, -0.07535171508789062, -0.06584930419921875, -0.056346893310546875, -0.046844482421875, -0.037342071533203125, -0.02783966064453125, -0.018337249755859375, -0.0088348388671875, 0.000667572021484375, 0.01016998291015625, 0.019672393798828125, 0.0291748046875, 0.038677215576171875, 0.04817962646484375, 0.057682037353515625, 0.0671844482421875, 0.07668685913085938, 0.08618927001953125, 0.09569168090820312, 0.105194091796875, 0.11469650268554688, 0.12419891357421875, 0.13370132446289062, 0.1432037353515625, 0.15270614624023438, 0.16220855712890625, 0.17171096801757812, 0.18121337890625, 0.19071578979492188, 0.20021820068359375, 0.20972061157226562, 0.2192230224609375, 0.22872543334960938, 0.23822784423828125, 0.24773025512695312, 0.257232666015625, 0.2667350769042969, 0.27623748779296875, 0.2857398986816406, 0.2952423095703125, 0.3047447204589844, 0.31424713134765625, 0.3237495422363281, 0.333251953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 6.0, 5.0, 11.0, 15.0, 26.0, 35.0, 31.0, 53.0, 53.0, 71.0, 78.0, 96.0, 102.0, 85.0, 58.0, 66.0, 52.0, 29.0, 30.0, 19.0, 19.0, 9.0, 6.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.148712158203125, -0.14337158203125, -0.138031005859375, -0.1326904296875, -0.127349853515625, -0.12200927734375, -0.116668701171875, -0.111328125, -0.105987548828125, -0.10064697265625, -0.095306396484375, -0.0899658203125, -0.084625244140625, -0.07928466796875, -0.073944091796875, -0.068603515625, -0.063262939453125, -0.05792236328125, -0.052581787109375, -0.0472412109375, -0.041900634765625, -0.03656005859375, -0.031219482421875, -0.02587890625, -0.020538330078125, -0.01519775390625, -0.009857177734375, -0.0045166015625, 0.000823974609375, 0.00616455078125, 0.011505126953125, 0.016845703125, 0.022186279296875, 0.02752685546875, 0.032867431640625, 0.0382080078125, 0.043548583984375, 0.04888916015625, 0.054229736328125, 0.0595703125, 0.064910888671875, 0.07025146484375, 0.075592041015625, 0.0809326171875, 0.086273193359375, 0.09161376953125, 0.096954345703125, 0.102294921875, 0.107635498046875, 0.11297607421875, 0.118316650390625, 0.1236572265625, 0.128997802734375, 0.13433837890625, 0.139678955078125, 0.14501953125, 0.150360107421875, 0.15570068359375, 0.161041259765625, 0.1663818359375, 0.171722412109375, 0.17706298828125, 0.182403564453125, 0.187744140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 25.0, 94.0, 198.0, 304.0, 236.0, 85.0, 39.0, 8.0, 5.0, 1.0, 0.0, 3.0, 2.0], "bins": [-9.819957733154297, -9.640528678894043, -9.461099624633789, -9.281670570373535, -9.102241516113281, -8.922812461853027, -8.743383407592773, -8.563955307006836, -8.384526252746582, -8.205097198486328, -8.025668144226074, -7.84623908996582, -7.666810512542725, -7.487381458282471, -7.307952404022217, -7.128523349761963, -6.949093818664551, -6.769664764404297, -6.590235710144043, -6.410806655883789, -6.231378078460693, -6.0519490242004395, -5.8725199699401855, -5.693090915679932, -5.513662338256836, -5.334233283996582, -5.154804229736328, -4.975375175476074, -4.7959465980529785, -4.616517543792725, -4.437088489532471, -4.257659435272217, -4.078230381011963, -3.898801326751709, -3.719372510910034, -3.5399434566497803, -3.3605144023895264, -3.1810855865478516, -3.0016565322875977, -2.8222274780273438, -2.64279842376709, -2.463369369506836, -2.283940553665161, -2.1045114994049072, -1.9250824451446533, -1.745653510093689, -1.5662245750427246, -1.3867955207824707, -1.207366704940796, -1.0279377698898315, -0.8485087156295776, -0.6690797805786133, -0.48965078592300415, -0.310221791267395, -0.13079285621643066, 0.04863619804382324, 0.2280651330947876, 0.40749412775039673, 0.5869231224060059, 0.7663520574569702, 0.9457810521125793, 1.1252100467681885, 1.3046389818191528, 1.4840680360794067, 1.663496971130371]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 10.0, 14.0, 12.0, 8.0, 13.0, 21.0, 16.0, 22.0, 30.0, 34.0, 24.0, 28.0, 29.0, 41.0, 39.0, 56.0, 43.0, 53.0, 45.0, 39.0, 43.0, 51.0, 34.0, 33.0, 41.0, 34.0, 38.0, 30.0, 20.0, 15.0, 13.0, 12.0, 7.0, 7.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6344897747039795, -1.5825459957122803, -1.530602216720581, -1.4786584377288818, -1.4267146587371826, -1.3747708797454834, -1.3228269815444946, -1.2708832025527954, -1.2189394235610962, -1.166995644569397, -1.1150518655776978, -1.0631080865859985, -1.0111641883850098, -0.9592204689979553, -0.9072766304016113, -0.8553328514099121, -0.8033890724182129, -0.7514452934265137, -0.6995015144348145, -0.6475576758384705, -0.5956138968467712, -0.543670117855072, -0.4917263090610504, -0.4397825002670288, -0.3878387212753296, -0.33589494228363037, -0.28395113348960876, -0.23200733959674835, -0.18006354570388794, -0.12811976671218872, -0.07617595791816711, -0.024232149124145508, 0.02771151065826416, 0.07965530455112457, 0.13159909844398499, 0.1835428923368454, 0.2354866862297058, 0.28743046522140503, 0.33937427401542664, 0.39131808280944824, 0.44326186180114746, 0.4952056407928467, 0.5471494197845459, 0.5990932583808899, 0.6510370373725891, 0.7029808163642883, 0.7549246549606323, 0.8068684339523315, 0.8588122129440308, 0.91075599193573, 0.9626997709274292, 1.0146435499191284, 1.0665874481201172, 1.1185312271118164, 1.1704750061035156, 1.2224187850952148, 1.274362564086914, 1.3263063430786133, 1.3782501220703125, 1.4301939010620117, 1.482137680053711, 1.5340814590454102, 1.586025357246399, 1.6379691362380981, 1.6899129152297974]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 2.0, 10.0, 8.0, 7.0, 12.0, 35.0, 23.0, 59.0, 70.0, 91.0, 131.0, 182.0, 263.0, 341.0, 574.0, 844.0, 1394.0, 2487.0, 5183.0, 14126.0, 85795.0, 4011490.0, 50093.0, 10967.0, 4217.0, 2177.0, 1255.0, 761.0, 505.0, 333.0, 219.0, 166.0, 112.0, 90.0, 58.0, 48.0, 37.0, 35.0, 15.0, 27.0, 7.0, 7.0, 8.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2872352600097656, -0.27808380126953125, -0.2689323425292969, -0.2597808837890625, -0.2506294250488281, -0.24147796630859375, -0.23232650756835938, -0.223175048828125, -0.21402359008789062, -0.20487213134765625, -0.19572067260742188, -0.1865692138671875, -0.17741775512695312, -0.16826629638671875, -0.15911483764648438, -0.14996337890625, -0.14081192016601562, -0.13166046142578125, -0.12250900268554688, -0.1133575439453125, -0.10420608520507812, -0.09505462646484375, -0.08590316772460938, -0.076751708984375, -0.06760025024414062, -0.05844879150390625, -0.049297332763671875, -0.0401458740234375, -0.030994415283203125, -0.02184295654296875, -0.012691497802734375, -0.0035400390625, 0.005611419677734375, 0.01476287841796875, 0.023914337158203125, 0.0330657958984375, 0.042217254638671875, 0.05136871337890625, 0.060520172119140625, 0.069671630859375, 0.07882308959960938, 0.08797454833984375, 0.09712600708007812, 0.1062774658203125, 0.11542892456054688, 0.12458038330078125, 0.13373184204101562, 0.14288330078125, 0.15203475952148438, 0.16118621826171875, 0.17033767700195312, 0.1794891357421875, 0.18864059448242188, 0.19779205322265625, 0.20694351196289062, 0.216094970703125, 0.22524642944335938, 0.23439788818359375, 0.24354934692382812, 0.2527008056640625, 0.2618522644042969, 0.27100372314453125, 0.2801551818847656, 0.289306640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 11.0, 12.0, 11.0, 27.0, 27.0, 29.0, 39.0, 51.0, 56.0, 65.0, 69.0, 76.0, 82.0, 72.0, 56.0, 68.0, 57.0, 35.0, 38.0, 25.0, 27.0, 14.0, 15.0, 11.0, 7.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07204246520996094, -0.06907272338867188, -0.06610298156738281, -0.06313323974609375, -0.06016349792480469, -0.057193756103515625, -0.05422401428222656, -0.0512542724609375, -0.04828453063964844, -0.045314788818359375, -0.04234504699707031, -0.03937530517578125, -0.03640556335449219, -0.033435821533203125, -0.030466079711914062, -0.027496337890625, -0.024526596069335938, -0.021556854248046875, -0.018587112426757812, -0.01561737060546875, -0.012647628784179688, -0.009677886962890625, -0.0067081451416015625, -0.0037384033203125, -0.0007686614990234375, 0.002201080322265625, 0.0051708221435546875, 0.00814056396484375, 0.011110305786132812, 0.014080047607421875, 0.017049789428710938, 0.02001953125, 0.022989273071289062, 0.025959014892578125, 0.028928756713867188, 0.03189849853515625, 0.03486824035644531, 0.037837982177734375, 0.04080772399902344, 0.0437774658203125, 0.04674720764160156, 0.049716949462890625, 0.05268669128417969, 0.05565643310546875, 0.05862617492675781, 0.061595916748046875, 0.06456565856933594, 0.067535400390625, 0.07050514221191406, 0.07347488403320312, 0.07644462585449219, 0.07941436767578125, 0.08238410949707031, 0.08535385131835938, 0.08832359313964844, 0.0912933349609375, 0.09426307678222656, 0.09723281860351562, 0.10020256042480469, 0.10317230224609375, 0.10614204406738281, 0.10911178588867188, 0.11208152770996094, 0.11505126953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 8.0, 17.0, 16.0, 37.0, 55.0, 69.0, 81.0, 132.0, 225.0, 482.0, 1191.0, 5659.0, 3658408.0, 520271.0, 5464.0, 1092.0, 393.0, 229.0, 132.0, 100.0, 61.0, 41.0, 27.0, 21.0, 18.0, 22.0, 4.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322265625, -1.2821807861328125, -1.242095947265625, -1.2020111083984375, -1.16192626953125, -1.1218414306640625, -1.081756591796875, -1.0416717529296875, -1.0015869140625, -0.9615020751953125, -0.921417236328125, -0.8813323974609375, -0.84124755859375, -0.8011627197265625, -0.761077880859375, -0.7209930419921875, -0.680908203125, -0.6408233642578125, -0.600738525390625, -0.5606536865234375, -0.52056884765625, -0.4804840087890625, -0.440399169921875, -0.4003143310546875, -0.3602294921875, -0.3201446533203125, -0.280059814453125, -0.2399749755859375, -0.19989013671875, -0.1598052978515625, -0.119720458984375, -0.0796356201171875, -0.03955078125, 0.0005340576171875, 0.040618896484375, 0.0807037353515625, 0.12078857421875, 0.1608734130859375, 0.200958251953125, 0.2410430908203125, 0.2811279296875, 0.3212127685546875, 0.361297607421875, 0.4013824462890625, 0.44146728515625, 0.4815521240234375, 0.521636962890625, 0.5617218017578125, 0.601806640625, 0.6418914794921875, 0.681976318359375, 0.7220611572265625, 0.76214599609375, 0.8022308349609375, 0.842315673828125, 0.8824005126953125, 0.9224853515625, 0.9625701904296875, 1.002655029296875, 1.0427398681640625, 1.08282470703125, 1.1229095458984375, 1.162994384765625, 1.2030792236328125, 1.2431640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 20.0, 41.0, 237.0, 3658.0, 76.0, 29.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.233154296875, -0.22516250610351562, -0.21717071533203125, -0.20917892456054688, -0.2011871337890625, -0.19319534301757812, -0.18520355224609375, -0.17721176147460938, -0.169219970703125, -0.16122817993164062, -0.15323638916015625, -0.14524459838867188, -0.1372528076171875, -0.12926101684570312, -0.12126922607421875, -0.11327743530273438, -0.10528564453125, -0.09729385375976562, -0.08930206298828125, -0.08131027221679688, -0.0733184814453125, -0.06532669067382812, -0.05733489990234375, -0.049343109130859375, -0.041351318359375, -0.033359527587890625, -0.02536773681640625, -0.017375946044921875, -0.0093841552734375, -0.001392364501953125, 0.00659942626953125, 0.014591217041015625, 0.0225830078125, 0.030574798583984375, 0.03856658935546875, 0.046558380126953125, 0.0545501708984375, 0.06254196166992188, 0.07053375244140625, 0.07852554321289062, 0.086517333984375, 0.09450912475585938, 0.10250091552734375, 0.11049270629882812, 0.1184844970703125, 0.12647628784179688, 0.13446807861328125, 0.14245986938476562, 0.15045166015625, 0.15844345092773438, 0.16643524169921875, 0.17442703247070312, 0.1824188232421875, 0.19041061401367188, 0.19840240478515625, 0.20639419555664062, 0.214385986328125, 0.22237777709960938, 0.23036956787109375, 0.23836135864257812, 0.2463531494140625, 0.2543449401855469, 0.26233673095703125, 0.2703285217285156, 0.2783203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 17.0, 10.0, 33.0, 45.0, 72.0, 104.0, 141.0, 157.0, 148.0, 103.0, 63.0, 45.0, 26.0, 12.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2764352560043335, -0.26142966747283936, -0.24642407894134521, -0.23141850531101227, -0.21641291677951813, -0.201407328248024, -0.18640175461769104, -0.1713961660861969, -0.15639057755470276, -0.14138498902320862, -0.12637940049171448, -0.11137382686138153, -0.09636823832988739, -0.08136264979839325, -0.0663570687174797, -0.05135148763656616, -0.03634589910507202, -0.02134031429886818, -0.006334729492664337, 0.008670855313539505, 0.023676440119743347, 0.03868202865123749, 0.05368760973215103, 0.06869319081306458, 0.08369877934455872, 0.09870436787605286, 0.1137099489569664, 0.12871553003787994, 0.14372111856937408, 0.15872670710086823, 0.17373228073120117, 0.1887378692626953, 0.20374345779418945, 0.2187490463256836, 0.23375463485717773, 0.24876020848751068, 0.263765811920166, 0.27877140045166016, 0.2937769591808319, 0.30878254771232605, 0.3237881362438202, 0.33879372477531433, 0.35379931330680847, 0.3688049018383026, 0.38381046056747437, 0.3988160490989685, 0.41382163763046265, 0.4288272261619568, 0.4438328146934509, 0.45883840322494507, 0.4738439917564392, 0.48884958028793335, 0.5038551688194275, 0.5188607573509216, 0.5338663458824158, 0.5488718748092651, 0.5638774633407593, 0.5788830518722534, 0.5938886404037476, 0.6088942289352417, 0.6238998174667358, 0.63890540599823, 0.6539109945297241, 0.6689165830612183, 0.6839221715927124]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 3.0, 7.0, 10.0, 9.0, 16.0, 16.0, 19.0, 12.0, 13.0, 31.0, 31.0, 38.0, 31.0, 43.0, 38.0, 34.0, 46.0, 57.0, 49.0, 43.0, 53.0, 49.0, 42.0, 39.0, 39.0, 38.0, 22.0, 22.0, 30.0, 20.0, 17.0, 14.0, 11.0, 13.0, 12.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.23510068655014038, -0.22808532416820526, -0.22106997668743134, -0.21405461430549622, -0.2070392519235611, -0.20002388954162598, -0.19300854206085205, -0.18599317967891693, -0.1789778172969818, -0.1719624549150467, -0.16494710743427277, -0.15793174505233765, -0.15091638267040253, -0.1439010202884674, -0.13688567280769348, -0.12987031042575836, -0.12285496294498444, -0.11583960801362991, -0.1088242456316948, -0.10180889070034027, -0.09479352831840515, -0.08777817338705063, -0.0807628184556961, -0.07374745607376099, -0.06673210114240646, -0.05971674248576164, -0.05270138382911682, -0.0456860288977623, -0.03867067024111748, -0.031655311584472656, -0.024639956653118134, -0.017624597996473312, -0.010609239339828491, -0.0035938816145062447, 0.003421476110816002, 0.010436832904815674, 0.017452191561460495, 0.024467550218105316, 0.03148290514945984, 0.03849826380610466, 0.04551362246274948, 0.0525289811193943, 0.059544339776039124, 0.06655969470739365, 0.07357504963874817, 0.08059041202068329, 0.08760576695203781, 0.09462112188339233, 0.10163648426532745, 0.10865183919668198, 0.1156672015786171, 0.12268255650997162, 0.12969791889190674, 0.13671326637268066, 0.14372862875461578, 0.1507439911365509, 0.15775933861732483, 0.16477470099925995, 0.17179004848003387, 0.178805410861969, 0.1858207732439041, 0.19283613562583923, 0.19985148310661316, 0.20686684548854828, 0.2138822078704834]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 14.0, 18.0, 36.0, 40.0, 84.0, 151.0, 270.0, 466.0, 923.0, 1872.0, 3942.0, 8810.0, 21948.0, 58105.0, 160947.0, 339843.0, 274669.0, 109174.0, 39879.0, 15327.0, 6338.0, 2831.0, 1307.0, 655.0, 389.0, 195.0, 116.0, 75.0, 38.0, 26.0, 17.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16463470458984375, -0.1584930419921875, -0.15235137939453125, -0.146209716796875, -0.14006805419921875, -0.1339263916015625, -0.12778472900390625, -0.12164306640625, -0.11550140380859375, -0.1093597412109375, -0.10321807861328125, -0.097076416015625, -0.09093475341796875, -0.0847930908203125, -0.07865142822265625, -0.072509765625, -0.06636810302734375, -0.0602264404296875, -0.05408477783203125, -0.047943115234375, -0.04180145263671875, -0.0356597900390625, -0.02951812744140625, -0.02337646484375, -0.01723480224609375, -0.0110931396484375, -0.00495147705078125, 0.001190185546875, 0.00733184814453125, 0.0134735107421875, 0.01961517333984375, 0.0257568359375, 0.03189849853515625, 0.0380401611328125, 0.04418182373046875, 0.050323486328125, 0.05646514892578125, 0.0626068115234375, 0.06874847412109375, 0.07489013671875, 0.08103179931640625, 0.0871734619140625, 0.09331512451171875, 0.099456787109375, 0.10559844970703125, 0.1117401123046875, 0.11788177490234375, 0.1240234375, 0.13016510009765625, 0.1363067626953125, 0.14244842529296875, 0.148590087890625, 0.15473175048828125, 0.1608734130859375, 0.16701507568359375, 0.17315673828125, 0.17929840087890625, 0.1854400634765625, 0.19158172607421875, 0.197723388671875, 0.20386505126953125, 0.2100067138671875, 0.21614837646484375, 0.2222900390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 7.0, 17.0, 16.0, 18.0, 21.0, 30.0, 37.0, 52.0, 57.0, 46.0, 41.0, 56.0, 48.0, 71.0, 65.0, 56.0, 57.0, 49.0, 45.0, 25.0, 33.0, 26.0, 28.0, 19.0, 20.0, 11.0, 4.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0731201171875, -0.07024288177490234, -0.06736564636230469, -0.06448841094970703, -0.061611175537109375, -0.05873394012451172, -0.05585670471191406, -0.052979469299316406, -0.05010223388671875, -0.047224998474121094, -0.04434776306152344, -0.04147052764892578, -0.038593292236328125, -0.03571605682373047, -0.03283882141113281, -0.029961585998535156, -0.0270843505859375, -0.024207115173339844, -0.021329879760742188, -0.01845264434814453, -0.015575408935546875, -0.012698173522949219, -0.009820938110351562, -0.006943702697753906, -0.00406646728515625, -0.0011892318725585938, 0.0016880035400390625, 0.004565238952636719, 0.007442474365234375, 0.010319709777832031, 0.013196945190429688, 0.016074180603027344, 0.018951416015625, 0.021828651428222656, 0.024705886840820312, 0.02758312225341797, 0.030460357666015625, 0.03333759307861328, 0.03621482849121094, 0.039092063903808594, 0.04196929931640625, 0.044846534729003906, 0.04772377014160156, 0.05060100555419922, 0.053478240966796875, 0.05635547637939453, 0.05923271179199219, 0.062109947204589844, 0.0649871826171875, 0.06786441802978516, 0.07074165344238281, 0.07361888885498047, 0.07649612426757812, 0.07937335968017578, 0.08225059509277344, 0.0851278305053711, 0.08800506591796875, 0.0908823013305664, 0.09375953674316406, 0.09663677215576172, 0.09951400756835938, 0.10239124298095703, 0.10526847839355469, 0.10814571380615234, 0.11102294921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 13.0, 19.0, 28.0, 47.0, 53.0, 73.0, 103.0, 149.0, 230.0, 323.0, 552.0, 995.0, 1876.0, 4399.0, 15306.0, 82925.0, 547758.0, 330516.0, 46266.0, 10027.0, 3204.0, 1391.0, 787.0, 485.0, 318.0, 230.0, 127.0, 85.0, 67.0, 66.0, 31.0, 28.0, 24.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39794921875, -0.38652801513671875, -0.3751068115234375, -0.36368560791015625, -0.352264404296875, -0.34084320068359375, -0.3294219970703125, -0.31800079345703125, -0.30657958984375, -0.29515838623046875, -0.2837371826171875, -0.27231597900390625, -0.260894775390625, -0.24947357177734375, -0.2380523681640625, -0.22663116455078125, -0.2152099609375, -0.20378875732421875, -0.1923675537109375, -0.18094635009765625, -0.169525146484375, -0.15810394287109375, -0.1466827392578125, -0.13526153564453125, -0.12384033203125, -0.11241912841796875, -0.1009979248046875, -0.08957672119140625, -0.078155517578125, -0.06673431396484375, -0.0553131103515625, -0.04389190673828125, -0.032470703125, -0.02104949951171875, -0.0096282958984375, 0.00179290771484375, 0.013214111328125, 0.02463531494140625, 0.0360565185546875, 0.04747772216796875, 0.05889892578125, 0.07032012939453125, 0.0817413330078125, 0.09316253662109375, 0.104583740234375, 0.11600494384765625, 0.1274261474609375, 0.13884735107421875, 0.1502685546875, 0.16168975830078125, 0.1731109619140625, 0.18453216552734375, 0.195953369140625, 0.20737457275390625, 0.2187957763671875, 0.23021697998046875, 0.24163818359375, 0.25305938720703125, 0.2644805908203125, 0.27590179443359375, 0.287322998046875, 0.29874420166015625, 0.3101654052734375, 0.32158660888671875, 0.3330078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 6.0, 4.0, 6.0, 14.0, 20.0, 14.0, 12.0, 15.0, 24.0, 37.0, 28.0, 43.0, 36.0, 37.0, 56.0, 36.0, 46.0, 53.0, 42.0, 38.0, 35.0, 44.0, 32.0, 39.0, 47.0, 29.0, 36.0, 32.0, 27.0, 12.0, 17.0, 14.0, 10.0, 15.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3729896545410156, -0.36048126220703125, -0.3479728698730469, -0.3354644775390625, -0.3229560852050781, -0.31044769287109375, -0.2979393005371094, -0.285430908203125, -0.2729225158691406, -0.26041412353515625, -0.24790573120117188, -0.2353973388671875, -0.22288894653320312, -0.21038055419921875, -0.19787216186523438, -0.18536376953125, -0.17285537719726562, -0.16034698486328125, -0.14783859252929688, -0.1353302001953125, -0.12282180786132812, -0.11031341552734375, -0.09780502319335938, -0.085296630859375, -0.07278823852539062, -0.06027984619140625, -0.047771453857421875, -0.0352630615234375, -0.022754669189453125, -0.01024627685546875, 0.002262115478515625, 0.0147705078125, 0.027278900146484375, 0.03978729248046875, 0.052295684814453125, 0.0648040771484375, 0.07731246948242188, 0.08982086181640625, 0.10232925415039062, 0.114837646484375, 0.12734603881835938, 0.13985443115234375, 0.15236282348632812, 0.1648712158203125, 0.17737960815429688, 0.18988800048828125, 0.20239639282226562, 0.21490478515625, 0.22741317749023438, 0.23992156982421875, 0.2524299621582031, 0.2649383544921875, 0.2774467468261719, 0.28995513916015625, 0.3024635314941406, 0.314971923828125, 0.3274803161621094, 0.33998870849609375, 0.3524971008300781, 0.3650054931640625, 0.3775138854980469, 0.39002227783203125, 0.4025306701660156, 0.4150390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 5.0, 10.0, 9.0, 9.0, 30.0, 55.0, 41.0, 117.0, 179.0, 349.0, 801.0, 1879.0, 6298.0, 30701.0, 294831.0, 625264.0, 71672.0, 11140.0, 2930.0, 1106.0, 506.0, 267.0, 157.0, 69.0, 46.0, 31.0, 10.0, 16.0, 6.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18652725219726562, -0.18054962158203125, -0.17457199096679688, -0.1685943603515625, -0.16261672973632812, -0.15663909912109375, -0.15066146850585938, -0.144683837890625, -0.13870620727539062, -0.13272857666015625, -0.12675094604492188, -0.1207733154296875, -0.11479568481445312, -0.10881805419921875, -0.10284042358398438, -0.09686279296875, -0.09088516235351562, -0.08490753173828125, -0.07892990112304688, -0.0729522705078125, -0.06697463989257812, -0.06099700927734375, -0.055019378662109375, -0.049041748046875, -0.043064117431640625, -0.03708648681640625, -0.031108856201171875, -0.0251312255859375, -0.019153594970703125, -0.01317596435546875, -0.007198333740234375, -0.001220703125, 0.004756927490234375, 0.01073455810546875, 0.016712188720703125, 0.0226898193359375, 0.028667449951171875, 0.03464508056640625, 0.040622711181640625, 0.046600341796875, 0.052577972412109375, 0.05855560302734375, 0.06453323364257812, 0.0705108642578125, 0.07648849487304688, 0.08246612548828125, 0.08844375610351562, 0.09442138671875, 0.10039901733398438, 0.10637664794921875, 0.11235427856445312, 0.1183319091796875, 0.12430953979492188, 0.13028717041015625, 0.13626480102539062, 0.142242431640625, 0.14822006225585938, 0.15419769287109375, 0.16017532348632812, 0.1661529541015625, 0.17213058471679688, 0.17810821533203125, 0.18408584594726562, 0.1900634765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 15.0, 14.0, 11.0, 21.0, 27.0, 24.0, 44.0, 50.0, 65.0, 87.0, 86.0, 93.0, 77.0, 80.0, 64.0, 51.0, 28.0, 50.0, 25.0, 21.0, 9.0, 18.0, 8.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.963180541992188e-05, -7.7015720307827e-05, -7.439963519573212e-05, -7.178355008363724e-05, -6.916746497154236e-05, -6.655137985944748e-05, -6.39352947473526e-05, -6.131920963525772e-05, -5.870312452316284e-05, -5.608703941106796e-05, -5.3470954298973083e-05, -5.0854869186878204e-05, -4.8238784074783325e-05, -4.5622698962688446e-05, -4.300661385059357e-05, -4.039052873849869e-05, -3.777444362640381e-05, -3.515835851430893e-05, -3.254227340221405e-05, -2.992618829011917e-05, -2.7310103178024292e-05, -2.4694018065929413e-05, -2.2077932953834534e-05, -1.9461847841739655e-05, -1.6845762729644775e-05, -1.4229677617549896e-05, -1.1613592505455017e-05, -8.997507393360138e-06, -6.381422281265259e-06, -3.7653371691703796e-06, -1.1492520570755005e-06, 1.4668330550193787e-06, 4.082918167114258e-06, 6.699003279209137e-06, 9.315088391304016e-06, 1.1931173503398895e-05, 1.4547258615493774e-05, 1.7163343727588654e-05, 1.9779428839683533e-05, 2.2395513951778412e-05, 2.501159906387329e-05, 2.762768417596817e-05, 3.024376928806305e-05, 3.285985440015793e-05, 3.547593951225281e-05, 3.809202462434769e-05, 4.0708109736442566e-05, 4.3324194848537445e-05, 4.5940279960632324e-05, 4.85563650727272e-05, 5.117245018482208e-05, 5.378853529691696e-05, 5.640462040901184e-05, 5.902070552110672e-05, 6.16367906332016e-05, 6.425287574529648e-05, 6.686896085739136e-05, 6.948504596948624e-05, 7.210113108158112e-05, 7.4717216193676e-05, 7.733330130577087e-05, 7.994938641786575e-05, 8.256547152996063e-05, 8.518155664205551e-05, 8.779764175415039e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 13.0, 12.0, 17.0, 27.0, 31.0, 45.0, 70.0, 119.0, 213.0, 386.0, 732.0, 1622.0, 4280.0, 15315.0, 102866.0, 648904.0, 234788.0, 28199.0, 6454.0, 2255.0, 978.0, 480.0, 276.0, 147.0, 93.0, 51.0, 52.0, 21.0, 17.0, 21.0, 14.0, 16.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1903076171875, -0.18482017517089844, -0.17933273315429688, -0.1738452911376953, -0.16835784912109375, -0.1628704071044922, -0.15738296508789062, -0.15189552307128906, -0.1464080810546875, -0.14092063903808594, -0.13543319702148438, -0.1299457550048828, -0.12445831298828125, -0.11897087097167969, -0.11348342895507812, -0.10799598693847656, -0.102508544921875, -0.09702110290527344, -0.09153366088867188, -0.08604621887207031, -0.08055877685546875, -0.07507133483886719, -0.06958389282226562, -0.06409645080566406, -0.0586090087890625, -0.05312156677246094, -0.047634124755859375, -0.04214668273925781, -0.03665924072265625, -0.031171798706054688, -0.025684356689453125, -0.020196914672851562, -0.01470947265625, -0.009222030639648438, -0.003734588623046875, 0.0017528533935546875, 0.00724029541015625, 0.012727737426757812, 0.018215179443359375, 0.023702621459960938, 0.0291900634765625, 0.03467750549316406, 0.040164947509765625, 0.04565238952636719, 0.05113983154296875, 0.05662727355957031, 0.062114715576171875, 0.06760215759277344, 0.073089599609375, 0.07857704162597656, 0.08406448364257812, 0.08955192565917969, 0.09503936767578125, 0.10052680969238281, 0.10601425170898438, 0.11150169372558594, 0.1169891357421875, 0.12247657775878906, 0.12796401977539062, 0.1334514617919922, 0.13893890380859375, 0.1444263458251953, 0.14991378784179688, 0.15540122985839844, 0.160888671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 7.0, 14.0, 25.0, 41.0, 52.0, 66.0, 84.0, 100.0, 113.0, 95.0, 82.0, 86.0, 82.0, 45.0, 29.0, 16.0, 14.0, 9.0, 5.0, 6.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17737388610839844, -0.17164230346679688, -0.1659107208251953, -0.16017913818359375, -0.1544475555419922, -0.14871597290039062, -0.14298439025878906, -0.1372528076171875, -0.13152122497558594, -0.12578964233398438, -0.12005805969238281, -0.11432647705078125, -0.10859489440917969, -0.10286331176757812, -0.09713172912597656, -0.091400146484375, -0.08566856384277344, -0.07993698120117188, -0.07420539855957031, -0.06847381591796875, -0.06274223327636719, -0.057010650634765625, -0.05127906799316406, -0.0455474853515625, -0.03981590270996094, -0.034084320068359375, -0.028352737426757812, -0.02262115478515625, -0.016889572143554688, -0.011157989501953125, -0.0054264068603515625, 0.00030517578125, 0.0060367584228515625, 0.011768341064453125, 0.017499923706054688, 0.02323150634765625, 0.028963088989257812, 0.034694671630859375, 0.04042625427246094, 0.0461578369140625, 0.05188941955566406, 0.057621002197265625, 0.06335258483886719, 0.06908416748046875, 0.07481575012207031, 0.08054733276367188, 0.08627891540527344, 0.092010498046875, 0.09774208068847656, 0.10347366333007812, 0.10920524597167969, 0.11493682861328125, 0.12066841125488281, 0.12639999389648438, 0.13213157653808594, 0.1378631591796875, 0.14359474182128906, 0.14932632446289062, 0.1550579071044922, 0.16078948974609375, 0.1665210723876953, 0.17225265502929688, 0.17798423767089844, 0.1837158203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 16.0, 20.0, 46.0, 63.0, 103.0, 134.0, 160.0, 136.0, 112.0, 85.0, 40.0, 34.0, 19.0, 9.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.426270008087158, -2.3378474712371826, -2.249425172805786, -2.1610026359558105, -2.072580099105835, -1.9841578006744385, -1.895735263824463, -1.8073128461837769, -1.7188904285430908, -1.6304680109024048, -1.5420454740524292, -1.4536230564117432, -1.3652006387710571, -1.276778221130371, -1.1883556842803955, -1.0999332666397095, -1.0115107297897339, -0.9230882525444031, -0.834665834903717, -0.7462433576583862, -0.6578209400177002, -0.5693984627723694, -0.4809759855270386, -0.39255356788635254, -0.30413109064102173, -0.2157086431980133, -0.1272861808538437, -0.03886371850967407, 0.04955872893333435, 0.13798117637634277, 0.22640365362167358, 0.3148260712623596, 0.40324854850769043, 0.49167099595069885, 0.5800934433937073, 0.6685159206390381, 0.7569383382797241, 0.8453608155250549, 0.9337832927703857, 1.0222057104110718, 1.1106281280517578, 1.1990505456924438, 1.2874730825424194, 1.3758955001831055, 1.4643179178237915, 1.5527403354644775, 1.6411628723144531, 1.7295852899551392, 1.8180078268051147, 1.9064302444458008, 1.9948527812957764, 2.083275318145752, 2.1716976165771484, 2.260120153427124, 2.3485426902770996, 2.436964988708496, 2.5253875255584717, 2.6138100624084473, 2.7022323608398438, 2.7906548976898193, 2.879077434539795, 2.9674997329711914, 3.055922269821167, 3.1443448066711426, 3.232767105102539]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 11.0, 6.0, 7.0, 10.0, 15.0, 12.0, 16.0, 24.0, 15.0, 26.0, 32.0, 29.0, 35.0, 33.0, 41.0, 37.0, 45.0, 34.0, 46.0, 49.0, 43.0, 39.0, 42.0, 40.0, 37.0, 39.0, 36.0, 20.0, 31.0, 29.0, 13.0, 12.0, 14.0, 20.0, 12.0, 5.0, 6.0, 9.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.09592866897583, -2.039032459259033, -1.9821360111236572, -1.9252396821975708, -1.8683433532714844, -1.811447024345398, -1.7545506954193115, -1.697654366493225, -1.6407580375671387, -1.5838617086410522, -1.5269653797149658, -1.4700690507888794, -1.413172721862793, -1.3562763929367065, -1.2993800640106201, -1.2424837350845337, -1.1855874061584473, -1.1286910772323608, -1.0717947483062744, -1.014898419380188, -0.9580020904541016, -0.9011057615280151, -0.8442094326019287, -0.7873131036758423, -0.7304167747497559, -0.6735204458236694, -0.616624116897583, -0.5597277879714966, -0.5028314590454102, -0.44593513011932373, -0.3890388011932373, -0.3321424722671509, -0.275246262550354, -0.21834993362426758, -0.16145360469818115, -0.10455727577209473, -0.0476609468460083, 0.009235382080078125, 0.06613171100616455, 0.12302803993225098, 0.1799243688583374, 0.23682069778442383, 0.29371702671051025, 0.3506133556365967, 0.4075096845626831, 0.46440601348876953, 0.521302342414856, 0.5781986713409424, 0.6350950002670288, 0.6919913291931152, 0.7488876581192017, 0.8057839870452881, 0.8626803159713745, 0.9195766448974609, 0.9764729738235474, 1.0333693027496338, 1.0902656316757202, 1.1471619606018066, 1.204058289527893, 1.2609546184539795, 1.317850947380066, 1.3747472763061523, 1.4316436052322388, 1.4885399341583252, 1.5454362630844116]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 6.0, 7.0, 3.0, 9.0, 8.0, 6.0, 6.0, 8.0, 11.0, 18.0, 30.0, 26.0, 28.0, 57.0, 82.0, 99.0, 149.0, 237.0, 407.0, 577.0, 995.0, 1745.0, 3421.0, 7680.0, 21867.0, 171046.0, 3922996.0, 41231.0, 11226.0, 4707.0, 2221.0, 1248.0, 748.0, 412.0, 301.0, 184.0, 134.0, 90.0, 54.0, 45.0, 46.0, 24.0, 17.0, 17.0, 21.0, 12.0, 9.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.280517578125, -0.2718086242675781, -0.26309967041015625, -0.2543907165527344, -0.2456817626953125, -0.23697280883789062, -0.22826385498046875, -0.21955490112304688, -0.210845947265625, -0.20213699340820312, -0.19342803955078125, -0.18471908569335938, -0.1760101318359375, -0.16730117797851562, -0.15859222412109375, -0.14988327026367188, -0.14117431640625, -0.13246536254882812, -0.12375640869140625, -0.11504745483398438, -0.1063385009765625, -0.09762954711914062, -0.08892059326171875, -0.08021163940429688, -0.071502685546875, -0.06279373168945312, -0.05408477783203125, -0.045375823974609375, -0.0366668701171875, -0.027957916259765625, -0.01924896240234375, -0.010540008544921875, -0.0018310546875, 0.006877899169921875, 0.01558685302734375, 0.024295806884765625, 0.0330047607421875, 0.041713714599609375, 0.05042266845703125, 0.059131622314453125, 0.067840576171875, 0.07654953002929688, 0.08525848388671875, 0.09396743774414062, 0.1026763916015625, 0.11138534545898438, 0.12009429931640625, 0.12880325317382812, 0.13751220703125, 0.14622116088867188, 0.15493011474609375, 0.16363906860351562, 0.1723480224609375, 0.18105697631835938, 0.18976593017578125, 0.19847488403320312, 0.207183837890625, 0.21589279174804688, 0.22460174560546875, 0.23331069946289062, 0.2420196533203125, 0.2507286071777344, 0.25943756103515625, 0.2681465148925781, 0.27685546875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 11.0, 9.0, 18.0, 24.0, 26.0, 42.0, 44.0, 40.0, 46.0, 35.0, 54.0, 48.0, 45.0, 66.0, 45.0, 60.0, 52.0, 48.0, 50.0, 38.0, 39.0, 26.0, 24.0, 19.0, 18.0, 6.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08465576171875, -0.08185863494873047, -0.07906150817871094, -0.0762643814086914, -0.07346725463867188, -0.07067012786865234, -0.06787300109863281, -0.06507587432861328, -0.06227874755859375, -0.05948162078857422, -0.05668449401855469, -0.053887367248535156, -0.051090240478515625, -0.048293113708496094, -0.04549598693847656, -0.04269886016845703, -0.0399017333984375, -0.03710460662841797, -0.03430747985839844, -0.031510353088378906, -0.028713226318359375, -0.025916099548339844, -0.023118972778320312, -0.02032184600830078, -0.01752471923828125, -0.014727592468261719, -0.011930465698242188, -0.009133338928222656, -0.006336212158203125, -0.0035390853881835938, -0.0007419586181640625, 0.0020551681518554688, 0.004852294921875, 0.007649421691894531, 0.010446548461914062, 0.013243675231933594, 0.016040802001953125, 0.018837928771972656, 0.021635055541992188, 0.02443218231201172, 0.02722930908203125, 0.03002643585205078, 0.03282356262207031, 0.035620689392089844, 0.038417816162109375, 0.041214942932128906, 0.04401206970214844, 0.04680919647216797, 0.0496063232421875, 0.05240345001220703, 0.05520057678222656, 0.057997703552246094, 0.060794830322265625, 0.06359195709228516, 0.06638908386230469, 0.06918621063232422, 0.07198333740234375, 0.07478046417236328, 0.07757759094238281, 0.08037471771240234, 0.08317184448242188, 0.0859689712524414, 0.08876609802246094, 0.09156322479248047, 0.0943603515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 13.0, 9.0, 17.0, 11.0, 22.0, 29.0, 51.0, 66.0, 100.0, 141.0, 183.0, 306.0, 544.0, 889.0, 1731.0, 3225.0, 7229.0, 18783.0, 76370.0, 3873687.0, 164115.0, 27943.0, 9549.0, 4170.0, 2088.0, 1170.0, 671.0, 390.0, 253.0, 163.0, 108.0, 77.0, 44.0, 29.0, 21.0, 16.0, 15.0, 13.0, 4.0, 6.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27783203125, -0.2690582275390625, -0.260284423828125, -0.2515106201171875, -0.24273681640625, -0.2339630126953125, -0.225189208984375, -0.2164154052734375, -0.2076416015625, -0.1988677978515625, -0.190093994140625, -0.1813201904296875, -0.17254638671875, -0.1637725830078125, -0.154998779296875, -0.1462249755859375, -0.137451171875, -0.1286773681640625, -0.119903564453125, -0.1111297607421875, -0.10235595703125, -0.0935821533203125, -0.084808349609375, -0.0760345458984375, -0.0672607421875, -0.0584869384765625, -0.049713134765625, -0.0409393310546875, -0.03216552734375, -0.0233917236328125, -0.014617919921875, -0.0058441162109375, 0.0029296875, 0.0117034912109375, 0.020477294921875, 0.0292510986328125, 0.03802490234375, 0.0467987060546875, 0.055572509765625, 0.0643463134765625, 0.0731201171875, 0.0818939208984375, 0.090667724609375, 0.0994415283203125, 0.10821533203125, 0.1169891357421875, 0.125762939453125, 0.1345367431640625, 0.143310546875, 0.1520843505859375, 0.160858154296875, 0.1696319580078125, 0.17840576171875, 0.1871795654296875, 0.195953369140625, 0.2047271728515625, 0.2135009765625, 0.2222747802734375, 0.231048583984375, 0.2398223876953125, 0.24859619140625, 0.2573699951171875, 0.266143798828125, 0.2749176025390625, 0.28369140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 4.0, 10.0, 8.0, 12.0, 9.0, 12.0, 26.0, 52.0, 101.0, 411.0, 3115.0, 153.0, 57.0, 40.0, 15.0, 16.0, 12.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09197998046875, -0.08929157257080078, -0.08660316467285156, -0.08391475677490234, -0.08122634887695312, -0.0785379409790039, -0.07584953308105469, -0.07316112518310547, -0.07047271728515625, -0.06778430938720703, -0.06509590148925781, -0.062407493591308594, -0.059719085693359375, -0.057030677795410156, -0.05434226989746094, -0.05165386199951172, -0.0489654541015625, -0.04627704620361328, -0.04358863830566406, -0.040900230407714844, -0.038211822509765625, -0.035523414611816406, -0.03283500671386719, -0.03014659881591797, -0.02745819091796875, -0.02476978302001953, -0.022081375122070312, -0.019392967224121094, -0.016704559326171875, -0.014016151428222656, -0.011327743530273438, -0.008639335632324219, -0.005950927734375, -0.0032625198364257812, -0.0005741119384765625, 0.0021142959594726562, 0.004802703857421875, 0.007491111755371094, 0.010179519653320312, 0.012867927551269531, 0.01555633544921875, 0.01824474334716797, 0.020933151245117188, 0.023621559143066406, 0.026309967041015625, 0.028998374938964844, 0.03168678283691406, 0.03437519073486328, 0.0370635986328125, 0.03975200653076172, 0.04244041442871094, 0.045128822326660156, 0.047817230224609375, 0.050505638122558594, 0.05319404602050781, 0.05588245391845703, 0.05857086181640625, 0.06125926971435547, 0.06394767761230469, 0.0666360855102539, 0.06932449340820312, 0.07201290130615234, 0.07470130920410156, 0.07738971710205078, 0.080078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 19.0, 19.0, 41.0, 43.0, 70.0, 88.0, 104.0, 88.0, 117.0, 95.0, 89.0, 61.0, 51.0, 25.0, 24.0, 16.0, 12.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2323429137468338, -0.22346237301826477, -0.21458184719085693, -0.2057013064622879, -0.19682076573371887, -0.18794023990631104, -0.179059699177742, -0.17017915844917297, -0.16129863262176514, -0.1524180918931961, -0.14353756606578827, -0.13465702533721924, -0.1257764995098114, -0.11689595878124237, -0.10801541805267334, -0.0991348847746849, -0.09025435149669647, -0.08137381821870804, -0.0724932849407196, -0.06361274421215057, -0.05473221093416214, -0.045851677656173706, -0.036971140652894974, -0.02809060364961624, -0.019210070371627808, -0.010329535230994225, -0.0014490000903606415, 0.007431535050272942, 0.016312070190906525, 0.02519260346889496, 0.03407314047217369, 0.04295367747545242, 0.05183419585227966, 0.0607147291302681, 0.06959526240825653, 0.07847580313682556, 0.087356336414814, 0.09623686969280243, 0.10511741042137146, 0.1139979436993599, 0.12287847697734833, 0.13175901770591736, 0.1406395435333252, 0.14952008426189423, 0.15840062499046326, 0.1672811508178711, 0.17616169154644012, 0.18504223227500916, 0.193922758102417, 0.20280329883098602, 0.21168382465839386, 0.2205643653869629, 0.22944489121437073, 0.23832543194293976, 0.2472059726715088, 0.2560864984989166, 0.26496702432632446, 0.2738475501537323, 0.2827281057834625, 0.29160863161087036, 0.3004891574382782, 0.30936968326568604, 0.31825023889541626, 0.3271307647228241, 0.3360113203525543]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 6.0, 7.0, 9.0, 15.0, 9.0, 24.0, 24.0, 19.0, 25.0, 33.0, 32.0, 33.0, 34.0, 41.0, 47.0, 45.0, 42.0, 49.0, 47.0, 44.0, 50.0, 35.0, 35.0, 33.0, 32.0, 33.0, 35.0, 17.0, 18.0, 19.0, 16.0, 18.0, 11.0, 12.0, 11.0, 11.0, 1.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.14557647705078125, -0.1409279853105545, -0.13627947866916656, -0.13163098692893982, -0.12698249518871307, -0.12233399599790573, -0.11768549680709839, -0.11303700506687164, -0.1083885058760643, -0.10374000668525696, -0.09909151494503021, -0.09444301575422287, -0.08979451656341553, -0.08514602482318878, -0.08049752563238144, -0.0758490264415741, -0.07120053470134735, -0.06655203551054001, -0.06190354377031326, -0.05725504457950592, -0.052606549113988876, -0.04795805364847183, -0.04330955445766449, -0.038661058992147446, -0.0340125635266304, -0.029364068061113358, -0.024715570732951164, -0.02006707340478897, -0.015418577939271927, -0.010770082473754883, -0.0061215851455926895, -0.0014730878174304962, 0.003175407648086548, 0.007823904044926167, 0.012472400441765785, 0.01712089776992798, 0.021769393235445023, 0.026417888700962067, 0.03106638602912426, 0.03571488335728645, 0.0403633788228035, 0.04501187428832054, 0.049660369753837585, 0.05430886894464493, 0.05895736441016197, 0.06360585987567902, 0.06825435906648636, 0.0729028582572937, 0.07755134999752045, 0.08219984918832779, 0.08684834092855453, 0.09149684011936188, 0.09614533185958862, 0.10079383105039597, 0.10544233024120331, 0.11009082198143005, 0.1147393211722374, 0.11938782036304474, 0.12403631210327148, 0.12868480384349823, 0.13333331048488617, 0.13798180222511292, 0.14263029396533966, 0.1472788006067276, 0.15192729234695435]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 17.0, 20.0, 37.0, 45.0, 73.0, 173.0, 324.0, 699.0, 1730.0, 4334.0, 12297.0, 39245.0, 136782.0, 372370.0, 324671.0, 108466.0, 31119.0, 9955.0, 3513.0, 1390.0, 602.0, 297.0, 155.0, 97.0, 44.0, 25.0, 15.0, 14.0, 11.0, 6.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2242431640625, -0.21742820739746094, -0.21061325073242188, -0.2037982940673828, -0.19698333740234375, -0.1901683807373047, -0.18335342407226562, -0.17653846740722656, -0.1697235107421875, -0.16290855407714844, -0.15609359741210938, -0.1492786407470703, -0.14246368408203125, -0.1356487274169922, -0.12883377075195312, -0.12201881408691406, -0.115203857421875, -0.10838890075683594, -0.10157394409179688, -0.09475898742675781, -0.08794403076171875, -0.08112907409667969, -0.07431411743164062, -0.06749916076660156, -0.0606842041015625, -0.05386924743652344, -0.047054290771484375, -0.04023933410644531, -0.03342437744140625, -0.026609420776367188, -0.019794464111328125, -0.012979507446289062, -0.00616455078125, 0.0006504058837890625, 0.007465362548828125, 0.014280319213867188, 0.02109527587890625, 0.027910232543945312, 0.034725189208984375, 0.04154014587402344, 0.0483551025390625, 0.05517005920410156, 0.061985015869140625, 0.06879997253417969, 0.07561492919921875, 0.08242988586425781, 0.08924484252929688, 0.09605979919433594, 0.102874755859375, 0.10968971252441406, 0.11650466918945312, 0.12331962585449219, 0.13013458251953125, 0.1369495391845703, 0.14376449584960938, 0.15057945251464844, 0.1573944091796875, 0.16420936584472656, 0.17102432250976562, 0.1778392791748047, 0.18465423583984375, 0.1914691925048828, 0.19828414916992188, 0.20509910583496094, 0.2119140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 5.0, 9.0, 4.0, 15.0, 12.0, 16.0, 26.0, 42.0, 35.0, 35.0, 48.0, 60.0, 56.0, 54.0, 58.0, 75.0, 79.0, 57.0, 48.0, 44.0, 39.0, 39.0, 29.0, 20.0, 21.0, 31.0, 8.0, 10.0, 7.0, 7.0, 0.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10171318054199219, -0.09844589233398438, -0.09517860412597656, -0.09191131591796875, -0.08864402770996094, -0.08537673950195312, -0.08210945129394531, -0.0788421630859375, -0.07557487487792969, -0.07230758666992188, -0.06904029846191406, -0.06577301025390625, -0.06250572204589844, -0.059238433837890625, -0.05597114562988281, -0.052703857421875, -0.04943656921386719, -0.046169281005859375, -0.04290199279785156, -0.03963470458984375, -0.03636741638183594, -0.033100128173828125, -0.029832839965820312, -0.0265655517578125, -0.023298263549804688, -0.020030975341796875, -0.016763687133789062, -0.01349639892578125, -0.010229110717773438, -0.006961822509765625, -0.0036945343017578125, -0.00042724609375, 0.0028400421142578125, 0.006107330322265625, 0.009374618530273438, 0.01264190673828125, 0.015909194946289062, 0.019176483154296875, 0.022443771362304688, 0.0257110595703125, 0.028978347778320312, 0.032245635986328125, 0.03551292419433594, 0.03878021240234375, 0.04204750061035156, 0.045314788818359375, 0.04858207702636719, 0.051849365234375, 0.05511665344238281, 0.058383941650390625, 0.06165122985839844, 0.06491851806640625, 0.06818580627441406, 0.07145309448242188, 0.07472038269042969, 0.0779876708984375, 0.08125495910644531, 0.08452224731445312, 0.08778953552246094, 0.09105682373046875, 0.09432411193847656, 0.09759140014648438, 0.10085868835449219, 0.1041259765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 10.0, 11.0, 15.0, 14.0, 25.0, 37.0, 53.0, 81.0, 101.0, 150.0, 207.0, 382.0, 571.0, 1005.0, 2069.0, 5466.0, 23520.0, 205141.0, 675304.0, 111104.0, 15331.0, 3889.0, 1677.0, 883.0, 513.0, 268.0, 220.0, 172.0, 111.0, 57.0, 45.0, 26.0, 21.0, 23.0, 14.0, 7.0, 8.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.33052825927734375, -0.3199920654296875, -0.30945587158203125, -0.298919677734375, -0.28838348388671875, -0.2778472900390625, -0.26731109619140625, -0.25677490234375, -0.24623870849609375, -0.2357025146484375, -0.22516632080078125, -0.214630126953125, -0.20409393310546875, -0.1935577392578125, -0.18302154541015625, -0.1724853515625, -0.16194915771484375, -0.1514129638671875, -0.14087677001953125, -0.130340576171875, -0.11980438232421875, -0.1092681884765625, -0.09873199462890625, -0.08819580078125, -0.07765960693359375, -0.0671234130859375, -0.05658721923828125, -0.046051025390625, -0.03551483154296875, -0.0249786376953125, -0.01444244384765625, -0.00390625, 0.00662994384765625, 0.0171661376953125, 0.02770233154296875, 0.038238525390625, 0.04877471923828125, 0.0593109130859375, 0.06984710693359375, 0.08038330078125, 0.09091949462890625, 0.1014556884765625, 0.11199188232421875, 0.122528076171875, 0.13306427001953125, 0.1436004638671875, 0.15413665771484375, 0.1646728515625, 0.17520904541015625, 0.1857452392578125, 0.19628143310546875, 0.206817626953125, 0.21735382080078125, 0.2278900146484375, 0.23842620849609375, 0.24896240234375, 0.25949859619140625, 0.2700347900390625, 0.28057098388671875, 0.291107177734375, 0.30164337158203125, 0.3121795654296875, 0.32271575927734375, 0.333251953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 14.0, 10.0, 14.0, 13.0, 25.0, 24.0, 26.0, 29.0, 34.0, 42.0, 42.0, 43.0, 33.0, 53.0, 58.0, 47.0, 48.0, 36.0, 46.0, 30.0, 34.0, 51.0, 42.0, 25.0, 29.0, 19.0, 16.0, 20.0, 14.0, 12.0, 6.0, 7.0, 4.0, 7.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4091796875, -0.3976097106933594, -0.38603973388671875, -0.3744697570800781, -0.3628997802734375, -0.3513298034667969, -0.33975982666015625, -0.3281898498535156, -0.316619873046875, -0.3050498962402344, -0.29347991943359375, -0.2819099426269531, -0.2703399658203125, -0.2587699890136719, -0.24720001220703125, -0.23563003540039062, -0.22406005859375, -0.21249008178710938, -0.20092010498046875, -0.18935012817382812, -0.1777801513671875, -0.16621017456054688, -0.15464019775390625, -0.14307022094726562, -0.131500244140625, -0.11993026733398438, -0.10836029052734375, -0.09679031372070312, -0.0852203369140625, -0.07365036010742188, -0.06208038330078125, -0.050510406494140625, -0.0389404296875, -0.027370452880859375, -0.01580047607421875, -0.004230499267578125, 0.0073394775390625, 0.018909454345703125, 0.03047943115234375, 0.042049407958984375, 0.053619384765625, 0.06518936157226562, 0.07675933837890625, 0.08832931518554688, 0.0998992919921875, 0.11146926879882812, 0.12303924560546875, 0.13460922241210938, 0.14617919921875, 0.15774917602539062, 0.16931915283203125, 0.18088912963867188, 0.1924591064453125, 0.20402908325195312, 0.21559906005859375, 0.22716903686523438, 0.238739013671875, 0.2503089904785156, 0.26187896728515625, 0.2734489440917969, 0.2850189208984375, 0.2965888977050781, 0.30815887451171875, 0.3197288513183594, 0.331298828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 8.0, 4.0, 10.0, 13.0, 14.0, 22.0, 29.0, 54.0, 66.0, 127.0, 219.0, 377.0, 695.0, 1652.0, 4552.0, 19441.0, 170961.0, 708703.0, 119778.0, 15041.0, 3798.0, 1461.0, 652.0, 319.0, 202.0, 119.0, 69.0, 57.0, 33.0, 22.0, 13.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.1832752227783203, -0.17795181274414062, -0.17262840270996094, -0.16730499267578125, -0.16198158264160156, -0.15665817260742188, -0.1513347625732422, -0.1460113525390625, -0.1406879425048828, -0.13536453247070312, -0.13004112243652344, -0.12471771240234375, -0.11939430236816406, -0.11407089233398438, -0.10874748229980469, -0.103424072265625, -0.09810066223144531, -0.09277725219726562, -0.08745384216308594, -0.08213043212890625, -0.07680702209472656, -0.07148361206054688, -0.06616020202636719, -0.0608367919921875, -0.05551338195800781, -0.050189971923828125, -0.04486656188964844, -0.03954315185546875, -0.03421974182128906, -0.028896331787109375, -0.023572921752929688, -0.01824951171875, -0.012926101684570312, -0.007602691650390625, -0.0022792816162109375, 0.00304412841796875, 0.008367538452148438, 0.013690948486328125, 0.019014358520507812, 0.0243377685546875, 0.029661178588867188, 0.034984588623046875, 0.04030799865722656, 0.04563140869140625, 0.05095481872558594, 0.056278228759765625, 0.06160163879394531, 0.066925048828125, 0.07224845886230469, 0.07757186889648438, 0.08289527893066406, 0.08821868896484375, 0.09354209899902344, 0.09886550903320312, 0.10418891906738281, 0.1095123291015625, 0.11483573913574219, 0.12015914916992188, 0.12548255920410156, 0.13080596923828125, 0.13612937927246094, 0.14145278930664062, 0.1467761993408203, 0.152099609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 12.0, 15.0, 19.0, 22.0, 32.0, 54.0, 70.0, 74.0, 76.0, 96.0, 100.0, 102.0, 89.0, 68.0, 53.0, 31.0, 27.0, 20.0, 17.0, 6.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.502866744995117e-05, -6.263144314289093e-05, -6.023421883583069e-05, -5.783699452877045e-05, -5.5439770221710205e-05, -5.304254591464996e-05, -5.064532160758972e-05, -4.824809730052948e-05, -4.585087299346924e-05, -4.3453648686408997e-05, -4.1056424379348755e-05, -3.865920007228851e-05, -3.626197576522827e-05, -3.386475145816803e-05, -3.146752715110779e-05, -2.9070302844047546e-05, -2.6673078536987305e-05, -2.4275854229927063e-05, -2.187862992286682e-05, -1.948140561580658e-05, -1.7084181308746338e-05, -1.4686957001686096e-05, -1.2289732694625854e-05, -9.892508387565613e-06, -7.495284080505371e-06, -5.098059773445129e-06, -2.7008354663848877e-06, -3.03611159324646e-07, 2.0936131477355957e-06, 4.490837454795837e-06, 6.888061761856079e-06, 9.28528606891632e-06, 1.1682510375976562e-05, 1.4079734683036804e-05, 1.6476958990097046e-05, 1.8874183297157288e-05, 2.127140760421753e-05, 2.366863191127777e-05, 2.6065856218338013e-05, 2.8463080525398254e-05, 3.0860304832458496e-05, 3.325752913951874e-05, 3.565475344657898e-05, 3.805197775363922e-05, 4.044920206069946e-05, 4.2846426367759705e-05, 4.5243650674819946e-05, 4.764087498188019e-05, 5.003809928894043e-05, 5.243532359600067e-05, 5.483254790306091e-05, 5.7229772210121155e-05, 5.9626996517181396e-05, 6.202422082424164e-05, 6.442144513130188e-05, 6.681866943836212e-05, 6.921589374542236e-05, 7.16131180524826e-05, 7.401034235954285e-05, 7.640756666660309e-05, 7.880479097366333e-05, 8.120201528072357e-05, 8.359923958778381e-05, 8.599646389484406e-05, 8.83936882019043e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 9.0, 6.0, 13.0, 12.0, 19.0, 28.0, 39.0, 71.0, 116.0, 189.0, 388.0, 809.0, 1871.0, 4813.0, 21423.0, 221104.0, 690238.0, 89631.0, 11719.0, 3353.0, 1298.0, 627.0, 308.0, 179.0, 104.0, 55.0, 39.0, 25.0, 17.0, 16.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.15056800842285156, -0.14525222778320312, -0.1399364471435547, -0.13462066650390625, -0.1293048858642578, -0.12398910522460938, -0.11867332458496094, -0.1133575439453125, -0.10804176330566406, -0.10272598266601562, -0.09741020202636719, -0.09209442138671875, -0.08677864074707031, -0.08146286010742188, -0.07614707946777344, -0.070831298828125, -0.06551551818847656, -0.060199737548828125, -0.05488395690917969, -0.04956817626953125, -0.04425239562988281, -0.038936614990234375, -0.03362083435058594, -0.0283050537109375, -0.022989273071289062, -0.017673492431640625, -0.012357711791992188, -0.00704193115234375, -0.0017261505126953125, 0.003589630126953125, 0.008905410766601562, 0.01422119140625, 0.019536972045898438, 0.024852752685546875, 0.030168533325195312, 0.03548431396484375, 0.04080009460449219, 0.046115875244140625, 0.05143165588378906, 0.0567474365234375, 0.06206321716308594, 0.06737899780273438, 0.07269477844238281, 0.07801055908203125, 0.08332633972167969, 0.08864212036132812, 0.09395790100097656, 0.099273681640625, 0.10458946228027344, 0.10990524291992188, 0.11522102355957031, 0.12053680419921875, 0.1258525848388672, 0.13116836547851562, 0.13648414611816406, 0.1417999267578125, 0.14711570739746094, 0.15243148803710938, 0.1577472686767578, 0.16306304931640625, 0.1683788299560547, 0.17369461059570312, 0.17901039123535156, 0.184326171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 9.0, 9.0, 12.0, 19.0, 25.0, 26.0, 51.0, 50.0, 78.0, 96.0, 90.0, 111.0, 103.0, 72.0, 73.0, 63.0, 40.0, 23.0, 22.0, 10.0, 9.0, 6.0, 1.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.14794921875, -0.1432323455810547, -0.13851547241210938, -0.13379859924316406, -0.12908172607421875, -0.12436485290527344, -0.11964797973632812, -0.11493110656738281, -0.1102142333984375, -0.10549736022949219, -0.10078048706054688, -0.09606361389160156, -0.09134674072265625, -0.08662986755371094, -0.08191299438476562, -0.07719612121582031, -0.072479248046875, -0.06776237487792969, -0.06304550170898438, -0.05832862854003906, -0.05361175537109375, -0.04889488220214844, -0.044178009033203125, -0.03946113586425781, -0.0347442626953125, -0.030027389526367188, -0.025310516357421875, -0.020593643188476562, -0.01587677001953125, -0.011159896850585938, -0.006443023681640625, -0.0017261505126953125, 0.00299072265625, 0.0077075958251953125, 0.012424468994140625, 0.017141342163085938, 0.02185821533203125, 0.026575088500976562, 0.031291961669921875, 0.03600883483886719, 0.0407257080078125, 0.04544258117675781, 0.050159454345703125, 0.05487632751464844, 0.05959320068359375, 0.06431007385253906, 0.06902694702148438, 0.07374382019042969, 0.078460693359375, 0.08317756652832031, 0.08789443969726562, 0.09261131286621094, 0.09732818603515625, 0.10204505920410156, 0.10676193237304688, 0.11147880554199219, 0.1161956787109375, 0.12091255187988281, 0.12562942504882812, 0.13034629821777344, 0.13506317138671875, 0.13978004455566406, 0.14449691772460938, 0.1492137908935547, 0.1539306640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 30.0, 50.0, 108.0, 181.0, 197.0, 191.0, 132.0, 61.0, 26.0, 10.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.165902137756348, -5.057231903076172, -4.948562145233154, -4.8398919105529785, -4.731222152709961, -4.622551918029785, -4.513881683349609, -4.405211925506592, -4.296541690826416, -4.18787145614624, -4.079201698303223, -3.970531463623047, -3.86186146736145, -3.7531914710998535, -3.644521474838257, -3.53585147857666, -3.4271814823150635, -3.318511486053467, -3.20984148979187, -3.1011714935302734, -2.9925012588500977, -2.883831262588501, -2.7751612663269043, -2.6664912700653076, -2.557821273803711, -2.4491512775421143, -2.3404812812805176, -2.231811046600342, -2.123141050338745, -2.0144710540771484, -1.9058010578155518, -1.797131061553955, -1.6884608268737793, -1.5797908306121826, -1.4711207151412964, -1.3624507188796997, -1.2537806034088135, -1.1451106071472168, -1.0364406108856201, -0.9277705550193787, -0.8191004991531372, -0.7104304432868958, -0.6017603874206543, -0.4930903911590576, -0.38442033529281616, -0.2757502794265747, -0.16708028316497803, -0.05841022729873657, 0.05025982856750488, 0.15892986953258514, 0.2675999104976654, 0.3762699365615845, 0.4849399924278259, 0.5936100482940674, 0.7022800445556641, 0.8109501004219055, 0.919620156288147, 1.0282901525497437, 1.1369602680206299, 1.2456302642822266, 1.3543002605438232, 1.4629703760147095, 1.5716403722763062, 1.6803104877471924, 1.788980484008789]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 6.0, 8.0, 23.0, 18.0, 16.0, 24.0, 19.0, 27.0, 31.0, 41.0, 47.0, 41.0, 43.0, 47.0, 40.0, 53.0, 53.0, 56.0, 49.0, 45.0, 37.0, 36.0, 46.0, 23.0, 20.0, 23.0, 23.0, 20.0, 14.0, 12.0, 7.0, 12.0, 7.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8363511562347412, -1.783287525177002, -1.7302238941192627, -1.6771602630615234, -1.6240966320037842, -1.571033000946045, -1.5179694890975952, -1.464905858039856, -1.4118422269821167, -1.3587785959243774, -1.3057149648666382, -1.252651333808899, -1.1995878219604492, -1.14652419090271, -1.0934605598449707, -1.0403969287872314, -0.9873332977294922, -0.9342696666717529, -0.8812060356140137, -0.8281424641609192, -0.7750788331031799, -0.7220152020454407, -0.6689516305923462, -0.6158879995346069, -0.5628243684768677, -0.5097607374191284, -0.45669713616371155, -0.4036335349082947, -0.3505699038505554, -0.29750627279281616, -0.2444426715373993, -0.19137907028198242, -0.13831555843353271, -0.08525194227695465, -0.03218832612037659, 0.020875290036201477, 0.07393890619277954, 0.1270025372505188, 0.18006613850593567, 0.23312973976135254, 0.2861933708190918, 0.33925700187683105, 0.3923206031322479, 0.4453842043876648, 0.49844783544540405, 0.5515114665031433, 0.6045750379562378, 0.657638669013977, 0.7107023000717163, 0.7637659311294556, 0.8168295621871948, 0.8698931336402893, 0.9229567646980286, 0.9760203957557678, 1.0290839672088623, 1.0821475982666016, 1.1352112293243408, 1.18827486038208, 1.2413384914398193, 1.2944021224975586, 1.3474657535552979, 1.400529384613037, 1.4535928964614868, 1.506656527519226, 1.5597201585769653]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 17.0, 19.0, 11.0, 28.0, 37.0, 46.0, 65.0, 101.0, 126.0, 202.0, 289.0, 384.0, 644.0, 1035.0, 1840.0, 4080.0, 13111.0, 154518.0, 3988309.0, 18822.0, 5056.0, 2223.0, 1173.0, 670.0, 436.0, 287.0, 228.0, 146.0, 105.0, 86.0, 49.0, 43.0, 25.0, 21.0, 11.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.384033203125, -0.3716888427734375, -0.359344482421875, -0.3470001220703125, -0.33465576171875, -0.3223114013671875, -0.309967041015625, -0.2976226806640625, -0.2852783203125, -0.2729339599609375, -0.260589599609375, -0.2482452392578125, -0.23590087890625, -0.2235565185546875, -0.211212158203125, -0.1988677978515625, -0.1865234375, -0.1741790771484375, -0.161834716796875, -0.1494903564453125, -0.13714599609375, -0.1248016357421875, -0.112457275390625, -0.1001129150390625, -0.0877685546875, -0.0754241943359375, -0.063079833984375, -0.0507354736328125, -0.03839111328125, -0.0260467529296875, -0.013702392578125, -0.0013580322265625, 0.010986328125, 0.0233306884765625, 0.035675048828125, 0.0480194091796875, 0.06036376953125, 0.0727081298828125, 0.085052490234375, 0.0973968505859375, 0.1097412109375, 0.1220855712890625, 0.134429931640625, 0.1467742919921875, 0.15911865234375, 0.1714630126953125, 0.183807373046875, 0.1961517333984375, 0.20849609375, 0.2208404541015625, 0.233184814453125, 0.2455291748046875, 0.25787353515625, 0.2702178955078125, 0.282562255859375, 0.2949066162109375, 0.3072509765625, 0.3195953369140625, 0.331939697265625, 0.3442840576171875, 0.35662841796875, 0.3689727783203125, 0.381317138671875, 0.3936614990234375, 0.406005859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 11.0, 24.0, 16.0, 17.0, 29.0, 36.0, 45.0, 53.0, 58.0, 46.0, 57.0, 63.0, 52.0, 65.0, 66.0, 51.0, 68.0, 39.0, 36.0, 41.0, 29.0, 25.0, 12.0, 15.0, 11.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1016845703125, -0.0985565185546875, -0.095428466796875, -0.0923004150390625, -0.08917236328125, -0.0860443115234375, -0.082916259765625, -0.0797882080078125, -0.07666015625, -0.0735321044921875, -0.070404052734375, -0.0672760009765625, -0.06414794921875, -0.0610198974609375, -0.057891845703125, -0.0547637939453125, -0.0516357421875, -0.0485076904296875, -0.045379638671875, -0.0422515869140625, -0.03912353515625, -0.0359954833984375, -0.032867431640625, -0.0297393798828125, -0.026611328125, -0.0234832763671875, -0.020355224609375, -0.0172271728515625, -0.01409912109375, -0.0109710693359375, -0.007843017578125, -0.0047149658203125, -0.0015869140625, 0.0015411376953125, 0.004669189453125, 0.0077972412109375, 0.01092529296875, 0.0140533447265625, 0.017181396484375, 0.0203094482421875, 0.0234375, 0.0265655517578125, 0.029693603515625, 0.0328216552734375, 0.03594970703125, 0.0390777587890625, 0.042205810546875, 0.0453338623046875, 0.0484619140625, 0.0515899658203125, 0.054718017578125, 0.0578460693359375, 0.06097412109375, 0.0641021728515625, 0.067230224609375, 0.0703582763671875, 0.073486328125, 0.0766143798828125, 0.079742431640625, 0.0828704833984375, 0.08599853515625, 0.0891265869140625, 0.092254638671875, 0.0953826904296875, 0.0985107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 10.0, 17.0, 20.0, 15.0, 28.0, 38.0, 40.0, 46.0, 68.0, 118.0, 129.0, 144.0, 218.0, 363.0, 690.0, 1434.0, 3860.0, 16417.0, 3855322.0, 295062.0, 13539.0, 3531.0, 1327.0, 585.0, 365.0, 215.0, 135.0, 106.0, 98.0, 71.0, 49.0, 47.0, 28.0, 33.0, 21.0, 22.0, 9.0, 11.0, 4.0, 4.0, 4.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0], "bins": [-0.5791015625, -0.5615234375, -0.5439453125, -0.5263671875, -0.5087890625, -0.4912109375, -0.4736328125, -0.4560546875, -0.4384765625, -0.4208984375, -0.4033203125, -0.3857421875, -0.3681640625, -0.3505859375, -0.3330078125, -0.3154296875, -0.2978515625, -0.2802734375, -0.2626953125, -0.2451171875, -0.2275390625, -0.2099609375, -0.1923828125, -0.1748046875, -0.1572265625, -0.1396484375, -0.1220703125, -0.1044921875, -0.0869140625, -0.0693359375, -0.0517578125, -0.0341796875, -0.0166015625, 0.0009765625, 0.0185546875, 0.0361328125, 0.0537109375, 0.0712890625, 0.0888671875, 0.1064453125, 0.1240234375, 0.1416015625, 0.1591796875, 0.1767578125, 0.1943359375, 0.2119140625, 0.2294921875, 0.2470703125, 0.2646484375, 0.2822265625, 0.2998046875, 0.3173828125, 0.3349609375, 0.3525390625, 0.3701171875, 0.3876953125, 0.4052734375, 0.4228515625, 0.4404296875, 0.4580078125, 0.4755859375, 0.4931640625, 0.5107421875, 0.5283203125, 0.5458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 17.0, 18.0, 62.0, 3543.0, 335.0, 50.0, 19.0, 12.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17626953125, -0.17073440551757812, -0.16519927978515625, -0.15966415405273438, -0.1541290283203125, -0.14859390258789062, -0.14305877685546875, -0.13752365112304688, -0.131988525390625, -0.12645339965820312, -0.12091827392578125, -0.11538314819335938, -0.1098480224609375, -0.10431289672851562, -0.09877777099609375, -0.09324264526367188, -0.08770751953125, -0.08217239379882812, -0.07663726806640625, -0.07110214233398438, -0.0655670166015625, -0.060031890869140625, -0.05449676513671875, -0.048961639404296875, -0.043426513671875, -0.037891387939453125, -0.03235626220703125, -0.026821136474609375, -0.0212860107421875, -0.015750885009765625, -0.01021575927734375, -0.004680633544921875, 0.0008544921875, 0.006389617919921875, 0.01192474365234375, 0.017459869384765625, 0.0229949951171875, 0.028530120849609375, 0.03406524658203125, 0.039600372314453125, 0.045135498046875, 0.050670623779296875, 0.05620574951171875, 0.061740875244140625, 0.0672760009765625, 0.07281112670898438, 0.07834625244140625, 0.08388137817382812, 0.08941650390625, 0.09495162963867188, 0.10048675537109375, 0.10602188110351562, 0.1115570068359375, 0.11709213256835938, 0.12262725830078125, 0.12816238403320312, 0.133697509765625, 0.13923263549804688, 0.14476776123046875, 0.15030288696289062, 0.1558380126953125, 0.16137313842773438, 0.16690826416015625, 0.17244338989257812, 0.177978515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 12.0, 13.0, 14.0, 26.0, 36.0, 60.0, 102.0, 106.0, 147.0, 152.0, 117.0, 87.0, 57.0, 28.0, 12.0, 10.0, 4.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3946044445037842, -0.3813950717449188, -0.36818569898605347, -0.3549763262271881, -0.34176695346832275, -0.3285575807094574, -0.31534820795059204, -0.3021388351917267, -0.28892946243286133, -0.27572008967399597, -0.2625107169151306, -0.24930134415626526, -0.2360919713973999, -0.22288259863853455, -0.2096732258796692, -0.19646385312080383, -0.18325448036193848, -0.17004510760307312, -0.15683573484420776, -0.1436263620853424, -0.13041698932647705, -0.1172076165676117, -0.10399824380874634, -0.09078887104988098, -0.07757949829101562, -0.06437012553215027, -0.05116075277328491, -0.037951380014419556, -0.0247420072555542, -0.011532634496688843, 0.0016767382621765137, 0.01488611102104187, 0.028095483779907227, 0.04130485653877258, 0.05451422929763794, 0.0677236020565033, 0.08093297481536865, 0.09414234757423401, 0.10735172033309937, 0.12056109309196472, 0.13377046585083008, 0.14697983860969543, 0.1601892113685608, 0.17339858412742615, 0.1866079568862915, 0.19981732964515686, 0.21302670240402222, 0.22623607516288757, 0.23944544792175293, 0.2526548206806183, 0.26586419343948364, 0.279073566198349, 0.29228293895721436, 0.3054923117160797, 0.31870168447494507, 0.3319110572338104, 0.3451204299926758, 0.35832980275154114, 0.3715391755104065, 0.38474854826927185, 0.3979579210281372, 0.41116729378700256, 0.4243766665458679, 0.4375860393047333, 0.45079541206359863]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 9.0, 8.0, 8.0, 10.0, 9.0, 21.0, 19.0, 22.0, 24.0, 26.0, 22.0, 31.0, 46.0, 38.0, 42.0, 31.0, 45.0, 36.0, 50.0, 43.0, 40.0, 43.0, 34.0, 47.0, 32.0, 30.0, 34.0, 18.0, 22.0, 24.0, 21.0, 11.0, 8.0, 22.0, 9.0, 17.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1824837327003479, -0.1767328530550003, -0.1709819883108139, -0.1652311086654663, -0.1594802290201187, -0.15372934937477112, -0.14797848463058472, -0.14222760498523712, -0.13647672533988953, -0.13072584569454193, -0.12497497349977493, -0.11922410130500793, -0.11347322165966034, -0.10772234946489334, -0.10197147727012634, -0.09622059762477875, -0.09046973288059235, -0.08471886068582535, -0.07896798104047775, -0.07321710884571075, -0.06746622920036316, -0.06171535700559616, -0.05596448481082916, -0.050213608890771866, -0.04446273297071457, -0.03871185705065727, -0.032960981130599976, -0.027210108935832977, -0.02145923301577568, -0.015708357095718384, -0.009957484900951385, -0.004206608980894089, 0.001544266939163208, 0.00729514192789793, 0.013046016916632652, 0.0187968909740448, 0.024547766894102097, 0.030298642814159393, 0.03604951500892639, 0.04180039092898369, 0.047551266849040985, 0.05330214276909828, 0.05905301868915558, 0.06480389088392258, 0.07055476307868958, 0.07630564272403717, 0.08205651491880417, 0.08780738711357117, 0.09355826675891876, 0.09930913895368576, 0.10506001859903336, 0.11081089079380035, 0.11656177043914795, 0.12231264263391495, 0.12806351482868195, 0.13381439447402954, 0.13956525921821594, 0.14531613886356354, 0.15106700360774994, 0.15681788325309753, 0.16256876289844513, 0.16831964254379272, 0.17407050728797913, 0.17982138693332672, 0.18557226657867432]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 7.0, 14.0, 25.0, 24.0, 29.0, 73.0, 110.0, 132.0, 189.0, 251.0, 459.0, 698.0, 968.0, 1586.0, 2520.0, 4209.0, 7127.0, 12994.0, 24228.0, 48509.0, 98425.0, 193527.0, 270957.0, 186598.0, 94829.0, 45966.0, 23528.0, 12326.0, 7157.0, 4180.0, 2456.0, 1528.0, 1024.0, 601.0, 431.0, 271.0, 189.0, 142.0, 93.0, 62.0, 32.0, 16.0, 20.0, 18.0, 13.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1278076171875, -0.12398910522460938, -0.12017059326171875, -0.11635208129882812, -0.1125335693359375, -0.10871505737304688, -0.10489654541015625, -0.10107803344726562, -0.097259521484375, -0.09344100952148438, -0.08962249755859375, -0.08580398559570312, -0.0819854736328125, -0.07816696166992188, -0.07434844970703125, -0.07052993774414062, -0.06671142578125, -0.06289291381835938, -0.05907440185546875, -0.055255889892578125, -0.0514373779296875, -0.047618865966796875, -0.04380035400390625, -0.039981842041015625, -0.036163330078125, -0.032344818115234375, -0.02852630615234375, -0.024707794189453125, -0.0208892822265625, -0.017070770263671875, -0.01325225830078125, -0.009433746337890625, -0.005615234375, -0.001796722412109375, 0.00202178955078125, 0.005840301513671875, 0.0096588134765625, 0.013477325439453125, 0.01729583740234375, 0.021114349365234375, 0.024932861328125, 0.028751373291015625, 0.03256988525390625, 0.036388397216796875, 0.0402069091796875, 0.044025421142578125, 0.04784393310546875, 0.051662445068359375, 0.05548095703125, 0.059299468994140625, 0.06311798095703125, 0.06693649291992188, 0.0707550048828125, 0.07457351684570312, 0.07839202880859375, 0.08221054077148438, 0.086029052734375, 0.08984756469726562, 0.09366607666015625, 0.09748458862304688, 0.1013031005859375, 0.10512161254882812, 0.10894012451171875, 0.11275863647460938, 0.1165771484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 17.0, 17.0, 22.0, 20.0, 25.0, 43.0, 44.0, 43.0, 41.0, 64.0, 53.0, 55.0, 68.0, 64.0, 60.0, 63.0, 39.0, 47.0, 50.0, 30.0, 21.0, 19.0, 18.0, 13.0, 16.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10687255859375, -0.10356807708740234, -0.10026359558105469, -0.09695911407470703, -0.09365463256835938, -0.09035015106201172, -0.08704566955566406, -0.0837411880493164, -0.08043670654296875, -0.0771322250366211, -0.07382774353027344, -0.07052326202392578, -0.06721878051757812, -0.06391429901123047, -0.06060981750488281, -0.057305335998535156, -0.0540008544921875, -0.050696372985839844, -0.04739189147949219, -0.04408740997314453, -0.040782928466796875, -0.03747844696044922, -0.03417396545410156, -0.030869483947753906, -0.02756500244140625, -0.024260520935058594, -0.020956039428710938, -0.01765155792236328, -0.014347076416015625, -0.011042594909667969, -0.0077381134033203125, -0.004433631896972656, -0.001129150390625, 0.0021753311157226562, 0.0054798126220703125, 0.008784294128417969, 0.012088775634765625, 0.015393257141113281, 0.018697738647460938, 0.022002220153808594, 0.02530670166015625, 0.028611183166503906, 0.03191566467285156, 0.03522014617919922, 0.038524627685546875, 0.04182910919189453, 0.04513359069824219, 0.048438072204589844, 0.0517425537109375, 0.055047035217285156, 0.05835151672363281, 0.06165599822998047, 0.06496047973632812, 0.06826496124267578, 0.07156944274902344, 0.0748739242553711, 0.07817840576171875, 0.0814828872680664, 0.08478736877441406, 0.08809185028076172, 0.09139633178710938, 0.09470081329345703, 0.09800529479980469, 0.10130977630615234, 0.1046142578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 3.0, 13.0, 19.0, 19.0, 23.0, 33.0, 36.0, 71.0, 88.0, 106.0, 131.0, 224.0, 306.0, 476.0, 751.0, 1377.0, 3245.0, 11958.0, 86766.0, 711866.0, 200903.0, 21058.0, 4689.0, 1701.0, 921.0, 537.0, 370.0, 243.0, 162.0, 116.0, 87.0, 53.0, 55.0, 36.0, 24.0, 22.0, 10.0, 15.0, 12.0, 8.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30859375, -0.29853057861328125, -0.2884674072265625, -0.27840423583984375, -0.268341064453125, -0.25827789306640625, -0.2482147216796875, -0.23815155029296875, -0.22808837890625, -0.21802520751953125, -0.2079620361328125, -0.19789886474609375, -0.187835693359375, -0.17777252197265625, -0.1677093505859375, -0.15764617919921875, -0.1475830078125, -0.13751983642578125, -0.1274566650390625, -0.11739349365234375, -0.107330322265625, -0.09726715087890625, -0.0872039794921875, -0.07714080810546875, -0.06707763671875, -0.05701446533203125, -0.0469512939453125, -0.03688812255859375, -0.026824951171875, -0.01676177978515625, -0.0066986083984375, 0.00336456298828125, 0.013427734375, 0.02349090576171875, 0.0335540771484375, 0.04361724853515625, 0.053680419921875, 0.06374359130859375, 0.0738067626953125, 0.08386993408203125, 0.09393310546875, 0.10399627685546875, 0.1140594482421875, 0.12412261962890625, 0.134185791015625, 0.14424896240234375, 0.1543121337890625, 0.16437530517578125, 0.1744384765625, 0.18450164794921875, 0.1945648193359375, 0.20462799072265625, 0.214691162109375, 0.22475433349609375, 0.2348175048828125, 0.24488067626953125, 0.25494384765625, 0.26500701904296875, 0.2750701904296875, 0.28513336181640625, 0.295196533203125, 0.30525970458984375, 0.3153228759765625, 0.32538604736328125, 0.33544921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 6.0, 5.0, 7.0, 4.0, 14.0, 9.0, 14.0, 6.0, 21.0, 24.0, 24.0, 21.0, 28.0, 35.0, 21.0, 40.0, 34.0, 52.0, 37.0, 41.0, 35.0, 46.0, 40.0, 30.0, 38.0, 37.0, 43.0, 32.0, 34.0, 26.0, 25.0, 27.0, 20.0, 26.0, 19.0, 16.0, 13.0, 14.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.316650390625, -0.3068962097167969, -0.29714202880859375, -0.2873878479003906, -0.2776336669921875, -0.2678794860839844, -0.25812530517578125, -0.24837112426757812, -0.238616943359375, -0.22886276245117188, -0.21910858154296875, -0.20935440063476562, -0.1996002197265625, -0.18984603881835938, -0.18009185791015625, -0.17033767700195312, -0.16058349609375, -0.15082931518554688, -0.14107513427734375, -0.13132095336914062, -0.1215667724609375, -0.11181259155273438, -0.10205841064453125, -0.09230422973632812, -0.082550048828125, -0.07279586791992188, -0.06304168701171875, -0.053287506103515625, -0.0435333251953125, -0.033779144287109375, -0.02402496337890625, -0.014270782470703125, -0.0045166015625, 0.005237579345703125, 0.01499176025390625, 0.024745941162109375, 0.0345001220703125, 0.044254302978515625, 0.05400848388671875, 0.06376266479492188, 0.073516845703125, 0.08327102661132812, 0.09302520751953125, 0.10277938842773438, 0.1125335693359375, 0.12228775024414062, 0.13204193115234375, 0.14179611206054688, 0.15155029296875, 0.16130447387695312, 0.17105865478515625, 0.18081283569335938, 0.1905670166015625, 0.20032119750976562, 0.21007537841796875, 0.21982955932617188, 0.229583740234375, 0.23933792114257812, 0.24909210205078125, 0.2588462829589844, 0.2686004638671875, 0.2783546447753906, 0.28810882568359375, 0.2978630065917969, 0.3076171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 4.0, 11.0, 11.0, 18.0, 28.0, 50.0, 64.0, 89.0, 126.0, 237.0, 448.0, 918.0, 2360.0, 9903.0, 112263.0, 795056.0, 112545.0, 10006.0, 2347.0, 939.0, 423.0, 252.0, 151.0, 85.0, 67.0, 38.0, 28.0, 25.0, 13.0, 5.0, 11.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17699813842773438, -0.17137908935546875, -0.16576004028320312, -0.1601409912109375, -0.15452194213867188, -0.14890289306640625, -0.14328384399414062, -0.137664794921875, -0.13204574584960938, -0.12642669677734375, -0.12080764770507812, -0.1151885986328125, -0.10956954956054688, -0.10395050048828125, -0.09833145141601562, -0.09271240234375, -0.08709335327148438, -0.08147430419921875, -0.07585525512695312, -0.0702362060546875, -0.06461715698242188, -0.05899810791015625, -0.053379058837890625, -0.047760009765625, -0.042140960693359375, -0.03652191162109375, -0.030902862548828125, -0.0252838134765625, -0.019664764404296875, -0.01404571533203125, -0.008426666259765625, -0.0028076171875, 0.002811431884765625, 0.00843048095703125, 0.014049530029296875, 0.0196685791015625, 0.025287628173828125, 0.03090667724609375, 0.036525726318359375, 0.042144775390625, 0.047763824462890625, 0.05338287353515625, 0.059001922607421875, 0.0646209716796875, 0.07024002075195312, 0.07585906982421875, 0.08147811889648438, 0.08709716796875, 0.09271621704101562, 0.09833526611328125, 0.10395431518554688, 0.1095733642578125, 0.11519241333007812, 0.12081146240234375, 0.12643051147460938, 0.132049560546875, 0.13766860961914062, 0.14328765869140625, 0.14890670776367188, 0.1545257568359375, 0.16014480590820312, 0.16576385498046875, 0.17138290405273438, 0.177001953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 11.0, 9.0, 16.0, 9.0, 25.0, 18.0, 32.0, 37.0, 40.0, 76.0, 75.0, 58.0, 65.0, 73.0, 69.0, 70.0, 61.0, 49.0, 44.0, 29.0, 17.0, 17.0, 11.0, 5.0, 7.0, 7.0, 14.0, 6.0, 7.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.9768947064876556e-05, -4.8099085688591003e-05, -4.642922431230545e-05, -4.47593629360199e-05, -4.3089501559734344e-05, -4.141964018344879e-05, -3.974977880716324e-05, -3.8079917430877686e-05, -3.641005605459213e-05, -3.474019467830658e-05, -3.3070333302021027e-05, -3.1400471925735474e-05, -2.973061054944992e-05, -2.8060749173164368e-05, -2.6390887796878815e-05, -2.4721026420593262e-05, -2.305116504430771e-05, -2.1381303668022156e-05, -1.9711442291736603e-05, -1.804158091545105e-05, -1.6371719539165497e-05, -1.4701858162879944e-05, -1.3031996786594391e-05, -1.1362135410308838e-05, -9.692274034023285e-06, -8.022412657737732e-06, -6.352551281452179e-06, -4.682689905166626e-06, -3.012828528881073e-06, -1.34296715259552e-06, 3.2689422369003296e-07, 1.996755599975586e-06, 3.666616976261139e-06, 5.336478352546692e-06, 7.006339728832245e-06, 8.676201105117798e-06, 1.034606248140335e-05, 1.2015923857688904e-05, 1.3685785233974457e-05, 1.535564661026001e-05, 1.7025507986545563e-05, 1.8695369362831116e-05, 2.036523073911667e-05, 2.203509211540222e-05, 2.3704953491687775e-05, 2.5374814867973328e-05, 2.704467624425888e-05, 2.8714537620544434e-05, 3.0384398996829987e-05, 3.205426037311554e-05, 3.372412174940109e-05, 3.5393983125686646e-05, 3.70638445019722e-05, 3.873370587825775e-05, 4.0403567254543304e-05, 4.207342863082886e-05, 4.374329000711441e-05, 4.541315138339996e-05, 4.7083012759685516e-05, 4.875287413597107e-05, 5.042273551225662e-05, 5.2092596888542175e-05, 5.376245826482773e-05, 5.543231964111328e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 13.0, 18.0, 17.0, 37.0, 45.0, 81.0, 157.0, 258.0, 535.0, 1013.0, 2572.0, 9416.0, 74085.0, 724089.0, 210847.0, 18355.0, 4121.0, 1449.0, 621.0, 343.0, 171.0, 129.0, 68.0, 39.0, 23.0, 11.0, 6.0, 2.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2293701171875, -0.22386837005615234, -0.2183666229248047, -0.21286487579345703, -0.20736312866210938, -0.20186138153076172, -0.19635963439941406, -0.1908578872680664, -0.18535614013671875, -0.1798543930053711, -0.17435264587402344, -0.16885089874267578, -0.16334915161132812, -0.15784740447998047, -0.1523456573486328, -0.14684391021728516, -0.1413421630859375, -0.13584041595458984, -0.1303386688232422, -0.12483692169189453, -0.11933517456054688, -0.11383342742919922, -0.10833168029785156, -0.1028299331665039, -0.09732818603515625, -0.0918264389038086, -0.08632469177246094, -0.08082294464111328, -0.07532119750976562, -0.06981945037841797, -0.06431770324707031, -0.058815956115722656, -0.053314208984375, -0.047812461853027344, -0.04231071472167969, -0.03680896759033203, -0.031307220458984375, -0.02580547332763672, -0.020303726196289062, -0.014801979064941406, -0.00930023193359375, -0.0037984848022460938, 0.0017032623291015625, 0.007205009460449219, 0.012706756591796875, 0.01820850372314453, 0.023710250854492188, 0.029211997985839844, 0.0347137451171875, 0.040215492248535156, 0.04571723937988281, 0.05121898651123047, 0.056720733642578125, 0.06222248077392578, 0.06772422790527344, 0.0732259750366211, 0.07872772216796875, 0.0842294692993164, 0.08973121643066406, 0.09523296356201172, 0.10073471069335938, 0.10623645782470703, 0.11173820495605469, 0.11723995208740234, 0.12274169921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 5.0, 7.0, 11.0, 13.0, 20.0, 34.0, 42.0, 48.0, 69.0, 100.0, 103.0, 109.0, 96.0, 80.0, 68.0, 47.0, 44.0, 33.0, 18.0, 15.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.19873046875, -0.19403457641601562, -0.18933868408203125, -0.18464279174804688, -0.1799468994140625, -0.17525100708007812, -0.17055511474609375, -0.16585922241210938, -0.161163330078125, -0.15646743774414062, -0.15177154541015625, -0.14707565307617188, -0.1423797607421875, -0.13768386840820312, -0.13298797607421875, -0.12829208374023438, -0.12359619140625, -0.11890029907226562, -0.11420440673828125, -0.10950851440429688, -0.1048126220703125, -0.10011672973632812, -0.09542083740234375, -0.09072494506835938, -0.086029052734375, -0.08133316040039062, -0.07663726806640625, -0.07194137573242188, -0.0672454833984375, -0.06254959106445312, -0.05785369873046875, -0.053157806396484375, -0.0484619140625, -0.043766021728515625, -0.03907012939453125, -0.034374237060546875, -0.0296783447265625, -0.024982452392578125, -0.02028656005859375, -0.015590667724609375, -0.010894775390625, -0.006198883056640625, -0.00150299072265625, 0.003192901611328125, 0.0078887939453125, 0.012584686279296875, 0.01728057861328125, 0.021976470947265625, 0.02667236328125, 0.031368255615234375, 0.03606414794921875, 0.040760040283203125, 0.0454559326171875, 0.050151824951171875, 0.05484771728515625, 0.059543609619140625, 0.064239501953125, 0.06893539428710938, 0.07363128662109375, 0.07832717895507812, 0.0830230712890625, 0.08771896362304688, 0.09241485595703125, 0.09711074829101562, 0.101806640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 10.0, 54.0, 172.0, 254.0, 255.0, 174.0, 55.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75568962097168, -4.62678337097168, -4.49787712097168, -4.368971347808838, -4.240065097808838, -4.111158847808838, -3.982252836227417, -3.853346824645996, -3.724440574645996, -3.595534324645996, -3.466628313064575, -3.3377223014831543, -3.2088160514831543, -3.0799098014831543, -2.9510037899017334, -2.8220977783203125, -2.6931915283203125, -2.5642852783203125, -2.4353792667388916, -2.3064732551574707, -2.1775670051574707, -2.0486607551574707, -1.9197547435760498, -1.7908486127853394, -1.661942481994629, -1.5330363512039185, -1.404130220413208, -1.2752240896224976, -1.146317958831787, -1.0174118280410767, -0.8885056972503662, -0.7595995664596558, -0.6306934356689453, -0.5017873048782349, -0.3728811740875244, -0.24397504329681396, -0.11506891250610352, 0.013837218284606934, 0.14274334907531738, 0.27164947986602783, 0.4005556106567383, 0.5294617414474487, 0.6583678722381592, 0.7872740030288696, 0.9161801338195801, 1.0450862646102905, 1.173992395401001, 1.3028985261917114, 1.4318046569824219, 1.5607107877731323, 1.6896169185638428, 1.8185230493545532, 1.9474291801452637, 2.0763354301452637, 2.2052414417266846, 2.3341474533081055, 2.4630537033081055, 2.5919599533081055, 2.7208659648895264, 2.8497719764709473, 2.9786782264709473, 3.1075844764709473, 3.236490488052368, 3.365396499633789, 3.494302749633789]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 10.0, 6.0, 6.0, 11.0, 12.0, 10.0, 12.0, 22.0, 22.0, 23.0, 33.0, 31.0, 39.0, 30.0, 41.0, 42.0, 36.0, 50.0, 57.0, 56.0, 38.0, 42.0, 44.0, 44.0, 37.0, 41.0, 31.0, 32.0, 22.0, 21.0, 11.0, 16.0, 11.0, 10.0, 10.0, 3.0, 7.0, 3.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6720733642578125, -1.6205507516860962, -1.5690281391143799, -1.517505407333374, -1.4659827947616577, -1.4144601821899414, -1.3629374504089355, -1.3114148378372192, -1.259892225265503, -1.2083696126937866, -1.1568470001220703, -1.1053242683410645, -1.0538016557693481, -1.0022790431976318, -0.9507563710212708, -0.8992336988449097, -0.8477110862731934, -0.796188473701477, -0.744665801525116, -0.6931431293487549, -0.6416205167770386, -0.5900979042053223, -0.5385752320289612, -0.4870525896549225, -0.4355299472808838, -0.3840073049068451, -0.3324846625328064, -0.2809620201587677, -0.229439377784729, -0.1779167354106903, -0.1263940930366516, -0.07487145066261292, -0.02334892749786377, 0.028173714876174927, 0.07969635725021362, 0.13121899962425232, 0.18274164199829102, 0.2342642843723297, 0.2857869267463684, 0.3373095691204071, 0.3888322114944458, 0.4403548538684845, 0.4918774962425232, 0.5434001684188843, 0.5949227809906006, 0.6464453935623169, 0.697968065738678, 0.7494907379150391, 0.8010133504867554, 0.8525359630584717, 0.9040586352348328, 0.9555813074111938, 1.0071039199829102, 1.0586265325546265, 1.1101491451263428, 1.1616718769073486, 1.213194489479065, 1.2647171020507812, 1.316239833831787, 1.3677624464035034, 1.4192850589752197, 1.470807671546936, 1.5223302841186523, 1.5738530158996582, 1.6253756284713745]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 9.0, 6.0, 11.0, 21.0, 30.0, 48.0, 59.0, 100.0, 121.0, 204.0, 298.0, 508.0, 873.0, 1554.0, 3152.0, 7601.0, 21446.0, 113341.0, 3930628.0, 82936.0, 18202.0, 6651.0, 2937.0, 1349.0, 810.0, 476.0, 292.0, 194.0, 145.0, 84.0, 57.0, 35.0, 28.0, 21.0, 17.0, 10.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2470703125, -0.23945236206054688, -0.23183441162109375, -0.22421646118164062, -0.2165985107421875, -0.20898056030273438, -0.20136260986328125, -0.19374465942382812, -0.186126708984375, -0.17850875854492188, -0.17089080810546875, -0.16327285766601562, -0.1556549072265625, -0.14803695678710938, -0.14041900634765625, -0.13280105590820312, -0.12518310546875, -0.11756515502929688, -0.10994720458984375, -0.10232925415039062, -0.0947113037109375, -0.08709335327148438, -0.07947540283203125, -0.07185745239257812, -0.064239501953125, -0.056621551513671875, -0.04900360107421875, -0.041385650634765625, -0.0337677001953125, -0.026149749755859375, -0.01853179931640625, -0.010913848876953125, -0.0032958984375, 0.004322052001953125, 0.01194000244140625, 0.019557952880859375, 0.0271759033203125, 0.034793853759765625, 0.04241180419921875, 0.050029754638671875, 0.057647705078125, 0.06526565551757812, 0.07288360595703125, 0.08050155639648438, 0.0881195068359375, 0.09573745727539062, 0.10335540771484375, 0.11097335815429688, 0.11859130859375, 0.12620925903320312, 0.13382720947265625, 0.14144515991210938, 0.1490631103515625, 0.15668106079101562, 0.16429901123046875, 0.17191696166992188, 0.179534912109375, 0.18715286254882812, 0.19477081298828125, 0.20238876342773438, 0.2100067138671875, 0.21762466430664062, 0.22524261474609375, 0.23286056518554688, 0.240478515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 11.0, 16.0, 26.0, 33.0, 43.0, 38.0, 45.0, 77.0, 60.0, 72.0, 101.0, 87.0, 76.0, 66.0, 49.0, 54.0, 39.0, 26.0, 20.0, 20.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11700439453125, -0.11278057098388672, -0.10855674743652344, -0.10433292388916016, -0.10010910034179688, -0.0958852767944336, -0.09166145324707031, -0.08743762969970703, -0.08321380615234375, -0.07898998260498047, -0.07476615905761719, -0.0705423355102539, -0.06631851196289062, -0.062094688415527344, -0.05787086486816406, -0.05364704132080078, -0.0494232177734375, -0.04519939422607422, -0.04097557067871094, -0.036751747131347656, -0.032527923583984375, -0.028304100036621094, -0.024080276489257812, -0.01985645294189453, -0.01563262939453125, -0.011408805847167969, -0.0071849822998046875, -0.0029611587524414062, 0.001262664794921875, 0.005486488342285156, 0.009710311889648438, 0.013934135437011719, 0.018157958984375, 0.02238178253173828, 0.026605606079101562, 0.030829429626464844, 0.035053253173828125, 0.039277076721191406, 0.04350090026855469, 0.04772472381591797, 0.05194854736328125, 0.05617237091064453, 0.06039619445800781, 0.0646200180053711, 0.06884384155273438, 0.07306766510009766, 0.07729148864746094, 0.08151531219482422, 0.0857391357421875, 0.08996295928955078, 0.09418678283691406, 0.09841060638427734, 0.10263442993164062, 0.1068582534790039, 0.11108207702636719, 0.11530590057373047, 0.11952972412109375, 0.12375354766845703, 0.1279773712158203, 0.1322011947631836, 0.13642501831054688, 0.14064884185791016, 0.14487266540527344, 0.14909648895263672, 0.1533203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 10.0, 19.0, 32.0, 54.0, 69.0, 99.0, 191.0, 389.0, 815.0, 2070.0, 6190.0, 28363.0, 3180482.0, 939863.0, 26162.0, 5828.0, 1954.0, 751.0, 369.0, 184.0, 112.0, 81.0, 56.0, 36.0, 21.0, 9.0, 7.0, 8.0, 7.0, 8.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387451171875, -0.3745269775390625, -0.361602783203125, -0.3486785888671875, -0.33575439453125, -0.3228302001953125, -0.309906005859375, -0.2969818115234375, -0.2840576171875, -0.2711334228515625, -0.258209228515625, -0.2452850341796875, -0.23236083984375, -0.2194366455078125, -0.206512451171875, -0.1935882568359375, -0.1806640625, -0.1677398681640625, -0.154815673828125, -0.1418914794921875, -0.12896728515625, -0.1160430908203125, -0.103118896484375, -0.0901947021484375, -0.0772705078125, -0.0643463134765625, -0.051422119140625, -0.0384979248046875, -0.02557373046875, -0.0126495361328125, 0.000274658203125, 0.0131988525390625, 0.026123046875, 0.0390472412109375, 0.051971435546875, 0.0648956298828125, 0.07781982421875, 0.0907440185546875, 0.103668212890625, 0.1165924072265625, 0.1295166015625, 0.1424407958984375, 0.155364990234375, 0.1682891845703125, 0.18121337890625, 0.1941375732421875, 0.207061767578125, 0.2199859619140625, 0.23291015625, 0.2458343505859375, 0.258758544921875, 0.2716827392578125, 0.28460693359375, 0.2975311279296875, 0.310455322265625, 0.3233795166015625, 0.3363037109375, 0.3492279052734375, 0.362152099609375, 0.3750762939453125, 0.38800048828125, 0.4009246826171875, 0.413848876953125, 0.4267730712890625, 0.439697265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 11.0, 36.0, 47.0, 96.0, 340.0, 3104.0, 230.0, 86.0, 38.0, 23.0, 14.0, 7.0, 10.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.13134384155273438, -0.12548065185546875, -0.11961746215820312, -0.1137542724609375, -0.10789108276367188, -0.10202789306640625, -0.09616470336914062, -0.090301513671875, -0.08443832397460938, -0.07857513427734375, -0.07271194458007812, -0.0668487548828125, -0.060985565185546875, -0.05512237548828125, -0.049259185791015625, -0.04339599609375, -0.037532806396484375, -0.03166961669921875, -0.025806427001953125, -0.0199432373046875, -0.014080047607421875, -0.00821685791015625, -0.002353668212890625, 0.003509521484375, 0.009372711181640625, 0.01523590087890625, 0.021099090576171875, 0.0269622802734375, 0.032825469970703125, 0.03868865966796875, 0.044551849365234375, 0.0504150390625, 0.056278228759765625, 0.06214141845703125, 0.06800460815429688, 0.0738677978515625, 0.07973098754882812, 0.08559417724609375, 0.09145736694335938, 0.097320556640625, 0.10318374633789062, 0.10904693603515625, 0.11491012573242188, 0.1207733154296875, 0.12663650512695312, 0.13249969482421875, 0.13836288452148438, 0.14422607421875, 0.15008926391601562, 0.15595245361328125, 0.16181564331054688, 0.1676788330078125, 0.17354202270507812, 0.17940521240234375, 0.18526840209960938, 0.191131591796875, 0.19699478149414062, 0.20285797119140625, 0.20872116088867188, 0.2145843505859375, 0.22044754028320312, 0.22631072998046875, 0.23217391967773438, 0.238037109375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 15.0, 27.0, 29.0, 56.0, 87.0, 111.0, 128.0, 118.0, 108.0, 106.0, 73.0, 50.0, 23.0, 20.0, 11.0, 9.0, 0.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50335693359375, -0.4859715402126312, -0.46858614683151245, -0.4512007236480713, -0.4338153302669525, -0.41642993688583374, -0.3990445137023926, -0.3816591203212738, -0.36427372694015503, -0.34688833355903625, -0.3295029401779175, -0.3121175169944763, -0.29473212361335754, -0.27734673023223877, -0.2599613070487976, -0.24257591366767883, -0.22519052028656006, -0.20780512690544128, -0.19041971862316132, -0.17303431034088135, -0.15564891695976257, -0.1382635235786438, -0.12087811529636383, -0.10349271446466446, -0.08610731363296509, -0.06872191280126572, -0.051336511969566345, -0.033951111137866974, -0.016565710306167603, 0.0008196905255317688, 0.01820509135723114, 0.03559049218893051, 0.05297589302062988, 0.07036129385232925, 0.08774669468402863, 0.105132095515728, 0.12251749634742737, 0.13990288972854614, 0.1572882980108261, 0.17467370629310608, 0.19205909967422485, 0.20944449305534363, 0.2268299013376236, 0.24421530961990356, 0.26160070300102234, 0.2789860963821411, 0.2963715195655823, 0.31375691294670105, 0.3311423063278198, 0.3485276997089386, 0.3659130930900574, 0.38329851627349854, 0.4006839096546173, 0.4180693030357361, 0.43545472621917725, 0.452840119600296, 0.4702255129814148, 0.48761090636253357, 0.5049962997436523, 0.5223817229270935, 0.5397671461105347, 0.557152509689331, 0.5745379328727722, 0.5919232964515686, 0.6093087196350098]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 9.0, 17.0, 11.0, 13.0, 23.0, 19.0, 26.0, 21.0, 26.0, 25.0, 35.0, 23.0, 38.0, 46.0, 45.0, 51.0, 54.0, 47.0, 38.0, 33.0, 35.0, 46.0, 51.0, 24.0, 34.0, 27.0, 33.0, 25.0, 17.0, 22.0, 9.0, 12.0, 12.0, 6.0, 4.0, 2.0, 4.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.3324315547943115, -0.3221175968647003, -0.3118036091327667, -0.3014896512031555, -0.2911756634712219, -0.2808617055416107, -0.2705477476119995, -0.2602337598800659, -0.2499198019504547, -0.2396058291196823, -0.2292918562889099, -0.2189778983592987, -0.2086639255285263, -0.1983499526977539, -0.1880359947681427, -0.1777220219373703, -0.1674080491065979, -0.1570940762758255, -0.1467801034450531, -0.1364661455154419, -0.1261521726846695, -0.1158381998538971, -0.10552423447370529, -0.09521026909351349, -0.08489629626274109, -0.07458232343196869, -0.06426835805177689, -0.053954388946294785, -0.04364041984081268, -0.03332645073533058, -0.02301248162984848, -0.012698516249656677, -0.0023845434188842773, 0.007929425686597824, 0.018243394792079926, 0.028557363897562027, 0.03887133300304413, 0.04918530210852623, 0.05949927121400833, 0.06981323659420013, 0.08012720942497253, 0.09044118225574493, 0.10075514763593674, 0.11106911301612854, 0.12138308584690094, 0.13169705867767334, 0.14201101660728455, 0.15232498943805695, 0.16263896226882935, 0.17295293509960175, 0.18326690793037415, 0.19358086585998535, 0.20389483869075775, 0.21420881152153015, 0.22452276945114136, 0.23483674228191376, 0.24515071511268616, 0.25546467304229736, 0.26577866077423096, 0.27609261870384216, 0.28640657663345337, 0.29672056436538696, 0.30703452229499817, 0.3173484802246094, 0.32766246795654297]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 3.0, 10.0, 12.0, 23.0, 46.0, 79.0, 157.0, 326.0, 625.0, 1426.0, 3095.0, 7590.0, 18833.0, 50797.0, 143126.0, 394424.0, 276435.0, 94565.0, 34399.0, 13123.0, 5187.0, 2244.0, 1022.0, 529.0, 226.0, 124.0, 48.0, 29.0, 15.0, 15.0, 10.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.263671875, -0.25720977783203125, -0.2507476806640625, -0.24428558349609375, -0.237823486328125, -0.23136138916015625, -0.2248992919921875, -0.21843719482421875, -0.21197509765625, -0.20551300048828125, -0.1990509033203125, -0.19258880615234375, -0.186126708984375, -0.17966461181640625, -0.1732025146484375, -0.16674041748046875, -0.1602783203125, -0.15381622314453125, -0.1473541259765625, -0.14089202880859375, -0.134429931640625, -0.12796783447265625, -0.1215057373046875, -0.11504364013671875, -0.10858154296875, -0.10211944580078125, -0.0956573486328125, -0.08919525146484375, -0.082733154296875, -0.07627105712890625, -0.0698089599609375, -0.06334686279296875, -0.056884765625, -0.05042266845703125, -0.0439605712890625, -0.03749847412109375, -0.031036376953125, -0.02457427978515625, -0.0181121826171875, -0.01165008544921875, -0.00518798828125, 0.00127410888671875, 0.0077362060546875, 0.01419830322265625, 0.020660400390625, 0.02712249755859375, 0.0335845947265625, 0.04004669189453125, 0.0465087890625, 0.05297088623046875, 0.0594329833984375, 0.06589508056640625, 0.072357177734375, 0.07881927490234375, 0.0852813720703125, 0.09174346923828125, 0.09820556640625, 0.10466766357421875, 0.1111297607421875, 0.11759185791015625, 0.124053955078125, 0.13051605224609375, 0.1369781494140625, 0.14344024658203125, 0.14990234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 14.0, 19.0, 18.0, 26.0, 34.0, 39.0, 53.0, 50.0, 64.0, 72.0, 83.0, 71.0, 61.0, 80.0, 60.0, 54.0, 45.0, 35.0, 27.0, 24.0, 19.0, 10.0, 15.0, 9.0, 3.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12396621704101562, -0.11988067626953125, -0.11579513549804688, -0.1117095947265625, -0.10762405395507812, -0.10353851318359375, -0.09945297241210938, -0.095367431640625, -0.09128189086914062, -0.08719635009765625, -0.08311080932617188, -0.0790252685546875, -0.07493972778320312, -0.07085418701171875, -0.06676864624023438, -0.06268310546875, -0.058597564697265625, -0.05451202392578125, -0.050426483154296875, -0.0463409423828125, -0.042255401611328125, -0.03816986083984375, -0.034084320068359375, -0.029998779296875, -0.025913238525390625, -0.02182769775390625, -0.017742156982421875, -0.0136566162109375, -0.009571075439453125, -0.00548553466796875, -0.001399993896484375, 0.002685546875, 0.006771087646484375, 0.01085662841796875, 0.014942169189453125, 0.0190277099609375, 0.023113250732421875, 0.02719879150390625, 0.031284332275390625, 0.035369873046875, 0.039455413818359375, 0.04354095458984375, 0.047626495361328125, 0.0517120361328125, 0.055797576904296875, 0.05988311767578125, 0.06396865844726562, 0.06805419921875, 0.07213973999023438, 0.07622528076171875, 0.08031082153320312, 0.0843963623046875, 0.08848190307617188, 0.09256744384765625, 0.09665298461914062, 0.100738525390625, 0.10482406616210938, 0.10890960693359375, 0.11299514770507812, 0.1170806884765625, 0.12116622924804688, 0.12525177001953125, 0.12933731079101562, 0.1334228515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 19.0, 11.0, 16.0, 37.0, 57.0, 62.0, 105.0, 137.0, 211.0, 305.0, 480.0, 859.0, 1539.0, 3911.0, 18709.0, 204055.0, 728413.0, 74223.0, 9607.0, 2685.0, 1181.0, 643.0, 412.0, 277.0, 167.0, 118.0, 101.0, 59.0, 43.0, 27.0, 24.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.427978515625, -0.41550445556640625, -0.4030303955078125, -0.39055633544921875, -0.378082275390625, -0.36560821533203125, -0.3531341552734375, -0.34066009521484375, -0.32818603515625, -0.31571197509765625, -0.3032379150390625, -0.29076385498046875, -0.278289794921875, -0.26581573486328125, -0.2533416748046875, -0.24086761474609375, -0.2283935546875, -0.21591949462890625, -0.2034454345703125, -0.19097137451171875, -0.178497314453125, -0.16602325439453125, -0.1535491943359375, -0.14107513427734375, -0.12860107421875, -0.11612701416015625, -0.1036529541015625, -0.09117889404296875, -0.078704833984375, -0.06623077392578125, -0.0537567138671875, -0.04128265380859375, -0.02880859375, -0.01633453369140625, -0.0038604736328125, 0.00861358642578125, 0.021087646484375, 0.03356170654296875, 0.0460357666015625, 0.05850982666015625, 0.07098388671875, 0.08345794677734375, 0.0959320068359375, 0.10840606689453125, 0.120880126953125, 0.13335418701171875, 0.1458282470703125, 0.15830230712890625, 0.1707763671875, 0.18325042724609375, 0.1957244873046875, 0.20819854736328125, 0.220672607421875, 0.23314666748046875, 0.2456207275390625, 0.25809478759765625, 0.27056884765625, 0.28304290771484375, 0.2955169677734375, 0.30799102783203125, 0.320465087890625, 0.33293914794921875, 0.3454132080078125, 0.35788726806640625, 0.370361328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 10.0, 15.0, 7.0, 13.0, 22.0, 21.0, 16.0, 24.0, 32.0, 24.0, 33.0, 35.0, 28.0, 29.0, 50.0, 48.0, 48.0, 39.0, 39.0, 39.0, 39.0, 49.0, 42.0, 31.0, 40.0, 29.0, 30.0, 32.0, 18.0, 22.0, 17.0, 16.0, 18.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.347564697265625, -0.33624267578125, -0.324920654296875, -0.3135986328125, -0.302276611328125, -0.29095458984375, -0.279632568359375, -0.268310546875, -0.256988525390625, -0.24566650390625, -0.234344482421875, -0.2230224609375, -0.211700439453125, -0.20037841796875, -0.189056396484375, -0.177734375, -0.166412353515625, -0.15509033203125, -0.143768310546875, -0.1324462890625, -0.121124267578125, -0.10980224609375, -0.098480224609375, -0.087158203125, -0.075836181640625, -0.06451416015625, -0.053192138671875, -0.0418701171875, -0.030548095703125, -0.01922607421875, -0.007904052734375, 0.00341796875, 0.014739990234375, 0.02606201171875, 0.037384033203125, 0.0487060546875, 0.060028076171875, 0.07135009765625, 0.082672119140625, 0.093994140625, 0.105316162109375, 0.11663818359375, 0.127960205078125, 0.1392822265625, 0.150604248046875, 0.16192626953125, 0.173248291015625, 0.1845703125, 0.195892333984375, 0.20721435546875, 0.218536376953125, 0.2298583984375, 0.241180419921875, 0.25250244140625, 0.263824462890625, 0.275146484375, 0.286468505859375, 0.29779052734375, 0.309112548828125, 0.3204345703125, 0.331756591796875, 0.34307861328125, 0.354400634765625, 0.36572265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 15.0, 18.0, 29.0, 34.0, 52.0, 108.0, 235.0, 635.0, 2560.0, 25808.0, 916543.0, 96042.0, 4869.0, 937.0, 329.0, 118.0, 76.0, 46.0, 25.0, 17.0, 14.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3363838195800781, -0.32608795166015625, -0.3157920837402344, -0.3054962158203125, -0.2952003479003906, -0.28490447998046875, -0.2746086120605469, -0.264312744140625, -0.2540168762207031, -0.24372100830078125, -0.23342514038085938, -0.2231292724609375, -0.21283340454101562, -0.20253753662109375, -0.19224166870117188, -0.18194580078125, -0.17164993286132812, -0.16135406494140625, -0.15105819702148438, -0.1407623291015625, -0.13046646118164062, -0.12017059326171875, -0.10987472534179688, -0.099578857421875, -0.08928298950195312, -0.07898712158203125, -0.06869125366210938, -0.0583953857421875, -0.048099517822265625, -0.03780364990234375, -0.027507781982421875, -0.0172119140625, -0.006916046142578125, 0.00337982177734375, 0.013675689697265625, 0.0239715576171875, 0.034267425537109375, 0.04456329345703125, 0.054859161376953125, 0.065155029296875, 0.07545089721679688, 0.08574676513671875, 0.09604263305664062, 0.1063385009765625, 0.11663436889648438, 0.12693023681640625, 0.13722610473632812, 0.14752197265625, 0.15781784057617188, 0.16811370849609375, 0.17840957641601562, 0.1887054443359375, 0.19900131225585938, 0.20929718017578125, 0.21959304809570312, 0.229888916015625, 0.24018478393554688, 0.25048065185546875, 0.2607765197753906, 0.2710723876953125, 0.2813682556152344, 0.29166412353515625, 0.3019599914550781, 0.312255859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 6.0, 11.0, 11.0, 10.0, 30.0, 32.0, 45.0, 70.0, 80.0, 98.0, 148.0, 117.0, 81.0, 49.0, 61.0, 43.0, 37.0, 19.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.771087646484375e-05, -6.49699941277504e-05, -6.222911179065704e-05, -5.948822945356369e-05, -5.674734711647034e-05, -5.4006464779376984e-05, -5.126558244228363e-05, -4.852470010519028e-05, -4.5783817768096924e-05, -4.304293543100357e-05, -4.030205309391022e-05, -3.7561170756816864e-05, -3.482028841972351e-05, -3.207940608263016e-05, -2.9338523745536804e-05, -2.659764140844345e-05, -2.3856759071350098e-05, -2.1115876734256744e-05, -1.837499439716339e-05, -1.5634112060070038e-05, -1.2893229722976685e-05, -1.0152347385883331e-05, -7.411465048789978e-06, -4.670582711696625e-06, -1.9297003746032715e-06, 8.111819624900818e-07, 3.552064299583435e-06, 6.292946636676788e-06, 9.033828973770142e-06, 1.1774711310863495e-05, 1.4515593647956848e-05, 1.72564759850502e-05, 1.9997358322143555e-05, 2.2738240659236908e-05, 2.547912299633026e-05, 2.8220005333423615e-05, 3.096088767051697e-05, 3.370177000761032e-05, 3.6442652344703674e-05, 3.918353468179703e-05, 4.192441701889038e-05, 4.4665299355983734e-05, 4.740618169307709e-05, 5.014706403017044e-05, 5.2887946367263794e-05, 5.562882870435715e-05, 5.83697110414505e-05, 6.111059337854385e-05, 6.385147571563721e-05, 6.659235805273056e-05, 6.933324038982391e-05, 7.207412272691727e-05, 7.481500506401062e-05, 7.755588740110397e-05, 8.029676973819733e-05, 8.303765207529068e-05, 8.577853441238403e-05, 8.851941674947739e-05, 9.126029908657074e-05, 9.400118142366409e-05, 9.674206376075745e-05, 9.94829460978508e-05, 0.00010222382843494415, 0.0001049647107720375, 0.00010770559310913086]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 12.0, 21.0, 20.0, 24.0, 34.0, 70.0, 120.0, 204.0, 481.0, 1207.0, 3602.0, 22854.0, 941406.0, 70124.0, 5499.0, 1584.0, 607.0, 250.0, 153.0, 101.0, 62.0, 36.0, 18.0, 15.0, 12.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3408851623535156, -0.32898712158203125, -0.3170890808105469, -0.3051910400390625, -0.2932929992675781, -0.28139495849609375, -0.2694969177246094, -0.257598876953125, -0.24570083618164062, -0.23380279541015625, -0.22190475463867188, -0.2100067138671875, -0.19810867309570312, -0.18621063232421875, -0.17431259155273438, -0.16241455078125, -0.15051651000976562, -0.13861846923828125, -0.12672042846679688, -0.1148223876953125, -0.10292434692382812, -0.09102630615234375, -0.07912826538085938, -0.067230224609375, -0.055332183837890625, -0.04343414306640625, -0.031536102294921875, -0.0196380615234375, -0.007740020751953125, 0.00415802001953125, 0.016056060791015625, 0.0279541015625, 0.039852142333984375, 0.05175018310546875, 0.06364822387695312, 0.0755462646484375, 0.08744430541992188, 0.09934234619140625, 0.11124038696289062, 0.123138427734375, 0.13503646850585938, 0.14693450927734375, 0.15883255004882812, 0.1707305908203125, 0.18262863159179688, 0.19452667236328125, 0.20642471313476562, 0.21832275390625, 0.23022079467773438, 0.24211883544921875, 0.2540168762207031, 0.2659149169921875, 0.2778129577636719, 0.28971099853515625, 0.3016090393066406, 0.313507080078125, 0.3254051208496094, 0.33730316162109375, 0.3492012023925781, 0.3610992431640625, 0.3729972839355469, 0.38489532470703125, 0.3967933654785156, 0.40869140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 17.0, 26.0, 21.0, 53.0, 65.0, 110.0, 155.0, 134.0, 135.0, 77.0, 53.0, 35.0, 32.0, 24.0, 11.0, 9.0, 2.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.232421875, -0.22618865966796875, -0.2199554443359375, -0.21372222900390625, -0.207489013671875, -0.20125579833984375, -0.1950225830078125, -0.18878936767578125, -0.18255615234375, -0.17632293701171875, -0.1700897216796875, -0.16385650634765625, -0.157623291015625, -0.15139007568359375, -0.1451568603515625, -0.13892364501953125, -0.1326904296875, -0.12645721435546875, -0.1202239990234375, -0.11399078369140625, -0.107757568359375, -0.10152435302734375, -0.0952911376953125, -0.08905792236328125, -0.08282470703125, -0.07659149169921875, -0.0703582763671875, -0.06412506103515625, -0.057891845703125, -0.05165863037109375, -0.0454254150390625, -0.03919219970703125, -0.032958984375, -0.02672576904296875, -0.0204925537109375, -0.01425933837890625, -0.008026123046875, -0.00179290771484375, 0.0044403076171875, 0.01067352294921875, 0.01690673828125, 0.02313995361328125, 0.0293731689453125, 0.03560638427734375, 0.041839599609375, 0.04807281494140625, 0.0543060302734375, 0.06053924560546875, 0.0667724609375, 0.07300567626953125, 0.0792388916015625, 0.08547210693359375, 0.091705322265625, 0.09793853759765625, 0.1041717529296875, 0.11040496826171875, 0.11663818359375, 0.12287139892578125, 0.1291046142578125, 0.13533782958984375, 0.141571044921875, 0.14780426025390625, 0.1540374755859375, 0.16027069091796875, 0.16650390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 16.0, 55.0, 129.0, 248.0, 291.0, 156.0, 55.0, 28.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.76110315322876, -4.603743553161621, -4.446383953094482, -4.289024353027344, -4.131664276123047, -3.9743049144744873, -3.8169450759887695, -3.659585475921631, -3.502225875854492, -3.3448662757873535, -3.187506675720215, -3.030146837234497, -2.8727872371673584, -2.7154276371002197, -2.558067798614502, -2.4007081985473633, -2.2433485984802246, -2.085988998413086, -1.9286292791366577, -1.7712695598602295, -1.6139099597930908, -1.4565503597259521, -1.299190640449524, -1.1418309211730957, -0.984471321105957, -0.8271116614341736, -0.6697520017623901, -0.5123923420906067, -0.35503268241882324, -0.1976730227470398, -0.04031336307525635, 0.11704635620117188, 0.27440643310546875, 0.4317660927772522, 0.5891257524490356, 0.7464854121208191, 0.9038450717926025, 1.0612046718597412, 1.2185643911361694, 1.3759241104125977, 1.5332837104797363, 1.690643310546875, 1.8480030298233032, 2.0053627490997314, 2.16272234916687, 2.320081949234009, 2.4774417877197266, 2.6348013877868652, 2.792160987854004, 2.9495205879211426, 3.1068801879882812, 3.264240026473999, 3.4215996265411377, 3.5789592266082764, 3.736319065093994, 3.893678665161133, 4.0510382652282715, 4.20839786529541, 4.365757465362549, 4.5231170654296875, 4.680477142333984, 4.837836742401123, 4.995196342468262, 5.1525559425354, 5.309915542602539]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 8.0, 10.0, 20.0, 29.0, 29.0, 34.0, 42.0, 49.0, 53.0, 78.0, 74.0, 73.0, 77.0, 71.0, 68.0, 53.0, 54.0, 40.0, 29.0, 36.0, 16.0, 16.0, 15.0, 6.0, 8.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.288053035736084, -3.205904245376587, -3.12375545501709, -3.041606903076172, -2.959458112716675, -2.8773093223571777, -2.7951605319976807, -2.7130117416381836, -2.6308631896972656, -2.5487143993377686, -2.4665656089782715, -2.3844170570373535, -2.3022682666778564, -2.2201194763183594, -2.1379706859588623, -2.0558218955993652, -1.9736732244491577, -1.8915244340896606, -1.8093757629394531, -1.727226972579956, -1.6450783014297485, -1.5629295110702515, -1.480780839920044, -1.3986320495605469, -1.3164832592010498, -1.2343344688415527, -1.1521857976913452, -1.0700370073318481, -0.9878883361816406, -0.9057395458221436, -0.8235908150672913, -0.741442084312439, -0.659293532371521, -0.5771448016166687, -0.4949960708618164, -0.4128473103046417, -0.33069857954978943, -0.24854984879493713, -0.16640108823776245, -0.08425235748291016, -0.0021036267280578613, 0.08004511147737503, 0.16219384968280792, 0.2443425953388214, 0.3264913260936737, 0.408640056848526, 0.4907888174057007, 0.572937548160553, 0.6550862789154053, 0.7372350096702576, 0.8193837404251099, 0.9015325307846069, 0.9836812019348145, 1.0658299922943115, 1.1479787826538086, 1.2301274538040161, 1.3122761249542236, 1.3944249153137207, 1.4765735864639282, 1.5587223768234253, 1.6408710479736328, 1.7230198383331299, 1.805168628692627, 1.8873172998428345, 1.9694660902023315]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 9.0, 12.0, 21.0, 24.0, 30.0, 62.0, 78.0, 156.0, 245.0, 487.0, 973.0, 2496.0, 6884.0, 25389.0, 185405.0, 3384620.0, 525793.0, 45478.0, 10579.0, 3216.0, 1193.0, 544.0, 249.0, 122.0, 81.0, 51.0, 30.0, 19.0, 4.0, 15.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3515625, -0.3431243896484375, -0.334686279296875, -0.3262481689453125, -0.31781005859375, -0.3093719482421875, -0.300933837890625, -0.2924957275390625, -0.2840576171875, -0.2756195068359375, -0.267181396484375, -0.2587432861328125, -0.25030517578125, -0.2418670654296875, -0.233428955078125, -0.2249908447265625, -0.216552734375, -0.2081146240234375, -0.199676513671875, -0.1912384033203125, -0.18280029296875, -0.1743621826171875, -0.165924072265625, -0.1574859619140625, -0.1490478515625, -0.1406097412109375, -0.132171630859375, -0.1237335205078125, -0.11529541015625, -0.1068572998046875, -0.098419189453125, -0.0899810791015625, -0.08154296875, -0.0731048583984375, -0.064666748046875, -0.0562286376953125, -0.04779052734375, -0.0393524169921875, -0.030914306640625, -0.0224761962890625, -0.0140380859375, -0.0055999755859375, 0.002838134765625, 0.0112762451171875, 0.01971435546875, 0.0281524658203125, 0.036590576171875, 0.0450286865234375, 0.053466796875, 0.0619049072265625, 0.070343017578125, 0.0787811279296875, 0.08721923828125, 0.0956573486328125, 0.104095458984375, 0.1125335693359375, 0.1209716796875, 0.1294097900390625, 0.137847900390625, 0.1462860107421875, 0.15472412109375, 0.1631622314453125, 0.171600341796875, 0.1800384521484375, 0.1884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 8.0, 10.0, 17.0, 22.0, 17.0, 19.0, 38.0, 46.0, 43.0, 51.0, 60.0, 68.0, 65.0, 79.0, 62.0, 79.0, 65.0, 51.0, 42.0, 35.0, 25.0, 28.0, 19.0, 10.0, 15.0, 7.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0], "bins": [-0.162109375, -0.15844154357910156, -0.15477371215820312, -0.1511058807373047, -0.14743804931640625, -0.1437702178955078, -0.14010238647460938, -0.13643455505371094, -0.1327667236328125, -0.12909889221191406, -0.12543106079101562, -0.12176322937011719, -0.11809539794921875, -0.11442756652832031, -0.11075973510742188, -0.10709190368652344, -0.103424072265625, -0.09975624084472656, -0.09608840942382812, -0.09242057800292969, -0.08875274658203125, -0.08508491516113281, -0.08141708374023438, -0.07774925231933594, -0.0740814208984375, -0.07041358947753906, -0.06674575805664062, -0.06307792663574219, -0.05941009521484375, -0.05574226379394531, -0.052074432373046875, -0.04840660095214844, -0.04473876953125, -0.04107093811035156, -0.037403106689453125, -0.03373527526855469, -0.03006744384765625, -0.026399612426757812, -0.022731781005859375, -0.019063949584960938, -0.0153961181640625, -0.011728286743164062, -0.008060455322265625, -0.0043926239013671875, -0.00072479248046875, 0.0029430389404296875, 0.006610870361328125, 0.010278701782226562, 0.013946533203125, 0.017614364624023438, 0.021282196044921875, 0.024950027465820312, 0.02861785888671875, 0.03228569030761719, 0.035953521728515625, 0.03962135314941406, 0.0432891845703125, 0.04695701599121094, 0.050624847412109375, 0.05429267883300781, 0.05796051025390625, 0.06162834167480469, 0.06529617309570312, 0.06896400451660156, 0.0726318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 22.0, 31.0, 56.0, 122.0, 254.0, 708.0, 2532.0, 23748.0, 3616216.0, 537595.0, 10454.0, 1635.0, 491.0, 191.0, 93.0, 47.0, 20.0, 15.0, 11.0, 11.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6298828125, -0.609466552734375, -0.58905029296875, -0.568634033203125, -0.5482177734375, -0.527801513671875, -0.50738525390625, -0.486968994140625, -0.466552734375, -0.446136474609375, -0.42572021484375, -0.405303955078125, -0.3848876953125, -0.364471435546875, -0.34405517578125, -0.323638916015625, -0.30322265625, -0.282806396484375, -0.26239013671875, -0.241973876953125, -0.2215576171875, -0.201141357421875, -0.18072509765625, -0.160308837890625, -0.139892578125, -0.119476318359375, -0.09906005859375, -0.078643798828125, -0.0582275390625, -0.037811279296875, -0.01739501953125, 0.003021240234375, 0.0234375, 0.043853759765625, 0.06427001953125, 0.084686279296875, 0.1051025390625, 0.125518798828125, 0.14593505859375, 0.166351318359375, 0.186767578125, 0.207183837890625, 0.22760009765625, 0.248016357421875, 0.2684326171875, 0.288848876953125, 0.30926513671875, 0.329681396484375, 0.35009765625, 0.370513916015625, 0.39093017578125, 0.411346435546875, 0.4317626953125, 0.452178955078125, 0.47259521484375, 0.493011474609375, 0.513427734375, 0.533843994140625, 0.55426025390625, 0.574676513671875, 0.5950927734375, 0.615509033203125, 0.63592529296875, 0.656341552734375, 0.6767578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 10.0, 10.0, 10.0, 13.0, 29.0, 64.0, 87.0, 185.0, 456.0, 1229.0, 1124.0, 405.0, 197.0, 108.0, 49.0, 27.0, 21.0, 14.0, 11.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.4180755615234375, -0.404998779296875, -0.3919219970703125, -0.37884521484375, -0.3657684326171875, -0.352691650390625, -0.3396148681640625, -0.3265380859375, -0.3134613037109375, -0.300384521484375, -0.2873077392578125, -0.27423095703125, -0.2611541748046875, -0.248077392578125, -0.2350006103515625, -0.221923828125, -0.2088470458984375, -0.195770263671875, -0.1826934814453125, -0.16961669921875, -0.1565399169921875, -0.143463134765625, -0.1303863525390625, -0.1173095703125, -0.1042327880859375, -0.091156005859375, -0.0780792236328125, -0.06500244140625, -0.0519256591796875, -0.038848876953125, -0.0257720947265625, -0.0126953125, 0.0003814697265625, 0.013458251953125, 0.0265350341796875, 0.03961181640625, 0.0526885986328125, 0.065765380859375, 0.0788421630859375, 0.0919189453125, 0.1049957275390625, 0.118072509765625, 0.1311492919921875, 0.14422607421875, 0.1573028564453125, 0.170379638671875, 0.1834564208984375, 0.196533203125, 0.2096099853515625, 0.222686767578125, 0.2357635498046875, 0.24884033203125, 0.2619171142578125, 0.274993896484375, 0.2880706787109375, 0.3011474609375, 0.3142242431640625, 0.327301025390625, 0.3403778076171875, 0.35345458984375, 0.3665313720703125, 0.379608154296875, 0.3926849365234375, 0.40576171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 8.0, 8.0, 8.0, 15.0, 40.0, 83.0, 185.0, 225.0, 202.0, 118.0, 54.0, 24.0, 10.0, 10.0, 3.0, 3.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4501988887786865, -3.3506782054901123, -3.251157522201538, -3.151636838912964, -3.0521161556243896, -2.9525954723358154, -2.853074789047241, -2.753554105758667, -2.6540334224700928, -2.5545127391815186, -2.4549920558929443, -2.35547137260437, -2.255950689315796, -2.1564300060272217, -2.0569093227386475, -1.9573886394500732, -1.857867956161499, -1.7583472728729248, -1.6588265895843506, -1.5593059062957764, -1.4597852230072021, -1.360264539718628, -1.2607438564300537, -1.1612231731414795, -1.0617024898529053, -0.962181806564331, -0.8626611232757568, -0.7631404399871826, -0.6636197566986084, -0.5640990734100342, -0.46457839012145996, -0.36505770683288574, -0.2655370235443115, -0.1660163402557373, -0.06649565696716309, 0.03302502632141113, 0.13254570960998535, 0.23206639289855957, 0.3315870761871338, 0.431107759475708, 0.5306284427642822, 0.6301491260528564, 0.7296698093414307, 0.8291904926300049, 0.9287111759185791, 1.0282318592071533, 1.1277525424957275, 1.2272732257843018, 1.326793909072876, 1.4263145923614502, 1.5258352756500244, 1.6253559589385986, 1.7248766422271729, 1.824397325515747, 1.9239180088043213, 2.0234386920928955, 2.1229593753814697, 2.222480058670044, 2.322000741958618, 2.4215214252471924, 2.5210421085357666, 2.620562791824341, 2.720083475112915, 2.8196041584014893, 2.9191248416900635]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 10.0, 7.0, 7.0, 9.0, 15.0, 17.0, 36.0, 32.0, 34.0, 31.0, 41.0, 57.0, 56.0, 63.0, 67.0, 71.0, 61.0, 61.0, 55.0, 49.0, 36.0, 32.0, 29.0, 33.0, 28.0, 13.0, 13.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9883368015289307, -1.9346591234207153, -1.8809813261032104, -1.8273036479949951, -1.7736259698867798, -1.719948172569275, -1.6662704944610596, -1.6125926971435547, -1.5589150190353394, -1.505237340927124, -1.4515595436096191, -1.3978818655014038, -1.3442041873931885, -1.2905263900756836, -1.2368487119674683, -1.183171033859253, -1.129493236541748, -1.0758155584335327, -1.0221377611160278, -0.9684600830078125, -0.9147823452949524, -0.8611046075820923, -0.807426929473877, -0.7537491917610168, -0.7000715732574463, -0.6463938355445862, -0.5927161574363708, -0.5390384197235107, -0.48536068201065063, -0.4316829741001129, -0.3780052661895752, -0.3243275284767151, -0.270649790763855, -0.21697206795215607, -0.16329434514045715, -0.10961663722991943, -0.05593891441822052, -0.0022611916065216064, 0.05141651630401611, 0.10509425401687622, 0.15877196192741394, 0.21244968473911285, 0.26612740755081177, 0.3198051154613495, 0.3734828233718872, 0.4271605610847473, 0.48083826899528503, 0.5345159769058228, 0.5881937146186829, 0.641871452331543, 0.6955491304397583, 0.7492268681526184, 0.8029046058654785, 0.8565822839736938, 0.910260021686554, 0.9639377593994141, 1.0176154375076294, 1.0712931156158447, 1.1249709129333496, 1.178648591041565, 1.2323262691497803, 1.2860040664672852, 1.3396817445755005, 1.3933594226837158, 1.4470372200012207]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 12.0, 27.0, 30.0, 54.0, 70.0, 114.0, 178.0, 338.0, 580.0, 989.0, 1851.0, 3574.0, 7085.0, 15543.0, 36808.0, 101928.0, 397620.0, 334409.0, 87309.0, 32631.0, 13888.0, 6356.0, 3198.0, 1658.0, 968.0, 514.0, 318.0, 192.0, 122.0, 59.0, 37.0, 19.0, 15.0, 10.0, 8.0, 9.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.227783203125, -0.22041893005371094, -0.21305465698242188, -0.2056903839111328, -0.19832611083984375, -0.1909618377685547, -0.18359756469726562, -0.17623329162597656, -0.1688690185546875, -0.16150474548339844, -0.15414047241210938, -0.1467761993408203, -0.13941192626953125, -0.1320476531982422, -0.12468338012695312, -0.11731910705566406, -0.109954833984375, -0.10259056091308594, -0.09522628784179688, -0.08786201477050781, -0.08049774169921875, -0.07313346862792969, -0.06576919555664062, -0.05840492248535156, -0.0510406494140625, -0.04367637634277344, -0.036312103271484375, -0.028947830200195312, -0.02158355712890625, -0.014219284057617188, -0.006855010986328125, 0.0005092620849609375, 0.00787353515625, 0.015237808227539062, 0.022602081298828125, 0.029966354370117188, 0.03733062744140625, 0.04469490051269531, 0.052059173583984375, 0.05942344665527344, 0.0667877197265625, 0.07415199279785156, 0.08151626586914062, 0.08888053894042969, 0.09624481201171875, 0.10360908508300781, 0.11097335815429688, 0.11833763122558594, 0.125701904296875, 0.13306617736816406, 0.14043045043945312, 0.1477947235107422, 0.15515899658203125, 0.1625232696533203, 0.16988754272460938, 0.17725181579589844, 0.1846160888671875, 0.19198036193847656, 0.19934463500976562, 0.2067089080810547, 0.21407318115234375, 0.2214374542236328, 0.22880172729492188, 0.23616600036621094, 0.2435302734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 7.0, 5.0, 11.0, 18.0, 17.0, 23.0, 26.0, 43.0, 37.0, 40.0, 47.0, 37.0, 51.0, 65.0, 65.0, 62.0, 71.0, 67.0, 49.0, 48.0, 47.0, 28.0, 27.0, 22.0, 19.0, 17.0, 16.0, 9.0, 5.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.1446533203125, -0.1411733627319336, -0.1376934051513672, -0.13421344757080078, -0.13073348999023438, -0.12725353240966797, -0.12377357482910156, -0.12029361724853516, -0.11681365966796875, -0.11333370208740234, -0.10985374450683594, -0.10637378692626953, -0.10289382934570312, -0.09941387176513672, -0.09593391418457031, -0.0924539566040039, -0.0889739990234375, -0.0854940414428711, -0.08201408386230469, -0.07853412628173828, -0.07505416870117188, -0.07157421112060547, -0.06809425354003906, -0.06461429595947266, -0.06113433837890625, -0.057654380798339844, -0.05417442321777344, -0.05069446563720703, -0.047214508056640625, -0.04373455047607422, -0.04025459289550781, -0.036774635314941406, -0.033294677734375, -0.029814720153808594, -0.026334762573242188, -0.02285480499267578, -0.019374847412109375, -0.01589488983154297, -0.012414932250976562, -0.008934974670410156, -0.00545501708984375, -0.0019750595092773438, 0.0015048980712890625, 0.004984855651855469, 0.008464813232421875, 0.011944770812988281, 0.015424728393554688, 0.018904685974121094, 0.0223846435546875, 0.025864601135253906, 0.029344558715820312, 0.03282451629638672, 0.036304473876953125, 0.03978443145751953, 0.04326438903808594, 0.046744346618652344, 0.05022430419921875, 0.053704261779785156, 0.05718421936035156, 0.06066417694091797, 0.06414413452148438, 0.06762409210205078, 0.07110404968261719, 0.0745840072631836, 0.07806396484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 16.0, 27.0, 23.0, 42.0, 53.0, 78.0, 122.0, 192.0, 265.0, 481.0, 988.0, 2365.0, 8311.0, 63952.0, 867022.0, 89190.0, 10160.0, 2722.0, 1050.0, 522.0, 307.0, 182.0, 113.0, 113.0, 62.0, 39.0, 22.0, 32.0, 21.0, 16.0, 9.0, 13.0, 0.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.75439453125, -0.7325668334960938, -0.7107391357421875, -0.6889114379882812, -0.667083740234375, -0.6452560424804688, -0.6234283447265625, -0.6016006469726562, -0.57977294921875, -0.5579452514648438, -0.5361175537109375, -0.5142898559570312, -0.492462158203125, -0.47063446044921875, -0.4488067626953125, -0.42697906494140625, -0.4051513671875, -0.38332366943359375, -0.3614959716796875, -0.33966827392578125, -0.317840576171875, -0.29601287841796875, -0.2741851806640625, -0.25235748291015625, -0.23052978515625, -0.20870208740234375, -0.1868743896484375, -0.16504669189453125, -0.143218994140625, -0.12139129638671875, -0.0995635986328125, -0.07773590087890625, -0.055908203125, -0.03408050537109375, -0.0122528076171875, 0.00957489013671875, 0.031402587890625, 0.05323028564453125, 0.0750579833984375, 0.09688568115234375, 0.11871337890625, 0.14054107666015625, 0.1623687744140625, 0.18419647216796875, 0.206024169921875, 0.22785186767578125, 0.2496795654296875, 0.27150726318359375, 0.2933349609375, 0.31516265869140625, 0.3369903564453125, 0.35881805419921875, 0.380645751953125, 0.40247344970703125, 0.4243011474609375, 0.44612884521484375, 0.46795654296875, 0.48978424072265625, 0.5116119384765625, 0.5334396362304688, 0.555267333984375, 0.5770950317382812, 0.5989227294921875, 0.6207504272460938, 0.642578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 12.0, 9.0, 7.0, 19.0, 21.0, 21.0, 20.0, 33.0, 39.0, 37.0, 46.0, 60.0, 52.0, 66.0, 59.0, 46.0, 54.0, 51.0, 54.0, 42.0, 41.0, 39.0, 16.0, 26.0, 20.0, 11.0, 16.0, 8.0, 12.0, 7.0, 8.0, 2.0, 7.0, 4.0, 5.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486083984375, -0.4698143005371094, -0.45354461669921875, -0.4372749328613281, -0.4210052490234375, -0.4047355651855469, -0.38846588134765625, -0.3721961975097656, -0.355926513671875, -0.3396568298339844, -0.32338714599609375, -0.3071174621582031, -0.2908477783203125, -0.2745780944824219, -0.25830841064453125, -0.24203872680664062, -0.22576904296875, -0.20949935913085938, -0.19322967529296875, -0.17695999145507812, -0.1606903076171875, -0.14442062377929688, -0.12815093994140625, -0.11188125610351562, -0.095611572265625, -0.07934188842773438, -0.06307220458984375, -0.046802520751953125, -0.0305328369140625, -0.014263153076171875, 0.00200653076171875, 0.018276214599609375, 0.0345458984375, 0.050815582275390625, 0.06708526611328125, 0.08335494995117188, 0.0996246337890625, 0.11589431762695312, 0.13216400146484375, 0.14843368530273438, 0.164703369140625, 0.18097305297851562, 0.19724273681640625, 0.21351242065429688, 0.2297821044921875, 0.24605178833007812, 0.26232147216796875, 0.2785911560058594, 0.29486083984375, 0.3111305236816406, 0.32740020751953125, 0.3436698913574219, 0.3599395751953125, 0.3762092590332031, 0.39247894287109375, 0.4087486267089844, 0.425018310546875, 0.4412879943847656, 0.45755767822265625, 0.4738273620605469, 0.4900970458984375, 0.5063667297363281, 0.5226364135742188, 0.5389060974121094, 0.55517578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 3.0, 6.0, 15.0, 22.0, 37.0, 70.0, 109.0, 212.0, 482.0, 1287.0, 5543.0, 50610.0, 911467.0, 69415.0, 6762.0, 1494.0, 514.0, 213.0, 117.0, 62.0, 36.0, 17.0, 9.0, 12.0, 6.0, 4.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350830078125, -0.338958740234375, -0.32708740234375, -0.315216064453125, -0.3033447265625, -0.291473388671875, -0.27960205078125, -0.267730712890625, -0.255859375, -0.243988037109375, -0.23211669921875, -0.220245361328125, -0.2083740234375, -0.196502685546875, -0.18463134765625, -0.172760009765625, -0.160888671875, -0.149017333984375, -0.13714599609375, -0.125274658203125, -0.1134033203125, -0.101531982421875, -0.08966064453125, -0.077789306640625, -0.06591796875, -0.054046630859375, -0.04217529296875, -0.030303955078125, -0.0184326171875, -0.006561279296875, 0.00531005859375, 0.017181396484375, 0.029052734375, 0.040924072265625, 0.05279541015625, 0.064666748046875, 0.0765380859375, 0.088409423828125, 0.10028076171875, 0.112152099609375, 0.1240234375, 0.135894775390625, 0.14776611328125, 0.159637451171875, 0.1715087890625, 0.183380126953125, 0.19525146484375, 0.207122802734375, 0.218994140625, 0.230865478515625, 0.24273681640625, 0.254608154296875, 0.2664794921875, 0.278350830078125, 0.29022216796875, 0.302093505859375, 0.31396484375, 0.325836181640625, 0.33770751953125, 0.349578857421875, 0.3614501953125, 0.373321533203125, 0.38519287109375, 0.397064208984375, 0.408935546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 10.0, 16.0, 18.0, 22.0, 34.0, 42.0, 55.0, 77.0, 101.0, 114.0, 128.0, 87.0, 60.0, 42.0, 32.0, 31.0, 24.0, 12.0, 8.0, 12.0, 8.0, 4.0, 6.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.334087371826172e-05, -9.079650044441223e-05, -8.825212717056274e-05, -8.570775389671326e-05, -8.316338062286377e-05, -8.061900734901428e-05, -7.80746340751648e-05, -7.553026080131531e-05, -7.298588752746582e-05, -7.044151425361633e-05, -6.789714097976685e-05, -6.535276770591736e-05, -6.280839443206787e-05, -6.0264021158218384e-05, -5.7719647884368896e-05, -5.517527461051941e-05, -5.263090133666992e-05, -5.0086528062820435e-05, -4.754215478897095e-05, -4.499778151512146e-05, -4.245340824127197e-05, -3.9909034967422485e-05, -3.7364661693573e-05, -3.482028841972351e-05, -3.2275915145874023e-05, -2.9731541872024536e-05, -2.718716859817505e-05, -2.464279532432556e-05, -2.2098422050476074e-05, -1.9554048776626587e-05, -1.70096755027771e-05, -1.4465302228927612e-05, -1.1920928955078125e-05, -9.376555681228638e-06, -6.83218240737915e-06, -4.287809133529663e-06, -1.7434358596801758e-06, 8.009374141693115e-07, 3.345310688018799e-06, 5.889683961868286e-06, 8.434057235717773e-06, 1.097843050956726e-05, 1.3522803783416748e-05, 1.6067177057266235e-05, 1.8611550331115723e-05, 2.115592360496521e-05, 2.3700296878814697e-05, 2.6244670152664185e-05, 2.8789043426513672e-05, 3.133341670036316e-05, 3.3877789974212646e-05, 3.6422163248062134e-05, 3.896653652191162e-05, 4.151090979576111e-05, 4.4055283069610596e-05, 4.659965634346008e-05, 4.914402961730957e-05, 5.168840289115906e-05, 5.4232776165008545e-05, 5.677714943885803e-05, 5.932152271270752e-05, 6.186589598655701e-05, 6.44102692604065e-05, 6.695464253425598e-05, 6.949901580810547e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 7.0, 9.0, 16.0, 18.0, 22.0, 33.0, 44.0, 77.0, 99.0, 173.0, 250.0, 514.0, 1147.0, 3562.0, 14949.0, 262739.0, 734162.0, 23158.0, 4579.0, 1487.0, 675.0, 305.0, 166.0, 104.0, 69.0, 46.0, 34.0, 16.0, 21.0, 12.0, 9.0, 10.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2945556640625, -0.28369140625, -0.2728271484375, -0.261962890625, -0.2510986328125, -0.240234375, -0.2293701171875, -0.218505859375, -0.2076416015625, -0.19677734375, -0.1859130859375, -0.175048828125, -0.1641845703125, -0.1533203125, -0.1424560546875, -0.131591796875, -0.1207275390625, -0.10986328125, -0.0989990234375, -0.088134765625, -0.0772705078125, -0.06640625, -0.0555419921875, -0.044677734375, -0.0338134765625, -0.02294921875, -0.0120849609375, -0.001220703125, 0.0096435546875, 0.0205078125, 0.0313720703125, 0.042236328125, 0.0531005859375, 0.06396484375, 0.0748291015625, 0.085693359375, 0.0965576171875, 0.107421875, 0.1182861328125, 0.129150390625, 0.1400146484375, 0.15087890625, 0.1617431640625, 0.172607421875, 0.1834716796875, 0.1943359375, 0.2052001953125, 0.216064453125, 0.2269287109375, 0.23779296875, 0.2486572265625, 0.259521484375, 0.2703857421875, 0.28125, 0.2921142578125, 0.302978515625, 0.3138427734375, 0.32470703125, 0.3355712890625, 0.346435546875, 0.3572998046875, 0.3681640625, 0.3790283203125, 0.389892578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 12.0, 12.0, 18.0, 31.0, 57.0, 74.0, 111.0, 152.0, 170.0, 114.0, 64.0, 43.0, 38.0, 13.0, 11.0, 20.0, 9.0, 2.0, 10.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2027587890625, -0.1943035125732422, -0.18584823608398438, -0.17739295959472656, -0.16893768310546875, -0.16048240661621094, -0.15202713012695312, -0.1435718536376953, -0.1351165771484375, -0.1266613006591797, -0.11820602416992188, -0.10975074768066406, -0.10129547119140625, -0.09284019470214844, -0.08438491821289062, -0.07592964172363281, -0.067474365234375, -0.05901908874511719, -0.050563812255859375, -0.04210853576660156, -0.03365325927734375, -0.025197982788085938, -0.016742706298828125, -0.008287429809570312, 0.0001678466796875, 0.008623123168945312, 0.017078399658203125, 0.025533676147460938, 0.03398895263671875, 0.04244422912597656, 0.050899505615234375, 0.05935478210449219, 0.06781005859375, 0.07626533508300781, 0.08472061157226562, 0.09317588806152344, 0.10163116455078125, 0.11008644104003906, 0.11854171752929688, 0.1269969940185547, 0.1354522705078125, 0.1439075469970703, 0.15236282348632812, 0.16081809997558594, 0.16927337646484375, 0.17772865295410156, 0.18618392944335938, 0.1946392059326172, 0.203094482421875, 0.2115497589111328, 0.22000503540039062, 0.22846031188964844, 0.23691558837890625, 0.24537086486816406, 0.2538261413574219, 0.2622814178466797, 0.2707366943359375, 0.2791919708251953, 0.2876472473144531, 0.29610252380371094, 0.30455780029296875, 0.31301307678222656, 0.3214683532714844, 0.3299236297607422, 0.33837890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 13.0, 32.0, 59.0, 125.0, 202.0, 244.0, 147.0, 94.0, 45.0, 12.0, 7.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.706342697143555, -4.560476779937744, -4.414610385894775, -4.268744468688965, -4.122878074645996, -3.9770121574401855, -3.831146001815796, -3.6852798461914062, -3.5394136905670166, -3.393547534942627, -3.2476813793182373, -3.1018152236938477, -2.955949306488037, -2.8100829124450684, -2.664216995239258, -2.518350839614868, -2.3724846839904785, -2.226618528366089, -2.080752372741699, -1.9348863363265991, -1.7890201807022095, -1.6431540250778198, -1.4972879886627197, -1.35142183303833, -1.2055556774139404, -1.0596895217895508, -0.9138234257698059, -0.767957329750061, -0.6220911741256714, -0.47622501850128174, -0.33035892248153687, -0.184492826461792, -0.038626670837402344, 0.10723945498466492, 0.2531055808067322, 0.39897170662879944, 0.5448378324508667, 0.6907039880752563, 0.8365700840950012, 0.9824361801147461, 1.1283023357391357, 1.2741684913635254, 1.420034646987915, 1.5659006834030151, 1.7117668390274048, 1.8576329946517944, 2.0034990310668945, 2.149365186691284, 2.295231342315674, 2.4410974979400635, 2.586963653564453, 2.7328298091888428, 2.8786959648132324, 3.024561882019043, 3.1704280376434326, 3.3162941932678223, 3.462160348892212, 3.6080265045166016, 3.753892660140991, 3.899758815765381, 4.045624732971191, 4.19149112701416, 4.337357044219971, 4.483222961425781, 4.62908935546875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 5.0, 4.0, 7.0, 8.0, 11.0, 14.0, 13.0, 17.0, 21.0, 20.0, 24.0, 32.0, 31.0, 34.0, 38.0, 48.0, 52.0, 49.0, 35.0, 52.0, 47.0, 44.0, 48.0, 45.0, 28.0, 33.0, 26.0, 36.0, 27.0, 26.0, 21.0, 14.0, 19.0, 13.0, 15.0, 6.0, 3.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6672248840332031, -1.6136741638183594, -1.5601234436035156, -1.5065727233886719, -1.4530220031738281, -1.3994712829589844, -1.3459205627441406, -1.2923698425292969, -1.2388191223144531, -1.1852684020996094, -1.1317176818847656, -1.0781669616699219, -1.0246162414550781, -0.9710655212402344, -0.9175148606300354, -0.8639641404151917, -0.8104134798049927, -0.7568627595901489, -0.7033120393753052, -0.6497613191604614, -0.5962105989456177, -0.5426598787307739, -0.48910921812057495, -0.4355584979057312, -0.38200777769088745, -0.3284570574760437, -0.27490633726119995, -0.2213556468486786, -0.16780492663383484, -0.11425420641899109, -0.06070351600646973, -0.0071527957916259766, 0.04639780521392822, 0.09994851797819138, 0.15349923074245453, 0.20704993605613708, 0.26060065627098083, 0.3141513764858246, 0.36770206689834595, 0.4212527871131897, 0.47480350732803345, 0.5283542275428772, 0.581904947757721, 0.6354556083679199, 0.6890063285827637, 0.7425570487976074, 0.7961077690124512, 0.8496584892272949, 0.9032092094421387, 0.9567599296569824, 1.0103106498718262, 1.06386137008667, 1.1174120903015137, 1.1709628105163574, 1.2245135307312012, 1.278064250946045, 1.3316149711608887, 1.3851656913757324, 1.4387164115905762, 1.49226713180542, 1.5458178520202637, 1.5993685722351074, 1.6529192924499512, 1.706470012664795, 1.7600206136703491]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 10.0, 12.0, 17.0, 16.0, 22.0, 33.0, 49.0, 69.0, 115.0, 194.0, 457.0, 1161.0, 4445.0, 33887.0, 3319803.0, 809586.0, 19641.0, 3189.0, 866.0, 303.0, 147.0, 91.0, 50.0, 28.0, 24.0, 21.0, 12.0, 2.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489013671875, -0.474578857421875, -0.46014404296875, -0.445709228515625, -0.4312744140625, -0.416839599609375, -0.40240478515625, -0.387969970703125, -0.37353515625, -0.359100341796875, -0.34466552734375, -0.330230712890625, -0.3157958984375, -0.301361083984375, -0.28692626953125, -0.272491455078125, -0.258056640625, -0.243621826171875, -0.22918701171875, -0.214752197265625, -0.2003173828125, -0.185882568359375, -0.17144775390625, -0.157012939453125, -0.142578125, -0.128143310546875, -0.11370849609375, -0.099273681640625, -0.0848388671875, -0.070404052734375, -0.05596923828125, -0.041534423828125, -0.027099609375, -0.012664794921875, 0.00177001953125, 0.016204833984375, 0.0306396484375, 0.045074462890625, 0.05950927734375, 0.073944091796875, 0.08837890625, 0.102813720703125, 0.11724853515625, 0.131683349609375, 0.1461181640625, 0.160552978515625, 0.17498779296875, 0.189422607421875, 0.203857421875, 0.218292236328125, 0.23272705078125, 0.247161865234375, 0.2615966796875, 0.276031494140625, 0.29046630859375, 0.304901123046875, 0.3193359375, 0.333770751953125, 0.34820556640625, 0.362640380859375, 0.3770751953125, 0.391510009765625, 0.40594482421875, 0.420379638671875, 0.434814453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 5.0, 12.0, 20.0, 26.0, 26.0, 32.0, 50.0, 50.0, 63.0, 72.0, 95.0, 89.0, 76.0, 83.0, 74.0, 58.0, 56.0, 31.0, 30.0, 15.0, 12.0, 5.0, 9.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18426895141601562, -0.17957305908203125, -0.17487716674804688, -0.1701812744140625, -0.16548538208007812, -0.16078948974609375, -0.15609359741210938, -0.151397705078125, -0.14670181274414062, -0.14200592041015625, -0.13731002807617188, -0.1326141357421875, -0.12791824340820312, -0.12322235107421875, -0.11852645874023438, -0.11383056640625, -0.10913467407226562, -0.10443878173828125, -0.09974288940429688, -0.0950469970703125, -0.09035110473632812, -0.08565521240234375, -0.08095932006835938, -0.076263427734375, -0.07156753540039062, -0.06687164306640625, -0.062175750732421875, -0.0574798583984375, -0.052783966064453125, -0.04808807373046875, -0.043392181396484375, -0.0386962890625, -0.034000396728515625, -0.02930450439453125, -0.024608612060546875, -0.0199127197265625, -0.015216827392578125, -0.01052093505859375, -0.005825042724609375, -0.001129150390625, 0.003566741943359375, 0.00826263427734375, 0.012958526611328125, 0.0176544189453125, 0.022350311279296875, 0.02704620361328125, 0.031742095947265625, 0.03643798828125, 0.041133880615234375, 0.04582977294921875, 0.050525665283203125, 0.0552215576171875, 0.059917449951171875, 0.06461334228515625, 0.06930923461914062, 0.074005126953125, 0.07870101928710938, 0.08339691162109375, 0.08809280395507812, 0.0927886962890625, 0.09748458862304688, 0.10218048095703125, 0.10687637329101562, 0.111572265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 13.0, 10.0, 10.0, 20.0, 29.0, 51.0, 112.0, 246.0, 659.0, 2251.0, 10031.0, 94493.0, 3811725.0, 252411.0, 17442.0, 3155.0, 917.0, 299.0, 163.0, 91.0, 56.0, 31.0, 14.0, 19.0, 14.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.39678955078125, -0.3800048828125, -0.36322021484375, -0.346435546875, -0.32965087890625, -0.3128662109375, -0.29608154296875, -0.279296875, -0.26251220703125, -0.2457275390625, -0.22894287109375, -0.212158203125, -0.19537353515625, -0.1785888671875, -0.16180419921875, -0.14501953125, -0.12823486328125, -0.1114501953125, -0.09466552734375, -0.077880859375, -0.06109619140625, -0.0443115234375, -0.02752685546875, -0.0107421875, 0.00604248046875, 0.0228271484375, 0.03961181640625, 0.056396484375, 0.07318115234375, 0.0899658203125, 0.10675048828125, 0.12353515625, 0.14031982421875, 0.1571044921875, 0.17388916015625, 0.190673828125, 0.20745849609375, 0.2242431640625, 0.24102783203125, 0.2578125, 0.27459716796875, 0.2913818359375, 0.30816650390625, 0.324951171875, 0.34173583984375, 0.3585205078125, 0.37530517578125, 0.39208984375, 0.40887451171875, 0.4256591796875, 0.44244384765625, 0.459228515625, 0.47601318359375, 0.4927978515625, 0.50958251953125, 0.5263671875, 0.54315185546875, 0.5599365234375, 0.57672119140625, 0.593505859375, 0.61029052734375, 0.6270751953125, 0.64385986328125, 0.66064453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 4.0, 2.0, 5.0, 20.0, 30.0, 47.0, 72.0, 137.0, 266.0, 722.0, 1398.0, 758.0, 278.0, 142.0, 58.0, 40.0, 30.0, 20.0, 11.0, 11.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.25962066650390625, -0.2462921142578125, -0.23296356201171875, -0.219635009765625, -0.20630645751953125, -0.1929779052734375, -0.17964935302734375, -0.16632080078125, -0.15299224853515625, -0.1396636962890625, -0.12633514404296875, -0.113006591796875, -0.09967803955078125, -0.0863494873046875, -0.07302093505859375, -0.0596923828125, -0.04636383056640625, -0.0330352783203125, -0.01970672607421875, -0.006378173828125, 0.00695037841796875, 0.0202789306640625, 0.03360748291015625, 0.04693603515625, 0.06026458740234375, 0.0735931396484375, 0.08692169189453125, 0.100250244140625, 0.11357879638671875, 0.1269073486328125, 0.14023590087890625, 0.153564453125, 0.16689300537109375, 0.1802215576171875, 0.19355010986328125, 0.206878662109375, 0.22020721435546875, 0.2335357666015625, 0.24686431884765625, 0.26019287109375, 0.27352142333984375, 0.2868499755859375, 0.30017852783203125, 0.313507080078125, 0.32683563232421875, 0.3401641845703125, 0.35349273681640625, 0.3668212890625, 0.38014984130859375, 0.3934783935546875, 0.40680694580078125, 0.420135498046875, 0.43346405029296875, 0.4467926025390625, 0.46012115478515625, 0.47344970703125, 0.48677825927734375, 0.5001068115234375, 0.5134353637695312, 0.526763916015625, 0.5400924682617188, 0.5534210205078125, 0.5667495727539062, 0.580078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 20.0, 44.0, 81.0, 211.0, 242.0, 203.0, 101.0, 36.0, 20.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7889578342437744, -2.683520793914795, -2.5780837535858154, -2.472646713256836, -2.3672094345092773, -2.261772394180298, -2.1563353538513184, -2.050898313522339, -1.9454611539840698, -1.8400241136550903, -1.7345869541168213, -1.6291499137878418, -1.5237128734588623, -1.4182757139205933, -1.3128386735916138, -1.2074015140533447, -1.1019644737243652, -0.996527373790741, -0.8910902738571167, -0.7856532335281372, -0.6802161335945129, -0.5747790336608887, -0.4693419933319092, -0.3639048933982849, -0.25846779346466064, -0.15303070843219757, -0.0475936233997345, 0.05784344673156738, 0.16328054666519165, 0.2687176465988159, 0.3741546869277954, 0.4795917868614197, 0.585029125213623, 0.6904662251472473, 0.7959033250808716, 0.9013403654098511, 1.0067775249481201, 1.1122145652770996, 1.217651605606079, 1.3230886459350586, 1.4285258054733276, 1.5339628458023071, 1.6394000053405762, 1.7448370456695557, 1.8502740859985352, 1.9557112455368042, 2.061148166656494, 2.1665854454040527, 2.2720224857330322, 2.3774595260620117, 2.482896566390991, 2.5883336067199707, 2.6937708854675293, 2.799207925796509, 2.9046449661254883, 3.0100820064544678, 3.1155190467834473, 3.2209560871124268, 3.3263931274414062, 3.431830406188965, 3.5372674465179443, 3.642704486846924, 3.7481415271759033, 3.853578567504883, 3.9590158462524414]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 6.0, 15.0, 20.0, 23.0, 19.0, 32.0, 33.0, 36.0, 42.0, 61.0, 54.0, 69.0, 60.0, 65.0, 46.0, 60.0, 55.0, 34.0, 50.0, 31.0, 42.0, 30.0, 22.0, 17.0, 13.0, 11.0, 14.0, 4.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.397870659828186, -1.3496992588043213, -1.301527976989746, -1.2533565759658813, -1.2051851749420166, -1.1570138931274414, -1.1088424921035767, -1.060671091079712, -1.0124998092651367, -0.9643284678459167, -0.9161571264266968, -0.867985725402832, -0.8198143839836121, -0.7716430425643921, -0.7234716415405273, -0.6753003001213074, -0.6271289587020874, -0.5789576172828674, -0.5307862758636475, -0.4826148748397827, -0.43444353342056274, -0.3862721920013428, -0.3381008207798004, -0.28992944955825806, -0.24175810813903809, -0.19358675181865692, -0.14541539549827576, -0.09724403917789459, -0.04907268285751343, -0.0009013265371322632, 0.0472700297832489, 0.09544140100479126, 0.14361262321472168, 0.19178397953510284, 0.239955335855484, 0.28812670707702637, 0.33629804849624634, 0.3844693899154663, 0.43264076113700867, 0.480812132358551, 0.528983473777771, 0.577154815196991, 0.6253261566162109, 0.6734975576400757, 0.7216688990592957, 0.7698402404785156, 0.8180116415023804, 0.8661829829216003, 0.9143543243408203, 0.9625256657600403, 1.0106970071792603, 1.058868408203125, 1.1070396900177002, 1.155211091041565, 1.2033824920654297, 1.2515537738800049, 1.2997251749038696, 1.3478965759277344, 1.3960678577423096, 1.4442392587661743, 1.492410659790039, 1.5405819416046143, 1.588753342628479, 1.6369247436523438, 1.685096025466919]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 3.0, 4.0, 10.0, 16.0, 26.0, 50.0, 68.0, 189.0, 445.0, 1338.0, 5944.0, 38976.0, 683795.0, 290247.0, 22022.0, 3852.0, 928.0, 335.0, 137.0, 84.0, 41.0, 20.0, 8.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5431900024414062, -0.5243682861328125, -0.5055465698242188, -0.486724853515625, -0.46790313720703125, -0.4490814208984375, -0.43025970458984375, -0.41143798828125, -0.39261627197265625, -0.3737945556640625, -0.35497283935546875, -0.336151123046875, -0.31732940673828125, -0.2985076904296875, -0.27968597412109375, -0.2608642578125, -0.24204254150390625, -0.2232208251953125, -0.20439910888671875, -0.185577392578125, -0.16675567626953125, -0.1479339599609375, -0.12911224365234375, -0.11029052734375, -0.09146881103515625, -0.0726470947265625, -0.05382537841796875, -0.035003662109375, -0.01618194580078125, 0.0026397705078125, 0.02146148681640625, 0.040283203125, 0.05910491943359375, 0.0779266357421875, 0.09674835205078125, 0.115570068359375, 0.13439178466796875, 0.1532135009765625, 0.17203521728515625, 0.19085693359375, 0.20967864990234375, 0.2285003662109375, 0.24732208251953125, 0.266143798828125, 0.28496551513671875, 0.3037872314453125, 0.32260894775390625, 0.3414306640625, 0.36025238037109375, 0.3790740966796875, 0.39789581298828125, 0.416717529296875, 0.43553924560546875, 0.4543609619140625, 0.47318267822265625, 0.49200439453125, 0.5108261108398438, 0.5296478271484375, 0.5484695434570312, 0.567291259765625, 0.5861129760742188, 0.6049346923828125, 0.6237564086914062, 0.642578125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 13.0, 15.0, 13.0, 13.0, 31.0, 38.0, 38.0, 57.0, 45.0, 64.0, 56.0, 96.0, 99.0, 82.0, 73.0, 57.0, 61.0, 41.0, 36.0, 30.0, 19.0, 10.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.2420654296875, -0.23701190948486328, -0.23195838928222656, -0.22690486907958984, -0.22185134887695312, -0.2167978286743164, -0.2117443084716797, -0.20669078826904297, -0.20163726806640625, -0.19658374786376953, -0.1915302276611328, -0.1864767074584961, -0.18142318725585938, -0.17636966705322266, -0.17131614685058594, -0.16626262664794922, -0.1612091064453125, -0.15615558624267578, -0.15110206604003906, -0.14604854583740234, -0.14099502563476562, -0.1359415054321289, -0.1308879852294922, -0.12583446502685547, -0.12078094482421875, -0.11572742462158203, -0.11067390441894531, -0.1056203842163086, -0.10056686401367188, -0.09551334381103516, -0.09045982360839844, -0.08540630340576172, -0.080352783203125, -0.07529926300048828, -0.07024574279785156, -0.06519222259521484, -0.060138702392578125, -0.055085182189941406, -0.05003166198730469, -0.04497814178466797, -0.03992462158203125, -0.03487110137939453, -0.029817581176757812, -0.024764060974121094, -0.019710540771484375, -0.014657020568847656, -0.009603500366210938, -0.004549980163574219, 0.0005035400390625, 0.005557060241699219, 0.010610580444335938, 0.015664100646972656, 0.020717620849609375, 0.025771141052246094, 0.030824661254882812, 0.03587818145751953, 0.04093170166015625, 0.04598522186279297, 0.05103874206542969, 0.056092262268066406, 0.061145782470703125, 0.06619930267333984, 0.07125282287597656, 0.07630634307861328, 0.08135986328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 15.0, 24.0, 13.0, 25.0, 39.0, 59.0, 101.0, 159.0, 308.0, 553.0, 1271.0, 3667.0, 15097.0, 147380.0, 820578.0, 47169.0, 7856.0, 2274.0, 901.0, 429.0, 247.0, 120.0, 96.0, 55.0, 33.0, 17.0, 21.0, 8.0, 4.0, 8.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6154251098632812, -0.5951080322265625, -0.5747909545898438, -0.554473876953125, -0.5341567993164062, -0.5138397216796875, -0.49352264404296875, -0.47320556640625, -0.45288848876953125, -0.4325714111328125, -0.41225433349609375, -0.391937255859375, -0.37162017822265625, -0.3513031005859375, -0.33098602294921875, -0.3106689453125, -0.29035186767578125, -0.2700347900390625, -0.24971771240234375, -0.229400634765625, -0.20908355712890625, -0.1887664794921875, -0.16844940185546875, -0.14813232421875, -0.12781524658203125, -0.1074981689453125, -0.08718109130859375, -0.066864013671875, -0.04654693603515625, -0.0262298583984375, -0.00591278076171875, 0.014404296875, 0.03472137451171875, 0.0550384521484375, 0.07535552978515625, 0.095672607421875, 0.11598968505859375, 0.1363067626953125, 0.15662384033203125, 0.17694091796875, 0.19725799560546875, 0.2175750732421875, 0.23789215087890625, 0.258209228515625, 0.27852630615234375, 0.2988433837890625, 0.31916046142578125, 0.3394775390625, 0.35979461669921875, 0.3801116943359375, 0.40042877197265625, 0.420745849609375, 0.44106292724609375, 0.4613800048828125, 0.48169708251953125, 0.50201416015625, 0.5223312377929688, 0.5426483154296875, 0.5629653930664062, 0.583282470703125, 0.6035995483398438, 0.6239166259765625, 0.6442337036132812, 0.66455078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 12.0, 23.0, 20.0, 28.0, 23.0, 45.0, 33.0, 59.0, 55.0, 57.0, 59.0, 64.0, 63.0, 65.0, 62.0, 52.0, 48.0, 35.0, 29.0, 31.0, 14.0, 18.0, 15.0, 15.0, 6.0, 8.0, 7.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4490242004394531, -0.43149566650390625, -0.4139671325683594, -0.3964385986328125, -0.3789100646972656, -0.36138153076171875, -0.3438529968261719, -0.326324462890625, -0.3087959289550781, -0.29126739501953125, -0.2737388610839844, -0.2562103271484375, -0.23868179321289062, -0.22115325927734375, -0.20362472534179688, -0.18609619140625, -0.16856765747070312, -0.15103912353515625, -0.13351058959960938, -0.1159820556640625, -0.09845352172851562, -0.08092498779296875, -0.06339645385742188, -0.045867919921875, -0.028339385986328125, -0.01081085205078125, 0.006717681884765625, 0.0242462158203125, 0.041774749755859375, 0.05930328369140625, 0.07683181762695312, 0.0943603515625, 0.11188888549804688, 0.12941741943359375, 0.14694595336914062, 0.1644744873046875, 0.18200302124023438, 0.19953155517578125, 0.21706008911132812, 0.234588623046875, 0.2521171569824219, 0.26964569091796875, 0.2871742248535156, 0.3047027587890625, 0.3222312927246094, 0.33975982666015625, 0.3572883605957031, 0.37481689453125, 0.3923454284667969, 0.40987396240234375, 0.4274024963378906, 0.4449310302734375, 0.4624595642089844, 0.47998809814453125, 0.4975166320800781, 0.515045166015625, 0.5325736999511719, 0.5501022338867188, 0.5676307678222656, 0.5851593017578125, 0.6026878356933594, 0.6202163696289062, 0.6377449035644531, 0.6552734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 12.0, 13.0, 18.0, 20.0, 46.0, 57.0, 112.0, 190.0, 484.0, 1429.0, 7016.0, 140946.0, 875849.0, 18396.0, 2542.0, 713.0, 313.0, 139.0, 81.0, 43.0, 25.0, 27.0, 19.0, 11.0, 12.0, 3.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.490478515625, -0.475250244140625, -0.46002197265625, -0.444793701171875, -0.4295654296875, -0.414337158203125, -0.39910888671875, -0.383880615234375, -0.36865234375, -0.353424072265625, -0.33819580078125, -0.322967529296875, -0.3077392578125, -0.292510986328125, -0.27728271484375, -0.262054443359375, -0.246826171875, -0.231597900390625, -0.21636962890625, -0.201141357421875, -0.1859130859375, -0.170684814453125, -0.15545654296875, -0.140228271484375, -0.125, -0.109771728515625, -0.09454345703125, -0.079315185546875, -0.0640869140625, -0.048858642578125, -0.03363037109375, -0.018402099609375, -0.003173828125, 0.012054443359375, 0.02728271484375, 0.042510986328125, 0.0577392578125, 0.072967529296875, 0.08819580078125, 0.103424072265625, 0.11865234375, 0.133880615234375, 0.14910888671875, 0.164337158203125, 0.1795654296875, 0.194793701171875, 0.21002197265625, 0.225250244140625, 0.240478515625, 0.255706787109375, 0.27093505859375, 0.286163330078125, 0.3013916015625, 0.316619873046875, 0.33184814453125, 0.347076416015625, 0.3623046875, 0.377532958984375, 0.39276123046875, 0.407989501953125, 0.4232177734375, 0.438446044921875, 0.45367431640625, 0.468902587890625, 0.484130859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 7.0, 6.0, 7.0, 10.0, 7.0, 23.0, 18.0, 27.0, 30.0, 54.0, 59.0, 85.0, 117.0, 107.0, 112.0, 78.0, 73.0, 57.0, 26.0, 32.0, 20.0, 11.0, 8.0, 10.0, 5.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010055303573608398, -9.813159704208374e-05, -9.57101583480835e-05, -9.328871965408325e-05, -9.086728096008301e-05, -8.844584226608276e-05, -8.602440357208252e-05, -8.360296487808228e-05, -8.118152618408203e-05, -7.876008749008179e-05, -7.633864879608154e-05, -7.39172101020813e-05, -7.149577140808105e-05, -6.907433271408081e-05, -6.665289402008057e-05, -6.423145532608032e-05, -6.181001663208008e-05, -5.9388577938079834e-05, -5.696713924407959e-05, -5.4545700550079346e-05, -5.21242618560791e-05, -4.970282316207886e-05, -4.728138446807861e-05, -4.485994577407837e-05, -4.2438507080078125e-05, -4.001706838607788e-05, -3.759562969207764e-05, -3.517419099807739e-05, -3.275275230407715e-05, -3.0331313610076904e-05, -2.790987491607666e-05, -2.5488436222076416e-05, -2.3066997528076172e-05, -2.0645558834075928e-05, -1.8224120140075684e-05, -1.580268144607544e-05, -1.3381242752075195e-05, -1.0959804058074951e-05, -8.538365364074707e-06, -6.116926670074463e-06, -3.6954879760742188e-06, -1.2740492820739746e-06, 1.1473894119262695e-06, 3.5688281059265137e-06, 5.990266799926758e-06, 8.411705493927002e-06, 1.0833144187927246e-05, 1.325458288192749e-05, 1.5676021575927734e-05, 1.809746026992798e-05, 2.0518898963928223e-05, 2.2940337657928467e-05, 2.536177635192871e-05, 2.7783215045928955e-05, 3.02046537399292e-05, 3.262609243392944e-05, 3.504753112792969e-05, 3.746896982192993e-05, 3.9890408515930176e-05, 4.231184720993042e-05, 4.4733285903930664e-05, 4.715472459793091e-05, 4.957616329193115e-05, 5.1997601985931396e-05, 5.441904067993164e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 9.0, 8.0, 12.0, 26.0, 24.0, 44.0, 60.0, 93.0, 173.0, 335.0, 657.0, 1795.0, 5687.0, 29843.0, 608149.0, 369954.0, 23832.0, 4991.0, 1578.0, 629.0, 294.0, 143.0, 86.0, 38.0, 27.0, 17.0, 15.0, 14.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298095703125, -0.2890472412109375, -0.279998779296875, -0.2709503173828125, -0.26190185546875, -0.2528533935546875, -0.243804931640625, -0.2347564697265625, -0.2257080078125, -0.2166595458984375, -0.207611083984375, -0.1985626220703125, -0.18951416015625, -0.1804656982421875, -0.171417236328125, -0.1623687744140625, -0.1533203125, -0.1442718505859375, -0.135223388671875, -0.1261749267578125, -0.11712646484375, -0.1080780029296875, -0.099029541015625, -0.0899810791015625, -0.0809326171875, -0.0718841552734375, -0.062835693359375, -0.0537872314453125, -0.04473876953125, -0.0356903076171875, -0.026641845703125, -0.0175933837890625, -0.008544921875, 0.0005035400390625, 0.009552001953125, 0.0186004638671875, 0.02764892578125, 0.0366973876953125, 0.045745849609375, 0.0547943115234375, 0.0638427734375, 0.0728912353515625, 0.081939697265625, 0.0909881591796875, 0.10003662109375, 0.1090850830078125, 0.118133544921875, 0.1271820068359375, 0.13623046875, 0.1452789306640625, 0.154327392578125, 0.1633758544921875, 0.17242431640625, 0.1814727783203125, 0.190521240234375, 0.1995697021484375, 0.2086181640625, 0.2176666259765625, 0.226715087890625, 0.2357635498046875, 0.24481201171875, 0.2538604736328125, 0.262908935546875, 0.2719573974609375, 0.281005859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 6.0, 3.0, 6.0, 17.0, 23.0, 37.0, 55.0, 68.0, 91.0, 138.0, 161.0, 113.0, 90.0, 57.0, 37.0, 25.0, 11.0, 19.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2735271453857422, -0.2658042907714844, -0.25808143615722656, -0.25035858154296875, -0.24263572692871094, -0.23491287231445312, -0.2271900177001953, -0.2194671630859375, -0.2117443084716797, -0.20402145385742188, -0.19629859924316406, -0.18857574462890625, -0.18085289001464844, -0.17313003540039062, -0.1654071807861328, -0.157684326171875, -0.1499614715576172, -0.14223861694335938, -0.13451576232910156, -0.12679290771484375, -0.11907005310058594, -0.11134719848632812, -0.10362434387207031, -0.0959014892578125, -0.08817863464355469, -0.08045578002929688, -0.07273292541503906, -0.06501007080078125, -0.05728721618652344, -0.049564361572265625, -0.04184150695800781, -0.03411865234375, -0.026395797729492188, -0.018672943115234375, -0.010950088500976562, -0.00322723388671875, 0.0044956207275390625, 0.012218475341796875, 0.019941329956054688, 0.0276641845703125, 0.03538703918457031, 0.043109893798828125, 0.05083274841308594, 0.05855560302734375, 0.06627845764160156, 0.07400131225585938, 0.08172416687011719, 0.089447021484375, 0.09716987609863281, 0.10489273071289062, 0.11261558532714844, 0.12033843994140625, 0.12806129455566406, 0.13578414916992188, 0.1435070037841797, 0.1512298583984375, 0.1589527130126953, 0.16667556762695312, 0.17439842224121094, 0.18212127685546875, 0.18984413146972656, 0.19756698608398438, 0.2052898406982422, 0.2130126953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 24.0, 48.0, 151.0, 287.0, 240.0, 136.0, 51.0, 16.0, 12.0, 9.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.172328472137451, -5.010281085968018, -4.848234176635742, -4.686186790466309, -4.524139404296875, -4.362092018127441, -4.200045108795166, -4.037997722625732, -3.875950574874878, -3.7139034271240234, -3.55185604095459, -3.3898088932037354, -3.227761745452881, -3.0657143592834473, -2.9036672115325928, -2.7416200637817383, -2.5795726776123047, -2.41752552986145, -2.2554781436920166, -2.093430995941162, -1.931383728981018, -1.769336462020874, -1.6072893142700195, -1.4452420473098755, -1.2831947803497314, -1.1211475133895874, -0.9591003060340881, -0.7970530986785889, -0.6350058317184448, -0.4729585647583008, -0.3109113574028015, -0.14886415004730225, 0.013182640075683594, 0.17522987723350525, 0.3372771143913269, 0.49932435154914856, 0.6613715887069702, 0.8234188556671143, 0.9854660630226135, 1.1475132703781128, 1.3095605373382568, 1.4716078042984009, 1.633655071258545, 1.7957022190093994, 1.9577494859695435, 2.1197967529296875, 2.281843900680542, 2.4438910484313965, 2.60593843460083, 2.7679855823516846, 2.930032968521118, 3.0920801162719727, 3.2541275024414062, 3.4161746501922607, 3.5782217979431152, 3.740269184112549, 3.9023163318634033, 4.064363479614258, 4.226410865783691, 4.388458251953125, 4.5505051612854, 4.712552547454834, 4.874599933624268, 5.036646842956543, 5.198694229125977]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 9.0, 12.0, 20.0, 8.0, 13.0, 18.0, 18.0, 23.0, 29.0, 26.0, 25.0, 21.0, 35.0, 36.0, 34.0, 53.0, 42.0, 53.0, 55.0, 46.0, 46.0, 41.0, 26.0, 38.0, 42.0, 25.0, 33.0, 13.0, 24.0, 17.0, 21.0, 14.0, 12.0, 14.0, 10.0, 6.0, 2.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.5909292697906494, -1.5423047542572021, -1.4936801195144653, -1.445055603981018, -1.3964309692382812, -1.347806453704834, -1.2991818189620972, -1.25055730342865, -1.201932668685913, -1.1533081531524658, -1.104683518409729, -1.0560590028762817, -1.007434368133545, -0.9588097929954529, -0.9101852178573608, -0.8615607023239136, -0.8129361271858215, -0.7643115520477295, -0.7156869769096375, -0.6670624017715454, -0.6184378266334534, -0.5698132514953613, -0.5211887359619141, -0.47256413102149963, -0.4239395558834076, -0.37531498074531555, -0.3266904056072235, -0.27806586027145386, -0.22944127023220062, -0.18081669509410858, -0.13219213485717773, -0.0835675597190857, -0.03494298458099365, 0.01368158683180809, 0.06230615824460983, 0.11093072593212128, 0.15955530107021332, 0.20817987620830536, 0.2568044364452362, 0.30542901158332825, 0.3540535867214203, 0.40267816185951233, 0.45130273699760437, 0.499927282333374, 0.5485518574714661, 0.5971764326095581, 0.6458010077476501, 0.6944255828857422, 0.7430501580238342, 0.7916747331619263, 0.8402993083000183, 0.8889238834381104, 0.9375484585762024, 0.9861730337142944, 1.0347975492477417, 1.0834221839904785, 1.1320466995239258, 1.180671215057373, 1.2292958498001099, 1.2779203653335571, 1.326545000076294, 1.3751695156097412, 1.423794150352478, 1.4724186658859253, 1.521043300628662]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 1.0, 2.0, 3.0, 12.0, 11.0, 11.0, 25.0, 21.0, 56.0, 71.0, 146.0, 250.0, 524.0, 1215.0, 3315.0, 11125.0, 53526.0, 662907.0, 3181732.0, 237213.0, 30792.0, 7338.0, 2371.0, 879.0, 358.0, 193.0, 80.0, 44.0, 21.0, 13.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.392333984375, -0.3828411102294922, -0.3733482360839844, -0.36385536193847656, -0.35436248779296875, -0.34486961364746094, -0.3353767395019531, -0.3258838653564453, -0.3163909912109375, -0.3068981170654297, -0.2974052429199219, -0.28791236877441406, -0.27841949462890625, -0.26892662048339844, -0.2594337463378906, -0.2499408721923828, -0.240447998046875, -0.2309551239013672, -0.22146224975585938, -0.21196937561035156, -0.20247650146484375, -0.19298362731933594, -0.18349075317382812, -0.1739978790283203, -0.1645050048828125, -0.1550121307373047, -0.14551925659179688, -0.13602638244628906, -0.12653350830078125, -0.11704063415527344, -0.10754776000976562, -0.09805488586425781, -0.08856201171875, -0.07906913757324219, -0.06957626342773438, -0.06008338928222656, -0.05059051513671875, -0.04109764099121094, -0.031604766845703125, -0.022111892700195312, -0.0126190185546875, -0.0031261444091796875, 0.006366729736328125, 0.015859603881835938, 0.02535247802734375, 0.03484535217285156, 0.044338226318359375, 0.05383110046386719, 0.063323974609375, 0.07281684875488281, 0.08230972290039062, 0.09180259704589844, 0.10129547119140625, 0.11078834533691406, 0.12028121948242188, 0.1297740936279297, 0.1392669677734375, 0.1487598419189453, 0.15825271606445312, 0.16774559020996094, 0.17723846435546875, 0.18673133850097656, 0.19622421264648438, 0.2057170867919922, 0.2152099609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 9.0, 18.0, 17.0, 10.0, 24.0, 31.0, 33.0, 55.0, 42.0, 44.0, 55.0, 49.0, 60.0, 51.0, 54.0, 46.0, 51.0, 50.0, 35.0, 41.0, 41.0, 31.0, 28.0, 27.0, 15.0, 11.0, 9.0, 11.0, 7.0, 6.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.12548828125, -0.12221431732177734, -0.11894035339355469, -0.11566638946533203, -0.11239242553710938, -0.10911846160888672, -0.10584449768066406, -0.1025705337524414, -0.09929656982421875, -0.0960226058959961, -0.09274864196777344, -0.08947467803955078, -0.08620071411132812, -0.08292675018310547, -0.07965278625488281, -0.07637882232666016, -0.0731048583984375, -0.06983089447021484, -0.06655693054199219, -0.06328296661376953, -0.060009002685546875, -0.05673503875732422, -0.05346107482910156, -0.050187110900878906, -0.04691314697265625, -0.043639183044433594, -0.04036521911621094, -0.03709125518798828, -0.033817291259765625, -0.03054332733154297, -0.027269363403320312, -0.023995399475097656, -0.020721435546875, -0.017447471618652344, -0.014173507690429688, -0.010899543762207031, -0.007625579833984375, -0.004351615905761719, -0.0010776519775390625, 0.0021963119506835938, 0.00547027587890625, 0.008744239807128906, 0.012018203735351562, 0.015292167663574219, 0.018566131591796875, 0.02184009552001953, 0.025114059448242188, 0.028388023376464844, 0.0316619873046875, 0.034935951232910156, 0.03820991516113281, 0.04148387908935547, 0.044757843017578125, 0.04803180694580078, 0.05130577087402344, 0.054579734802246094, 0.05785369873046875, 0.061127662658691406, 0.06440162658691406, 0.06767559051513672, 0.07094955444335938, 0.07422351837158203, 0.07749748229980469, 0.08077144622802734, 0.08404541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 7.0, 10.0, 23.0, 34.0, 36.0, 58.0, 107.0, 232.0, 599.0, 1925.0, 7515.0, 60736.0, 3198758.0, 888896.0, 29157.0, 4190.0, 1154.0, 395.0, 212.0, 98.0, 50.0, 21.0, 17.0, 12.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6494140625, -0.6302337646484375, -0.611053466796875, -0.5918731689453125, -0.57269287109375, -0.5535125732421875, -0.534332275390625, -0.5151519775390625, -0.4959716796875, -0.4767913818359375, -0.457611083984375, -0.4384307861328125, -0.41925048828125, -0.4000701904296875, -0.380889892578125, -0.3617095947265625, -0.342529296875, -0.3233489990234375, -0.304168701171875, -0.2849884033203125, -0.26580810546875, -0.2466278076171875, -0.227447509765625, -0.2082672119140625, -0.1890869140625, -0.1699066162109375, -0.150726318359375, -0.1315460205078125, -0.11236572265625, -0.0931854248046875, -0.074005126953125, -0.0548248291015625, -0.03564453125, -0.0164642333984375, 0.002716064453125, 0.0218963623046875, 0.04107666015625, 0.0602569580078125, 0.079437255859375, 0.0986175537109375, 0.1177978515625, 0.1369781494140625, 0.156158447265625, 0.1753387451171875, 0.19451904296875, 0.2136993408203125, 0.232879638671875, 0.2520599365234375, 0.271240234375, 0.2904205322265625, 0.309600830078125, 0.3287811279296875, 0.34796142578125, 0.3671417236328125, 0.386322021484375, 0.4055023193359375, 0.4246826171875, 0.4438629150390625, 0.463043212890625, 0.4822235107421875, 0.50140380859375, 0.5205841064453125, 0.539764404296875, 0.5589447021484375, 0.578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 10.0, 14.0, 21.0, 20.0, 34.0, 44.0, 72.0, 136.0, 227.0, 414.0, 740.0, 945.0, 565.0, 328.0, 175.0, 113.0, 66.0, 36.0, 29.0, 24.0, 10.0, 11.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5107421875, -0.4962615966796875, -0.481781005859375, -0.4673004150390625, -0.45281982421875, -0.4383392333984375, -0.423858642578125, -0.4093780517578125, -0.3948974609375, -0.3804168701171875, -0.365936279296875, -0.3514556884765625, -0.33697509765625, -0.3224945068359375, -0.308013916015625, -0.2935333251953125, -0.279052734375, -0.2645721435546875, -0.250091552734375, -0.2356109619140625, -0.22113037109375, -0.2066497802734375, -0.192169189453125, -0.1776885986328125, -0.1632080078125, -0.1487274169921875, -0.134246826171875, -0.1197662353515625, -0.10528564453125, -0.0908050537109375, -0.076324462890625, -0.0618438720703125, -0.04736328125, -0.0328826904296875, -0.018402099609375, -0.0039215087890625, 0.01055908203125, 0.0250396728515625, 0.039520263671875, 0.0540008544921875, 0.0684814453125, 0.0829620361328125, 0.097442626953125, 0.1119232177734375, 0.12640380859375, 0.1408843994140625, 0.155364990234375, 0.1698455810546875, 0.184326171875, 0.1988067626953125, 0.213287353515625, 0.2277679443359375, 0.24224853515625, 0.2567291259765625, 0.271209716796875, 0.2856903076171875, 0.3001708984375, 0.3146514892578125, 0.329132080078125, 0.3436126708984375, 0.35809326171875, 0.3725738525390625, 0.387054443359375, 0.4015350341796875, 0.416015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 13.0, 37.0, 107.0, 232.0, 289.0, 176.0, 70.0, 30.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.058704376220703, -7.8810529708862305, -7.703401565551758, -7.525750160217285, -7.348099231719971, -7.170447826385498, -6.992796421051025, -6.815145015716553, -6.63749361038208, -6.459842205047607, -6.282190799713135, -6.10453987121582, -5.926888465881348, -5.749237060546875, -5.571585655212402, -5.39393424987793, -5.216282844543457, -5.038631439208984, -4.860980033874512, -4.683328628540039, -4.505677700042725, -4.328026294708252, -4.150374889373779, -3.9727234840393066, -3.795072555541992, -3.6174211502075195, -3.439769983291626, -3.2621185779571533, -3.0844671726226807, -2.906816005706787, -2.7291646003723145, -2.551513195037842, -2.37386155128479, -2.1962101459503174, -2.018558979034424, -1.8409075736999512, -1.6632561683654785, -1.4856048822402954, -1.3079535961151123, -1.1303021907806396, -0.9526509046554565, -0.7749995589256287, -0.5973482131958008, -0.4196969270706177, -0.2420455813407898, -0.06439423561096191, 0.11325705051422119, 0.29090845584869385, 0.46855974197387695, 0.6462110877037048, 0.8238624334335327, 1.0015137195587158, 1.1791651248931885, 1.3568164110183716, 1.5344676971435547, 1.7121191024780273, 1.8897703886032104, 2.0674216747283936, 2.245073080062866, 2.4227242469787598, 2.6003756523132324, 2.778027057647705, 2.9556784629821777, 3.1333298683166504, 3.310981035232544]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 5.0, 6.0, 7.0, 10.0, 12.0, 24.0, 20.0, 24.0, 30.0, 35.0, 45.0, 33.0, 46.0, 56.0, 46.0, 60.0, 53.0, 45.0, 48.0, 48.0, 46.0, 46.0, 27.0, 35.0, 35.0, 23.0, 24.0, 22.0, 15.0, 11.0, 8.0, 7.0, 7.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5826128721237183, -1.526394009590149, -1.4701752662658691, -1.4139564037322998, -1.3577375411987305, -1.3015186786651611, -1.2452998161315918, -1.189081072807312, -1.1328622102737427, -1.0766433477401733, -1.0204246044158936, -0.9642057418823242, -0.9079868793487549, -0.8517680168151855, -0.795549213886261, -0.7393304109573364, -0.6831115484237671, -0.6268926858901978, -0.5706738829612732, -0.5144550800323486, -0.4582362174987793, -0.40201738476753235, -0.3457985520362854, -0.28957971930503845, -0.2333608865737915, -0.17714205384254456, -0.12092322111129761, -0.06470438838005066, -0.008485555648803711, 0.04773327708244324, 0.10395210981369019, 0.16017094254493713, 0.21638989448547363, 0.2726087272167206, 0.32882755994796753, 0.3850463926792145, 0.4412652254104614, 0.4974840581417084, 0.5537028908729553, 0.6099216938018799, 0.6661405563354492, 0.7223594188690186, 0.7785782217979431, 0.8347970247268677, 0.891015887260437, 0.9472347497940063, 1.0034534931182861, 1.0596723556518555, 1.1158912181854248, 1.1721100807189941, 1.2283289432525635, 1.2845476865768433, 1.3407665491104126, 1.396985411643982, 1.4532041549682617, 1.509423017501831, 1.5656418800354004, 1.6218607425689697, 1.678079605102539, 1.7342983484268188, 1.7905172109603882, 1.8467360734939575, 1.9029548168182373, 1.9591736793518066, 2.015392541885376]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 22.0, 24.0, 42.0, 60.0, 89.0, 149.0, 276.0, 527.0, 1095.0, 2432.0, 6101.0, 18156.0, 62252.0, 275952.0, 524386.0, 110204.0, 30323.0, 9815.0, 3525.0, 1483.0, 716.0, 382.0, 201.0, 105.0, 65.0, 46.0, 31.0, 14.0, 23.0, 13.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.410888671875, -0.3985176086425781, -0.38614654541015625, -0.3737754821777344, -0.3614044189453125, -0.3490333557128906, -0.33666229248046875, -0.3242912292480469, -0.311920166015625, -0.2995491027832031, -0.28717803955078125, -0.2748069763183594, -0.2624359130859375, -0.2500648498535156, -0.23769378662109375, -0.22532272338867188, -0.21295166015625, -0.20058059692382812, -0.18820953369140625, -0.17583847045898438, -0.1634674072265625, -0.15109634399414062, -0.13872528076171875, -0.12635421752929688, -0.113983154296875, -0.10161209106445312, -0.08924102783203125, -0.07686996459960938, -0.0644989013671875, -0.052127838134765625, -0.03975677490234375, -0.027385711669921875, -0.0150146484375, -0.002643585205078125, 0.00972747802734375, 0.022098541259765625, 0.0344696044921875, 0.046840667724609375, 0.05921173095703125, 0.07158279418945312, 0.083953857421875, 0.09632492065429688, 0.10869598388671875, 0.12106704711914062, 0.1334381103515625, 0.14580917358398438, 0.15818023681640625, 0.17055130004882812, 0.18292236328125, 0.19529342651367188, 0.20766448974609375, 0.22003555297851562, 0.2324066162109375, 0.24477767944335938, 0.25714874267578125, 0.2695198059082031, 0.281890869140625, 0.2942619323730469, 0.30663299560546875, 0.3190040588378906, 0.3313751220703125, 0.3437461853027344, 0.35611724853515625, 0.3684883117675781, 0.380859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 13.0, 16.0, 25.0, 29.0, 24.0, 43.0, 45.0, 61.0, 66.0, 61.0, 65.0, 78.0, 72.0, 71.0, 66.0, 64.0, 40.0, 43.0, 30.0, 24.0, 15.0, 11.0, 15.0, 9.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21550464630126953, -0.21055030822753906, -0.2055959701538086, -0.20064163208007812, -0.19568729400634766, -0.1907329559326172, -0.18577861785888672, -0.18082427978515625, -0.17586994171142578, -0.1709156036376953, -0.16596126556396484, -0.16100692749023438, -0.1560525894165039, -0.15109825134277344, -0.14614391326904297, -0.1411895751953125, -0.13623523712158203, -0.13128089904785156, -0.1263265609741211, -0.12137222290039062, -0.11641788482666016, -0.11146354675292969, -0.10650920867919922, -0.10155487060546875, -0.09660053253173828, -0.09164619445800781, -0.08669185638427734, -0.08173751831054688, -0.0767831802368164, -0.07182884216308594, -0.06687450408935547, -0.061920166015625, -0.05696582794189453, -0.05201148986816406, -0.047057151794433594, -0.042102813720703125, -0.037148475646972656, -0.03219413757324219, -0.02723979949951172, -0.02228546142578125, -0.01733112335205078, -0.012376785278320312, -0.007422447204589844, -0.002468109130859375, 0.0024862289428710938, 0.0074405670166015625, 0.012394905090332031, 0.0173492431640625, 0.02230358123779297, 0.027257919311523438, 0.032212257385253906, 0.037166595458984375, 0.042120933532714844, 0.04707527160644531, 0.05202960968017578, 0.05698394775390625, 0.06193828582763672, 0.06689262390136719, 0.07184696197509766, 0.07680130004882812, 0.0817556381225586, 0.08670997619628906, 0.09166431427001953, 0.09661865234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 9.0, 16.0, 13.0, 25.0, 32.0, 48.0, 67.0, 118.0, 161.0, 242.0, 507.0, 808.0, 1895.0, 4916.0, 20416.0, 257622.0, 716152.0, 34111.0, 6485.0, 2352.0, 1053.0, 571.0, 298.0, 216.0, 126.0, 74.0, 48.0, 40.0, 30.0, 27.0, 19.0, 8.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79541015625, -0.7681045532226562, -0.7407989501953125, -0.7134933471679688, -0.686187744140625, -0.6588821411132812, -0.6315765380859375, -0.6042709350585938, -0.57696533203125, -0.5496597290039062, -0.5223541259765625, -0.49504852294921875, -0.467742919921875, -0.44043731689453125, -0.4131317138671875, -0.38582611083984375, -0.3585205078125, -0.33121490478515625, -0.3039093017578125, -0.27660369873046875, -0.249298095703125, -0.22199249267578125, -0.1946868896484375, -0.16738128662109375, -0.14007568359375, -0.11277008056640625, -0.0854644775390625, -0.05815887451171875, -0.030853271484375, -0.00354766845703125, 0.0237579345703125, 0.05106353759765625, 0.078369140625, 0.10567474365234375, 0.1329803466796875, 0.16028594970703125, 0.187591552734375, 0.21489715576171875, 0.2422027587890625, 0.26950836181640625, 0.29681396484375, 0.32411956787109375, 0.3514251708984375, 0.37873077392578125, 0.406036376953125, 0.43334197998046875, 0.4606475830078125, 0.48795318603515625, 0.5152587890625, 0.5425643920898438, 0.5698699951171875, 0.5971755981445312, 0.624481201171875, 0.6517868041992188, 0.6790924072265625, 0.7063980102539062, 0.73370361328125, 0.7610092163085938, 0.7883148193359375, 0.8156204223632812, 0.842926025390625, 0.8702316284179688, 0.8975372314453125, 0.9248428344726562, 0.9521484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 0.0, 1.0, 5.0, 5.0, 12.0, 12.0, 13.0, 13.0, 16.0, 24.0, 24.0, 41.0, 45.0, 54.0, 49.0, 52.0, 59.0, 51.0, 64.0, 61.0, 52.0, 59.0, 52.0, 33.0, 42.0, 24.0, 22.0, 23.0, 24.0, 15.0, 14.0, 10.0, 10.0, 8.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5738677978515625, -0.552520751953125, -0.5311737060546875, -0.50982666015625, -0.4884796142578125, -0.467132568359375, -0.4457855224609375, -0.4244384765625, -0.4030914306640625, -0.381744384765625, -0.3603973388671875, -0.33905029296875, -0.3177032470703125, -0.296356201171875, -0.2750091552734375, -0.253662109375, -0.2323150634765625, -0.210968017578125, -0.1896209716796875, -0.16827392578125, -0.1469268798828125, -0.125579833984375, -0.1042327880859375, -0.0828857421875, -0.0615386962890625, -0.040191650390625, -0.0188446044921875, 0.00250244140625, 0.0238494873046875, 0.045196533203125, 0.0665435791015625, 0.087890625, 0.1092376708984375, 0.130584716796875, 0.1519317626953125, 0.17327880859375, 0.1946258544921875, 0.215972900390625, 0.2373199462890625, 0.2586669921875, 0.2800140380859375, 0.301361083984375, 0.3227081298828125, 0.34405517578125, 0.3654022216796875, 0.386749267578125, 0.4080963134765625, 0.429443359375, 0.4507904052734375, 0.472137451171875, 0.4934844970703125, 0.51483154296875, 0.5361785888671875, 0.557525634765625, 0.5788726806640625, 0.6002197265625, 0.6215667724609375, 0.642913818359375, 0.6642608642578125, 0.68560791015625, 0.7069549560546875, 0.728302001953125, 0.7496490478515625, 0.77099609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 9.0, 6.0, 9.0, 13.0, 27.0, 26.0, 52.0, 93.0, 165.0, 362.0, 761.0, 2161.0, 8187.0, 56754.0, 822912.0, 137607.0, 14139.0, 3206.0, 1117.0, 416.0, 224.0, 105.0, 80.0, 30.0, 22.0, 14.0, 18.0, 5.0, 5.0, 9.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33935546875, -0.3286399841308594, -0.31792449951171875, -0.3072090148925781, -0.2964935302734375, -0.2857780456542969, -0.27506256103515625, -0.2643470764160156, -0.253631591796875, -0.24291610717773438, -0.23220062255859375, -0.22148513793945312, -0.2107696533203125, -0.20005416870117188, -0.18933868408203125, -0.17862319946289062, -0.16790771484375, -0.15719223022460938, -0.14647674560546875, -0.13576126098632812, -0.1250457763671875, -0.11433029174804688, -0.10361480712890625, -0.09289932250976562, -0.082183837890625, -0.07146835327148438, -0.06075286865234375, -0.050037384033203125, -0.0393218994140625, -0.028606414794921875, -0.01789093017578125, -0.007175445556640625, 0.0035400390625, 0.014255523681640625, 0.02497100830078125, 0.035686492919921875, 0.0464019775390625, 0.057117462158203125, 0.06783294677734375, 0.07854843139648438, 0.089263916015625, 0.09997940063476562, 0.11069488525390625, 0.12141036987304688, 0.1321258544921875, 0.14284133911132812, 0.15355682373046875, 0.16427230834960938, 0.17498779296875, 0.18570327758789062, 0.19641876220703125, 0.20713424682617188, 0.2178497314453125, 0.22856521606445312, 0.23928070068359375, 0.24999618530273438, 0.260711669921875, 0.2714271545410156, 0.28214263916015625, 0.2928581237792969, 0.3035736083984375, 0.3142890930175781, 0.32500457763671875, 0.3357200622558594, 0.346435546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 7.0, 8.0, 4.0, 14.0, 15.0, 11.0, 18.0, 13.0, 26.0, 37.0, 31.0, 55.0, 69.0, 78.0, 83.0, 86.0, 71.0, 52.0, 50.0, 49.0, 41.0, 16.0, 22.0, 15.0, 22.0, 13.0, 15.0, 7.0, 13.0, 5.0, 3.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.918741226196289e-05, -5.7208351790905e-05, -5.522929131984711e-05, -5.3250230848789215e-05, -5.127117037773132e-05, -4.929210990667343e-05, -4.731304943561554e-05, -4.533398896455765e-05, -4.3354928493499756e-05, -4.1375868022441864e-05, -3.939680755138397e-05, -3.741774708032608e-05, -3.543868660926819e-05, -3.34596261382103e-05, -3.1480565667152405e-05, -2.9501505196094513e-05, -2.752244472503662e-05, -2.554338425397873e-05, -2.3564323782920837e-05, -2.1585263311862946e-05, -1.9606202840805054e-05, -1.7627142369747162e-05, -1.564808189868927e-05, -1.3669021427631378e-05, -1.1689960956573486e-05, -9.710900485515594e-06, -7.731840014457703e-06, -5.752779543399811e-06, -3.773719072341919e-06, -1.794658601284027e-06, 1.8440186977386475e-07, 2.1634623408317566e-06, 4.1425228118896484e-06, 6.12158328294754e-06, 8.100643754005432e-06, 1.0079704225063324e-05, 1.2058764696121216e-05, 1.4037825167179108e-05, 1.6016885638237e-05, 1.799594610929489e-05, 1.9975006580352783e-05, 2.1954067051410675e-05, 2.3933127522468567e-05, 2.591218799352646e-05, 2.789124846458435e-05, 2.9870308935642242e-05, 3.1849369406700134e-05, 3.3828429877758026e-05, 3.580749034881592e-05, 3.778655081987381e-05, 3.97656112909317e-05, 4.1744671761989594e-05, 4.3723732233047485e-05, 4.570279270410538e-05, 4.768185317516327e-05, 4.966091364622116e-05, 5.163997411727905e-05, 5.3619034588336945e-05, 5.5598095059394836e-05, 5.757715553045273e-05, 5.955621600151062e-05, 6.153527647256851e-05, 6.35143369436264e-05, 6.54933974146843e-05, 6.747245788574219e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 12.0, 11.0, 15.0, 20.0, 21.0, 30.0, 46.0, 70.0, 64.0, 113.0, 199.0, 290.0, 476.0, 923.0, 1918.0, 4949.0, 17082.0, 119538.0, 802694.0, 78714.0, 13373.0, 4128.0, 1720.0, 842.0, 461.0, 279.0, 172.0, 104.0, 80.0, 45.0, 43.0, 29.0, 23.0, 15.0, 19.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.297119140625, -0.2882270812988281, -0.27933502197265625, -0.2704429626464844, -0.2615509033203125, -0.2526588439941406, -0.24376678466796875, -0.23487472534179688, -0.225982666015625, -0.21709060668945312, -0.20819854736328125, -0.19930648803710938, -0.1904144287109375, -0.18152236938476562, -0.17263031005859375, -0.16373825073242188, -0.15484619140625, -0.14595413208007812, -0.13706207275390625, -0.12817001342773438, -0.1192779541015625, -0.11038589477539062, -0.10149383544921875, -0.09260177612304688, -0.083709716796875, -0.07481765747070312, -0.06592559814453125, -0.057033538818359375, -0.0481414794921875, -0.039249420166015625, -0.03035736083984375, -0.021465301513671875, -0.0125732421875, -0.003681182861328125, 0.00521087646484375, 0.014102935791015625, 0.0229949951171875, 0.031887054443359375, 0.04077911376953125, 0.049671173095703125, 0.058563232421875, 0.06745529174804688, 0.07634735107421875, 0.08523941040039062, 0.0941314697265625, 0.10302352905273438, 0.11191558837890625, 0.12080764770507812, 0.12969970703125, 0.13859176635742188, 0.14748382568359375, 0.15637588500976562, 0.1652679443359375, 0.17416000366210938, 0.18305206298828125, 0.19194412231445312, 0.200836181640625, 0.20972824096679688, 0.21862030029296875, 0.22751235961914062, 0.2364044189453125, 0.24529647827148438, 0.25418853759765625, 0.2630805969238281, 0.27197265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 12.0, 6.0, 24.0, 15.0, 32.0, 34.0, 36.0, 61.0, 88.0, 110.0, 132.0, 103.0, 78.0, 63.0, 32.0, 35.0, 18.0, 22.0, 13.0, 14.0, 8.0, 9.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31298828125, -0.30504417419433594, -0.2971000671386719, -0.2891559600830078, -0.28121185302734375, -0.2732677459716797, -0.2653236389160156, -0.25737953186035156, -0.2494354248046875, -0.24149131774902344, -0.23354721069335938, -0.2256031036376953, -0.21765899658203125, -0.2097148895263672, -0.20177078247070312, -0.19382667541503906, -0.185882568359375, -0.17793846130371094, -0.16999435424804688, -0.1620502471923828, -0.15410614013671875, -0.1461620330810547, -0.13821792602539062, -0.13027381896972656, -0.1223297119140625, -0.11438560485839844, -0.10644149780273438, -0.09849739074707031, -0.09055328369140625, -0.08260917663574219, -0.07466506958007812, -0.06672096252441406, -0.05877685546875, -0.05083274841308594, -0.042888641357421875, -0.03494453430175781, -0.02700042724609375, -0.019056320190429688, -0.011112213134765625, -0.0031681060791015625, 0.0047760009765625, 0.012720108032226562, 0.020664215087890625, 0.028608322143554688, 0.03655242919921875, 0.04449653625488281, 0.052440643310546875, 0.06038475036621094, 0.068328857421875, 0.07627296447753906, 0.08421707153320312, 0.09216117858886719, 0.10010528564453125, 0.10804939270019531, 0.11599349975585938, 0.12393760681152344, 0.1318817138671875, 0.13982582092285156, 0.14776992797851562, 0.1557140350341797, 0.16365814208984375, 0.1716022491455078, 0.17954635620117188, 0.18749046325683594, 0.1954345703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 7.0, 10.0, 20.0, 40.0, 94.0, 118.0, 265.0, 219.0, 113.0, 51.0, 22.0, 12.0, 9.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.828040599822998, -7.657020092010498, -7.485999584197998, -7.31497859954834, -7.14395809173584, -6.97293758392334, -6.80191707611084, -6.63089656829834, -6.459875583648682, -6.288855075836182, -6.117834568023682, -5.946813583374023, -5.775793075561523, -5.604772567749023, -5.433752059936523, -5.262731552124023, -5.091711044311523, -4.920690536499023, -4.749670028686523, -4.578649044036865, -4.407628536224365, -4.236608028411865, -4.065587520599365, -3.894566774368286, -3.723546028137207, -3.552525520324707, -3.381504774093628, -3.210484266281128, -3.039463520050049, -2.868443012237549, -2.697422504425049, -2.5264017581939697, -2.3553812503814697, -2.1843607425689697, -2.0133399963378906, -1.8423194885253906, -1.6712987422943115, -1.5002782344818115, -1.329257607460022, -1.1582369804382324, -0.9872163534164429, -0.8161957263946533, -0.6451750993728638, -0.474154531955719, -0.30313390493392944, -0.1321132779121399, 0.03890728950500488, 0.20992791652679443, 0.380948543548584, 0.5519691705703735, 0.7229897975921631, 0.8940103650093079, 1.0650310516357422, 1.2360515594482422, 1.4070721864700317, 1.5780928134918213, 1.7491134405136108, 1.9201340675354004, 2.0911545753479004, 2.2621753215789795, 2.4331958293914795, 2.6042165756225586, 2.7752370834350586, 2.9462575912475586, 3.1172783374786377]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 9.0, 11.0, 4.0, 17.0, 20.0, 18.0, 22.0, 30.0, 14.0, 29.0, 27.0, 39.0, 49.0, 38.0, 55.0, 56.0, 63.0, 63.0, 47.0, 39.0, 31.0, 43.0, 38.0, 35.0, 30.0, 21.0, 10.0, 22.0, 19.0, 14.0, 17.0, 12.0, 8.0, 6.0, 9.0, 6.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9805541038513184, -1.9171664714813232, -1.8537788391113281, -1.790391206741333, -1.727003574371338, -1.6636159420013428, -1.6002283096313477, -1.5368406772613525, -1.4734530448913574, -1.4100654125213623, -1.3466777801513672, -1.283290147781372, -1.219902515411377, -1.1565148830413818, -1.0931272506713867, -1.0297396183013916, -0.9663518667221069, -0.9029642343521118, -0.8395766019821167, -0.7761889696121216, -0.7128013372421265, -0.6494137048721313, -0.5860260128974915, -0.5226383805274963, -0.4592507481575012, -0.3958631157875061, -0.332475483417511, -0.2690878212451935, -0.20570018887519836, -0.14231255650520325, -0.07892489433288574, -0.015537261962890625, 0.04785037040710449, 0.1112380102276802, 0.17462565004825592, 0.23801329731941223, 0.30140092968940735, 0.36478856205940247, 0.42817622423171997, 0.4915638566017151, 0.5549514889717102, 0.6183391213417053, 0.6817267537117004, 0.7451144456863403, 0.8085020780563354, 0.8718897104263306, 0.9352773427963257, 0.9986649751663208, 1.062052607536316, 1.125440239906311, 1.1888278722763062, 1.2522155046463013, 1.3156031370162964, 1.3789907693862915, 1.4423785209655762, 1.5057661533355713, 1.5691537857055664, 1.6325414180755615, 1.6959290504455566, 1.7593166828155518, 1.8227043151855469, 1.886091947555542, 1.949479579925537, 2.0128672122955322, 2.0762548446655273]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 15.0, 10.0, 19.0, 36.0, 42.0, 75.0, 120.0, 198.0, 392.0, 959.0, 2637.0, 9493.0, 60729.0, 1850641.0, 2187278.0, 66735.0, 10159.0, 2824.0, 953.0, 413.0, 227.0, 128.0, 55.0, 43.0, 31.0, 27.0, 11.0, 10.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.4873046875, -0.47542572021484375, -0.4635467529296875, -0.45166778564453125, -0.439788818359375, -0.42790985107421875, -0.4160308837890625, -0.40415191650390625, -0.39227294921875, -0.38039398193359375, -0.3685150146484375, -0.35663604736328125, -0.344757080078125, -0.33287811279296875, -0.3209991455078125, -0.30912017822265625, -0.2972412109375, -0.28536224365234375, -0.2734832763671875, -0.26160430908203125, -0.249725341796875, -0.23784637451171875, -0.2259674072265625, -0.21408843994140625, -0.20220947265625, -0.19033050537109375, -0.1784515380859375, -0.16657257080078125, -0.154693603515625, -0.14281463623046875, -0.1309356689453125, -0.11905670166015625, -0.107177734375, -0.09529876708984375, -0.0834197998046875, -0.07154083251953125, -0.059661865234375, -0.04778289794921875, -0.0359039306640625, -0.02402496337890625, -0.01214599609375, -0.00026702880859375, 0.0116119384765625, 0.02349090576171875, 0.035369873046875, 0.04724884033203125, 0.0591278076171875, 0.07100677490234375, 0.0828857421875, 0.09476470947265625, 0.1066436767578125, 0.11852264404296875, 0.130401611328125, 0.14228057861328125, 0.1541595458984375, 0.16603851318359375, 0.17791748046875, 0.18979644775390625, 0.2016754150390625, 0.21355438232421875, 0.225433349609375, 0.23731231689453125, 0.2491912841796875, 0.26107025146484375, 0.27294921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 12.0, 17.0, 30.0, 52.0, 77.0, 97.0, 112.0, 109.0, 116.0, 117.0, 87.0, 58.0, 45.0, 24.0, 28.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18630409240722656, -0.17815017700195312, -0.1699962615966797, -0.16184234619140625, -0.1536884307861328, -0.14553451538085938, -0.13738059997558594, -0.1292266845703125, -0.12107276916503906, -0.11291885375976562, -0.10476493835449219, -0.09661102294921875, -0.08845710754394531, -0.08030319213867188, -0.07214927673339844, -0.063995361328125, -0.05584144592285156, -0.047687530517578125, -0.03953361511230469, -0.03137969970703125, -0.023225784301757812, -0.015071868896484375, -0.0069179534912109375, 0.0012359619140625, 0.009389877319335938, 0.017543792724609375, 0.025697708129882812, 0.03385162353515625, 0.04200553894042969, 0.050159454345703125, 0.05831336975097656, 0.06646728515625, 0.07462120056152344, 0.08277511596679688, 0.09092903137207031, 0.09908294677734375, 0.10723686218261719, 0.11539077758789062, 0.12354469299316406, 0.1316986083984375, 0.13985252380371094, 0.14800643920898438, 0.1561603546142578, 0.16431427001953125, 0.1724681854248047, 0.18062210083007812, 0.18877601623535156, 0.196929931640625, 0.20508384704589844, 0.21323776245117188, 0.2213916778564453, 0.22954559326171875, 0.2376995086669922, 0.24585342407226562, 0.25400733947753906, 0.2621612548828125, 0.27031517028808594, 0.2784690856933594, 0.2866230010986328, 0.29477691650390625, 0.3029308319091797, 0.3110847473144531, 0.31923866271972656, 0.327392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 19.0, 29.0, 46.0, 87.0, 194.0, 438.0, 1286.0, 4665.0, 29877.0, 559283.0, 3473291.0, 107445.0, 12673.0, 2973.0, 1062.0, 425.0, 232.0, 106.0, 55.0, 34.0, 19.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482666015625, -0.4642829895019531, -0.44589996337890625, -0.4275169372558594, -0.4091339111328125, -0.3907508850097656, -0.37236785888671875, -0.3539848327636719, -0.335601806640625, -0.3172187805175781, -0.29883575439453125, -0.2804527282714844, -0.2620697021484375, -0.24368667602539062, -0.22530364990234375, -0.20692062377929688, -0.18853759765625, -0.17015457153320312, -0.15177154541015625, -0.13338851928710938, -0.1150054931640625, -0.09662246704101562, -0.07823944091796875, -0.059856414794921875, -0.041473388671875, -0.023090362548828125, -0.00470733642578125, 0.013675689697265625, 0.0320587158203125, 0.050441741943359375, 0.06882476806640625, 0.08720779418945312, 0.1055908203125, 0.12397384643554688, 0.14235687255859375, 0.16073989868164062, 0.1791229248046875, 0.19750595092773438, 0.21588897705078125, 0.23427200317382812, 0.252655029296875, 0.2710380554199219, 0.28942108154296875, 0.3078041076660156, 0.3261871337890625, 0.3445701599121094, 0.36295318603515625, 0.3813362121582031, 0.39971923828125, 0.4181022644042969, 0.43648529052734375, 0.4548683166503906, 0.4732513427734375, 0.4916343688964844, 0.5100173950195312, 0.5284004211425781, 0.546783447265625, 0.5651664733886719, 0.5835494995117188, 0.6019325256347656, 0.6203155517578125, 0.6386985778808594, 0.6570816040039062, 0.6754646301269531, 0.69384765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 11.0, 24.0, 27.0, 38.0, 70.0, 97.0, 167.0, 278.0, 527.0, 805.0, 792.0, 506.0, 265.0, 141.0, 83.0, 65.0, 47.0, 33.0, 16.0, 21.0, 16.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.288330078125, -0.27392578125, -0.259521484375, -0.2451171875, -0.230712890625, -0.21630859375, -0.201904296875, -0.1875, -0.173095703125, -0.15869140625, -0.144287109375, -0.1298828125, -0.115478515625, -0.10107421875, -0.086669921875, -0.072265625, -0.057861328125, -0.04345703125, -0.029052734375, -0.0146484375, -0.000244140625, 0.01416015625, 0.028564453125, 0.04296875, 0.057373046875, 0.07177734375, 0.086181640625, 0.1005859375, 0.114990234375, 0.12939453125, 0.143798828125, 0.158203125, 0.172607421875, 0.18701171875, 0.201416015625, 0.2158203125, 0.230224609375, 0.24462890625, 0.259033203125, 0.2734375, 0.287841796875, 0.30224609375, 0.316650390625, 0.3310546875, 0.345458984375, 0.35986328125, 0.374267578125, 0.388671875, 0.403076171875, 0.41748046875, 0.431884765625, 0.4462890625, 0.460693359375, 0.47509765625, 0.489501953125, 0.50390625, 0.518310546875, 0.53271484375, 0.547119140625, 0.5615234375, 0.575927734375, 0.59033203125, 0.604736328125, 0.619140625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 11.0, 34.0, 91.0, 202.0, 301.0, 219.0, 92.0, 27.0, 14.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.331094741821289, -3.1280770301818848, -2.9250595569610596, -2.7220420837402344, -2.51902437210083, -2.316006660461426, -2.1129891872406006, -1.9099715948104858, -1.706954002380371, -1.5039364099502563, -1.3009188175201416, -1.0979012250900269, -0.8948836326599121, -0.6918660402297974, -0.4888484477996826, -0.28583085536956787, -0.08281326293945312, 0.12020432949066162, 0.32322192192077637, 0.5262395143508911, 0.7292571067810059, 0.9322746992111206, 1.1352922916412354, 1.33830988407135, 1.5413274765014648, 1.7443450689315796, 1.9473626613616943, 2.1503801345825195, 2.353397846221924, 2.556415557861328, 2.7594330310821533, 2.9624505043029785, 3.165468215942383, 3.368485927581787, 3.5715034008026123, 3.7745208740234375, 3.977538585662842, 4.180556297302246, 4.383573532104492, 4.5865912437438965, 4.789608955383301, 4.992626667022705, 5.195644378662109, 5.3986616134643555, 5.60167932510376, 5.804697036743164, 6.00771427154541, 6.2107319831848145, 6.413749694824219, 6.616767406463623, 6.819785118103027, 7.022802352905273, 7.225820064544678, 7.428837776184082, 7.631855010986328, 7.834872722625732, 8.037890434265137, 8.240907669067383, 8.443925857543945, 8.646943092346191, 8.849960327148438, 9.052978515625, 9.255995750427246, 9.459013938903809, 9.662031173706055]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 9.0, 16.0, 16.0, 26.0, 22.0, 29.0, 36.0, 36.0, 41.0, 43.0, 50.0, 40.0, 54.0, 49.0, 58.0, 50.0, 33.0, 51.0, 57.0, 39.0, 38.0, 38.0, 26.0, 24.0, 24.0, 14.0, 16.0, 9.0, 12.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.272352457046509, -2.2094199657440186, -2.1464877128601074, -2.083555221557617, -2.020622730255127, -1.9576903581619263, -1.8947579860687256, -1.8318254947662354, -1.7688931226730347, -1.705960750579834, -1.6430282592773438, -1.580095887184143, -1.5171635150909424, -1.4542310237884521, -1.3912986516952515, -1.3283662796020508, -1.2654337882995605, -1.2025014162063599, -1.1395689249038696, -1.076636552810669, -1.0137040615081787, -0.950771689414978, -0.8878393173217773, -0.8249068856239319, -0.7619744539260864, -0.699042022228241, -0.6361095905303955, -0.5731772184371948, -0.5102447867393494, -0.4473123550415039, -0.38437995314598083, -0.32144755125045776, -0.25851523876190186, -0.1955828219652176, -0.13265040516853333, -0.06971798837184906, -0.006785571575164795, 0.056146860122680664, 0.11907926201820374, 0.1820116639137268, 0.24494409561157227, 0.3078765273094177, 0.3708089292049408, 0.43374133110046387, 0.4966737627983093, 0.5596061944961548, 0.6225385665893555, 0.6854709982872009, 0.7484034299850464, 0.8113358616828918, 0.8742682933807373, 0.937200665473938, 1.0001330375671387, 1.063065528869629, 1.1259979009628296, 1.1889302730560303, 1.2518627643585205, 1.3147951364517212, 1.3777276277542114, 1.440659999847412, 1.5035924911499023, 1.566524863243103, 1.6294572353363037, 1.692389726638794, 1.7553220987319946]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 8.0, 9.0, 11.0, 27.0, 51.0, 78.0, 138.0, 316.0, 685.0, 1773.0, 5309.0, 20615.0, 131407.0, 732026.0, 127937.0, 20033.0, 5058.0, 1669.0, 683.0, 350.0, 169.0, 82.0, 37.0, 26.0, 11.0, 4.0, 6.0, 9.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.62451171875, -0.6082878112792969, -0.5920639038085938, -0.5758399963378906, -0.5596160888671875, -0.5433921813964844, -0.5271682739257812, -0.5109443664550781, -0.494720458984375, -0.4784965515136719, -0.46227264404296875, -0.4460487365722656, -0.4298248291015625, -0.4136009216308594, -0.39737701416015625, -0.3811531066894531, -0.36492919921875, -0.3487052917480469, -0.33248138427734375, -0.3162574768066406, -0.3000335693359375, -0.2838096618652344, -0.26758575439453125, -0.2513618469238281, -0.235137939453125, -0.21891403198242188, -0.20269012451171875, -0.18646621704101562, -0.1702423095703125, -0.15401840209960938, -0.13779449462890625, -0.12157058715820312, -0.1053466796875, -0.08912277221679688, -0.07289886474609375, -0.056674957275390625, -0.0404510498046875, -0.024227142333984375, -0.00800323486328125, 0.008220672607421875, 0.024444580078125, 0.040668487548828125, 0.05689239501953125, 0.07311630249023438, 0.0893402099609375, 0.10556411743164062, 0.12178802490234375, 0.13801193237304688, 0.15423583984375, 0.17045974731445312, 0.18668365478515625, 0.20290756225585938, 0.2191314697265625, 0.23535537719726562, 0.25157928466796875, 0.2678031921386719, 0.284027099609375, 0.3002510070800781, 0.31647491455078125, 0.3326988220214844, 0.3489227294921875, 0.3651466369628906, 0.38137054443359375, 0.3975944519042969, 0.413818359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 12.0, 13.0, 19.0, 28.0, 31.0, 40.0, 42.0, 73.0, 67.0, 77.0, 67.0, 62.0, 73.0, 73.0, 66.0, 52.0, 46.0, 43.0, 21.0, 32.0, 25.0, 14.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2353515625, -0.22939109802246094, -0.22343063354492188, -0.2174701690673828, -0.21150970458984375, -0.2055492401123047, -0.19958877563476562, -0.19362831115722656, -0.1876678466796875, -0.18170738220214844, -0.17574691772460938, -0.1697864532470703, -0.16382598876953125, -0.1578655242919922, -0.15190505981445312, -0.14594459533691406, -0.139984130859375, -0.13402366638183594, -0.12806320190429688, -0.12210273742675781, -0.11614227294921875, -0.11018180847167969, -0.10422134399414062, -0.09826087951660156, -0.0923004150390625, -0.08633995056152344, -0.08037948608398438, -0.07441902160644531, -0.06845855712890625, -0.06249809265136719, -0.056537628173828125, -0.05057716369628906, -0.04461669921875, -0.03865623474121094, -0.032695770263671875, -0.026735305786132812, -0.02077484130859375, -0.014814376831054688, -0.008853912353515625, -0.0028934478759765625, 0.0030670166015625, 0.009027481079101562, 0.014987945556640625, 0.020948410034179688, 0.02690887451171875, 0.03286933898925781, 0.038829803466796875, 0.04479026794433594, 0.050750732421875, 0.05671119689941406, 0.06267166137695312, 0.06863212585449219, 0.07459259033203125, 0.08055305480957031, 0.08651351928710938, 0.09247398376464844, 0.0984344482421875, 0.10439491271972656, 0.11035537719726562, 0.11631584167480469, 0.12227630615234375, 0.1282367706298828, 0.13419723510742188, 0.14015769958496094, 0.1461181640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 15.0, 18.0, 18.0, 32.0, 27.0, 37.0, 52.0, 64.0, 116.0, 189.0, 255.0, 379.0, 672.0, 1565.0, 3732.0, 13771.0, 87790.0, 808146.0, 108704.0, 15170.0, 4129.0, 1670.0, 731.0, 400.0, 253.0, 178.0, 113.0, 84.0, 50.0, 44.0, 28.0, 28.0, 9.0, 11.0, 11.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5727081298828125, -0.552642822265625, -0.5325775146484375, -0.51251220703125, -0.4924468994140625, -0.472381591796875, -0.4523162841796875, -0.4322509765625, -0.4121856689453125, -0.392120361328125, -0.3720550537109375, -0.35198974609375, -0.3319244384765625, -0.311859130859375, -0.2917938232421875, -0.271728515625, -0.2516632080078125, -0.231597900390625, -0.2115325927734375, -0.19146728515625, -0.1714019775390625, -0.151336669921875, -0.1312713623046875, -0.1112060546875, -0.0911407470703125, -0.071075439453125, -0.0510101318359375, -0.03094482421875, -0.0108795166015625, 0.009185791015625, 0.0292510986328125, 0.04931640625, 0.0693817138671875, 0.089447021484375, 0.1095123291015625, 0.12957763671875, 0.1496429443359375, 0.169708251953125, 0.1897735595703125, 0.2098388671875, 0.2299041748046875, 0.249969482421875, 0.2700347900390625, 0.29010009765625, 0.3101654052734375, 0.330230712890625, 0.3502960205078125, 0.370361328125, 0.3904266357421875, 0.410491943359375, 0.4305572509765625, 0.45062255859375, 0.4706878662109375, 0.490753173828125, 0.5108184814453125, 0.5308837890625, 0.5509490966796875, 0.571014404296875, 0.5910797119140625, 0.61114501953125, 0.6312103271484375, 0.651275634765625, 0.6713409423828125, 0.69140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 11.0, 5.0, 18.0, 12.0, 13.0, 25.0, 33.0, 35.0, 43.0, 48.0, 39.0, 43.0, 42.0, 68.0, 63.0, 73.0, 58.0, 61.0, 55.0, 50.0, 37.0, 33.0, 32.0, 22.0, 16.0, 16.0, 9.0, 15.0, 3.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69482421875, -0.6731796264648438, -0.6515350341796875, -0.6298904418945312, -0.608245849609375, -0.5866012573242188, -0.5649566650390625, -0.5433120727539062, -0.52166748046875, -0.5000228881835938, -0.4783782958984375, -0.45673370361328125, -0.435089111328125, -0.41344451904296875, -0.3917999267578125, -0.37015533447265625, -0.3485107421875, -0.32686614990234375, -0.3052215576171875, -0.28357696533203125, -0.261932373046875, -0.24028778076171875, -0.2186431884765625, -0.19699859619140625, -0.17535400390625, -0.15370941162109375, -0.1320648193359375, -0.11042022705078125, -0.088775634765625, -0.06713104248046875, -0.0454864501953125, -0.02384185791015625, -0.002197265625, 0.01944732666015625, 0.0410919189453125, 0.06273651123046875, 0.084381103515625, 0.10602569580078125, 0.1276702880859375, 0.14931488037109375, 0.17095947265625, 0.19260406494140625, 0.2142486572265625, 0.23589324951171875, 0.257537841796875, 0.27918243408203125, 0.3008270263671875, 0.32247161865234375, 0.3441162109375, 0.36576080322265625, 0.3874053955078125, 0.40904998779296875, 0.430694580078125, 0.45233917236328125, 0.4739837646484375, 0.49562835693359375, 0.51727294921875, 0.5389175415039062, 0.5605621337890625, 0.5822067260742188, 0.603851318359375, 0.6254959106445312, 0.6471405029296875, 0.6687850952148438, 0.6904296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 21.0, 31.0, 49.0, 71.0, 109.0, 193.0, 390.0, 1061.0, 4083.0, 25770.0, 720859.0, 274718.0, 16427.0, 3082.0, 877.0, 321.0, 147.0, 92.0, 63.0, 42.0, 32.0, 18.0, 14.0, 14.0, 7.0, 10.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.331787109375, -0.32030487060546875, -0.3088226318359375, -0.29734039306640625, -0.285858154296875, -0.27437591552734375, -0.2628936767578125, -0.25141143798828125, -0.23992919921875, -0.22844696044921875, -0.2169647216796875, -0.20548248291015625, -0.194000244140625, -0.18251800537109375, -0.1710357666015625, -0.15955352783203125, -0.1480712890625, -0.13658905029296875, -0.1251068115234375, -0.11362457275390625, -0.102142333984375, -0.09066009521484375, -0.0791778564453125, -0.06769561767578125, -0.05621337890625, -0.04473114013671875, -0.0332489013671875, -0.02176666259765625, -0.010284423828125, 0.00119781494140625, 0.0126800537109375, 0.02416229248046875, 0.03564453125, 0.04712677001953125, 0.0586090087890625, 0.07009124755859375, 0.081573486328125, 0.09305572509765625, 0.1045379638671875, 0.11602020263671875, 0.12750244140625, 0.13898468017578125, 0.1504669189453125, 0.16194915771484375, 0.173431396484375, 0.18491363525390625, 0.1963958740234375, 0.20787811279296875, 0.2193603515625, 0.23084259033203125, 0.2423248291015625, 0.25380706787109375, 0.265289306640625, 0.27677154541015625, 0.2882537841796875, 0.29973602294921875, 0.31121826171875, 0.32270050048828125, 0.3341827392578125, 0.34566497802734375, 0.357147216796875, 0.36862945556640625, 0.3801116943359375, 0.39159393310546875, 0.403076171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 1.0, 11.0, 13.0, 18.0, 41.0, 53.0, 83.0, 126.0, 184.0, 157.0, 125.0, 61.0, 36.0, 30.0, 16.0, 7.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001461505889892578, -0.00014247652143239975, -0.0001388024538755417, -0.00013512838631868362, -0.00013145431876182556, -0.0001277802512049675, -0.00012410618364810944, -0.00012043211609125137, -0.00011675804853439331, -0.00011308398097753525, -0.00010940991342067719, -0.00010573584586381912, -0.00010206177830696106, -9.8387710750103e-05, -9.471364319324493e-05, -9.103957563638687e-05, -8.736550807952881e-05, -8.369144052267075e-05, -8.001737296581268e-05, -7.634330540895462e-05, -7.266923785209656e-05, -6.89951702952385e-05, -6.532110273838043e-05, -6.164703518152237e-05, -5.797296762466431e-05, -5.4298900067806244e-05, -5.062483251094818e-05, -4.695076495409012e-05, -4.3276697397232056e-05, -3.960262984037399e-05, -3.592856228351593e-05, -3.225449472665787e-05, -2.8580427169799805e-05, -2.4906359612941742e-05, -2.123229205608368e-05, -1.7558224499225616e-05, -1.3884156942367554e-05, -1.0210089385509491e-05, -6.536021828651428e-06, -2.8619542717933655e-06, 8.121132850646973e-07, 4.48618084192276e-06, 8.160248398780823e-06, 1.1834315955638885e-05, 1.5508383512496948e-05, 1.918245106935501e-05, 2.2856518626213074e-05, 2.6530586183071136e-05, 3.02046537399292e-05, 3.387872129678726e-05, 3.7552788853645325e-05, 4.122685641050339e-05, 4.490092396736145e-05, 4.857499152421951e-05, 5.2249059081077576e-05, 5.592312663793564e-05, 5.95971941947937e-05, 6.327126175165176e-05, 6.694532930850983e-05, 7.061939686536789e-05, 7.429346442222595e-05, 7.796753197908401e-05, 8.164159953594208e-05, 8.531566709280014e-05, 8.89897346496582e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 6.0, 6.0, 10.0, 12.0, 14.0, 22.0, 40.0, 48.0, 63.0, 93.0, 172.0, 294.0, 636.0, 1376.0, 3566.0, 11951.0, 92515.0, 841805.0, 78749.0, 11142.0, 3340.0, 1291.0, 569.0, 294.0, 185.0, 103.0, 76.0, 50.0, 31.0, 16.0, 18.0, 12.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.330322265625, -0.32073974609375, -0.3111572265625, -0.30157470703125, -0.2919921875, -0.28240966796875, -0.2728271484375, -0.26324462890625, -0.253662109375, -0.24407958984375, -0.2344970703125, -0.22491455078125, -0.21533203125, -0.20574951171875, -0.1961669921875, -0.18658447265625, -0.177001953125, -0.16741943359375, -0.1578369140625, -0.14825439453125, -0.138671875, -0.12908935546875, -0.1195068359375, -0.10992431640625, -0.100341796875, -0.09075927734375, -0.0811767578125, -0.07159423828125, -0.06201171875, -0.05242919921875, -0.0428466796875, -0.03326416015625, -0.023681640625, -0.01409912109375, -0.0045166015625, 0.00506591796875, 0.0146484375, 0.02423095703125, 0.0338134765625, 0.04339599609375, 0.052978515625, 0.06256103515625, 0.0721435546875, 0.08172607421875, 0.09130859375, 0.10089111328125, 0.1104736328125, 0.12005615234375, 0.129638671875, 0.13922119140625, 0.1488037109375, 0.15838623046875, 0.16796875, 0.17755126953125, 0.1871337890625, 0.19671630859375, 0.206298828125, 0.21588134765625, 0.2254638671875, 0.23504638671875, 0.24462890625, 0.25421142578125, 0.2637939453125, 0.27337646484375, 0.282958984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 11.0, 7.0, 8.0, 9.0, 21.0, 25.0, 34.0, 63.0, 100.0, 140.0, 163.0, 136.0, 93.0, 62.0, 30.0, 24.0, 21.0, 5.0, 16.0, 8.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2516288757324219, -0.24300384521484375, -0.23437881469726562, -0.2257537841796875, -0.21712875366210938, -0.20850372314453125, -0.19987869262695312, -0.191253662109375, -0.18262863159179688, -0.17400360107421875, -0.16537857055664062, -0.1567535400390625, -0.14812850952148438, -0.13950347900390625, -0.13087844848632812, -0.12225341796875, -0.11362838745117188, -0.10500335693359375, -0.09637832641601562, -0.0877532958984375, -0.07912826538085938, -0.07050323486328125, -0.061878204345703125, -0.053253173828125, -0.044628143310546875, -0.03600311279296875, -0.027378082275390625, -0.0187530517578125, -0.010128021240234375, -0.00150299072265625, 0.007122039794921875, 0.0157470703125, 0.024372100830078125, 0.03299713134765625, 0.041622161865234375, 0.0502471923828125, 0.058872222900390625, 0.06749725341796875, 0.07612228393554688, 0.084747314453125, 0.09337234497070312, 0.10199737548828125, 0.11062240600585938, 0.1192474365234375, 0.12787246704101562, 0.13649749755859375, 0.14512252807617188, 0.15374755859375, 0.16237258911132812, 0.17099761962890625, 0.17962265014648438, 0.1882476806640625, 0.19687271118164062, 0.20549774169921875, 0.21412277221679688, 0.222747802734375, 0.23137283325195312, 0.23999786376953125, 0.24862289428710938, 0.2572479248046875, 0.2658729553222656, 0.27449798583984375, 0.2831230163574219, 0.291748046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 13.0, 37.0, 327.0, 487.0, 97.0, 17.0, 11.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.933162689208984, -15.588034629821777, -15.24290657043457, -14.897777557373047, -14.55264949798584, -14.207521438598633, -13.862393379211426, -13.517265319824219, -13.172136306762695, -12.827008247375488, -12.481880187988281, -12.136751174926758, -11.79162311553955, -11.446495056152344, -11.101366996765137, -10.75623893737793, -10.411109924316406, -10.0659818649292, -9.720853805541992, -9.375724792480469, -9.030596733093262, -8.685468673706055, -8.340340614318848, -7.995212078094482, -7.650084495544434, -7.304956436157227, -6.959827899932861, -6.614699840545654, -6.269571304321289, -5.924443244934082, -5.579315185546875, -5.23418664932251, -4.8890581130981445, -4.5439300537109375, -4.198801517486572, -3.8536734580993652, -3.508544921875, -3.163416862487793, -2.818288564682007, -2.4731602668762207, -2.1280319690704346, -1.7829036712646484, -1.4377753734588623, -1.0926471948623657, -0.7475188970565796, -0.40239059925079346, -0.057262420654296875, 0.28786587715148926, 0.6329941749572754, 0.9781224727630615, 1.3232507705688477, 1.6683789491653442, 2.01350736618042, 2.358635425567627, 2.703763723373413, 3.048892021179199, 3.3940203189849854, 3.7391486167907715, 4.0842766761779785, 4.429405212402344, 4.774533271789551, 5.119661808013916, 5.464789867401123, 5.809918403625488, 6.155046463012695]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 6.0, 6.0, 4.0, 11.0, 10.0, 11.0, 10.0, 16.0, 28.0, 23.0, 22.0, 25.0, 28.0, 28.0, 37.0, 44.0, 48.0, 65.0, 63.0, 51.0, 60.0, 47.0, 45.0, 27.0, 29.0, 26.0, 23.0, 25.0, 22.0, 24.0, 24.0, 19.0, 12.0, 10.0, 11.0, 9.0, 3.0, 7.0, 3.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-2.0123491287231445, -1.9493887424468994, -1.8864283561706543, -1.8234679698944092, -1.760507583618164, -1.697547197341919, -1.6345866918563843, -1.5716263055801392, -1.508665919303894, -1.445705533027649, -1.3827451467514038, -1.3197847604751587, -1.256824254989624, -1.193863868713379, -1.1309034824371338, -1.0679430961608887, -1.0049827098846436, -0.9420223236083984, -0.8790619373321533, -0.8161014914512634, -0.7531411051750183, -0.6901807188987732, -0.6272202730178833, -0.5642598867416382, -0.5012995004653931, -0.43833911418914795, -0.37537869811058044, -0.31241828203201294, -0.24945789575576782, -0.1864975094795227, -0.1235370934009552, -0.060576677322387695, 0.0023834705352783203, 0.06534387171268463, 0.12830427289009094, 0.19126467406749725, 0.25422507524490356, 0.3171854615211487, 0.3801458775997162, 0.4431062936782837, 0.5060666799545288, 0.5690270662307739, 0.631987452507019, 0.6949478983879089, 0.757908284664154, 0.8208686709403992, 0.8838291168212891, 0.9467895030975342, 1.0097498893737793, 1.0727102756500244, 1.1356706619262695, 1.1986310482025146, 1.2615914344787598, 1.3245518207550049, 1.3875123262405396, 1.4504727125167847, 1.5134330987930298, 1.576393485069275, 1.63935387134552, 1.7023142576217651, 1.7652747631072998, 1.828235149383545, 1.89119553565979, 1.9541559219360352, 2.0171163082122803]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 5.0, 5.0, 19.0, 24.0, 24.0, 41.0, 76.0, 142.0, 349.0, 1166.0, 4982.0, 54092.0, 3953099.0, 168894.0, 8495.0, 1853.0, 547.0, 231.0, 101.0, 42.0, 34.0, 15.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 4.0], "bins": [-1.0537109375, -1.0315895080566406, -1.0094680786132812, -0.9873466491699219, -0.9652252197265625, -0.9431037902832031, -0.9209823608398438, -0.8988609313964844, -0.876739501953125, -0.8546180725097656, -0.8324966430664062, -0.8103752136230469, -0.7882537841796875, -0.7661323547363281, -0.7440109252929688, -0.7218894958496094, -0.69976806640625, -0.6776466369628906, -0.6555252075195312, -0.6334037780761719, -0.6112823486328125, -0.5891609191894531, -0.5670394897460938, -0.5449180603027344, -0.522796630859375, -0.5006752014160156, -0.47855377197265625, -0.4564323425292969, -0.4343109130859375, -0.4121894836425781, -0.39006805419921875, -0.3679466247558594, -0.3458251953125, -0.3237037658691406, -0.30158233642578125, -0.2794609069824219, -0.2573394775390625, -0.23521804809570312, -0.21309661865234375, -0.19097518920898438, -0.168853759765625, -0.14673233032226562, -0.12461090087890625, -0.10248947143554688, -0.0803680419921875, -0.058246612548828125, -0.03612518310546875, -0.014003753662109375, 0.00811767578125, 0.030239105224609375, 0.05236053466796875, 0.07448196411132812, 0.0966033935546875, 0.11872482299804688, 0.14084625244140625, 0.16296768188476562, 0.185089111328125, 0.20721054077148438, 0.22933197021484375, 0.2514533996582031, 0.2735748291015625, 0.2956962585449219, 0.31781768798828125, 0.3399391174316406, 0.362060546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 9.0, 11.0, 10.0, 12.0, 15.0, 23.0, 32.0, 42.0, 47.0, 51.0, 67.0, 66.0, 65.0, 64.0, 71.0, 66.0, 54.0, 49.0, 57.0, 33.0, 38.0, 27.0, 22.0, 21.0, 17.0, 8.0, 9.0, 5.0, 6.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.20241928100585938, -0.19719696044921875, -0.19197463989257812, -0.1867523193359375, -0.18152999877929688, -0.17630767822265625, -0.17108535766601562, -0.165863037109375, -0.16064071655273438, -0.15541839599609375, -0.15019607543945312, -0.1449737548828125, -0.13975143432617188, -0.13452911376953125, -0.12930679321289062, -0.12408447265625, -0.11886215209960938, -0.11363983154296875, -0.10841751098632812, -0.1031951904296875, -0.09797286987304688, -0.09275054931640625, -0.08752822875976562, -0.082305908203125, -0.07708358764648438, -0.07186126708984375, -0.06663894653320312, -0.0614166259765625, -0.056194305419921875, -0.05097198486328125, -0.045749664306640625, -0.04052734375, -0.035305023193359375, -0.03008270263671875, -0.024860382080078125, -0.0196380615234375, -0.014415740966796875, -0.00919342041015625, -0.003971099853515625, 0.001251220703125, 0.006473541259765625, 0.01169586181640625, 0.016918182373046875, 0.0221405029296875, 0.027362823486328125, 0.03258514404296875, 0.037807464599609375, 0.04302978515625, 0.048252105712890625, 0.05347442626953125, 0.058696746826171875, 0.0639190673828125, 0.06914138793945312, 0.07436370849609375, 0.07958602905273438, 0.084808349609375, 0.09003067016601562, 0.09525299072265625, 0.10047531127929688, 0.1056976318359375, 0.11091995239257812, 0.11614227294921875, 0.12136459350585938, 0.1265869140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 12.0, 9.0, 22.0, 32.0, 59.0, 109.0, 248.0, 641.0, 1883.0, 8508.0, 168904.0, 3956268.0, 50663.0, 4812.0, 1208.0, 470.0, 197.0, 116.0, 50.0, 21.0, 20.0, 12.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.97607421875, -0.9449386596679688, -0.9138031005859375, -0.8826675415039062, -0.851531982421875, -0.8203964233398438, -0.7892608642578125, -0.7581253051757812, -0.72698974609375, -0.6958541870117188, -0.6647186279296875, -0.6335830688476562, -0.602447509765625, -0.5713119506835938, -0.5401763916015625, -0.5090408325195312, -0.4779052734375, -0.44676971435546875, -0.4156341552734375, -0.38449859619140625, -0.353363037109375, -0.32222747802734375, -0.2910919189453125, -0.25995635986328125, -0.22882080078125, -0.19768524169921875, -0.1665496826171875, -0.13541412353515625, -0.104278564453125, -0.07314300537109375, -0.0420074462890625, -0.01087188720703125, 0.020263671875, 0.05139923095703125, 0.0825347900390625, 0.11367034912109375, 0.144805908203125, 0.17594146728515625, 0.2070770263671875, 0.23821258544921875, 0.26934814453125, 0.30048370361328125, 0.3316192626953125, 0.36275482177734375, 0.393890380859375, 0.42502593994140625, 0.4561614990234375, 0.48729705810546875, 0.5184326171875, 0.5495681762695312, 0.5807037353515625, 0.6118392944335938, 0.642974853515625, 0.6741104125976562, 0.7052459716796875, 0.7363815307617188, 0.76751708984375, 0.7986526489257812, 0.8297882080078125, 0.8609237670898438, 0.892059326171875, 0.9231948852539062, 0.9543304443359375, 0.9854660034179688, 1.0166015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 11.0, 8.0, 25.0, 44.0, 79.0, 151.0, 329.0, 905.0, 1413.0, 637.0, 227.0, 101.0, 47.0, 32.0, 21.0, 10.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6693191528320312, -0.6472320556640625, -0.6251449584960938, -0.603057861328125, -0.5809707641601562, -0.5588836669921875, -0.5367965698242188, -0.51470947265625, -0.49262237548828125, -0.4705352783203125, -0.44844818115234375, -0.426361083984375, -0.40427398681640625, -0.3821868896484375, -0.36009979248046875, -0.3380126953125, -0.31592559814453125, -0.2938385009765625, -0.27175140380859375, -0.249664306640625, -0.22757720947265625, -0.2054901123046875, -0.18340301513671875, -0.16131591796875, -0.13922882080078125, -0.1171417236328125, -0.09505462646484375, -0.072967529296875, -0.05088043212890625, -0.0287933349609375, -0.00670623779296875, 0.015380859375, 0.03746795654296875, 0.0595550537109375, 0.08164215087890625, 0.103729248046875, 0.12581634521484375, 0.1479034423828125, 0.16999053955078125, 0.19207763671875, 0.21416473388671875, 0.2362518310546875, 0.25833892822265625, 0.280426025390625, 0.30251312255859375, 0.3246002197265625, 0.34668731689453125, 0.3687744140625, 0.39086151123046875, 0.4129486083984375, 0.43503570556640625, 0.457122802734375, 0.47920989990234375, 0.5012969970703125, 0.5233840942382812, 0.54547119140625, 0.5675582885742188, 0.5896453857421875, 0.6117324829101562, 0.633819580078125, 0.6559066772460938, 0.6779937744140625, 0.7000808715820312, 0.72216796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 7.0, 12.0, 19.0, 32.0, 54.0, 128.0, 195.0, 208.0, 167.0, 87.0, 48.0, 17.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.769728899002075, -3.631511688232422, -3.4932944774627686, -3.3550772666931152, -3.216860055923462, -3.0786428451538086, -2.940425395965576, -2.802208423614502, -2.6639909744262695, -2.525773763656616, -2.387556552886963, -2.2493393421173096, -2.1111221313476562, -1.972904920578003, -1.83468759059906, -1.6964703798294067, -1.558253288269043, -1.4200360774993896, -1.2818188667297363, -1.143601655960083, -1.0053844451904297, -0.8671671748161316, -0.7289499044418335, -0.5907326936721802, -0.45251548290252686, -0.31429827213287354, -0.17608103156089783, -0.03786379098892212, 0.1003534197807312, 0.23857063055038452, 0.3767879009246826, 0.5150051116943359, 0.6532225608825684, 0.7914397716522217, 0.929656982421875, 1.0678741931915283, 1.2060914039611816, 1.344308614730835, 1.4825259447097778, 1.6207431554794312, 1.7589603662490845, 1.8971775770187378, 2.0353949069976807, 2.173612117767334, 2.3118293285369873, 2.4500465393066406, 2.588263750076294, 2.7264809608459473, 2.8646981716156006, 3.002915382385254, 3.1411325931549072, 3.2793498039245605, 3.417567014694214, 3.555784225463867, 3.6940016746520996, 3.832218647003174, 3.9704360961914062, 4.108653545379639, 4.246870517730713, 4.385087966918945, 4.5233049392700195, 4.661522388458252, 4.799739360809326, 4.937956809997559, 5.076173782348633]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 12.0, 24.0, 33.0, 44.0, 45.0, 69.0, 72.0, 74.0, 90.0, 112.0, 81.0, 80.0, 79.0, 53.0, 49.0, 26.0, 16.0, 15.0, 5.0, 11.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5023036003112793, -2.3944942951202393, -2.286684989929199, -2.178875684738159, -2.071066379547119, -1.963257074356079, -1.8554476499557495, -1.7476383447647095, -1.6398290395736694, -1.5320197343826294, -1.4242104291915894, -1.3164010047912598, -1.2085916996002197, -1.1007823944091797, -0.9929730892181396, -0.8851637840270996, -0.7773544788360596, -0.6695451736450195, -0.5617358684539795, -0.4539265036582947, -0.34611719846725464, -0.2383078932762146, -0.13049852848052979, -0.022689223289489746, 0.08512008190155029, 0.19292940199375153, 0.30073872208595276, 0.4085480570793152, 0.5163573622703552, 0.6241666674613953, 0.7319760322570801, 0.8397853374481201, 0.9475946426391602, 1.0554039478302002, 1.1632132530212402, 1.2710225582122803, 1.3788318634033203, 1.4866411685943604, 1.59445059299469, 1.70225989818573, 1.81006920337677, 1.91787850856781, 2.0256879329681396, 2.1334972381591797, 2.2413065433502197, 2.3491158485412598, 2.4569251537323, 2.56473445892334, 2.67254376411438, 2.78035306930542, 2.88816237449646, 2.9959716796875, 3.10378098487854, 3.21159029006958, 3.319399833679199, 3.42720890045166, 3.5350184440612793, 3.6428277492523193, 3.7506370544433594, 3.8584463596343994, 3.9662556648254395, 4.074065208435059, 4.1818742752075195, 4.289683818817139, 4.3974928855896]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 10.0, 11.0, 15.0, 28.0, 49.0, 80.0, 125.0, 274.0, 625.0, 1731.0, 6567.0, 46305.0, 642784.0, 321211.0, 22392.0, 4175.0, 1206.0, 459.0, 230.0, 101.0, 65.0, 26.0, 23.0, 10.0, 13.0, 5.0, 6.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52001953125, -0.5046539306640625, -0.489288330078125, -0.4739227294921875, -0.45855712890625, -0.4431915283203125, -0.427825927734375, -0.4124603271484375, -0.3970947265625, -0.3817291259765625, -0.366363525390625, -0.3509979248046875, -0.33563232421875, -0.3202667236328125, -0.304901123046875, -0.2895355224609375, -0.274169921875, -0.2588043212890625, -0.243438720703125, -0.2280731201171875, -0.21270751953125, -0.1973419189453125, -0.181976318359375, -0.1666107177734375, -0.1512451171875, -0.1358795166015625, -0.120513916015625, -0.1051483154296875, -0.08978271484375, -0.0744171142578125, -0.059051513671875, -0.0436859130859375, -0.0283203125, -0.0129547119140625, 0.002410888671875, 0.0177764892578125, 0.03314208984375, 0.0485076904296875, 0.063873291015625, 0.0792388916015625, 0.0946044921875, 0.1099700927734375, 0.125335693359375, 0.1407012939453125, 0.15606689453125, 0.1714324951171875, 0.186798095703125, 0.2021636962890625, 0.217529296875, 0.2328948974609375, 0.248260498046875, 0.2636260986328125, 0.27899169921875, 0.2943572998046875, 0.309722900390625, 0.3250885009765625, 0.3404541015625, 0.3558197021484375, 0.371185302734375, 0.3865509033203125, 0.40191650390625, 0.4172821044921875, 0.432647705078125, 0.4480133056640625, 0.46337890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 15.0, 14.0, 7.0, 19.0, 26.0, 34.0, 41.0, 42.0, 65.0, 71.0, 53.0, 75.0, 51.0, 68.0, 63.0, 73.0, 47.0, 53.0, 34.0, 26.0, 28.0, 21.0, 21.0, 10.0, 12.0, 9.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.250244140625, -0.24436187744140625, -0.2384796142578125, -0.23259735107421875, -0.226715087890625, -0.22083282470703125, -0.2149505615234375, -0.20906829833984375, -0.20318603515625, -0.19730377197265625, -0.1914215087890625, -0.18553924560546875, -0.179656982421875, -0.17377471923828125, -0.1678924560546875, -0.16201019287109375, -0.1561279296875, -0.15024566650390625, -0.1443634033203125, -0.13848114013671875, -0.132598876953125, -0.12671661376953125, -0.1208343505859375, -0.11495208740234375, -0.10906982421875, -0.10318756103515625, -0.0973052978515625, -0.09142303466796875, -0.085540771484375, -0.07965850830078125, -0.0737762451171875, -0.06789398193359375, -0.06201171875, -0.05612945556640625, -0.0502471923828125, -0.04436492919921875, -0.038482666015625, -0.03260040283203125, -0.0267181396484375, -0.02083587646484375, -0.01495361328125, -0.00907135009765625, -0.0031890869140625, 0.00269317626953125, 0.008575439453125, 0.01445770263671875, 0.0203399658203125, 0.02622222900390625, 0.0321044921875, 0.03798675537109375, 0.0438690185546875, 0.04975128173828125, 0.055633544921875, 0.06151580810546875, 0.0673980712890625, 0.07328033447265625, 0.07916259765625, 0.08504486083984375, 0.0909271240234375, 0.09680938720703125, 0.102691650390625, 0.10857391357421875, 0.1144561767578125, 0.12033843994140625, 0.126220703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 12.0, 11.0, 10.0, 19.0, 26.0, 40.0, 57.0, 93.0, 139.0, 234.0, 411.0, 745.0, 1500.0, 3714.0, 9921.0, 36167.0, 200436.0, 649176.0, 110535.0, 22863.0, 6940.0, 2729.0, 1221.0, 618.0, 328.0, 200.0, 125.0, 74.0, 64.0, 44.0, 26.0, 15.0, 19.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.3232421875, -0.31292724609375, -0.3026123046875, -0.29229736328125, -0.281982421875, -0.27166748046875, -0.2613525390625, -0.25103759765625, -0.24072265625, -0.23040771484375, -0.2200927734375, -0.20977783203125, -0.199462890625, -0.18914794921875, -0.1788330078125, -0.16851806640625, -0.158203125, -0.14788818359375, -0.1375732421875, -0.12725830078125, -0.116943359375, -0.10662841796875, -0.0963134765625, -0.08599853515625, -0.07568359375, -0.06536865234375, -0.0550537109375, -0.04473876953125, -0.034423828125, -0.02410888671875, -0.0137939453125, -0.00347900390625, 0.0068359375, 0.01715087890625, 0.0274658203125, 0.03778076171875, 0.048095703125, 0.05841064453125, 0.0687255859375, 0.07904052734375, 0.08935546875, 0.09967041015625, 0.1099853515625, 0.12030029296875, 0.130615234375, 0.14093017578125, 0.1512451171875, 0.16156005859375, 0.171875, 0.18218994140625, 0.1925048828125, 0.20281982421875, 0.213134765625, 0.22344970703125, 0.2337646484375, 0.24407958984375, 0.25439453125, 0.26470947265625, 0.2750244140625, 0.28533935546875, 0.295654296875, 0.30596923828125, 0.3162841796875, 0.32659912109375, 0.3369140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 14.0, 4.0, 5.0, 9.0, 9.0, 12.0, 18.0, 22.0, 16.0, 26.0, 26.0, 38.0, 45.0, 40.0, 44.0, 38.0, 37.0, 43.0, 37.0, 53.0, 43.0, 40.0, 55.0, 35.0, 37.0, 38.0, 31.0, 26.0, 24.0, 19.0, 23.0, 10.0, 21.0, 11.0, 10.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.49755859375, -0.48174285888671875, -0.4659271240234375, -0.45011138916015625, -0.434295654296875, -0.41847991943359375, -0.4026641845703125, -0.38684844970703125, -0.37103271484375, -0.35521697998046875, -0.3394012451171875, -0.32358551025390625, -0.307769775390625, -0.29195404052734375, -0.2761383056640625, -0.26032257080078125, -0.2445068359375, -0.22869110107421875, -0.2128753662109375, -0.19705963134765625, -0.181243896484375, -0.16542816162109375, -0.1496124267578125, -0.13379669189453125, -0.11798095703125, -0.10216522216796875, -0.0863494873046875, -0.07053375244140625, -0.054718017578125, -0.03890228271484375, -0.0230865478515625, -0.00727081298828125, 0.008544921875, 0.02436065673828125, 0.0401763916015625, 0.05599212646484375, 0.071807861328125, 0.08762359619140625, 0.1034393310546875, 0.11925506591796875, 0.13507080078125, 0.15088653564453125, 0.1667022705078125, 0.18251800537109375, 0.198333740234375, 0.21414947509765625, 0.2299652099609375, 0.24578094482421875, 0.2615966796875, 0.27741241455078125, 0.2932281494140625, 0.30904388427734375, 0.324859619140625, 0.34067535400390625, 0.3564910888671875, 0.37230682373046875, 0.38812255859375, 0.40393829345703125, 0.4197540283203125, 0.43556976318359375, 0.451385498046875, 0.46720123291015625, 0.4830169677734375, 0.49883270263671875, 0.5146484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 9.0, 9.0, 13.0, 25.0, 53.0, 75.0, 125.0, 281.0, 533.0, 1181.0, 3147.0, 9568.0, 35579.0, 190394.0, 668195.0, 106655.0, 22180.0, 6433.0, 2266.0, 900.0, 449.0, 182.0, 111.0, 62.0, 37.0, 25.0, 11.0, 19.0, 9.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.12914276123046875, -0.1247406005859375, -0.12033843994140625, -0.115936279296875, -0.11153411865234375, -0.1071319580078125, -0.10272979736328125, -0.09832763671875, -0.09392547607421875, -0.0895233154296875, -0.08512115478515625, -0.080718994140625, -0.07631683349609375, -0.0719146728515625, -0.06751251220703125, -0.0631103515625, -0.05870819091796875, -0.0543060302734375, -0.04990386962890625, -0.045501708984375, -0.04109954833984375, -0.0366973876953125, -0.03229522705078125, -0.02789306640625, -0.02349090576171875, -0.0190887451171875, -0.01468658447265625, -0.010284423828125, -0.00588226318359375, -0.0014801025390625, 0.00292205810546875, 0.00732421875, 0.01172637939453125, 0.0161285400390625, 0.02053070068359375, 0.024932861328125, 0.02933502197265625, 0.0337371826171875, 0.03813934326171875, 0.04254150390625, 0.04694366455078125, 0.0513458251953125, 0.05574798583984375, 0.060150146484375, 0.06455230712890625, 0.0689544677734375, 0.07335662841796875, 0.0777587890625, 0.08216094970703125, 0.0865631103515625, 0.09096527099609375, 0.095367431640625, 0.09976959228515625, 0.1041717529296875, 0.10857391357421875, 0.11297607421875, 0.11737823486328125, 0.1217803955078125, 0.12618255615234375, 0.130584716796875, 0.13498687744140625, 0.1393890380859375, 0.14379119873046875, 0.148193359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 22.0, 24.0, 21.0, 37.0, 28.0, 57.0, 45.0, 47.0, 65.0, 72.0, 66.0, 65.0, 72.0, 61.0, 57.0, 52.0, 45.0, 26.0, 23.0, 20.0, 11.0, 14.0, 8.0, 6.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.9577873647212982e-05, -2.8399750590324402e-05, -2.722162753343582e-05, -2.604350447654724e-05, -2.486538141965866e-05, -2.368725836277008e-05, -2.25091353058815e-05, -2.133101224899292e-05, -2.015288919210434e-05, -1.897476613521576e-05, -1.779664307832718e-05, -1.66185200214386e-05, -1.544039696455002e-05, -1.4262273907661438e-05, -1.3084150850772858e-05, -1.1906027793884277e-05, -1.0727904736995697e-05, -9.549781680107117e-06, -8.371658623218536e-06, -7.193535566329956e-06, -6.015412509441376e-06, -4.837289452552795e-06, -3.659166395664215e-06, -2.4810433387756348e-06, -1.3029202818870544e-06, -1.2479722499847412e-07, 1.0533258318901062e-06, 2.2314488887786865e-06, 3.409571945667267e-06, 4.587695002555847e-06, 5.7658180594444275e-06, 6.943941116333008e-06, 8.122064173221588e-06, 9.300187230110168e-06, 1.0478310286998749e-05, 1.1656433343887329e-05, 1.283455640077591e-05, 1.401267945766449e-05, 1.519080251455307e-05, 1.636892557144165e-05, 1.754704862833023e-05, 1.872517168521881e-05, 1.990329474210739e-05, 2.108141779899597e-05, 2.2259540855884552e-05, 2.3437663912773132e-05, 2.4615786969661713e-05, 2.5793910026550293e-05, 2.6972033083438873e-05, 2.8150156140327454e-05, 2.9328279197216034e-05, 3.0506402254104614e-05, 3.1684525310993195e-05, 3.2862648367881775e-05, 3.4040771424770355e-05, 3.5218894481658936e-05, 3.6397017538547516e-05, 3.7575140595436096e-05, 3.8753263652324677e-05, 3.993138670921326e-05, 4.110950976610184e-05, 4.228763282299042e-05, 4.3465755879879e-05, 4.464387893676758e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 15.0, 22.0, 23.0, 35.0, 51.0, 101.0, 201.0, 295.0, 566.0, 1132.0, 2802.0, 8553.0, 35899.0, 228415.0, 661480.0, 84222.0, 16610.0, 4654.0, 1680.0, 826.0, 372.0, 232.0, 127.0, 82.0, 46.0, 33.0, 22.0, 16.0, 13.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15625, -0.15124893188476562, -0.14624786376953125, -0.14124679565429688, -0.1362457275390625, -0.13124465942382812, -0.12624359130859375, -0.12124252319335938, -0.116241455078125, -0.11124038696289062, -0.10623931884765625, -0.10123825073242188, -0.0962371826171875, -0.09123611450195312, -0.08623504638671875, -0.08123397827148438, -0.07623291015625, -0.07123184204101562, -0.06623077392578125, -0.061229705810546875, -0.0562286376953125, -0.051227569580078125, -0.04622650146484375, -0.041225433349609375, -0.036224365234375, -0.031223297119140625, -0.02622222900390625, -0.021221160888671875, -0.0162200927734375, -0.011219024658203125, -0.00621795654296875, -0.001216888427734375, 0.0037841796875, 0.008785247802734375, 0.01378631591796875, 0.018787384033203125, 0.0237884521484375, 0.028789520263671875, 0.03379058837890625, 0.038791656494140625, 0.043792724609375, 0.048793792724609375, 0.05379486083984375, 0.058795928955078125, 0.0637969970703125, 0.06879806518554688, 0.07379913330078125, 0.07880020141601562, 0.08380126953125, 0.08880233764648438, 0.09380340576171875, 0.09880447387695312, 0.1038055419921875, 0.10880661010742188, 0.11380767822265625, 0.11880874633789062, 0.123809814453125, 0.12881088256835938, 0.13381195068359375, 0.13881301879882812, 0.1438140869140625, 0.14881515502929688, 0.15381622314453125, 0.15881729125976562, 0.163818359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 15.0, 18.0, 23.0, 20.0, 34.0, 43.0, 46.0, 89.0, 84.0, 98.0, 116.0, 97.0, 100.0, 52.0, 40.0, 25.0, 22.0, 23.0, 8.0, 9.0, 6.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12127685546875, -0.1164693832397461, -0.11166191101074219, -0.10685443878173828, -0.10204696655273438, -0.09723949432373047, -0.09243202209472656, -0.08762454986572266, -0.08281707763671875, -0.07800960540771484, -0.07320213317871094, -0.06839466094970703, -0.06358718872070312, -0.05877971649169922, -0.05397224426269531, -0.049164772033691406, -0.0443572998046875, -0.039549827575683594, -0.03474235534667969, -0.02993488311767578, -0.025127410888671875, -0.02031993865966797, -0.015512466430664062, -0.010704994201660156, -0.00589752197265625, -0.0010900497436523438, 0.0037174224853515625, 0.008524894714355469, 0.013332366943359375, 0.01813983917236328, 0.022947311401367188, 0.027754783630371094, 0.032562255859375, 0.037369728088378906, 0.04217720031738281, 0.04698467254638672, 0.051792144775390625, 0.05659961700439453, 0.06140708923339844, 0.06621456146240234, 0.07102203369140625, 0.07582950592041016, 0.08063697814941406, 0.08544445037841797, 0.09025192260742188, 0.09505939483642578, 0.09986686706542969, 0.1046743392944336, 0.1094818115234375, 0.1142892837524414, 0.11909675598144531, 0.12390422821044922, 0.12871170043945312, 0.13351917266845703, 0.13832664489746094, 0.14313411712646484, 0.14794158935546875, 0.15274906158447266, 0.15755653381347656, 0.16236400604248047, 0.16717147827148438, 0.17197895050048828, 0.1767864227294922, 0.1815938949584961, 0.1864013671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 16.0, 42.0, 119.0, 277.0, 305.0, 143.0, 59.0, 19.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.487732887268066, -5.339611530303955, -5.191490173339844, -5.043368816375732, -4.895247459411621, -4.747125625610352, -4.599004745483398, -4.450882911682129, -4.302761554718018, -4.154640197753906, -4.006518840789795, -3.8583974838256836, -3.710275888442993, -3.562154531478882, -3.4140331745147705, -3.26591157913208, -3.117790460586548, -2.9696691036224365, -2.821547746658325, -2.6734261512756348, -2.5253047943115234, -2.377183437347412, -2.229062080383301, -2.0809407234191895, -1.9328192472457886, -1.7846978902816772, -1.6365764141082764, -1.488455057144165, -1.3403337001800537, -1.1922122240066528, -1.0440908670425415, -0.8959693908691406, -0.7478482723236084, -0.5997268557548523, -0.4516054689884186, -0.30348408222198486, -0.15536266565322876, -0.007241249084472656, 0.14088010787963867, 0.28900158405303955, 0.4371229410171509, 0.585244357585907, 0.7333657741546631, 0.8814871311187744, 1.0296084880828857, 1.1777299642562866, 1.325851321220398, 1.4739727973937988, 1.6220941543579102, 1.7702155113220215, 1.9183369874954224, 2.066458225250244, 2.2145798206329346, 2.362701177597046, 2.5108225345611572, 2.6589441299438477, 2.807065486907959, 2.9551868438720703, 3.1033082008361816, 3.251429557800293, 3.3995511531829834, 3.5476725101470947, 3.695793867111206, 3.8439154624938965, 3.9920365810394287]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 3.0, 6.0, 15.0, 16.0, 15.0, 20.0, 22.0, 20.0, 41.0, 35.0, 39.0, 50.0, 46.0, 58.0, 74.0, 96.0, 67.0, 58.0, 45.0, 33.0, 32.0, 34.0, 25.0, 24.0, 20.0, 20.0, 13.0, 11.0, 8.0, 10.0, 7.0, 6.0, 3.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0541341304779053, -1.9814300537109375, -1.9087260961532593, -1.836022138595581, -1.7633180618286133, -1.6906139850616455, -1.6179100275039673, -1.545206069946289, -1.4725019931793213, -1.3997979164123535, -1.3270939588546753, -1.254390001296997, -1.1816859245300293, -1.1089818477630615, -1.0362778902053833, -0.9635738730430603, -0.8908698558807373, -0.8181658387184143, -0.7454618215560913, -0.6727578043937683, -0.6000537872314453, -0.5273497700691223, -0.4546457529067993, -0.3819417357444763, -0.3092377185821533, -0.23653370141983032, -0.16382968425750732, -0.09112566709518433, -0.018421649932861328, 0.05428236722946167, 0.12698638439178467, 0.19969040155410767, 0.27239465713500977, 0.34509867429733276, 0.41780269145965576, 0.49050670862197876, 0.5632107257843018, 0.6359147429466248, 0.7086187601089478, 0.7813227772712708, 0.8540267944335938, 0.9267308115959167, 0.9994348287582397, 1.072138786315918, 1.1448428630828857, 1.2175469398498535, 1.2902508974075317, 1.36295485496521, 1.4356589317321777, 1.5083630084991455, 1.5810669660568237, 1.653770923614502, 1.7264750003814697, 1.7991790771484375, 1.8718830347061157, 1.944586992263794, 2.0172910690307617, 2.0899951457977295, 2.1626992225646973, 2.235403060913086, 2.3081071376800537, 2.3808112144470215, 2.45351505279541, 2.526219129562378, 2.5989232063293457]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 14.0, 17.0, 41.0, 75.0, 142.0, 298.0, 845.0, 9282.0, 4069879.0, 110480.0, 2348.0, 479.0, 174.0, 93.0, 47.0, 31.0, 13.0, 9.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66796875, -1.6322784423828125, -1.596588134765625, -1.5608978271484375, -1.52520751953125, -1.4895172119140625, -1.453826904296875, -1.4181365966796875, -1.3824462890625, -1.3467559814453125, -1.311065673828125, -1.2753753662109375, -1.23968505859375, -1.2039947509765625, -1.168304443359375, -1.1326141357421875, -1.096923828125, -1.0612335205078125, -1.025543212890625, -0.9898529052734375, -0.95416259765625, -0.9184722900390625, -0.882781982421875, -0.8470916748046875, -0.8114013671875, -0.7757110595703125, -0.740020751953125, -0.7043304443359375, -0.66864013671875, -0.6329498291015625, -0.597259521484375, -0.5615692138671875, -0.52587890625, -0.4901885986328125, -0.454498291015625, -0.4188079833984375, -0.38311767578125, -0.3474273681640625, -0.311737060546875, -0.2760467529296875, -0.2403564453125, -0.2046661376953125, -0.168975830078125, -0.1332855224609375, -0.09759521484375, -0.0619049072265625, -0.026214599609375, 0.0094757080078125, 0.045166015625, 0.0808563232421875, 0.116546630859375, 0.1522369384765625, 0.18792724609375, 0.2236175537109375, 0.259307861328125, 0.2949981689453125, 0.3306884765625, 0.3663787841796875, 0.402069091796875, 0.4377593994140625, 0.47344970703125, 0.5091400146484375, 0.544830322265625, 0.5805206298828125, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 10.0, 16.0, 22.0, 25.0, 31.0, 31.0, 36.0, 48.0, 68.0, 60.0, 58.0, 64.0, 59.0, 67.0, 57.0, 41.0, 48.0, 37.0, 37.0, 30.0, 24.0, 24.0, 17.0, 17.0, 18.0, 9.0, 6.0, 4.0, 1.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.190185546875, -0.18519973754882812, -0.18021392822265625, -0.17522811889648438, -0.1702423095703125, -0.16525650024414062, -0.16027069091796875, -0.15528488159179688, -0.150299072265625, -0.14531326293945312, -0.14032745361328125, -0.13534164428710938, -0.1303558349609375, -0.12537002563476562, -0.12038421630859375, -0.11539840698242188, -0.11041259765625, -0.10542678833007812, -0.10044097900390625, -0.09545516967773438, -0.0904693603515625, -0.08548355102539062, -0.08049774169921875, -0.07551193237304688, -0.070526123046875, -0.06554031372070312, -0.06055450439453125, -0.055568695068359375, -0.0505828857421875, -0.045597076416015625, -0.04061126708984375, -0.035625457763671875, -0.0306396484375, -0.025653839111328125, -0.02066802978515625, -0.015682220458984375, -0.0106964111328125, -0.005710601806640625, -0.00072479248046875, 0.004261016845703125, 0.009246826171875, 0.014232635498046875, 0.01921844482421875, 0.024204254150390625, 0.0291900634765625, 0.034175872802734375, 0.03916168212890625, 0.044147491455078125, 0.04913330078125, 0.054119110107421875, 0.05910491943359375, 0.06409072875976562, 0.0690765380859375, 0.07406234741210938, 0.07904815673828125, 0.08403396606445312, 0.089019775390625, 0.09400558471679688, 0.09899139404296875, 0.10397720336914062, 0.1089630126953125, 0.11394882202148438, 0.11893463134765625, 0.12392044067382812, 0.12890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 4.0, 17.0, 8.0, 27.0, 37.0, 81.0, 151.0, 473.0, 1499.0, 7927.0, 109590.0, 3974864.0, 90250.0, 7211.0, 1328.0, 427.0, 164.0, 71.0, 48.0, 24.0, 16.0, 16.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9541015625, -0.9286422729492188, -0.9031829833984375, -0.8777236938476562, -0.852264404296875, -0.8268051147460938, -0.8013458251953125, -0.7758865356445312, -0.75042724609375, -0.7249679565429688, -0.6995086669921875, -0.6740493774414062, -0.648590087890625, -0.6231307983398438, -0.5976715087890625, -0.5722122192382812, -0.5467529296875, -0.5212936401367188, -0.4958343505859375, -0.47037506103515625, -0.444915771484375, -0.41945648193359375, -0.3939971923828125, -0.36853790283203125, -0.34307861328125, -0.31761932373046875, -0.2921600341796875, -0.26670074462890625, -0.241241455078125, -0.21578216552734375, -0.1903228759765625, -0.16486358642578125, -0.139404296875, -0.11394500732421875, -0.0884857177734375, -0.06302642822265625, -0.037567138671875, -0.01210784912109375, 0.0133514404296875, 0.03881072998046875, 0.06427001953125, 0.08972930908203125, 0.1151885986328125, 0.14064788818359375, 0.166107177734375, 0.19156646728515625, 0.2170257568359375, 0.24248504638671875, 0.2679443359375, 0.29340362548828125, 0.3188629150390625, 0.34432220458984375, 0.369781494140625, 0.39524078369140625, 0.4207000732421875, 0.44615936279296875, 0.47161865234375, 0.49707794189453125, 0.5225372314453125, 0.5479965209960938, 0.573455810546875, 0.5989151000976562, 0.6243743896484375, 0.6498336791992188, 0.67529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 10.0, 6.0, 12.0, 21.0, 31.0, 33.0, 61.0, 102.0, 163.0, 335.0, 779.0, 1109.0, 749.0, 281.0, 134.0, 80.0, 36.0, 35.0, 29.0, 14.0, 4.0, 12.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.401611328125, -0.3863868713378906, -0.37116241455078125, -0.3559379577636719, -0.3407135009765625, -0.3254890441894531, -0.31026458740234375, -0.2950401306152344, -0.279815673828125, -0.2645912170410156, -0.24936676025390625, -0.23414230346679688, -0.2189178466796875, -0.20369338989257812, -0.18846893310546875, -0.17324447631835938, -0.15802001953125, -0.14279556274414062, -0.12757110595703125, -0.11234664916992188, -0.0971221923828125, -0.08189773559570312, -0.06667327880859375, -0.051448822021484375, -0.036224365234375, -0.020999908447265625, -0.00577545166015625, 0.009449005126953125, 0.0246734619140625, 0.039897918701171875, 0.05512237548828125, 0.07034683227539062, 0.0855712890625, 0.10079574584960938, 0.11602020263671875, 0.13124465942382812, 0.1464691162109375, 0.16169357299804688, 0.17691802978515625, 0.19214248657226562, 0.207366943359375, 0.22259140014648438, 0.23781585693359375, 0.2530403137207031, 0.2682647705078125, 0.2834892272949219, 0.29871368408203125, 0.3139381408691406, 0.32916259765625, 0.3443870544433594, 0.35961151123046875, 0.3748359680175781, 0.3900604248046875, 0.4052848815917969, 0.42050933837890625, 0.4357337951660156, 0.450958251953125, 0.4661827087402344, 0.48140716552734375, 0.4966316223144531, 0.5118560791015625, 0.5270805358886719, 0.5423049926757812, 0.5575294494628906, 0.57275390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 7.0, 11.0, 25.0, 35.0, 68.0, 88.0, 101.0, 155.0, 148.0, 100.0, 111.0, 48.0, 32.0, 16.0, 12.0, 6.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.008906126022339, -2.9259893894195557, -2.8430726528167725, -2.7601561546325684, -2.677239418029785, -2.594322681427002, -2.5114059448242188, -2.4284892082214355, -2.3455727100372314, -2.2626559734344482, -2.179739236831665, -2.096822738647461, -2.0139060020446777, -1.9309892654418945, -1.8480725288391113, -1.7651559114456177, -1.6822391748428345, -1.5993224382400513, -1.5164058208465576, -1.4334890842437744, -1.3505724668502808, -1.2676557302474976, -1.184739112854004, -1.1018223762512207, -1.0189056396484375, -0.9359889626502991, -0.8530722856521606, -0.7701555490493774, -0.6872389316558838, -0.6043221950531006, -0.5214055180549622, -0.43848884105682373, -0.3555722236633301, -0.27265554666519165, -0.18973885476589203, -0.10682216286659241, -0.02390548586845398, 0.05901119112968445, 0.14192789793014526, 0.2248445749282837, 0.3077612519264221, 0.39067792892456055, 0.473594605922699, 0.5565112829208374, 0.6394280195236206, 0.7223446369171143, 0.8052613735198975, 0.8881780505180359, 0.9710947275161743, 1.0540114641189575, 1.1369280815124512, 1.2198448181152344, 1.302761435508728, 1.3856781721115112, 1.4685947895050049, 1.551511526107788, 1.6344282627105713, 1.7173449993133545, 1.8002616167068481, 1.8831783533096313, 1.966094970703125, 2.049011707305908, 2.1319284439086914, 2.2148451805114746, 2.2977616786956787]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 10.0, 11.0, 18.0, 21.0, 32.0, 17.0, 42.0, 39.0, 38.0, 50.0, 47.0, 48.0, 61.0, 57.0, 60.0, 54.0, 40.0, 51.0, 50.0, 39.0, 37.0, 24.0, 24.0, 16.0, 15.0, 15.0, 16.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6852667331695557, -1.6285483837127686, -1.571829915046692, -1.5151115655899048, -1.4583932161331177, -1.401674747467041, -1.344956398010254, -1.2882380485534668, -1.2315196990966797, -1.1748013496398926, -1.118082880973816, -1.0613645315170288, -1.0046461820602417, -0.9479277729988098, -0.8912093639373779, -0.8344910144805908, -0.7777725458145142, -0.7210541367530823, -0.6643357872962952, -0.6076173782348633, -0.5508990287780762, -0.4941806197166443, -0.4374622106552124, -0.3807438313961029, -0.3240254521369934, -0.2673070728778839, -0.21058867871761322, -0.15387028455734253, -0.09715190529823303, -0.040433526039123535, 0.01628488302230835, 0.07300326228141785, 0.1297215223312378, 0.1864399015903473, 0.24315829575061798, 0.29987668991088867, 0.35659506916999817, 0.41331344842910767, 0.47003185749053955, 0.5267502069473267, 0.5834686160087585, 0.6401870250701904, 0.6969053745269775, 0.7536237835884094, 0.8103421926498413, 0.8670605421066284, 0.9237789511680603, 0.9804973602294922, 1.0372157096862793, 1.0939340591430664, 1.150652527809143, 1.2073708772659302, 1.2640892267227173, 1.320807695388794, 1.377526044845581, 1.4342443943023682, 1.4909627437591553, 1.5476810932159424, 1.604399561882019, 1.6611179113388062, 1.7178362607955933, 1.77455472946167, 1.831273078918457, 1.8879914283752441, 1.9447098970413208]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 11.0, 14.0, 21.0, 35.0, 76.0, 133.0, 224.0, 531.0, 1316.0, 4324.0, 21549.0, 315324.0, 652753.0, 42519.0, 6598.0, 1816.0, 633.0, 290.0, 139.0, 83.0, 50.0, 31.0, 17.0, 13.0, 7.0, 4.0, 6.0, 4.0, 8.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5156936645507812, -0.5001373291015625, -0.48458099365234375, -0.469024658203125, -0.45346832275390625, -0.4379119873046875, -0.42235565185546875, -0.40679931640625, -0.39124298095703125, -0.3756866455078125, -0.36013031005859375, -0.344573974609375, -0.32901763916015625, -0.3134613037109375, -0.29790496826171875, -0.2823486328125, -0.26679229736328125, -0.2512359619140625, -0.23567962646484375, -0.220123291015625, -0.20456695556640625, -0.1890106201171875, -0.17345428466796875, -0.15789794921875, -0.14234161376953125, -0.1267852783203125, -0.11122894287109375, -0.095672607421875, -0.08011627197265625, -0.0645599365234375, -0.04900360107421875, -0.033447265625, -0.01789093017578125, -0.0023345947265625, 0.01322174072265625, 0.028778076171875, 0.04433441162109375, 0.0598907470703125, 0.07544708251953125, 0.09100341796875, 0.10655975341796875, 0.1221160888671875, 0.13767242431640625, 0.153228759765625, 0.16878509521484375, 0.1843414306640625, 0.19989776611328125, 0.2154541015625, 0.23101043701171875, 0.2465667724609375, 0.26212310791015625, 0.277679443359375, 0.29323577880859375, 0.3087921142578125, 0.32434844970703125, 0.33990478515625, 0.35546112060546875, 0.3710174560546875, 0.38657379150390625, 0.402130126953125, 0.41768646240234375, 0.4332427978515625, 0.44879913330078125, 0.46435546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 3.0, 13.0, 12.0, 18.0, 18.0, 22.0, 31.0, 37.0, 34.0, 42.0, 36.0, 45.0, 45.0, 73.0, 47.0, 54.0, 53.0, 58.0, 42.0, 46.0, 43.0, 25.0, 41.0, 34.0, 32.0, 11.0, 20.0, 13.0, 15.0, 5.0, 5.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.183349609375, -0.1782855987548828, -0.17322158813476562, -0.16815757751464844, -0.16309356689453125, -0.15802955627441406, -0.15296554565429688, -0.1479015350341797, -0.1428375244140625, -0.1377735137939453, -0.13270950317382812, -0.12764549255371094, -0.12258148193359375, -0.11751747131347656, -0.11245346069335938, -0.10738945007324219, -0.102325439453125, -0.09726142883300781, -0.09219741821289062, -0.08713340759277344, -0.08206939697265625, -0.07700538635253906, -0.07194137573242188, -0.06687736511230469, -0.0618133544921875, -0.05674934387207031, -0.051685333251953125, -0.04662132263183594, -0.04155731201171875, -0.03649330139160156, -0.031429290771484375, -0.026365280151367188, -0.02130126953125, -0.016237258911132812, -0.011173248291015625, -0.0061092376708984375, -0.00104522705078125, 0.0040187835693359375, 0.009082794189453125, 0.014146804809570312, 0.0192108154296875, 0.024274826049804688, 0.029338836669921875, 0.03440284729003906, 0.03946685791015625, 0.04453086853027344, 0.049594879150390625, 0.05465888977050781, 0.059722900390625, 0.06478691101074219, 0.06985092163085938, 0.07491493225097656, 0.07997894287109375, 0.08504295349121094, 0.09010696411132812, 0.09517097473144531, 0.1002349853515625, 0.10529899597167969, 0.11036300659179688, 0.11542701721191406, 0.12049102783203125, 0.12555503845214844, 0.13061904907226562, 0.1356830596923828, 0.1407470703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 14.0, 14.0, 10.0, 22.0, 34.0, 66.0, 80.0, 151.0, 317.0, 636.0, 1737.0, 5617.0, 32652.0, 692174.0, 286468.0, 21605.0, 4326.0, 1439.0, 582.0, 250.0, 128.0, 72.0, 45.0, 40.0, 22.0, 22.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.46337127685546875, -0.4467620849609375, -0.43015289306640625, -0.413543701171875, -0.39693450927734375, -0.3803253173828125, -0.36371612548828125, -0.34710693359375, -0.33049774169921875, -0.3138885498046875, -0.29727935791015625, -0.280670166015625, -0.26406097412109375, -0.2474517822265625, -0.23084259033203125, -0.2142333984375, -0.19762420654296875, -0.1810150146484375, -0.16440582275390625, -0.147796630859375, -0.13118743896484375, -0.1145782470703125, -0.09796905517578125, -0.08135986328125, -0.06475067138671875, -0.0481414794921875, -0.03153228759765625, -0.014923095703125, 0.00168609619140625, 0.0182952880859375, 0.03490447998046875, 0.051513671875, 0.06812286376953125, 0.0847320556640625, 0.10134124755859375, 0.117950439453125, 0.13455963134765625, 0.1511688232421875, 0.16777801513671875, 0.18438720703125, 0.20099639892578125, 0.2176055908203125, 0.23421478271484375, 0.250823974609375, 0.26743316650390625, 0.2840423583984375, 0.30065155029296875, 0.3172607421875, 0.33386993408203125, 0.3504791259765625, 0.36708831787109375, 0.383697509765625, 0.40030670166015625, 0.4169158935546875, 0.43352508544921875, 0.45013427734375, 0.46674346923828125, 0.4833526611328125, 0.49996185302734375, 0.516571044921875, 0.5331802368164062, 0.5497894287109375, 0.5663986206054688, 0.5830078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 7.0, 7.0, 10.0, 14.0, 12.0, 22.0, 28.0, 20.0, 44.0, 32.0, 41.0, 44.0, 47.0, 80.0, 61.0, 80.0, 62.0, 65.0, 59.0, 47.0, 53.0, 37.0, 26.0, 24.0, 13.0, 12.0, 12.0, 9.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72607421875, -0.7041702270507812, -0.6822662353515625, -0.6603622436523438, -0.638458251953125, -0.6165542602539062, -0.5946502685546875, -0.5727462768554688, -0.55084228515625, -0.5289382934570312, -0.5070343017578125, -0.48513031005859375, -0.463226318359375, -0.44132232666015625, -0.4194183349609375, -0.39751434326171875, -0.3756103515625, -0.35370635986328125, -0.3318023681640625, -0.30989837646484375, -0.287994384765625, -0.26609039306640625, -0.2441864013671875, -0.22228240966796875, -0.20037841796875, -0.17847442626953125, -0.1565704345703125, -0.13466644287109375, -0.112762451171875, -0.09085845947265625, -0.0689544677734375, -0.04705047607421875, -0.025146484375, -0.00324249267578125, 0.0186614990234375, 0.04056549072265625, 0.062469482421875, 0.08437347412109375, 0.1062774658203125, 0.12818145751953125, 0.15008544921875, 0.17198944091796875, 0.1938934326171875, 0.21579742431640625, 0.237701416015625, 0.25960540771484375, 0.2815093994140625, 0.30341339111328125, 0.3253173828125, 0.34722137451171875, 0.3691253662109375, 0.39102935791015625, 0.412933349609375, 0.43483734130859375, 0.4567413330078125, 0.47864532470703125, 0.50054931640625, 0.5224533081054688, 0.5443572998046875, 0.5662612915039062, 0.588165283203125, 0.6100692749023438, 0.6319732666015625, 0.6538772583007812, 0.67578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 2.0, 1.0, 17.0, 24.0, 28.0, 36.0, 44.0, 65.0, 98.0, 181.0, 292.0, 443.0, 641.0, 1260.0, 2124.0, 3952.0, 7663.0, 17025.0, 44336.0, 149388.0, 618629.0, 130958.0, 39757.0, 15673.0, 7282.0, 3617.0, 2037.0, 1082.0, 656.0, 415.0, 259.0, 151.0, 107.0, 85.0, 63.0, 38.0, 26.0, 19.0, 16.0, 11.0, 6.0, 9.0, 9.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.097412109375, -0.09458446502685547, -0.09175682067871094, -0.0889291763305664, -0.08610153198242188, -0.08327388763427734, -0.08044624328613281, -0.07761859893798828, -0.07479095458984375, -0.07196331024169922, -0.06913566589355469, -0.06630802154541016, -0.06348037719726562, -0.060652732849121094, -0.05782508850097656, -0.05499744415283203, -0.0521697998046875, -0.04934215545654297, -0.04651451110839844, -0.043686866760253906, -0.040859222412109375, -0.038031578063964844, -0.03520393371582031, -0.03237628936767578, -0.02954864501953125, -0.02672100067138672, -0.023893356323242188, -0.021065711975097656, -0.018238067626953125, -0.015410423278808594, -0.012582778930664062, -0.009755134582519531, -0.006927490234375, -0.004099845886230469, -0.0012722015380859375, 0.0015554428100585938, 0.004383087158203125, 0.007210731506347656, 0.010038375854492188, 0.012866020202636719, 0.01569366455078125, 0.01852130889892578, 0.021348953247070312, 0.024176597595214844, 0.027004241943359375, 0.029831886291503906, 0.03265953063964844, 0.03548717498779297, 0.0383148193359375, 0.04114246368408203, 0.04397010803222656, 0.046797752380371094, 0.049625396728515625, 0.052453041076660156, 0.05528068542480469, 0.05810832977294922, 0.06093597412109375, 0.06376361846923828, 0.06659126281738281, 0.06941890716552734, 0.07224655151367188, 0.0750741958618164, 0.07790184020996094, 0.08072948455810547, 0.08355712890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 3.0, 4.0, 15.0, 9.0, 12.0, 36.0, 35.0, 32.0, 53.0, 66.0, 61.0, 82.0, 88.0, 83.0, 68.0, 66.0, 59.0, 48.0, 36.0, 23.0, 18.0, 21.0, 13.0, 13.0, 9.0, 5.0, 4.0, 4.0, 2.0, 7.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9577484130859375e-05, -3.8324855268001556e-05, -3.707222640514374e-05, -3.581959754228592e-05, -3.45669686794281e-05, -3.331433981657028e-05, -3.206171095371246e-05, -3.0809082090854645e-05, -2.9556453227996826e-05, -2.8303824365139008e-05, -2.705119550228119e-05, -2.579856663942337e-05, -2.4545937776565552e-05, -2.3293308913707733e-05, -2.2040680050849915e-05, -2.0788051187992096e-05, -1.9535422325134277e-05, -1.828279346227646e-05, -1.703016459941864e-05, -1.577753573656082e-05, -1.4524906873703003e-05, -1.3272278010845184e-05, -1.2019649147987366e-05, -1.0767020285129547e-05, -9.514391422271729e-06, -8.26176255941391e-06, -7.009133696556091e-06, -5.756504833698273e-06, -4.503875970840454e-06, -3.2512471079826355e-06, -1.998618245124817e-06, -7.459893822669983e-07, 5.066394805908203e-07, 1.759268343448639e-06, 3.0118972063064575e-06, 4.264526069164276e-06, 5.517154932022095e-06, 6.769783794879913e-06, 8.022412657737732e-06, 9.27504152059555e-06, 1.0527670383453369e-05, 1.1780299246311188e-05, 1.3032928109169006e-05, 1.4285556972026825e-05, 1.5538185834884644e-05, 1.6790814697742462e-05, 1.804344356060028e-05, 1.92960724234581e-05, 2.0548701286315918e-05, 2.1801330149173737e-05, 2.3053959012031555e-05, 2.4306587874889374e-05, 2.5559216737747192e-05, 2.681184560060501e-05, 2.806447446346283e-05, 2.9317103326320648e-05, 3.056973218917847e-05, 3.1822361052036285e-05, 3.3074989914894104e-05, 3.432761877775192e-05, 3.558024764060974e-05, 3.683287650346756e-05, 3.808550536632538e-05, 3.93381342291832e-05, 4.0590763092041016e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 6.0, 5.0, 11.0, 7.0, 13.0, 15.0, 23.0, 42.0, 50.0, 107.0, 129.0, 225.0, 413.0, 791.0, 1900.0, 5326.0, 18537.0, 95191.0, 758093.0, 133265.0, 23788.0, 6302.0, 2244.0, 979.0, 443.0, 245.0, 140.0, 79.0, 57.0, 36.0, 31.0, 25.0, 16.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138671875, -0.1334552764892578, -0.12823867797851562, -0.12302207946777344, -0.11780548095703125, -0.11258888244628906, -0.10737228393554688, -0.10215568542480469, -0.0969390869140625, -0.09172248840332031, -0.08650588989257812, -0.08128929138183594, -0.07607269287109375, -0.07085609436035156, -0.06563949584960938, -0.06042289733886719, -0.055206298828125, -0.04998970031738281, -0.044773101806640625, -0.03955650329589844, -0.03433990478515625, -0.029123306274414062, -0.023906707763671875, -0.018690109252929688, -0.0134735107421875, -0.008256912231445312, -0.003040313720703125, 0.0021762847900390625, 0.00739288330078125, 0.012609481811523438, 0.017826080322265625, 0.023042678833007812, 0.02825927734375, 0.03347587585449219, 0.038692474365234375, 0.04390907287597656, 0.04912567138671875, 0.05434226989746094, 0.059558868408203125, 0.06477546691894531, 0.0699920654296875, 0.07520866394042969, 0.08042526245117188, 0.08564186096191406, 0.09085845947265625, 0.09607505798339844, 0.10129165649414062, 0.10650825500488281, 0.111724853515625, 0.11694145202636719, 0.12215805053710938, 0.12737464904785156, 0.13259124755859375, 0.13780784606933594, 0.14302444458007812, 0.1482410430908203, 0.1534576416015625, 0.1586742401123047, 0.16389083862304688, 0.16910743713378906, 0.17432403564453125, 0.17954063415527344, 0.18475723266601562, 0.1899738311767578, 0.1951904296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 4.0, 1.0, 10.0, 9.0, 14.0, 15.0, 23.0, 36.0, 57.0, 58.0, 105.0, 136.0, 141.0, 117.0, 78.0, 52.0, 40.0, 25.0, 20.0, 12.0, 8.0, 5.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16943359375, -0.16381263732910156, -0.15819168090820312, -0.1525707244873047, -0.14694976806640625, -0.1413288116455078, -0.13570785522460938, -0.13008689880371094, -0.1244659423828125, -0.11884498596191406, -0.11322402954101562, -0.10760307312011719, -0.10198211669921875, -0.09636116027832031, -0.09074020385742188, -0.08511924743652344, -0.079498291015625, -0.07387733459472656, -0.06825637817382812, -0.06263542175292969, -0.05701446533203125, -0.05139350891113281, -0.045772552490234375, -0.04015159606933594, -0.0345306396484375, -0.028909683227539062, -0.023288726806640625, -0.017667770385742188, -0.01204681396484375, -0.0064258575439453125, -0.000804901123046875, 0.0048160552978515625, 0.01043701171875, 0.016057968139648438, 0.021678924560546875, 0.027299880981445312, 0.03292083740234375, 0.03854179382324219, 0.044162750244140625, 0.04978370666503906, 0.0554046630859375, 0.06102561950683594, 0.06664657592773438, 0.07226753234863281, 0.07788848876953125, 0.08350944519042969, 0.08913040161132812, 0.09475135803222656, 0.100372314453125, 0.10599327087402344, 0.11161422729492188, 0.11723518371582031, 0.12285614013671875, 0.1284770965576172, 0.13409805297851562, 0.13971900939941406, 0.1453399658203125, 0.15096092224121094, 0.15658187866210938, 0.1622028350830078, 0.16782379150390625, 0.1734447479248047, 0.17906570434570312, 0.18468666076660156, 0.1903076171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 10.0, 17.0, 38.0, 85.0, 193.0, 364.0, 160.0, 72.0, 30.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.349461555480957, -5.211082458496094, -5.072703838348389, -4.934324741363525, -4.79594612121582, -4.657567024230957, -4.519187927246094, -4.380809307098389, -4.242430210113525, -4.104051113128662, -3.965672492980957, -3.8272933959960938, -3.6889145374298096, -3.5505356788635254, -3.412156581878662, -3.273777723312378, -3.1353988647460938, -2.9970200061798096, -2.8586411476135254, -2.720262050628662, -2.581883192062378, -2.4435043334960938, -2.3051252365112305, -2.1667463779449463, -2.028367519378662, -1.889988660812378, -1.7516096830368042, -1.6132307052612305, -1.4748518466949463, -1.336472988128662, -1.1980940103530884, -1.0597150325775146, -0.9213364124298096, -0.7829574942588806, -0.6445785760879517, -0.5061996579170227, -0.36782073974609375, -0.2294418215751648, -0.09106290340423584, 0.047316014766693115, 0.18569493293762207, 0.324073851108551, 0.46245276927948, 0.6008316874504089, 0.7392106056213379, 0.8775895237922668, 1.0159684419631958, 1.1543474197387695, 1.2927262783050537, 1.431105136871338, 1.5694841146469116, 1.7078630924224854, 1.8462419509887695, 1.9846208095550537, 2.122999668121338, 2.261378765106201, 2.3997576236724854, 2.5381364822387695, 2.676515579223633, 2.814894437789917, 2.953273296356201, 3.0916521549224854, 3.2300310134887695, 3.368410110473633, 3.506788969039917]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 11.0, 13.0, 8.0, 16.0, 11.0, 20.0, 27.0, 24.0, 19.0, 24.0, 34.0, 29.0, 50.0, 61.0, 78.0, 79.0, 90.0, 55.0, 39.0, 42.0, 38.0, 34.0, 25.0, 29.0, 23.0, 15.0, 20.0, 10.0, 21.0, 14.0, 5.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0966553688049316, -2.030437469482422, -1.9642198085784912, -1.898002028465271, -1.8317842483520508, -1.7655664682388306, -1.6993486881256104, -1.6331309080123901, -1.56691312789917, -1.5006953477859497, -1.4344775676727295, -1.3682597875595093, -1.302042007446289, -1.2358242273330688, -1.1696064472198486, -1.1033886671066284, -1.0371708869934082, -0.970953106880188, -0.9047353267669678, -0.8385175466537476, -0.7722997665405273, -0.7060819864273071, -0.6398642063140869, -0.5736464262008667, -0.5074286460876465, -0.44121086597442627, -0.37499308586120605, -0.30877530574798584, -0.24255752563476562, -0.1763397455215454, -0.1101219654083252, -0.04390418529510498, 0.022313594818115234, 0.08853137493133545, 0.15474915504455566, 0.22096693515777588, 0.2871847152709961, 0.3534024953842163, 0.4196202754974365, 0.48583805561065674, 0.552055835723877, 0.6182736158370972, 0.6844913959503174, 0.7507091760635376, 0.8169269561767578, 0.883144736289978, 0.9493625164031982, 1.0155802965164185, 1.0817980766296387, 1.1480158567428589, 1.214233636856079, 1.2804514169692993, 1.3466691970825195, 1.4128869771957397, 1.47910475730896, 1.5453225374221802, 1.6115403175354004, 1.6777580976486206, 1.7439758777618408, 1.810193657875061, 1.8764114379882812, 1.9426292181015015, 2.0088469982147217, 2.0750646591186523, 2.141282558441162]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 9.0, 5.0, 11.0, 19.0, 23.0, 45.0, 62.0, 213.0, 479.0, 1518.0, 7902.0, 136377.0, 3944172.0, 93801.0, 7283.0, 1603.0, 404.0, 173.0, 71.0, 37.0, 23.0, 13.0, 3.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.921875, -0.9011383056640625, -0.880401611328125, -0.8596649169921875, -0.83892822265625, -0.8181915283203125, -0.797454833984375, -0.7767181396484375, -0.7559814453125, -0.7352447509765625, -0.714508056640625, -0.6937713623046875, -0.67303466796875, -0.6522979736328125, -0.631561279296875, -0.6108245849609375, -0.590087890625, -0.5693511962890625, -0.548614501953125, -0.5278778076171875, -0.50714111328125, -0.4864044189453125, -0.465667724609375, -0.4449310302734375, -0.4241943359375, -0.4034576416015625, -0.382720947265625, -0.3619842529296875, -0.34124755859375, -0.3205108642578125, -0.299774169921875, -0.2790374755859375, -0.25830078125, -0.2375640869140625, -0.216827392578125, -0.1960906982421875, -0.17535400390625, -0.1546173095703125, -0.133880615234375, -0.1131439208984375, -0.0924072265625, -0.0716705322265625, -0.050933837890625, -0.0301971435546875, -0.00946044921875, 0.0112762451171875, 0.032012939453125, 0.0527496337890625, 0.073486328125, 0.0942230224609375, 0.114959716796875, 0.1356964111328125, 0.15643310546875, 0.1771697998046875, 0.197906494140625, 0.2186431884765625, 0.2393798828125, 0.2601165771484375, 0.280853271484375, 0.3015899658203125, 0.32232666015625, 0.3430633544921875, 0.363800048828125, 0.3845367431640625, 0.4052734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 11.0, 12.0, 18.0, 8.0, 18.0, 25.0, 32.0, 37.0, 46.0, 48.0, 48.0, 45.0, 53.0, 48.0, 57.0, 55.0, 45.0, 62.0, 41.0, 39.0, 36.0, 40.0, 40.0, 21.0, 21.0, 18.0, 11.0, 13.0, 11.0, 7.0, 8.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1820068359375, -0.1770172119140625, -0.172027587890625, -0.1670379638671875, -0.16204833984375, -0.1570587158203125, -0.152069091796875, -0.1470794677734375, -0.14208984375, -0.1371002197265625, -0.132110595703125, -0.1271209716796875, -0.12213134765625, -0.1171417236328125, -0.112152099609375, -0.1071624755859375, -0.1021728515625, -0.0971832275390625, -0.092193603515625, -0.0872039794921875, -0.08221435546875, -0.0772247314453125, -0.072235107421875, -0.0672454833984375, -0.062255859375, -0.0572662353515625, -0.052276611328125, -0.0472869873046875, -0.04229736328125, -0.0373077392578125, -0.032318115234375, -0.0273284912109375, -0.0223388671875, -0.0173492431640625, -0.012359619140625, -0.0073699951171875, -0.00238037109375, 0.0026092529296875, 0.007598876953125, 0.0125885009765625, 0.017578125, 0.0225677490234375, 0.027557373046875, 0.0325469970703125, 0.03753662109375, 0.0425262451171875, 0.047515869140625, 0.0525054931640625, 0.0574951171875, 0.0624847412109375, 0.067474365234375, 0.0724639892578125, 0.07745361328125, 0.0824432373046875, 0.087432861328125, 0.0924224853515625, 0.097412109375, 0.1024017333984375, 0.107391357421875, 0.1123809814453125, 0.11737060546875, 0.1223602294921875, 0.127349853515625, 0.1323394775390625, 0.1373291015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 1.0, 7.0, 8.0, 8.0, 11.0, 14.0, 28.0, 33.0, 49.0, 99.0, 223.0, 493.0, 1383.0, 4418.0, 19791.0, 206775.0, 3755449.0, 180731.0, 18127.0, 4280.0, 1320.0, 483.0, 209.0, 96.0, 74.0, 50.0, 28.0, 15.0, 13.0, 14.0, 12.0, 4.0, 5.0, 8.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.6103515625, -0.5936203002929688, -0.5768890380859375, -0.5601577758789062, -0.543426513671875, -0.5266952514648438, -0.5099639892578125, -0.49323272705078125, -0.47650146484375, -0.45977020263671875, -0.4430389404296875, -0.42630767822265625, -0.409576416015625, -0.39284515380859375, -0.3761138916015625, -0.35938262939453125, -0.3426513671875, -0.32592010498046875, -0.3091888427734375, -0.29245758056640625, -0.275726318359375, -0.25899505615234375, -0.2422637939453125, -0.22553253173828125, -0.20880126953125, -0.19207000732421875, -0.1753387451171875, -0.15860748291015625, -0.141876220703125, -0.12514495849609375, -0.1084136962890625, -0.09168243408203125, -0.074951171875, -0.05821990966796875, -0.0414886474609375, -0.02475738525390625, -0.008026123046875, 0.00870513916015625, 0.0254364013671875, 0.04216766357421875, 0.05889892578125, 0.07563018798828125, 0.0923614501953125, 0.10909271240234375, 0.125823974609375, 0.14255523681640625, 0.1592864990234375, 0.17601776123046875, 0.1927490234375, 0.20948028564453125, 0.2262115478515625, 0.24294281005859375, 0.259674072265625, 0.27640533447265625, 0.2931365966796875, 0.30986785888671875, 0.32659912109375, 0.34333038330078125, 0.3600616455078125, 0.37679290771484375, 0.393524169921875, 0.41025543212890625, 0.4269866943359375, 0.44371795654296875, 0.46044921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 14.0, 8.0, 16.0, 23.0, 27.0, 39.0, 61.0, 73.0, 98.0, 204.0, 298.0, 515.0, 738.0, 673.0, 451.0, 290.0, 159.0, 106.0, 72.0, 44.0, 34.0, 29.0, 21.0, 9.0, 9.0, 4.0, 4.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.2688941955566406, -0.25849151611328125, -0.24808883666992188, -0.2376861572265625, -0.22728347778320312, -0.21688079833984375, -0.20647811889648438, -0.196075439453125, -0.18567276000976562, -0.17527008056640625, -0.16486740112304688, -0.1544647216796875, -0.14406204223632812, -0.13365936279296875, -0.12325668334960938, -0.11285400390625, -0.10245132446289062, -0.09204864501953125, -0.08164596557617188, -0.0712432861328125, -0.060840606689453125, -0.05043792724609375, -0.040035247802734375, -0.029632568359375, -0.019229888916015625, -0.00882720947265625, 0.001575469970703125, 0.0119781494140625, 0.022380828857421875, 0.03278350830078125, 0.043186187744140625, 0.0535888671875, 0.06399154663085938, 0.07439422607421875, 0.08479690551757812, 0.0951995849609375, 0.10560226440429688, 0.11600494384765625, 0.12640762329101562, 0.136810302734375, 0.14721298217773438, 0.15761566162109375, 0.16801834106445312, 0.1784210205078125, 0.18882369995117188, 0.19922637939453125, 0.20962905883789062, 0.22003173828125, 0.23043441772460938, 0.24083709716796875, 0.2512397766113281, 0.2616424560546875, 0.2720451354980469, 0.28244781494140625, 0.2928504943847656, 0.303253173828125, 0.3136558532714844, 0.32405853271484375, 0.3344612121582031, 0.3448638916015625, 0.3552665710449219, 0.36566925048828125, 0.3760719299316406, 0.386474609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 12.0, 22.0, 50.0, 118.0, 201.0, 277.0, 181.0, 78.0, 29.0, 11.0, 12.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2776670455932617, -3.1167852878570557, -2.9559032917022705, -2.7950215339660645, -2.6341397762298584, -2.4732580184936523, -2.312376022338867, -2.151494264602661, -1.9906123876571655, -1.82973051071167, -1.6688487529754639, -1.5079668760299683, -1.3470849990844727, -1.1862032413482666, -1.025321364402771, -0.8644396066665649, -0.7035577297210693, -0.5426759123802185, -0.3817940652370453, -0.22091221809387207, -0.06003040075302124, 0.10085141658782959, 0.2617332935333252, 0.42261505126953125, 0.5834969282150269, 0.7443787455558777, 0.9052605628967285, 1.0661424398422241, 1.2270243167877197, 1.3879060745239258, 1.5487879514694214, 1.7096697092056274, 1.870551586151123, 2.031433343887329, 2.1923153400421143, 2.3531970977783203, 2.5140788555145264, 2.6749606132507324, 2.8358426094055176, 2.9967243671417236, 3.1576061248779297, 3.3184878826141357, 3.479369878768921, 3.640251636505127, 3.801133394241333, 3.962015151977539, 4.122897148132324, 4.283779144287109, 4.4446611404418945, 4.60554313659668, 4.766424655914307, 4.927306652069092, 5.088188648223877, 5.249070167541504, 5.409952163696289, 5.570834159851074, 5.731715679168701, 5.892597675323486, 6.053479194641113, 6.214361190795898, 6.375243186950684, 6.5361247062683105, 6.697006702423096, 6.857888221740723, 7.018770217895508]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 8.0, 6.0, 11.0, 11.0, 26.0, 21.0, 27.0, 41.0, 53.0, 38.0, 40.0, 65.0, 67.0, 65.0, 87.0, 67.0, 56.0, 46.0, 48.0, 31.0, 44.0, 28.0, 23.0, 19.0, 17.0, 15.0, 13.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.068406581878662, -2.000345230102539, -1.9322841167449951, -1.8642228841781616, -1.7961616516113281, -1.728100299835205, -1.6600390672683716, -1.591977834701538, -1.5239166021347046, -1.455855369567871, -1.3877941370010376, -1.319732904434204, -1.251671552658081, -1.183610439300537, -1.115549087524414, -1.0474878549575806, -0.9794266223907471, -0.9113653898239136, -0.8433041572570801, -0.7752428650856018, -0.7071816325187683, -0.6391203999519348, -0.5710591077804565, -0.502997875213623, -0.43493664264678955, -0.36687541007995605, -0.29881414771080017, -0.23075290024280548, -0.1626916527748108, -0.0946304202079773, -0.02656915783882141, 0.04149210453033447, 0.10955333709716797, 0.17761458456516266, 0.24567583203315735, 0.31373709440231323, 0.38179832696914673, 0.4498595595359802, 0.5179208517074585, 0.585982084274292, 0.6540433168411255, 0.722104549407959, 0.7901657819747925, 0.8582270741462708, 0.9262883067131042, 0.9943495392799377, 1.062410831451416, 1.1304720640182495, 1.198533296585083, 1.2665945291519165, 1.33465576171875, 1.4027169942855835, 1.470778226852417, 1.53883957862854, 1.6069008111953735, 1.674962043762207, 1.7430232763290405, 1.811084508895874, 1.8791457414627075, 1.947206974029541, 2.015268325805664, 2.083329439163208, 2.151390790939331, 2.219451904296875, 2.287513256072998]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 16.0, 14.0, 29.0, 25.0, 56.0, 79.0, 133.0, 164.0, 280.0, 504.0, 896.0, 1819.0, 4208.0, 10501.0, 31366.0, 116795.0, 483676.0, 297584.0, 66905.0, 20148.0, 7196.0, 2978.0, 1387.0, 680.0, 404.0, 242.0, 141.0, 95.0, 70.0, 43.0, 36.0, 21.0, 17.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.2341327667236328, -0.22571182250976562, -0.21729087829589844, -0.20886993408203125, -0.20044898986816406, -0.19202804565429688, -0.1836071014404297, -0.1751861572265625, -0.1667652130126953, -0.15834426879882812, -0.14992332458496094, -0.14150238037109375, -0.13308143615722656, -0.12466049194335938, -0.11623954772949219, -0.107818603515625, -0.09939765930175781, -0.09097671508789062, -0.08255577087402344, -0.07413482666015625, -0.06571388244628906, -0.057292938232421875, -0.04887199401855469, -0.0404510498046875, -0.03203010559082031, -0.023609161376953125, -0.015188217163085938, -0.00676727294921875, 0.0016536712646484375, 0.010074615478515625, 0.018495559692382812, 0.02691650390625, 0.03533744812011719, 0.043758392333984375, 0.05217933654785156, 0.06060028076171875, 0.06902122497558594, 0.07744216918945312, 0.08586311340332031, 0.0942840576171875, 0.10270500183105469, 0.11112594604492188, 0.11954689025878906, 0.12796783447265625, 0.13638877868652344, 0.14480972290039062, 0.1532306671142578, 0.161651611328125, 0.1700725555419922, 0.17849349975585938, 0.18691444396972656, 0.19533538818359375, 0.20375633239746094, 0.21217727661132812, 0.2205982208251953, 0.2290191650390625, 0.2374401092529297, 0.24586105346679688, 0.25428199768066406, 0.26270294189453125, 0.27112388610839844, 0.2795448303222656, 0.2879657745361328, 0.29638671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 14.0, 14.0, 14.0, 27.0, 36.0, 33.0, 42.0, 53.0, 54.0, 59.0, 70.0, 79.0, 65.0, 55.0, 63.0, 51.0, 40.0, 36.0, 56.0, 34.0, 19.0, 27.0, 17.0, 9.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1351318359375, -0.1284351348876953, -0.12173843383789062, -0.11504173278808594, -0.10834503173828125, -0.10164833068847656, -0.09495162963867188, -0.08825492858886719, -0.0815582275390625, -0.07486152648925781, -0.06816482543945312, -0.06146812438964844, -0.05477142333984375, -0.04807472229003906, -0.041378021240234375, -0.03468132019042969, -0.027984619140625, -0.021287918090820312, -0.014591217041015625, -0.007894515991210938, -0.00119781494140625, 0.0054988861083984375, 0.012195587158203125, 0.018892288208007812, 0.0255889892578125, 0.03228569030761719, 0.038982391357421875, 0.04567909240722656, 0.05237579345703125, 0.05907249450683594, 0.06576919555664062, 0.07246589660644531, 0.07916259765625, 0.08585929870605469, 0.09255599975585938, 0.09925270080566406, 0.10594940185546875, 0.11264610290527344, 0.11934280395507812, 0.1260395050048828, 0.1327362060546875, 0.1394329071044922, 0.14612960815429688, 0.15282630920410156, 0.15952301025390625, 0.16621971130371094, 0.17291641235351562, 0.1796131134033203, 0.186309814453125, 0.1930065155029297, 0.19970321655273438, 0.20639991760253906, 0.21309661865234375, 0.21979331970214844, 0.22649002075195312, 0.2331867218017578, 0.2398834228515625, 0.2465801239013672, 0.2532768249511719, 0.25997352600097656, 0.26667022705078125, 0.27336692810058594, 0.2800636291503906, 0.2867603302001953, 0.29345703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 18.0, 24.0, 33.0, 56.0, 77.0, 122.0, 251.0, 482.0, 1176.0, 4167.0, 23935.0, 748545.0, 249386.0, 15286.0, 3045.0, 967.0, 434.0, 208.0, 120.0, 82.0, 39.0, 27.0, 17.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.88916015625, -0.8684310913085938, -0.8477020263671875, -0.8269729614257812, -0.806243896484375, -0.7855148315429688, -0.7647857666015625, -0.7440567016601562, -0.72332763671875, -0.7025985717773438, -0.6818695068359375, -0.6611404418945312, -0.640411376953125, -0.6196823120117188, -0.5989532470703125, -0.5782241821289062, -0.5574951171875, -0.5367660522460938, -0.5160369873046875, -0.49530792236328125, -0.474578857421875, -0.45384979248046875, -0.4331207275390625, -0.41239166259765625, -0.39166259765625, -0.37093353271484375, -0.3502044677734375, -0.32947540283203125, -0.308746337890625, -0.28801727294921875, -0.2672882080078125, -0.24655914306640625, -0.225830078125, -0.20510101318359375, -0.1843719482421875, -0.16364288330078125, -0.142913818359375, -0.12218475341796875, -0.1014556884765625, -0.08072662353515625, -0.05999755859375, -0.03926849365234375, -0.0185394287109375, 0.00218963623046875, 0.022918701171875, 0.04364776611328125, 0.0643768310546875, 0.08510589599609375, 0.1058349609375, 0.12656402587890625, 0.1472930908203125, 0.16802215576171875, 0.188751220703125, 0.20948028564453125, 0.2302093505859375, 0.25093841552734375, 0.27166748046875, 0.29239654541015625, 0.3131256103515625, 0.33385467529296875, 0.354583740234375, 0.37531280517578125, 0.3960418701171875, 0.41677093505859375, 0.4375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 9.0, 6.0, 7.0, 10.0, 11.0, 8.0, 17.0, 22.0, 31.0, 38.0, 59.0, 57.0, 67.0, 90.0, 88.0, 86.0, 79.0, 58.0, 53.0, 56.0, 38.0, 26.0, 22.0, 19.0, 13.0, 8.0, 3.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.1796875, -1.150115966796875, -1.12054443359375, -1.090972900390625, -1.0614013671875, -1.031829833984375, -1.00225830078125, -0.972686767578125, -0.943115234375, -0.913543701171875, -0.88397216796875, -0.854400634765625, -0.8248291015625, -0.795257568359375, -0.76568603515625, -0.736114501953125, -0.70654296875, -0.676971435546875, -0.64739990234375, -0.617828369140625, -0.5882568359375, -0.558685302734375, -0.52911376953125, -0.499542236328125, -0.469970703125, -0.440399169921875, -0.41082763671875, -0.381256103515625, -0.3516845703125, -0.322113037109375, -0.29254150390625, -0.262969970703125, -0.2333984375, -0.203826904296875, -0.17425537109375, -0.144683837890625, -0.1151123046875, -0.085540771484375, -0.05596923828125, -0.026397705078125, 0.003173828125, 0.032745361328125, 0.06231689453125, 0.091888427734375, 0.1214599609375, 0.151031494140625, 0.18060302734375, 0.210174560546875, 0.23974609375, 0.269317626953125, 0.29888916015625, 0.328460693359375, 0.3580322265625, 0.387603759765625, 0.41717529296875, 0.446746826171875, 0.476318359375, 0.505889892578125, 0.53546142578125, 0.565032958984375, 0.5946044921875, 0.624176025390625, 0.65374755859375, 0.683319091796875, 0.712890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 10.0, 17.0, 26.0, 58.0, 275.0, 2373.0, 415102.0, 627903.0, 2364.0, 277.0, 73.0, 34.0, 10.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5753402709960938, -0.5579071044921875, -0.5404739379882812, -0.523040771484375, -0.5056076049804688, -0.4881744384765625, -0.47074127197265625, -0.45330810546875, -0.43587493896484375, -0.4184417724609375, -0.40100860595703125, -0.383575439453125, -0.36614227294921875, -0.3487091064453125, -0.33127593994140625, -0.3138427734375, -0.29640960693359375, -0.2789764404296875, -0.26154327392578125, -0.244110107421875, -0.22667694091796875, -0.2092437744140625, -0.19181060791015625, -0.17437744140625, -0.15694427490234375, -0.1395111083984375, -0.12207794189453125, -0.104644775390625, -0.08721160888671875, -0.0697784423828125, -0.05234527587890625, -0.034912109375, -0.01747894287109375, -4.57763671875e-05, 0.01738739013671875, 0.034820556640625, 0.05225372314453125, 0.0696868896484375, 0.08712005615234375, 0.10455322265625, 0.12198638916015625, 0.1394195556640625, 0.15685272216796875, 0.174285888671875, 0.19171905517578125, 0.2091522216796875, 0.22658538818359375, 0.2440185546875, 0.26145172119140625, 0.2788848876953125, 0.29631805419921875, 0.313751220703125, 0.33118438720703125, 0.3486175537109375, 0.36605072021484375, 0.38348388671875, 0.40091705322265625, 0.4183502197265625, 0.43578338623046875, 0.453216552734375, 0.47064971923828125, 0.4880828857421875, 0.5055160522460938, 0.52294921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 17.0, 5.0, 16.0, 16.0, 31.0, 35.0, 46.0, 63.0, 94.0, 103.0, 109.0, 105.0, 92.0, 52.0, 50.0, 40.0, 16.0, 17.0, 20.0, 13.0, 9.0, 6.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.941225051879883e-05, -4.772935062646866e-05, -4.604645073413849e-05, -4.436355084180832e-05, -4.268065094947815e-05, -4.099775105714798e-05, -3.931485116481781e-05, -3.763195127248764e-05, -3.594905138015747e-05, -3.42661514878273e-05, -3.258325159549713e-05, -3.090035170316696e-05, -2.9217451810836792e-05, -2.7534551918506622e-05, -2.5851652026176453e-05, -2.4168752133846283e-05, -2.2485852241516113e-05, -2.0802952349185944e-05, -1.9120052456855774e-05, -1.7437152564525604e-05, -1.5754252672195435e-05, -1.4071352779865265e-05, -1.2388452887535095e-05, -1.0705552995204926e-05, -9.022653102874756e-06, -7.339753210544586e-06, -5.6568533182144165e-06, -3.973953425884247e-06, -2.291053533554077e-06, -6.081536412239075e-07, 1.0747462511062622e-06, 2.757646143436432e-06, 4.4405460357666016e-06, 6.123445928096771e-06, 7.806345820426941e-06, 9.48924571275711e-06, 1.117214560508728e-05, 1.285504549741745e-05, 1.453794538974762e-05, 1.622084528207779e-05, 1.790374517440796e-05, 1.958664506673813e-05, 2.12695449590683e-05, 2.2952444851398468e-05, 2.4635344743728638e-05, 2.6318244636058807e-05, 2.8001144528388977e-05, 2.9684044420719147e-05, 3.1366944313049316e-05, 3.3049844205379486e-05, 3.4732744097709656e-05, 3.6415643990039825e-05, 3.8098543882369995e-05, 3.9781443774700165e-05, 4.1464343667030334e-05, 4.3147243559360504e-05, 4.4830143451690674e-05, 4.6513043344020844e-05, 4.819594323635101e-05, 4.987884312868118e-05, 5.156174302101135e-05, 5.324464291334152e-05, 5.492754280567169e-05, 5.661044269800186e-05, 5.829334259033203e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 6.0, 4.0, 7.0, 9.0, 16.0, 18.0, 20.0, 28.0, 48.0, 62.0, 97.0, 153.0, 279.0, 494.0, 1066.0, 2439.0, 7236.0, 28870.0, 219070.0, 719945.0, 51560.0, 10816.0, 3440.0, 1377.0, 617.0, 373.0, 182.0, 98.0, 60.0, 33.0, 20.0, 23.0, 19.0, 16.0, 11.0, 6.0, 17.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.164794921875, -0.15982627868652344, -0.15485763549804688, -0.1498889923095703, -0.14492034912109375, -0.1399517059326172, -0.13498306274414062, -0.13001441955566406, -0.1250457763671875, -0.12007713317871094, -0.11510848999023438, -0.11013984680175781, -0.10517120361328125, -0.10020256042480469, -0.09523391723632812, -0.09026527404785156, -0.085296630859375, -0.08032798767089844, -0.07535934448242188, -0.07039070129394531, -0.06542205810546875, -0.06045341491699219, -0.055484771728515625, -0.05051612854003906, -0.0455474853515625, -0.04057884216308594, -0.035610198974609375, -0.030641555786132812, -0.02567291259765625, -0.020704269409179688, -0.015735626220703125, -0.010766983032226562, -0.00579833984375, -0.0008296966552734375, 0.004138946533203125, 0.009107589721679688, 0.01407623291015625, 0.019044876098632812, 0.024013519287109375, 0.028982162475585938, 0.0339508056640625, 0.03891944885253906, 0.043888092041015625, 0.04885673522949219, 0.05382537841796875, 0.05879402160644531, 0.06376266479492188, 0.06873130798339844, 0.073699951171875, 0.07866859436035156, 0.08363723754882812, 0.08860588073730469, 0.09357452392578125, 0.09854316711425781, 0.10351181030273438, 0.10848045349121094, 0.1134490966796875, 0.11841773986816406, 0.12338638305664062, 0.1283550262451172, 0.13332366943359375, 0.1382923126220703, 0.14326095581054688, 0.14822959899902344, 0.1531982421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 12.0, 20.0, 26.0, 27.0, 50.0, 67.0, 108.0, 124.0, 119.0, 126.0, 94.0, 65.0, 48.0, 16.0, 14.0, 19.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.1741485595703125, -0.167999267578125, -0.1618499755859375, -0.15570068359375, -0.1495513916015625, -0.143402099609375, -0.1372528076171875, -0.131103515625, -0.1249542236328125, -0.118804931640625, -0.1126556396484375, -0.10650634765625, -0.1003570556640625, -0.094207763671875, -0.0880584716796875, -0.0819091796875, -0.0757598876953125, -0.069610595703125, -0.0634613037109375, -0.05731201171875, -0.0511627197265625, -0.045013427734375, -0.0388641357421875, -0.03271484375, -0.0265655517578125, -0.020416259765625, -0.0142669677734375, -0.00811767578125, -0.0019683837890625, 0.004180908203125, 0.0103302001953125, 0.0164794921875, 0.0226287841796875, 0.028778076171875, 0.0349273681640625, 0.04107666015625, 0.0472259521484375, 0.053375244140625, 0.0595245361328125, 0.065673828125, 0.0718231201171875, 0.077972412109375, 0.0841217041015625, 0.09027099609375, 0.0964202880859375, 0.102569580078125, 0.1087188720703125, 0.1148681640625, 0.1210174560546875, 0.127166748046875, 0.1333160400390625, 0.13946533203125, 0.1456146240234375, 0.151763916015625, 0.1579132080078125, 0.1640625, 0.1702117919921875, 0.176361083984375, 0.1825103759765625, 0.18865966796875, 0.1948089599609375, 0.200958251953125, 0.2071075439453125, 0.2132568359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 74.0, 799.0, 118.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.703781127929688, -29.13824462890625, -28.57270622253418, -28.007169723510742, -27.441633224487305, -26.876094818115234, -26.310558319091797, -25.74502182006836, -25.179485321044922, -24.613948822021484, -24.048410415649414, -23.482873916625977, -22.91733741760254, -22.35179901123047, -21.78626251220703, -21.220726013183594, -20.655187606811523, -20.089651107788086, -19.524112701416016, -18.958576202392578, -18.39303970336914, -17.827503204345703, -17.261964797973633, -16.696428298950195, -16.130889892578125, -15.565352439880371, -14.999815940856934, -14.43427848815918, -13.868741989135742, -13.303204536437988, -12.737667083740234, -12.172130584716797, -11.60659408569336, -11.041056632995605, -10.475520133972168, -9.909982681274414, -9.344446182250977, -8.778908729553223, -8.213371276855469, -7.647834300994873, -7.082297325134277, -6.516760349273682, -5.951223373413086, -5.385685920715332, -4.820148944854736, -4.254611968994141, -3.689074754714966, -3.123537540435791, -2.5580005645751953, -1.99246346950531, -1.4269263744354248, -0.8613892793655396, -0.2958521842956543, 0.2696847915649414, 0.8352220058441162, 1.400759220123291, 1.9662961959838867, 2.5318331718444824, 3.0973703861236572, 3.662907600402832, 4.228444576263428, 4.793981552124023, 5.359519004821777, 5.925055980682373, 6.490592956542969]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 16.0, 23.0, 40.0, 41.0, 54.0, 74.0, 105.0, 194.0, 127.0, 65.0, 60.0, 43.0, 41.0, 36.0, 23.0, 14.0, 7.0, 5.0, 3.0, 6.0, 5.0, 4.0], "bins": [-7.6267619132995605, -7.473153114318848, -7.319544792175293, -7.16593599319458, -7.012327194213867, -6.858718395233154, -6.7051100730896, -6.551501274108887, -6.397892475128174, -6.244283676147461, -6.090675354003906, -5.937066555023193, -5.7834577560424805, -5.629848957061768, -5.476240634918213, -5.3226318359375, -5.169023513793945, -5.015414714813232, -4.861806392669678, -4.708197593688965, -4.554588794708252, -4.400979995727539, -4.247371673583984, -4.0937628746032715, -3.9401540756225586, -3.786545515060425, -3.632936716079712, -3.479328155517578, -3.3257193565368652, -3.1721107959747314, -3.0185022354125977, -2.8648934364318848, -2.7112843990325928, -2.557675838470459, -2.404067039489746, -2.2504584789276123, -2.0968496799468994, -1.9432411193847656, -1.7896324396133423, -1.636023759841919, -1.4824150800704956, -1.3288064002990723, -1.175197720527649, -1.0215890407562256, -0.867980420589447, -0.7143717408180237, -0.5607631206512451, -0.4071544408798218, -0.25354576110839844, -0.09993709623813629, 0.053671568632125854, 0.2072802186012268, 0.36088889837265015, 0.5144975781440735, 0.668106198310852, 0.8217148780822754, 0.9753235578536987, 1.128932237625122, 1.2825409173965454, 1.4361495971679688, 1.5897581577301025, 1.7433669567108154, 1.8969755172729492, 2.050584316253662, 2.204192876815796]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 8.0, 20.0, 25.0, 50.0, 109.0, 260.0, 939.0, 6688.0, 494677.0, 3666748.0, 21429.0, 2633.0, 456.0, 127.0, 58.0, 20.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.142578125, -2.0990219116210938, -2.0554656982421875, -2.0119094848632812, -1.968353271484375, -1.9247970581054688, -1.8812408447265625, -1.8376846313476562, -1.79412841796875, -1.7505722045898438, -1.7070159912109375, -1.6634597778320312, -1.619903564453125, -1.5763473510742188, -1.5327911376953125, -1.4892349243164062, -1.4456787109375, -1.4021224975585938, -1.3585662841796875, -1.3150100708007812, -1.271453857421875, -1.2278976440429688, -1.1843414306640625, -1.1407852172851562, -1.09722900390625, -1.0536727905273438, -1.0101165771484375, -0.9665603637695312, -0.923004150390625, -0.8794479370117188, -0.8358917236328125, -0.7923355102539062, -0.748779296875, -0.7052230834960938, -0.6616668701171875, -0.6181106567382812, -0.574554443359375, -0.5309982299804688, -0.4874420166015625, -0.44388580322265625, -0.40032958984375, -0.35677337646484375, -0.3132171630859375, -0.26966094970703125, -0.226104736328125, -0.18254852294921875, -0.1389923095703125, -0.09543609619140625, -0.0518798828125, -0.00832366943359375, 0.0352325439453125, 0.07878875732421875, 0.122344970703125, 0.16590118408203125, 0.2094573974609375, 0.25301361083984375, 0.29656982421875, 0.34012603759765625, 0.3836822509765625, 0.42723846435546875, 0.470794677734375, 0.5143508911132812, 0.5579071044921875, 0.6014633178710938, 0.64501953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 11.0, 29.0, 48.0, 56.0, 68.0, 117.0, 111.0, 118.0, 133.0, 93.0, 73.0, 59.0, 41.0, 21.0, 15.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.61328125, -0.6011180877685547, -0.5889549255371094, -0.5767917633056641, -0.5646286010742188, -0.5524654388427734, -0.5403022766113281, -0.5281391143798828, -0.5159759521484375, -0.5038127899169922, -0.4916496276855469, -0.47948646545410156, -0.46732330322265625, -0.45516014099121094, -0.4429969787597656, -0.4308338165283203, -0.418670654296875, -0.4065074920654297, -0.3943443298339844, -0.38218116760253906, -0.37001800537109375, -0.35785484313964844, -0.3456916809082031, -0.3335285186767578, -0.3213653564453125, -0.3092021942138672, -0.2970390319824219, -0.28487586975097656, -0.27271270751953125, -0.26054954528808594, -0.24838638305664062, -0.2362232208251953, -0.22406005859375, -0.2118968963623047, -0.19973373413085938, -0.18757057189941406, -0.17540740966796875, -0.16324424743652344, -0.15108108520507812, -0.1389179229736328, -0.1267547607421875, -0.11459159851074219, -0.10242843627929688, -0.09026527404785156, -0.07810211181640625, -0.06593894958496094, -0.053775787353515625, -0.04161262512207031, -0.029449462890625, -0.017286300659179688, -0.005123138427734375, 0.0070400238037109375, 0.01920318603515625, 0.03136634826660156, 0.043529510498046875, 0.05569267272949219, 0.0678558349609375, 0.08001899719238281, 0.09218215942382812, 0.10434532165527344, 0.11650848388671875, 0.12867164611816406, 0.14083480834960938, 0.1529979705810547, 0.1651611328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 10.0, 8.0, 14.0, 18.0, 32.0, 58.0, 77.0, 146.0, 271.0, 616.0, 1827.0, 8998.0, 444939.0, 3713408.0, 19295.0, 2777.0, 920.0, 351.0, 211.0, 104.0, 55.0, 46.0, 31.0, 16.0, 11.0, 8.0, 9.0, 8.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.28729248046875, -1.2415771484375, -1.19586181640625, -1.150146484375, -1.10443115234375, -1.0587158203125, -1.01300048828125, -0.96728515625, -0.92156982421875, -0.8758544921875, -0.83013916015625, -0.784423828125, -0.73870849609375, -0.6929931640625, -0.64727783203125, -0.6015625, -0.55584716796875, -0.5101318359375, -0.46441650390625, -0.418701171875, -0.37298583984375, -0.3272705078125, -0.28155517578125, -0.23583984375, -0.19012451171875, -0.1444091796875, -0.09869384765625, -0.052978515625, -0.00726318359375, 0.0384521484375, 0.08416748046875, 0.1298828125, 0.17559814453125, 0.2213134765625, 0.26702880859375, 0.312744140625, 0.35845947265625, 0.4041748046875, 0.44989013671875, 0.49560546875, 0.54132080078125, 0.5870361328125, 0.63275146484375, 0.678466796875, 0.72418212890625, 0.7698974609375, 0.81561279296875, 0.861328125, 0.90704345703125, 0.9527587890625, 0.99847412109375, 1.044189453125, 1.08990478515625, 1.1356201171875, 1.18133544921875, 1.22705078125, 1.27276611328125, 1.3184814453125, 1.36419677734375, 1.409912109375, 1.45562744140625, 1.5013427734375, 1.54705810546875, 1.5927734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 12.0, 9.0, 19.0, 19.0, 38.0, 56.0, 53.0, 88.0, 129.0, 201.0, 315.0, 439.0, 605.0, 660.0, 469.0, 298.0, 221.0, 140.0, 81.0, 75.0, 26.0, 26.0, 18.0, 13.0, 13.0, 11.0, 6.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4585380554199219, -0.44026947021484375, -0.4220008850097656, -0.4037322998046875, -0.3854637145996094, -0.36719512939453125, -0.3489265441894531, -0.330657958984375, -0.3123893737792969, -0.29412078857421875, -0.2758522033691406, -0.2575836181640625, -0.23931503295898438, -0.22104644775390625, -0.20277786254882812, -0.18450927734375, -0.16624069213867188, -0.14797210693359375, -0.12970352172851562, -0.1114349365234375, -0.09316635131835938, -0.07489776611328125, -0.056629180908203125, -0.038360595703125, -0.020092010498046875, -0.00182342529296875, 0.016445159912109375, 0.0347137451171875, 0.052982330322265625, 0.07125091552734375, 0.08951950073242188, 0.1077880859375, 0.12605667114257812, 0.14432525634765625, 0.16259384155273438, 0.1808624267578125, 0.19913101196289062, 0.21739959716796875, 0.23566818237304688, 0.253936767578125, 0.2722053527832031, 0.29047393798828125, 0.3087425231933594, 0.3270111083984375, 0.3452796936035156, 0.36354827880859375, 0.3818168640136719, 0.40008544921875, 0.4183540344238281, 0.43662261962890625, 0.4548912048339844, 0.4731597900390625, 0.4914283752441406, 0.5096969604492188, 0.5279655456542969, 0.546234130859375, 0.5645027160644531, 0.5827713012695312, 0.6010398864746094, 0.6193084716796875, 0.6375770568847656, 0.6558456420898438, 0.6741142272949219, 0.6923828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 20.0, 38.0, 111.0, 264.0, 293.0, 157.0, 55.0, 32.0, 12.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.400297164916992, -11.046185493469238, -10.692072868347168, -10.337961196899414, -9.983848571777344, -9.62973690032959, -9.275625228881836, -8.921512603759766, -8.567399978637695, -8.213288307189941, -7.859175682067871, -7.505064010620117, -7.150951385498047, -6.796839714050293, -6.442727565765381, -6.088615417480469, -5.734503746032715, -5.380391597747803, -5.026279449462891, -4.672167778015137, -4.318055152893066, -3.9639432430267334, -3.6098313331604004, -3.2557191848754883, -2.901607036590576, -2.547494888305664, -2.193382740020752, -1.839270830154419, -1.4851586818695068, -1.1310465335845947, -0.7769346237182617, -0.4228224754333496, -0.0687103271484375, 0.28540176153182983, 0.6395138502120972, 0.9936258792877197, 1.3477380275726318, 1.701850175857544, 2.055962085723877, 2.410074234008789, 2.764186382293701, 3.1182985305786133, 3.4724106788635254, 3.8265225887298584, 4.180634498596191, 4.534747123718262, 4.888858795166016, 5.242970943450928, 5.59708309173584, 5.951195240020752, 6.305307388305664, 6.659419059753418, 7.013531684875488, 7.367643356323242, 7.721755504608154, 8.075867652893066, 8.42997932434082, 8.784090995788574, 9.138203620910645, 9.492315292358398, 9.846427917480469, 10.200539588928223, 10.554651260375977, 10.908763885498047, 11.262876510620117]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 13.0, 9.0, 14.0, 21.0, 17.0, 15.0, 32.0, 25.0, 43.0, 45.0, 50.0, 67.0, 67.0, 71.0, 74.0, 56.0, 72.0, 52.0, 49.0, 46.0, 29.0, 33.0, 28.0, 23.0, 8.0, 12.0, 7.0, 7.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021679401397705, -2.910008668899536, -2.798337936401367, -2.686666965484619, -2.57499623298645, -2.4633255004882812, -2.351654529571533, -2.2399837970733643, -2.1283130645751953, -2.0166423320770264, -1.9049714803695679, -1.7933006286621094, -1.6816298961639404, -1.5699591636657715, -1.458288311958313, -1.3466174602508545, -1.2349467277526855, -1.1232759952545166, -1.011605143547058, -0.8999343514442444, -0.7882635593414307, -0.6765927672386169, -0.5649219751358032, -0.4532511830329895, -0.3415803909301758, -0.22990959882736206, -0.11823880672454834, -0.006568014621734619, 0.1051027774810791, 0.21677356958389282, 0.32844436168670654, 0.44011515378952026, 0.551785945892334, 0.6634567379951477, 0.7751275300979614, 0.8867983222007751, 0.9984691143035889, 1.1101398468017578, 1.2218106985092163, 1.3334815502166748, 1.4451522827148438, 1.5568230152130127, 1.6684938669204712, 1.7801647186279297, 1.8918354511260986, 2.0035061836242676, 2.1151771545410156, 2.2268478870391846, 2.3385186195373535, 2.4501893520355225, 2.5618600845336914, 2.6735310554504395, 2.7852017879486084, 2.8968725204467773, 3.0085434913635254, 3.1202142238616943, 3.2318849563598633, 3.3435556888580322, 3.455226421356201, 3.566897392272949, 3.678568124771118, 3.790238857269287, 3.901909828186035, 4.013580322265625, 4.125251293182373]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 13.0, 11.0, 20.0, 29.0, 44.0, 86.0, 119.0, 238.0, 529.0, 1028.0, 2448.0, 7207.0, 27355.0, 158023.0, 701037.0, 118428.0, 21785.0, 6034.0, 2174.0, 913.0, 456.0, 243.0, 111.0, 75.0, 49.0, 34.0, 23.0, 14.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.3515777587890625, -0.339630126953125, -0.3276824951171875, -0.31573486328125, -0.3037872314453125, -0.291839599609375, -0.2798919677734375, -0.2679443359375, -0.2559967041015625, -0.244049072265625, -0.2321014404296875, -0.22015380859375, -0.2082061767578125, -0.196258544921875, -0.1843109130859375, -0.17236328125, -0.1604156494140625, -0.148468017578125, -0.1365203857421875, -0.12457275390625, -0.1126251220703125, -0.100677490234375, -0.0887298583984375, -0.0767822265625, -0.0648345947265625, -0.052886962890625, -0.0409393310546875, -0.02899169921875, -0.0170440673828125, -0.005096435546875, 0.0068511962890625, 0.018798828125, 0.0307464599609375, 0.042694091796875, 0.0546417236328125, 0.06658935546875, 0.0785369873046875, 0.090484619140625, 0.1024322509765625, 0.1143798828125, 0.1263275146484375, 0.138275146484375, 0.1502227783203125, 0.16217041015625, 0.1741180419921875, 0.186065673828125, 0.1980133056640625, 0.2099609375, 0.2219085693359375, 0.233856201171875, 0.2458038330078125, 0.25775146484375, 0.2696990966796875, 0.281646728515625, 0.2935943603515625, 0.3055419921875, 0.3174896240234375, 0.329437255859375, 0.3413848876953125, 0.35333251953125, 0.3652801513671875, 0.377227783203125, 0.3891754150390625, 0.401123046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0, 6.0, 5.0, 6.0, 13.0, 13.0, 27.0, 32.0, 32.0, 35.0, 47.0, 65.0, 46.0, 65.0, 69.0, 63.0, 81.0, 62.0, 64.0, 36.0, 49.0, 39.0, 28.0, 32.0, 19.0, 16.0, 16.0, 10.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.1895732879638672, -0.18029403686523438, -0.17101478576660156, -0.16173553466796875, -0.15245628356933594, -0.14317703247070312, -0.1338977813720703, -0.1246185302734375, -0.11533927917480469, -0.10606002807617188, -0.09678077697753906, -0.08750152587890625, -0.07822227478027344, -0.06894302368164062, -0.05966377258300781, -0.050384521484375, -0.04110527038574219, -0.031826019287109375, -0.022546768188476562, -0.01326751708984375, -0.0039882659912109375, 0.005290985107421875, 0.014570236206054688, 0.0238494873046875, 0.03312873840332031, 0.042407989501953125, 0.05168724060058594, 0.06096649169921875, 0.07024574279785156, 0.07952499389648438, 0.08880424499511719, 0.09808349609375, 0.10736274719238281, 0.11664199829101562, 0.12592124938964844, 0.13520050048828125, 0.14447975158691406, 0.15375900268554688, 0.1630382537841797, 0.1723175048828125, 0.1815967559814453, 0.19087600708007812, 0.20015525817871094, 0.20943450927734375, 0.21871376037597656, 0.22799301147460938, 0.2372722625732422, 0.246551513671875, 0.2558307647705078, 0.2651100158691406, 0.27438926696777344, 0.28366851806640625, 0.29294776916503906, 0.3022270202636719, 0.3115062713623047, 0.3207855224609375, 0.3300647735595703, 0.3393440246582031, 0.34862327575683594, 0.35790252685546875, 0.36718177795410156, 0.3764610290527344, 0.3857402801513672, 0.39501953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 8.0, 12.0, 19.0, 15.0, 28.0, 69.0, 161.0, 323.0, 919.0, 4320.0, 56664.0, 957795.0, 24241.0, 2661.0, 733.0, 284.0, 116.0, 80.0, 33.0, 28.0, 12.0, 13.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6630859375, -0.63970947265625, -0.6163330078125, -0.59295654296875, -0.569580078125, -0.54620361328125, -0.5228271484375, -0.49945068359375, -0.47607421875, -0.45269775390625, -0.4293212890625, -0.40594482421875, -0.382568359375, -0.35919189453125, -0.3358154296875, -0.31243896484375, -0.2890625, -0.26568603515625, -0.2423095703125, -0.21893310546875, -0.195556640625, -0.17218017578125, -0.1488037109375, -0.12542724609375, -0.10205078125, -0.07867431640625, -0.0552978515625, -0.03192138671875, -0.008544921875, 0.01483154296875, 0.0382080078125, 0.06158447265625, 0.0849609375, 0.10833740234375, 0.1317138671875, 0.15509033203125, 0.178466796875, 0.20184326171875, 0.2252197265625, 0.24859619140625, 0.27197265625, 0.29534912109375, 0.3187255859375, 0.34210205078125, 0.365478515625, 0.38885498046875, 0.4122314453125, 0.43560791015625, 0.458984375, 0.48236083984375, 0.5057373046875, 0.52911376953125, 0.552490234375, 0.57586669921875, 0.5992431640625, 0.62261962890625, 0.64599609375, 0.66937255859375, 0.6927490234375, 0.71612548828125, 0.739501953125, 0.76287841796875, 0.7862548828125, 0.80963134765625, 0.8330078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 5.0, 2.0, 4.0, 10.0, 19.0, 11.0, 13.0, 9.0, 28.0, 23.0, 35.0, 40.0, 42.0, 62.0, 60.0, 72.0, 74.0, 80.0, 56.0, 64.0, 46.0, 29.0, 34.0, 25.0, 19.0, 17.0, 16.0, 21.0, 19.0, 3.0, 12.0, 10.0, 4.0, 5.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9228515625, -0.893707275390625, -0.86456298828125, -0.835418701171875, -0.8062744140625, -0.777130126953125, -0.74798583984375, -0.718841552734375, -0.689697265625, -0.660552978515625, -0.63140869140625, -0.602264404296875, -0.5731201171875, -0.543975830078125, -0.51483154296875, -0.485687255859375, -0.45654296875, -0.427398681640625, -0.39825439453125, -0.369110107421875, -0.3399658203125, -0.310821533203125, -0.28167724609375, -0.252532958984375, -0.223388671875, -0.194244384765625, -0.16510009765625, -0.135955810546875, -0.1068115234375, -0.077667236328125, -0.04852294921875, -0.019378662109375, 0.009765625, 0.038909912109375, 0.06805419921875, 0.097198486328125, 0.1263427734375, 0.155487060546875, 0.18463134765625, 0.213775634765625, 0.242919921875, 0.272064208984375, 0.30120849609375, 0.330352783203125, 0.3594970703125, 0.388641357421875, 0.41778564453125, 0.446929931640625, 0.47607421875, 0.505218505859375, 0.53436279296875, 0.563507080078125, 0.5926513671875, 0.621795654296875, 0.65093994140625, 0.680084228515625, 0.709228515625, 0.738372802734375, 0.76751708984375, 0.796661376953125, 0.8258056640625, 0.854949951171875, 0.88409423828125, 0.913238525390625, 0.9423828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 15.0, 39.0, 57.0, 87.0, 216.0, 420.0, 1015.0, 3544.0, 18101.0, 402606.0, 598483.0, 18597.0, 3491.0, 1013.0, 391.0, 222.0, 97.0, 61.0, 31.0, 17.0, 12.0, 8.0, 6.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11202716827392578, -0.10802650451660156, -0.10402584075927734, -0.10002517700195312, -0.0960245132446289, -0.09202384948730469, -0.08802318572998047, -0.08402252197265625, -0.08002185821533203, -0.07602119445800781, -0.0720205307006836, -0.06801986694335938, -0.06401920318603516, -0.06001853942871094, -0.05601787567138672, -0.0520172119140625, -0.04801654815673828, -0.04401588439941406, -0.040015220642089844, -0.036014556884765625, -0.032013893127441406, -0.028013229370117188, -0.02401256561279297, -0.02001190185546875, -0.01601123809814453, -0.012010574340820312, -0.008009910583496094, -0.004009246826171875, -8.58306884765625e-06, 0.0039920806884765625, 0.007992744445800781, 0.011993408203125, 0.01599407196044922, 0.019994735717773438, 0.023995399475097656, 0.027996063232421875, 0.031996726989746094, 0.03599739074707031, 0.03999805450439453, 0.04399871826171875, 0.04799938201904297, 0.05200004577636719, 0.056000709533691406, 0.060001373291015625, 0.06400203704833984, 0.06800270080566406, 0.07200336456298828, 0.0760040283203125, 0.08000469207763672, 0.08400535583496094, 0.08800601959228516, 0.09200668334960938, 0.0960073471069336, 0.10000801086425781, 0.10400867462158203, 0.10800933837890625, 0.11201000213623047, 0.11601066589355469, 0.1200113296508789, 0.12401199340820312, 0.12801265716552734, 0.13201332092285156, 0.13601398468017578, 0.1400146484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 5.0, 7.0, 10.0, 8.0, 5.0, 10.0, 8.0, 17.0, 19.0, 25.0, 40.0, 47.0, 74.0, 81.0, 105.0, 146.0, 91.0, 69.0, 66.0, 37.0, 25.0, 22.0, 12.0, 9.0, 11.0, 6.0, 8.0, 5.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.547834396362305e-05, -4.409998655319214e-05, -4.272162914276123e-05, -4.134327173233032e-05, -3.9964914321899414e-05, -3.8586556911468506e-05, -3.72081995010376e-05, -3.582984209060669e-05, -3.445148468017578e-05, -3.307312726974487e-05, -3.1694769859313965e-05, -3.0316412448883057e-05, -2.893805503845215e-05, -2.755969762802124e-05, -2.6181340217590332e-05, -2.4802982807159424e-05, -2.3424625396728516e-05, -2.2046267986297607e-05, -2.06679105758667e-05, -1.928955316543579e-05, -1.7911195755004883e-05, -1.6532838344573975e-05, -1.5154480934143066e-05, -1.3776123523712158e-05, -1.239776611328125e-05, -1.1019408702850342e-05, -9.641051292419434e-06, -8.262693881988525e-06, -6.884336471557617e-06, -5.505979061126709e-06, -4.127621650695801e-06, -2.7492642402648926e-06, -1.3709068298339844e-06, 7.450580596923828e-09, 1.385807991027832e-06, 2.7641654014587402e-06, 4.1425228118896484e-06, 5.520880222320557e-06, 6.899237632751465e-06, 8.277595043182373e-06, 9.655952453613281e-06, 1.103430986404419e-05, 1.2412667274475098e-05, 1.3791024684906006e-05, 1.5169382095336914e-05, 1.6547739505767822e-05, 1.792609691619873e-05, 1.930445432662964e-05, 2.0682811737060547e-05, 2.2061169147491455e-05, 2.3439526557922363e-05, 2.481788396835327e-05, 2.619624137878418e-05, 2.7574598789215088e-05, 2.8952956199645996e-05, 3.0331313610076904e-05, 3.170967102050781e-05, 3.308802843093872e-05, 3.446638584136963e-05, 3.584474325180054e-05, 3.7223100662231445e-05, 3.8601458072662354e-05, 3.997981548309326e-05, 4.135817289352417e-05, 4.273653030395508e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 11.0, 9.0, 19.0, 24.0, 40.0, 64.0, 119.0, 216.0, 509.0, 1246.0, 3718.0, 14754.0, 99150.0, 868042.0, 47298.0, 9065.0, 2571.0, 875.0, 384.0, 178.0, 101.0, 57.0, 25.0, 26.0, 12.0, 13.0, 11.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146728515625, -0.14279842376708984, -0.1388683319091797, -0.13493824005126953, -0.13100814819335938, -0.12707805633544922, -0.12314796447753906, -0.1192178726196289, -0.11528778076171875, -0.1113576889038086, -0.10742759704589844, -0.10349750518798828, -0.09956741333007812, -0.09563732147216797, -0.09170722961425781, -0.08777713775634766, -0.0838470458984375, -0.07991695404052734, -0.07598686218261719, -0.07205677032470703, -0.06812667846679688, -0.06419658660888672, -0.06026649475097656, -0.056336402893066406, -0.05240631103515625, -0.048476219177246094, -0.04454612731933594, -0.04061603546142578, -0.036685943603515625, -0.03275585174560547, -0.028825759887695312, -0.024895668029785156, -0.020965576171875, -0.017035484313964844, -0.013105392456054688, -0.009175300598144531, -0.005245208740234375, -0.0013151168823242188, 0.0026149749755859375, 0.006545066833496094, 0.01047515869140625, 0.014405250549316406, 0.018335342407226562, 0.02226543426513672, 0.026195526123046875, 0.03012561798095703, 0.03405570983886719, 0.037985801696777344, 0.0419158935546875, 0.045845985412597656, 0.04977607727050781, 0.05370616912841797, 0.057636260986328125, 0.06156635284423828, 0.06549644470214844, 0.0694265365600586, 0.07335662841796875, 0.0772867202758789, 0.08121681213378906, 0.08514690399169922, 0.08907699584960938, 0.09300708770751953, 0.09693717956542969, 0.10086727142333984, 0.10479736328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 3.0, 10.0, 6.0, 18.0, 17.0, 17.0, 25.0, 44.0, 34.0, 67.0, 75.0, 83.0, 108.0, 103.0, 79.0, 63.0, 59.0, 38.0, 35.0, 24.0, 18.0, 15.0, 12.0, 11.0, 9.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07501220703125, -0.07200431823730469, -0.06899642944335938, -0.06598854064941406, -0.06298065185546875, -0.05997276306152344, -0.056964874267578125, -0.05395698547363281, -0.0509490966796875, -0.04794120788574219, -0.044933319091796875, -0.04192543029785156, -0.03891754150390625, -0.03590965270996094, -0.032901763916015625, -0.029893875122070312, -0.026885986328125, -0.023878097534179688, -0.020870208740234375, -0.017862319946289062, -0.01485443115234375, -0.011846542358398438, -0.008838653564453125, -0.0058307647705078125, -0.0028228759765625, 0.0001850128173828125, 0.003192901611328125, 0.0062007904052734375, 0.00920867919921875, 0.012216567993164062, 0.015224456787109375, 0.018232345581054688, 0.021240234375, 0.024248123168945312, 0.027256011962890625, 0.030263900756835938, 0.03327178955078125, 0.03627967834472656, 0.039287567138671875, 0.04229545593261719, 0.0453033447265625, 0.04831123352050781, 0.051319122314453125, 0.05432701110839844, 0.05733489990234375, 0.06034278869628906, 0.06335067749023438, 0.06635856628417969, 0.069366455078125, 0.07237434387207031, 0.07538223266601562, 0.07839012145996094, 0.08139801025390625, 0.08440589904785156, 0.08741378784179688, 0.09042167663574219, 0.0934295654296875, 0.09643745422363281, 0.09944534301757812, 0.10245323181152344, 0.10546112060546875, 0.10846900939941406, 0.11147689819335938, 0.11448478698730469, 0.11749267578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 1.0, 4.0, 5.0, 17.0, 26.0, 48.0, 156.0, 447.0, 141.0, 68.0, 38.0, 23.0, 14.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1545372009277344, -2.014742612838745, -1.8749477863311768, -1.7351531982421875, -1.5953584909439087, -1.4555637836456299, -1.3157691955566406, -1.1759744882583618, -1.036179780960083, -0.8963850736618042, -0.7565904259681702, -0.6167957782745361, -0.4770010709762573, -0.3372063636779785, -0.19741171598434448, -0.05761706829071045, 0.08217763900756836, 0.22197231650352478, 0.3617669939994812, 0.5015616416931152, 0.641356348991394, 0.7811510562896729, 0.9209457039833069, 1.060740351676941, 1.2005350589752197, 1.3403297662734985, 1.4801244735717773, 1.6199190616607666, 1.7597137689590454, 1.8995084762573242, 2.0393030643463135, 2.1790976524353027, 2.3188929557800293, 2.4586875438690186, 2.598482370376587, 2.738276958465576, 2.8780717849731445, 3.017866373062134, 3.157660961151123, 3.2974557876586914, 3.4372503757476807, 3.57704496383667, 3.7168397903442383, 3.8566343784332275, 3.996428966522217, 4.136223793029785, 4.2760186195373535, 4.415812969207764, 4.555607795715332, 4.6954026222229, 4.8351969718933105, 4.974991798400879, 5.114786624908447, 5.254581451416016, 5.394375801086426, 5.534170627593994, 5.6739654541015625, 5.813760280609131, 5.953554630279541, 6.093349456787109, 6.233144283294678, 6.372939109802246, 6.512733459472656, 6.652528285980225, 6.792322635650635]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 9.0, 10.0, 5.0, 8.0, 17.0, 15.0, 27.0, 14.0, 30.0, 39.0, 31.0, 71.0, 109.0, 161.0, 107.0, 74.0, 41.0, 22.0, 27.0, 15.0, 17.0, 21.0, 14.0, 15.0, 13.0, 15.0, 8.0, 8.0, 9.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.4799249172210693, -2.4034242630004883, -2.3269236087799072, -2.250422954559326, -2.173922300338745, -2.097421646118164, -2.020920991897583, -1.944420337677002, -1.867919683456421, -1.7914190292358398, -1.7149183750152588, -1.6384177207946777, -1.5619170665740967, -1.4854164123535156, -1.4089157581329346, -1.3324151039123535, -1.2559144496917725, -1.1794137954711914, -1.1029131412506104, -1.0264124870300293, -0.9499118328094482, -0.8734111785888672, -0.7969105243682861, -0.7204098701477051, -0.643909215927124, -0.567408561706543, -0.4909079074859619, -0.41440725326538086, -0.3379065990447998, -0.26140594482421875, -0.1849052906036377, -0.10840463638305664, -0.031903743743896484, 0.04459691047668457, 0.12109756469726562, 0.19759821891784668, 0.27409887313842773, 0.3505995273590088, 0.42710018157958984, 0.5036008358001709, 0.580101490020752, 0.656602144241333, 0.7331027984619141, 0.8096034526824951, 0.8861041069030762, 0.9626047611236572, 1.0391054153442383, 1.1156060695648193, 1.1921067237854004, 1.2686073780059814, 1.3451080322265625, 1.4216086864471436, 1.4981093406677246, 1.5746099948883057, 1.6511106491088867, 1.7276113033294678, 1.8041119575500488, 1.8806126117706299, 1.957113265991211, 2.033613920211792, 2.110114574432373, 2.186615228652954, 2.263115882873535, 2.339616537094116, 2.4161171913146973]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 8.0, 15.0, 22.0, 24.0, 30.0, 42.0, 58.0, 50.0, 103.0, 274.0, 90.0, 78.0, 52.0, 40.0, 27.0, 23.0, 21.0, 21.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5947265625, -0.5821952819824219, -0.5696640014648438, -0.5571327209472656, -0.5446014404296875, -0.5320701599121094, -0.5195388793945312, -0.5070075988769531, -0.494476318359375, -0.4819450378417969, -0.46941375732421875, -0.4568824768066406, -0.4443511962890625, -0.4318199157714844, -0.41928863525390625, -0.4067573547363281, -0.39422607421875, -0.3816947937011719, -0.36916351318359375, -0.3566322326660156, -0.3441009521484375, -0.3315696716308594, -0.31903839111328125, -0.3065071105957031, -0.293975830078125, -0.2814445495605469, -0.26891326904296875, -0.2563819885253906, -0.2438507080078125, -0.23131942749023438, -0.21878814697265625, -0.20625686645507812, -0.1937255859375, -0.18119430541992188, -0.16866302490234375, -0.15613174438476562, -0.1436004638671875, -0.13106918334960938, -0.11853790283203125, -0.10600662231445312, -0.093475341796875, -0.08094406127929688, -0.06841278076171875, -0.055881500244140625, -0.0433502197265625, -0.030818939208984375, -0.01828765869140625, -0.005756378173828125, 0.00677490234375, 0.019306182861328125, 0.03183746337890625, 0.044368743896484375, 0.0569000244140625, 0.06943130493164062, 0.08196258544921875, 0.09449386596679688, 0.107025146484375, 0.11955642700195312, 0.13208770751953125, 0.14461898803710938, 0.1571502685546875, 0.16968154907226562, 0.18221282958984375, 0.19474411010742188, 0.207275390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 3.0, 10.0, 4.0, 17.0, 17.0, 14.0, 23.0, 31.0, 35.0, 51.0, 72.0, 175.0, 363.0, 1301.0, 7462.0, 8329077.0, 45295.0, 3318.0, 723.0, 247.0, 90.0, 74.0, 41.0, 39.0, 18.0, 20.0, 14.0, 8.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0], "bins": [-2.142411947250366, -2.072843074798584, -2.003274440765381, -1.9337055683135986, -1.864136815071106, -1.7945680618286133, -1.724999189376831, -1.6554304361343384, -1.5858616828918457, -1.516292929649353, -1.4467240571975708, -1.3771553039550781, -1.3075865507125854, -1.2380177974700928, -1.1684489250183105, -1.0988801717758179, -1.0293112993240356, -0.9597424864768982, -0.8901737332344055, -0.8206049203872681, -0.7510361671447754, -0.6814673542976379, -0.6118985414505005, -0.5423297882080078, -0.47276097536087036, -0.4031921923160553, -0.33362340927124023, -0.2640545964241028, -0.19448581337928772, -0.12491703033447266, -0.055348217487335205, 0.014220565557479858, 0.08378934860229492, 0.15335813164710999, 0.22292692959308624, 0.2924957275390625, 0.36206451058387756, 0.4316332936286926, 0.5012021064758301, 0.5707708597183228, 0.6403396725654602, 0.7099084854125977, 0.7794772386550903, 0.8490460515022278, 0.9186148643493652, 0.9881836175918579, 1.0577523708343506, 1.1273212432861328, 1.1968899965286255, 1.2664587497711182, 1.3360276222229004, 1.405596375465393, 1.4751651287078857, 1.544734001159668, 1.6143027544021606, 1.6838715076446533, 1.7534403800964355, 1.8230091333389282, 1.8925780057907104, 1.9621467590332031, 2.0317156314849854, 2.1012842655181885, 2.1708531379699707, 2.240422010421753, 2.309990644454956]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8204708099365234, -2.755647897720337, -2.6908252239227295, -2.626002311706543, -2.5611793994903564, -2.496356725692749, -2.4315338134765625, -2.366710901260376, -2.3018882274627686, -2.237065315246582, -2.1722426414489746, -2.107419729232788, -2.0425968170166016, -1.9777741432189941, -1.9129512310028076, -1.8481284379959106, -1.7833055257797241, -1.7184827327728271, -1.6536598205566406, -1.5888370275497437, -1.5240142345428467, -1.4591913223266602, -1.3943685293197632, -1.3295457363128662, -1.2647228240966797, -1.1999000310897827, -1.1350771188735962, -1.0702543258666992, -1.0054315328598022, -0.9406086802482605, -0.8757858276367188, -0.8109630346298218, -0.7461402416229248, -0.6813173890113831, -0.6164945960044861, -0.5516717433929443, -0.486848920583725, -0.4220260977745056, -0.35720324516296387, -0.2923804223537445, -0.22755759954452515, -0.1627347767353058, -0.09791193902492523, -0.03308910131454468, 0.03173372149467468, 0.09655654430389404, 0.1613793969154358, 0.22620221972465515, 0.2910250425338745, 0.35584786534309387, 0.42067068815231323, 0.485493540763855, 0.550316333770752, 0.6151391863822937, 0.6799620389938354, 0.7447848320007324, 0.8096076846122742, 0.8744305372238159, 0.9392533302307129, 1.0040762424468994, 1.0688990354537964, 1.1337218284606934, 1.1985447406768799, 1.2633675336837769, 1.3281903266906738]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 3.0, 3.0, 3.0, 14.0, 7.0, 9.0, 8.0, 11.0, 11.0, 11.0, 19.0, 19.0, 27.0, 22.0, 34.0, 29.0, 47.0, 43.0, 48.0, 49.0, 33.0, 41.0, 46.0, 46.0, 41.0, 51.0, 43.0, 43.0, 44.0, 31.0, 25.0, 27.0, 26.0, 12.0, 5.0, 14.0, 16.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.17333984375, -0.16819381713867188, -0.16304779052734375, -0.15790176391601562, -0.1527557373046875, -0.14760971069335938, -0.14246368408203125, -0.13731765747070312, -0.132171630859375, -0.12702560424804688, -0.12187957763671875, -0.11673355102539062, -0.1115875244140625, -0.10644149780273438, -0.10129547119140625, -0.09614944458007812, -0.09100341796875, -0.08585739135742188, -0.08071136474609375, -0.07556533813476562, -0.0704193115234375, -0.06527328491210938, -0.06012725830078125, -0.054981231689453125, -0.049835205078125, -0.044689178466796875, -0.03954315185546875, -0.034397125244140625, -0.0292510986328125, -0.024105072021484375, -0.01895904541015625, -0.013813018798828125, -0.0086669921875, -0.003520965576171875, 0.00162506103515625, 0.006771087646484375, 0.0119171142578125, 0.017063140869140625, 0.02220916748046875, 0.027355194091796875, 0.032501220703125, 0.037647247314453125, 0.04279327392578125, 0.047939300537109375, 0.0530853271484375, 0.058231353759765625, 0.06337738037109375, 0.06852340698242188, 0.07366943359375, 0.07881546020507812, 0.08396148681640625, 0.08910751342773438, 0.0942535400390625, 0.09939956665039062, 0.10454559326171875, 0.10969161987304688, 0.114837646484375, 0.11998367309570312, 0.12512969970703125, 0.13027572631835938, 0.1354217529296875, 0.14056777954101562, 0.14571380615234375, 0.15085983276367188, 0.156005859375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 23.0, 23.0, 27.0, 40.0, 59.0, 133.0, 182.0, 322.0, 604.0, 1205.0, 2531.0, 6373.0, 18427.0, 59167.0, 177892.0, 171597.0, 56310.0, 17681.0, 6335.0, 2636.0, 1189.0, 560.0, 324.0, 211.0, 126.0, 87.0, 57.0, 33.0, 27.0, 17.0, 16.0, 13.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.0509490966796875, -1.005218505859375, -0.9594879150390625, -0.91375732421875, -0.8680267333984375, -0.822296142578125, -0.7765655517578125, -0.7308349609375, -0.6851043701171875, -0.639373779296875, -0.5936431884765625, -0.54791259765625, -0.5021820068359375, -0.456451416015625, -0.4107208251953125, -0.364990234375, -0.3192596435546875, -0.273529052734375, -0.2277984619140625, -0.18206787109375, -0.1363372802734375, -0.090606689453125, -0.0448760986328125, 0.0008544921875, 0.0465850830078125, 0.092315673828125, 0.1380462646484375, 0.18377685546875, 0.2295074462890625, 0.275238037109375, 0.3209686279296875, 0.36669921875, 0.4124298095703125, 0.458160400390625, 0.5038909912109375, 0.54962158203125, 0.5953521728515625, 0.641082763671875, 0.6868133544921875, 0.7325439453125, 0.7782745361328125, 0.824005126953125, 0.8697357177734375, 0.91546630859375, 0.9611968994140625, 1.006927490234375, 1.0526580810546875, 1.098388671875, 1.1441192626953125, 1.189849853515625, 1.2355804443359375, 1.28131103515625, 1.3270416259765625, 1.372772216796875, 1.4185028076171875, 1.4642333984375, 1.5099639892578125, 1.555694580078125, 1.6014251708984375, 1.64715576171875, 1.6928863525390625, 1.738616943359375, 1.7843475341796875, 1.830078125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 7.0, 15.0, 24.0, 28.0, 54.0, 62.0, 70.0, 81.0, 88.0, 122.0, 90.0, 84.0, 58.0, 42.0, 54.0, 26.0, 34.0, 11.0, 10.0, 11.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3457183837890625, -0.334747314453125, -0.3237762451171875, -0.31280517578125, -0.3018341064453125, -0.290863037109375, -0.2798919677734375, -0.2689208984375, -0.2579498291015625, -0.246978759765625, -0.2360076904296875, -0.22503662109375, -0.2140655517578125, -0.203094482421875, -0.1921234130859375, -0.18115234375, -0.1701812744140625, -0.159210205078125, -0.1482391357421875, -0.13726806640625, -0.1262969970703125, -0.115325927734375, -0.1043548583984375, -0.0933837890625, -0.0824127197265625, -0.071441650390625, -0.0604705810546875, -0.04949951171875, -0.0385284423828125, -0.027557373046875, -0.0165863037109375, -0.005615234375, 0.0053558349609375, 0.016326904296875, 0.0272979736328125, 0.03826904296875, 0.0492401123046875, 0.060211181640625, 0.0711822509765625, 0.0821533203125, 0.0931243896484375, 0.104095458984375, 0.1150665283203125, 0.12603759765625, 0.1370086669921875, 0.147979736328125, 0.1589508056640625, 0.169921875, 0.1808929443359375, 0.191864013671875, 0.2028350830078125, 0.21380615234375, 0.2247772216796875, 0.235748291015625, 0.2467193603515625, 0.2576904296875, 0.2686614990234375, 0.279632568359375, 0.2906036376953125, 0.30157470703125, 0.3125457763671875, 0.323516845703125, 0.3344879150390625, 0.345458984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 12.0, 11.0, 29.0, 52.0, 90.0, 96.0, 82.0, 38.0, 23.0, 6.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4527597427368164, -2.388012170791626, -2.3232648372650146, -2.258517265319824, -2.193769693374634, -2.1290221214294434, -2.064274787902832, -1.9995272159576416, -1.9347796440124512, -1.8700321912765503, -1.8052846193313599, -1.740537166595459, -1.6757895946502686, -1.6110421419143677, -1.5462946891784668, -1.4815471172332764, -1.4167996644973755, -1.3520522117614746, -1.2873046398162842, -1.2225571870803833, -1.1578096151351929, -1.093062162399292, -1.0283145904541016, -0.9635671377182007, -0.898819625377655, -0.8340721130371094, -0.7693246006965637, -0.7045770883560181, -0.6398296356201172, -0.5750820636749268, -0.5103346109390259, -0.4455870985984802, -0.380839467048645, -0.31609195470809937, -0.2513444423675537, -0.18659695982933044, -0.12184944748878479, -0.057101935148239136, 0.007645547389984131, 0.07239305973052979, 0.13714057207107544, 0.2018880844116211, 0.26663559675216675, 0.33138307929039, 0.39613059163093567, 0.4608781039714813, 0.5256255865097046, 0.5903730988502502, 0.6551206111907959, 0.7198681235313416, 0.7846156358718872, 0.8493630886077881, 0.9141106605529785, 0.9788581132888794, 1.0436055660247803, 1.1083531379699707, 1.1731007099151611, 1.237848162651062, 1.3025957345962524, 1.3673431873321533, 1.4320907592773438, 1.4968382120132446, 1.5615856647491455, 1.626333236694336, 1.6910806894302368]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 12.0, 21.0, 34.0, 56.0, 60.0, 66.0, 63.0, 47.0, 20.0, 15.0, 7.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9985530376434326, -1.9410454034805298, -1.8835376501083374, -1.8260300159454346, -1.7685223817825317, -1.7110146284103394, -1.6535069942474365, -1.5959992408752441, -1.5384916067123413, -1.4809839725494385, -1.423476219177246, -1.3659685850143433, -1.3084609508514404, -1.250953197479248, -1.1934455633163452, -1.1359379291534424, -1.07843017578125, -1.0209225416183472, -0.9634148478507996, -0.905907154083252, -0.8483994603157043, -0.7908917665481567, -0.7333841323852539, -0.6758764386177063, -0.6183688640594482, -0.5608611702919006, -0.5033535361289978, -0.4458458423614502, -0.3883381485939026, -0.33083048462867737, -0.27332282066345215, -0.21581512689590454, -0.15830743312835693, -0.10079975426197052, -0.0432920828461647, 0.014215588569641113, 0.07172326743602753, 0.12923094630241394, 0.18673861026763916, 0.24424630403518677, 0.301753968000412, 0.3592616319656372, 0.4167693257331848, 0.47427698969841003, 0.5317846536636353, 0.5892923474311829, 0.6468000411987305, 0.7043076753616333, 0.7618153691291809, 0.8193230628967285, 0.8768306970596313, 0.934338390827179, 0.9918460845947266, 1.0493537187576294, 1.1068613529205322, 1.1643691062927246, 1.2218767404556274, 1.2793843746185303, 1.3368921279907227, 1.3943997621536255, 1.4519073963165283, 1.5094151496887207, 1.5669227838516235, 1.6244304180145264, 1.6819381713867188]}, "eval/loss": 0.35429710149765015, "eval/wer": 0.10019833399444665, "eval/runtime": 408.7192, "eval/samples_per_second": 6.464, "eval/steps_per_second": 0.406, "train/train_runtime": 25891.0003, "train/train_samples_per_second": 11.022, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 2.1241667401347613}