diff --git "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 3.1046, "train/learning_rate": 0.0003245579270532452, "train/epoch": 0.15, "train/global_step": 500, "_runtime": 3650, "_timestamp": 1651677739, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 615.0, 387.0, 9.0, 2.0, 2.0], "bins": [-95.63389587402344, -94.03797149658203, -92.44204711914062, -90.84611511230469, -89.25019073486328, -87.65426635742188, -86.05834197998047, -84.46241760253906, -82.86648559570312, -81.27056121826172, -79.67463684082031, -78.07870483398438, -76.48278045654297, -74.88685607910156, -73.29093170166016, -71.69500732421875, -70.09908294677734, -68.50315856933594, -66.90723419189453, -65.3113021850586, -63.71537780761719, -62.11945343017578, -60.523529052734375, -58.9276008605957, -57.33167266845703, -55.735748291015625, -54.13982009887695, -52.54389572143555, -50.947967529296875, -49.35204315185547, -47.75611877441406, -46.16019058227539, -44.56426239013672, -42.96833801269531, -41.37240982055664, -39.776485443115234, -38.18055725097656, -36.584632873535156, -34.98870849609375, -33.39278030395508, -31.796855926513672, -30.200929641723633, -28.605003356933594, -27.009078979492188, -25.41315269470215, -23.81722640991211, -22.22130012512207, -20.62537384033203, -19.029449462890625, -17.433523178100586, -15.837597846984863, -14.241671562194824, -12.645746231079102, -11.049819946289062, -9.453893661499023, -7.857968330383301, -6.2620415687561035, -4.666115760803223, -3.0701897144317627, -1.4742636680603027, 0.12166213989257812, 1.717587947845459, 3.313514232635498, 4.909439563751221, 6.50536584854126]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 12.0, 21.0, 34.0, 45.0, 69.0, 79.0, 128.0, 117.0, 120.0, 95.0, 86.0, 80.0, 37.0, 28.0, 13.0, 16.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.35371208190918, -10.862190246582031, -10.370668411254883, -9.879145622253418, -9.38762378692627, -8.896101951599121, -8.404580116271973, -7.913057804107666, -7.421535491943359, -6.930013656616211, -6.438491344451904, -5.946969509124756, -5.455447196960449, -4.963925361633301, -4.472403526306152, -3.9808812141418457, -3.4893593788146973, -2.9978373050689697, -2.506315231323242, -2.0147933959960938, -1.5232712030410767, -1.0317492485046387, -0.5402271747589111, -0.048705101013183594, 0.44281697273254395, 0.9343390464782715, 1.425861120223999, 1.917383074760437, 2.408905029296875, 2.9004271030426025, 3.39194917678833, 3.8834712505340576, 4.374993324279785, 4.866515159606934, 5.35803747177124, 5.849559307098389, 6.341081619262695, 6.832603454589844, 7.324125289916992, 7.815647602081299, 8.307169914245605, 8.798691749572754, 9.290213584899902, 9.781736373901367, 10.273258209228516, 10.764780044555664, 11.256301879882812, 11.747823715209961, 12.23934555053711, 12.730867385864258, 13.222389221191406, 13.713912010192871, 14.20543384552002, 14.696955680847168, 15.188477516174316, 15.680000305175781, 16.17152214050293, 16.663043975830078, 17.154565811157227, 17.646087646484375, 18.137609481811523, 18.629131317138672, 19.120655059814453, 19.6121768951416, 20.10369873046875]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 11.0, 16.0, 21.0, 41.0, 151.0, 882.0, 1330.0, 2879.0, 8210.0, 88129.0, 3848129.0, 231952.0, 10328.0, 1331.0, 354.0, 183.0, 85.0, 66.0, 33.0, 30.0, 22.0, 16.0, 12.0, 11.0, 11.0, 9.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7265625, -12.1373291015625, -11.548095703125, -10.9588623046875, -10.36962890625, -9.7803955078125, -9.191162109375, -8.6019287109375, -8.0126953125, -7.4234619140625, -6.834228515625, -6.2449951171875, -5.65576171875, -5.0665283203125, -4.477294921875, -3.8880615234375, -3.298828125, -2.7095947265625, -2.120361328125, -1.5311279296875, -0.94189453125, -0.3526611328125, 0.236572265625, 0.8258056640625, 1.4150390625, 2.0042724609375, 2.593505859375, 3.1827392578125, 3.77197265625, 4.3612060546875, 4.950439453125, 5.5396728515625, 6.12890625, 6.7181396484375, 7.307373046875, 7.8966064453125, 8.48583984375, 9.0750732421875, 9.664306640625, 10.2535400390625, 10.8427734375, 11.4320068359375, 12.021240234375, 12.6104736328125, 13.19970703125, 13.7889404296875, 14.378173828125, 14.9674072265625, 15.556640625, 16.1458740234375, 16.735107421875, 17.3243408203125, 17.91357421875, 18.5028076171875, 19.092041015625, 19.6812744140625, 20.2705078125, 20.8597412109375, 21.448974609375, 22.0382080078125, 22.62744140625, 23.2166748046875, 23.805908203125, 24.3951416015625, 24.984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 11.0, 22.0, 41.0, 67.0, 70.0, 100.0, 120.0, 136.0, 113.0, 113.0, 70.0, 46.0, 35.0, 7.0, 12.0, 14.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.546875, -8.12841796875, -7.7099609375, -7.29150390625, -6.873046875, -6.45458984375, -6.0361328125, -5.61767578125, -5.19921875, -4.78076171875, -4.3623046875, -3.94384765625, -3.525390625, -3.10693359375, -2.6884765625, -2.27001953125, -1.8515625, -1.43310546875, -1.0146484375, -0.59619140625, -0.177734375, 0.24072265625, 0.6591796875, 1.07763671875, 1.49609375, 1.91455078125, 2.3330078125, 2.75146484375, 3.169921875, 3.58837890625, 4.0068359375, 4.42529296875, 4.84375, 5.26220703125, 5.6806640625, 6.09912109375, 6.517578125, 6.93603515625, 7.3544921875, 7.77294921875, 8.19140625, 8.60986328125, 9.0283203125, 9.44677734375, 9.865234375, 10.28369140625, 10.7021484375, 11.12060546875, 11.5390625, 11.95751953125, 12.3759765625, 12.79443359375, 13.212890625, 13.63134765625, 14.0498046875, 14.46826171875, 14.88671875, 15.30517578125, 15.7236328125, 16.14208984375, 16.560546875, 16.97900390625, 17.3974609375, 17.81591796875, 18.234375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 12.0, 12.0, 17.0, 35.0, 77.0, 385.0, 4191235.0, 2224.0, 173.0, 40.0, 22.0, 16.0, 11.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.75, -254.47265625, -244.1953125, -233.91796875, -223.640625, -213.36328125, -203.0859375, -192.80859375, -182.53125, -172.25390625, -161.9765625, -151.69921875, -141.421875, -131.14453125, -120.8671875, -110.58984375, -100.3125, -90.03515625, -79.7578125, -69.48046875, -59.203125, -48.92578125, -38.6484375, -28.37109375, -18.09375, -7.81640625, 2.4609375, 12.73828125, 23.015625, 33.29296875, 43.5703125, 53.84765625, 64.125, 74.40234375, 84.6796875, 94.95703125, 105.234375, 115.51171875, 125.7890625, 136.06640625, 146.34375, 156.62109375, 166.8984375, 177.17578125, 187.453125, 197.73046875, 208.0078125, 218.28515625, 228.5625, 238.83984375, 249.1171875, 259.39453125, 269.671875, 279.94921875, 290.2265625, 300.50390625, 310.78125, 321.05859375, 331.3359375, 341.61328125, 351.890625, 362.16796875, 372.4453125, 382.72265625, 393.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 14.0, 8.0, 17.0, 39.0, 101.0, 526.0, 2473.0, 696.0, 102.0, 32.0, 17.0, 16.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.27734375, -5.0782470703125, -4.879150390625, -4.6800537109375, -4.48095703125, -4.2818603515625, -4.082763671875, -3.8836669921875, -3.6845703125, -3.4854736328125, -3.286376953125, -3.0872802734375, -2.88818359375, -2.6890869140625, -2.489990234375, -2.2908935546875, -2.091796875, -1.8927001953125, -1.693603515625, -1.4945068359375, -1.29541015625, -1.0963134765625, -0.897216796875, -0.6981201171875, -0.4990234375, -0.2999267578125, -0.100830078125, 0.0982666015625, 0.29736328125, 0.4964599609375, 0.695556640625, 0.8946533203125, 1.09375, 1.2928466796875, 1.491943359375, 1.6910400390625, 1.89013671875, 2.0892333984375, 2.288330078125, 2.4874267578125, 2.6865234375, 2.8856201171875, 3.084716796875, 3.2838134765625, 3.48291015625, 3.6820068359375, 3.881103515625, 4.0802001953125, 4.279296875, 4.4783935546875, 4.677490234375, 4.8765869140625, 5.07568359375, 5.2747802734375, 5.473876953125, 5.6729736328125, 5.8720703125, 6.0711669921875, 6.270263671875, 6.4693603515625, 6.66845703125, 6.8675537109375, 7.066650390625, 7.2657470703125, 7.46484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 19.0, 60.0, 118.0, 292.0, 303.0, 129.0, 49.0, 18.0, 8.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.277957916259766, -31.55997657775879, -30.841995239257812, -30.124013900756836, -29.40603256225586, -28.688051223754883, -27.970069885253906, -27.25208854675293, -26.534107208251953, -25.816125869750977, -25.09814453125, -24.380163192749023, -23.662181854248047, -22.94420051574707, -22.226219177246094, -21.508237838745117, -20.79025650024414, -20.072275161743164, -19.354293823242188, -18.63631248474121, -17.918331146240234, -17.200349807739258, -16.48236846923828, -15.764387130737305, -15.046407699584961, -14.328426361083984, -13.610445022583008, -12.892463684082031, -12.174482345581055, -11.456501007080078, -10.738519668579102, -10.020538330078125, -9.302556991577148, -8.584575653076172, -7.866594314575195, -7.148612976074219, -6.430631637573242, -5.712650299072266, -4.994669437408447, -4.276688098907471, -3.558706760406494, -2.8407254219055176, -2.122744083404541, -1.4047629833221436, -0.686781644821167, 0.03119969367980957, 0.749180793762207, 1.4671621322631836, 2.18514347076416, 2.9031248092651367, 3.6211061477661133, 4.33908748626709, 5.057068824768066, 5.775050163269043, 6.493031024932861, 7.211012363433838, 7.9289937019348145, 8.646974563598633, 9.36495590209961, 10.082937240600586, 10.800918579101562, 11.518899917602539, 12.236881256103516, 12.954862594604492, 13.672843933105469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 8.0, 10.0, 6.0, 13.0, 19.0, 15.0, 35.0, 48.0, 39.0, 52.0, 62.0, 66.0, 78.0, 92.0, 73.0, 66.0, 61.0, 58.0, 51.0, 46.0, 24.0, 18.0, 14.0, 15.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.424617767333984, -7.091316223144531, -6.758014678955078, -6.424712657928467, -6.091411113739014, -5.7581095695495605, -5.424807548522949, -5.091506004333496, -4.758204460144043, -4.42490291595459, -4.091601371765137, -3.7582993507385254, -3.4249978065490723, -3.091696262359619, -2.758394479751587, -2.4250926971435547, -2.0917911529541016, -1.7584894895553589, -1.4251878261566162, -1.0918861627578735, -0.7585844993591309, -0.4252828359603882, -0.09198117256164551, 0.24132061004638672, 0.5746221542358398, 0.9079238176345825, 1.2412254810333252, 1.5745271444320679, 1.9078288078308105, 2.2411303520202637, 2.574432134628296, 2.907733917236328, 3.2410354614257812, 3.5743370056152344, 3.9076387882232666, 4.240940570831299, 4.574242115020752, 4.907543659210205, 5.240845680236816, 5.5741472244262695, 5.907448768615723, 6.240750312805176, 6.574051856994629, 6.90735387802124, 7.240655422210693, 7.5739569664001465, 7.907258987426758, 8.240560531616211, 8.573862075805664, 8.907163619995117, 9.24046516418457, 9.573766708374023, 9.907068252563477, 10.240370750427246, 10.5736722946167, 10.906973838806152, 11.240275382995605, 11.573576927185059, 11.906878471374512, 12.240180015563965, 12.573482513427734, 12.906784057617188, 13.24008560180664, 13.573387145996094, 13.906688690185547]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 15.0, 21.0, 33.0, 41.0, 64.0, 114.0, 170.0, 298.0, 533.0, 1138.0, 2585.0, 7998.0, 38633.0, 389553.0, 538765.0, 53048.0, 9680.0, 3125.0, 1304.0, 560.0, 310.0, 206.0, 114.0, 75.0, 41.0, 30.0, 17.0, 16.0, 12.0, 9.0, 11.0, 1.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.759765625, -2.673736572265625, -2.58770751953125, -2.501678466796875, -2.4156494140625, -2.329620361328125, -2.24359130859375, -2.157562255859375, -2.071533203125, -1.985504150390625, -1.89947509765625, -1.813446044921875, -1.7274169921875, -1.641387939453125, -1.55535888671875, -1.469329833984375, -1.38330078125, -1.297271728515625, -1.21124267578125, -1.125213623046875, -1.0391845703125, -0.953155517578125, -0.86712646484375, -0.781097412109375, -0.695068359375, -0.609039306640625, -0.52301025390625, -0.436981201171875, -0.3509521484375, -0.264923095703125, -0.17889404296875, -0.092864990234375, -0.0068359375, 0.079193115234375, 0.16522216796875, 0.251251220703125, 0.3372802734375, 0.423309326171875, 0.50933837890625, 0.595367431640625, 0.681396484375, 0.767425537109375, 0.85345458984375, 0.939483642578125, 1.0255126953125, 1.111541748046875, 1.19757080078125, 1.283599853515625, 1.36962890625, 1.455657958984375, 1.54168701171875, 1.627716064453125, 1.7137451171875, 1.799774169921875, 1.88580322265625, 1.971832275390625, 2.057861328125, 2.143890380859375, 2.22991943359375, 2.315948486328125, 2.4019775390625, 2.488006591796875, 2.57403564453125, 2.660064697265625, 2.74609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 10.0, 10.0, 14.0, 17.0, 29.0, 44.0, 49.0, 69.0, 88.0, 89.0, 99.0, 118.0, 69.0, 79.0, 62.0, 45.0, 31.0, 24.0, 15.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.02099609375, -6.7216796875, -6.42236328125, -6.123046875, -5.82373046875, -5.5244140625, -5.22509765625, -4.92578125, -4.62646484375, -4.3271484375, -4.02783203125, -3.728515625, -3.42919921875, -3.1298828125, -2.83056640625, -2.53125, -2.23193359375, -1.9326171875, -1.63330078125, -1.333984375, -1.03466796875, -0.7353515625, -0.43603515625, -0.13671875, 0.16259765625, 0.4619140625, 0.76123046875, 1.060546875, 1.35986328125, 1.6591796875, 1.95849609375, 2.2578125, 2.55712890625, 2.8564453125, 3.15576171875, 3.455078125, 3.75439453125, 4.0537109375, 4.35302734375, 4.65234375, 4.95166015625, 5.2509765625, 5.55029296875, 5.849609375, 6.14892578125, 6.4482421875, 6.74755859375, 7.046875, 7.34619140625, 7.6455078125, 7.94482421875, 8.244140625, 8.54345703125, 8.8427734375, 9.14208984375, 9.44140625, 9.74072265625, 10.0400390625, 10.33935546875, 10.638671875, 10.93798828125, 11.2373046875, 11.53662109375, 11.8359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 11.0, 19.0, 26.0, 36.0, 77.0, 106.0, 161.0, 219.0, 378.0, 644.0, 1131.0, 2016.0, 3547.0, 6537.0, 12479.0, 24225.0, 50290.0, 106882.0, 218784.0, 280905.0, 176125.0, 82551.0, 39237.0, 19319.0, 10170.0, 5431.0, 3026.0, 1700.0, 949.0, 598.0, 342.0, 189.0, 133.0, 103.0, 66.0, 40.0, 29.0, 21.0, 16.0, 10.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.55517578125, -0.5390052795410156, -0.5228347778320312, -0.5066642761230469, -0.4904937744140625, -0.4743232727050781, -0.45815277099609375, -0.4419822692871094, -0.425811767578125, -0.4096412658691406, -0.39347076416015625, -0.3773002624511719, -0.3611297607421875, -0.3449592590332031, -0.32878875732421875, -0.3126182556152344, -0.29644775390625, -0.2802772521972656, -0.26410675048828125, -0.24793624877929688, -0.2317657470703125, -0.21559524536132812, -0.19942474365234375, -0.18325424194335938, -0.167083740234375, -0.15091323852539062, -0.13474273681640625, -0.11857223510742188, -0.1024017333984375, -0.08623123168945312, -0.07006072998046875, -0.053890228271484375, -0.0377197265625, -0.021549224853515625, -0.00537872314453125, 0.010791778564453125, 0.0269622802734375, 0.043132781982421875, 0.05930328369140625, 0.07547378540039062, 0.091644287109375, 0.10781478881835938, 0.12398529052734375, 0.14015579223632812, 0.1563262939453125, 0.17249679565429688, 0.18866729736328125, 0.20483779907226562, 0.22100830078125, 0.23717880249023438, 0.25334930419921875, 0.2695198059082031, 0.2856903076171875, 0.3018608093261719, 0.31803131103515625, 0.3342018127441406, 0.350372314453125, 0.3665428161621094, 0.38271331787109375, 0.3988838195800781, 0.4150543212890625, 0.4312248229980469, 0.44739532470703125, 0.4635658264160156, 0.479736328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 5.0, 4.0, 14.0, 12.0, 9.0, 16.0, 32.0, 15.0, 23.0, 34.0, 28.0, 30.0, 26.0, 38.0, 37.0, 45.0, 48.0, 52.0, 48.0, 44.0, 45.0, 40.0, 42.0, 46.0, 34.0, 33.0, 28.0, 27.0, 24.0, 19.0, 18.0, 18.0, 9.0, 9.0, 5.0, 14.0, 6.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1484375, -8.87158203125, -8.5947265625, -8.31787109375, -8.041015625, -7.76416015625, -7.4873046875, -7.21044921875, -6.93359375, -6.65673828125, -6.3798828125, -6.10302734375, -5.826171875, -5.54931640625, -5.2724609375, -4.99560546875, -4.71875, -4.44189453125, -4.1650390625, -3.88818359375, -3.611328125, -3.33447265625, -3.0576171875, -2.78076171875, -2.50390625, -2.22705078125, -1.9501953125, -1.67333984375, -1.396484375, -1.11962890625, -0.8427734375, -0.56591796875, -0.2890625, -0.01220703125, 0.2646484375, 0.54150390625, 0.818359375, 1.09521484375, 1.3720703125, 1.64892578125, 1.92578125, 2.20263671875, 2.4794921875, 2.75634765625, 3.033203125, 3.31005859375, 3.5869140625, 3.86376953125, 4.140625, 4.41748046875, 4.6943359375, 4.97119140625, 5.248046875, 5.52490234375, 5.8017578125, 6.07861328125, 6.35546875, 6.63232421875, 6.9091796875, 7.18603515625, 7.462890625, 7.73974609375, 8.0166015625, 8.29345703125, 8.5703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 8.0, 9.0, 17.0, 26.0, 31.0, 48.0, 63.0, 142.0, 177.0, 278.0, 454.0, 789.0, 1320.0, 2511.0, 5126.0, 11668.0, 30079.0, 89644.0, 311579.0, 407279.0, 121546.0, 38744.0, 14306.0, 6043.0, 2858.0, 1558.0, 829.0, 488.0, 323.0, 217.0, 126.0, 88.0, 57.0, 38.0, 21.0, 17.0, 15.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0792236328125, -0.07690238952636719, -0.07458114624023438, -0.07225990295410156, -0.06993865966796875, -0.06761741638183594, -0.06529617309570312, -0.06297492980957031, -0.0606536865234375, -0.05833244323730469, -0.056011199951171875, -0.05368995666503906, -0.05136871337890625, -0.04904747009277344, -0.046726226806640625, -0.04440498352050781, -0.042083740234375, -0.03976249694824219, -0.037441253662109375, -0.03512001037597656, -0.03279876708984375, -0.030477523803710938, -0.028156280517578125, -0.025835037231445312, -0.0235137939453125, -0.021192550659179688, -0.018871307373046875, -0.016550064086914062, -0.01422882080078125, -0.011907577514648438, -0.009586334228515625, -0.0072650909423828125, -0.00494384765625, -0.0026226043701171875, -0.000301361083984375, 0.0020198822021484375, 0.00434112548828125, 0.0066623687744140625, 0.008983612060546875, 0.011304855346679688, 0.0136260986328125, 0.015947341918945312, 0.018268585205078125, 0.020589828491210938, 0.02291107177734375, 0.025232315063476562, 0.027553558349609375, 0.029874801635742188, 0.032196044921875, 0.03451728820800781, 0.036838531494140625, 0.03915977478027344, 0.04148101806640625, 0.04380226135253906, 0.046123504638671875, 0.04844474792480469, 0.0507659912109375, 0.05308723449707031, 0.055408477783203125, 0.05772972106933594, 0.06005096435546875, 0.06237220764160156, 0.06469345092773438, 0.06701469421386719, 0.0693359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 9.0, 17.0, 20.0, 36.0, 69.0, 96.0, 145.0, 154.0, 174.0, 95.0, 64.0, 44.0, 25.0, 20.0, 13.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002903938293457031, -0.0002828836441040039, -0.0002753734588623047, -0.00026786327362060547, -0.00026035308837890625, -0.00025284290313720703, -0.0002453327178955078, -0.0002378225326538086, -0.00023031234741210938, -0.00022280216217041016, -0.00021529197692871094, -0.00020778179168701172, -0.0002002716064453125, -0.00019276142120361328, -0.00018525123596191406, -0.00017774105072021484, -0.00017023086547851562, -0.0001627206802368164, -0.0001552104949951172, -0.00014770030975341797, -0.00014019012451171875, -0.00013267993927001953, -0.0001251697540283203, -0.0001176595687866211, -0.00011014938354492188, -0.00010263919830322266, -9.512901306152344e-05, -8.761882781982422e-05, -8.0108642578125e-05, -7.259845733642578e-05, -6.508827209472656e-05, -5.7578086853027344e-05, -5.0067901611328125e-05, -4.2557716369628906e-05, -3.504753112792969e-05, -2.753734588623047e-05, -2.002716064453125e-05, -1.2516975402832031e-05, -5.0067901611328125e-06, 2.5033950805664062e-06, 1.0013580322265625e-05, 1.7523765563964844e-05, 2.5033950805664062e-05, 3.254413604736328e-05, 4.00543212890625e-05, 4.756450653076172e-05, 5.507469177246094e-05, 6.258487701416016e-05, 7.009506225585938e-05, 7.76052474975586e-05, 8.511543273925781e-05, 9.262561798095703e-05, 0.00010013580322265625, 0.00010764598846435547, 0.00011515617370605469, 0.0001226663589477539, 0.00013017654418945312, 0.00013768672943115234, 0.00014519691467285156, 0.00015270709991455078, 0.00016021728515625, 0.00016772747039794922, 0.00017523765563964844, 0.00018274784088134766, 0.00019025802612304688]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 7.0, 13.0, 12.0, 18.0, 24.0, 36.0, 42.0, 76.0, 102.0, 232.0, 1062.0, 45704.0, 990945.0, 9252.0, 526.0, 154.0, 87.0, 80.0, 40.0, 23.0, 23.0, 26.0, 11.0, 17.0, 11.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5117950439453125, -0.497711181640625, -0.4836273193359375, -0.46954345703125, -0.4554595947265625, -0.441375732421875, -0.4272918701171875, -0.4132080078125, -0.3991241455078125, -0.385040283203125, -0.3709564208984375, -0.35687255859375, -0.3427886962890625, -0.328704833984375, -0.3146209716796875, -0.300537109375, -0.2864532470703125, -0.272369384765625, -0.2582855224609375, -0.24420166015625, -0.2301177978515625, -0.216033935546875, -0.2019500732421875, -0.1878662109375, -0.1737823486328125, -0.159698486328125, -0.1456146240234375, -0.13153076171875, -0.1174468994140625, -0.103363037109375, -0.0892791748046875, -0.0751953125, -0.0611114501953125, -0.047027587890625, -0.0329437255859375, -0.01885986328125, -0.0047760009765625, 0.009307861328125, 0.0233917236328125, 0.0374755859375, 0.0515594482421875, 0.065643310546875, 0.0797271728515625, 0.09381103515625, 0.1078948974609375, 0.121978759765625, 0.1360626220703125, 0.150146484375, 0.1642303466796875, 0.178314208984375, 0.1923980712890625, 0.20648193359375, 0.2205657958984375, 0.234649658203125, 0.2487335205078125, 0.2628173828125, 0.2769012451171875, 0.290985107421875, 0.3050689697265625, 0.31915283203125, 0.3332366943359375, 0.347320556640625, 0.3614044189453125, 0.37548828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 7.0, 8.0, 7.0, 6.0, 19.0, 14.0, 18.0, 21.0, 26.0, 33.0, 41.0, 58.0, 73.0, 59.0, 84.0, 87.0, 70.0, 60.0, 56.0, 50.0, 41.0, 30.0, 25.0, 17.0, 18.0, 17.0, 16.0, 9.0, 9.0, 7.0, 3.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.03179931640625, -0.03094649314880371, -0.030093669891357422, -0.029240846633911133, -0.028388023376464844, -0.027535200119018555, -0.026682376861572266, -0.025829553604125977, -0.024976730346679688, -0.0241239070892334, -0.02327108383178711, -0.02241826057434082, -0.02156543731689453, -0.020712614059448242, -0.019859790802001953, -0.019006967544555664, -0.018154144287109375, -0.017301321029663086, -0.016448497772216797, -0.015595674514770508, -0.014742851257324219, -0.01389002799987793, -0.01303720474243164, -0.012184381484985352, -0.011331558227539062, -0.010478734970092773, -0.009625911712646484, -0.008773088455200195, -0.007920265197753906, -0.007067441940307617, -0.006214618682861328, -0.005361795425415039, -0.00450897216796875, -0.003656148910522461, -0.002803325653076172, -0.0019505023956298828, -0.0010976791381835938, -0.0002448558807373047, 0.0006079673767089844, 0.0014607906341552734, 0.0023136138916015625, 0.0031664371490478516, 0.004019260406494141, 0.00487208366394043, 0.005724906921386719, 0.006577730178833008, 0.007430553436279297, 0.008283376693725586, 0.009136199951171875, 0.009989023208618164, 0.010841846466064453, 0.011694669723510742, 0.012547492980957031, 0.01340031623840332, 0.01425313949584961, 0.015105962753295898, 0.015958786010742188, 0.016811609268188477, 0.017664432525634766, 0.018517255783081055, 0.019370079040527344, 0.020222902297973633, 0.021075725555419922, 0.02192854881286621, 0.0227813720703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 23.0, 125.0, 477.0, 314.0, 49.0, 16.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.40188980102539, -30.41054344177246, -29.41919708251953, -28.42784881591797, -27.43650245666504, -26.44515609741211, -25.45380973815918, -24.46246337890625, -23.47111701965332, -22.47977066040039, -21.48842430114746, -20.49707794189453, -19.50572967529297, -18.51438331604004, -17.52303695678711, -16.53169059753418, -15.540343284606934, -14.548996925354004, -13.557649612426758, -12.566303253173828, -11.574956893920898, -10.583610534667969, -9.592263221740723, -8.600916862487793, -7.609570026397705, -6.618223190307617, -5.6268768310546875, -4.6355299949646, -3.644183397293091, -2.652836799621582, -1.6614899635314941, -0.6701436042785645, 0.32120323181152344, 1.3125498294830322, 2.303896427154541, 3.295243263244629, 4.286589622497559, 5.2779364585876465, 6.269283294677734, 7.260629653930664, 8.251976013183594, 9.243322372436523, 10.23466968536377, 11.2260160446167, 12.217362403869629, 13.208709716796875, 14.200056076049805, 15.191402435302734, 16.182750701904297, 17.174097061157227, 18.165443420410156, 19.15679168701172, 20.14813804626465, 21.139484405517578, 22.130830764770508, 23.122177124023438, 24.113523483276367, 25.104869842529297, 26.096216201782227, 27.087562561035156, 28.07891082763672, 29.07025718688965, 30.061603546142578, 31.052949905395508, 32.04429626464844]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 11.0, 7.0, 12.0, 14.0, 21.0, 34.0, 51.0, 46.0, 57.0, 75.0, 83.0, 94.0, 92.0, 79.0, 69.0, 68.0, 48.0, 41.0, 25.0, 21.0, 11.0, 8.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.851236343383789, -6.583756923675537, -6.316277027130127, -6.048797607421875, -5.781318187713623, -5.513838768005371, -5.246358871459961, -4.978879451751709, -4.711400032043457, -4.443920612335205, -4.176440715789795, -3.908961296081543, -3.641481876373291, -3.37400221824646, -3.106522560119629, -2.839043140411377, -2.571563243865967, -2.3040835857391357, -2.036604166030884, -1.7691245079040527, -1.5016449689865112, -1.2341654300689697, -0.9666857719421387, -0.6992062330245972, -0.43172669410705566, -0.16424712538719177, 0.10323244333267212, 0.3707120418548584, 0.6381915807723999, 0.9056711196899414, 1.1731507778167725, 1.440630316734314, 1.7081098556518555, 1.975589394569397, 2.2430689334869385, 2.5105485916137695, 2.7780280113220215, 3.0455076694488525, 3.3129873275756836, 3.5804667472839355, 3.8479464054107666, 4.115426063537598, 4.38290548324585, 4.650384902954102, 4.917864799499512, 5.185344219207764, 5.452823638916016, 5.720303535461426, 5.987782955169678, 6.25526237487793, 6.52274227142334, 6.790221691131592, 7.057701110839844, 7.325181007385254, 7.592660427093506, 7.860139846801758, 8.127619743347168, 8.395099639892578, 8.662578582763672, 8.930058479309082, 9.197538375854492, 9.465017318725586, 9.732497215270996, 9.999977111816406, 10.2674560546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 6.0, 20.0, 21.0, 45.0, 48.0, 96.0, 181.0, 367.0, 662.0, 1709.0, 5002.0, 26458.0, 503288.0, 477248.0, 25332.0, 4912.0, 1677.0, 646.0, 318.0, 188.0, 102.0, 61.0, 39.0, 29.0, 19.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.5386962890625, -14.053955078125, -13.5692138671875, -13.08447265625, -12.5997314453125, -12.114990234375, -11.6302490234375, -11.1455078125, -10.6607666015625, -10.176025390625, -9.6912841796875, -9.20654296875, -8.7218017578125, -8.237060546875, -7.7523193359375, -7.267578125, -6.7828369140625, -6.298095703125, -5.8133544921875, -5.32861328125, -4.8438720703125, -4.359130859375, -3.8743896484375, -3.3896484375, -2.9049072265625, -2.420166015625, -1.9354248046875, -1.45068359375, -0.9659423828125, -0.481201171875, 0.0035400390625, 0.48828125, 0.9730224609375, 1.457763671875, 1.9425048828125, 2.42724609375, 2.9119873046875, 3.396728515625, 3.8814697265625, 4.3662109375, 4.8509521484375, 5.335693359375, 5.8204345703125, 6.30517578125, 6.7899169921875, 7.274658203125, 7.7593994140625, 8.244140625, 8.7288818359375, 9.213623046875, 9.6983642578125, 10.18310546875, 10.6678466796875, 11.152587890625, 11.6373291015625, 12.1220703125, 12.6068115234375, 13.091552734375, 13.5762939453125, 14.06103515625, 14.5457763671875, 15.030517578125, 15.5152587890625, 16.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 5.0, 11.0, 20.0, 33.0, 53.0, 69.0, 79.0, 115.0, 116.0, 114.0, 115.0, 78.0, 59.0, 53.0, 36.0, 19.0, 14.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.125, -147.501953125, -142.87890625, -138.255859375, -133.6328125, -129.009765625, -124.38671875, -119.763671875, -115.140625, -110.517578125, -105.89453125, -101.271484375, -96.6484375, -92.025390625, -87.40234375, -82.779296875, -78.15625, -73.533203125, -68.91015625, -64.287109375, -59.6640625, -55.041015625, -50.41796875, -45.794921875, -41.171875, -36.548828125, -31.92578125, -27.302734375, -22.6796875, -18.056640625, -13.43359375, -8.810546875, -4.1875, 0.435546875, 5.05859375, 9.681640625, 14.3046875, 18.927734375, 23.55078125, 28.173828125, 32.796875, 37.419921875, 42.04296875, 46.666015625, 51.2890625, 55.912109375, 60.53515625, 65.158203125, 69.78125, 74.404296875, 79.02734375, 83.650390625, 88.2734375, 92.896484375, 97.51953125, 102.142578125, 106.765625, 111.388671875, 116.01171875, 120.634765625, 125.2578125, 129.880859375, 134.50390625, 139.126953125, 143.75]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 3.0, 9.0, 5.0, 9.0, 20.0, 26.0, 36.0, 50.0, 95.0, 174.0, 346.0, 1363.0, 1015498.0, 29629.0, 696.0, 243.0, 139.0, 81.0, 46.0, 25.0, 19.0, 12.0, 10.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-80.0, -77.76708984375, -75.5341796875, -73.30126953125, -71.068359375, -68.83544921875, -66.6025390625, -64.36962890625, -62.13671875, -59.90380859375, -57.6708984375, -55.43798828125, -53.205078125, -50.97216796875, -48.7392578125, -46.50634765625, -44.2734375, -42.04052734375, -39.8076171875, -37.57470703125, -35.341796875, -33.10888671875, -30.8759765625, -28.64306640625, -26.41015625, -24.17724609375, -21.9443359375, -19.71142578125, -17.478515625, -15.24560546875, -13.0126953125, -10.77978515625, -8.546875, -6.31396484375, -4.0810546875, -1.84814453125, 0.384765625, 2.61767578125, 4.8505859375, 7.08349609375, 9.31640625, 11.54931640625, 13.7822265625, 16.01513671875, 18.248046875, 20.48095703125, 22.7138671875, 24.94677734375, 27.1796875, 29.41259765625, 31.6455078125, 33.87841796875, 36.111328125, 38.34423828125, 40.5771484375, 42.81005859375, 45.04296875, 47.27587890625, 49.5087890625, 51.74169921875, 53.974609375, 56.20751953125, 58.4404296875, 60.67333984375, 62.90625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 9.0, 12.0, 20.0, 33.0, 45.0, 67.0, 95.0, 103.0, 139.0, 96.0, 99.0, 72.0, 65.0, 45.0, 31.0, 16.0, 7.0, 16.0, 8.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-135.375, -131.5048828125, -127.634765625, -123.7646484375, -119.89453125, -116.0244140625, -112.154296875, -108.2841796875, -104.4140625, -100.5439453125, -96.673828125, -92.8037109375, -88.93359375, -85.0634765625, -81.193359375, -77.3232421875, -73.453125, -69.5830078125, -65.712890625, -61.8427734375, -57.97265625, -54.1025390625, -50.232421875, -46.3623046875, -42.4921875, -38.6220703125, -34.751953125, -30.8818359375, -27.01171875, -23.1416015625, -19.271484375, -15.4013671875, -11.53125, -7.6611328125, -3.791015625, 0.0791015625, 3.94921875, 7.8193359375, 11.689453125, 15.5595703125, 19.4296875, 23.2998046875, 27.169921875, 31.0400390625, 34.91015625, 38.7802734375, 42.650390625, 46.5205078125, 50.390625, 54.2607421875, 58.130859375, 62.0009765625, 65.87109375, 69.7412109375, 73.611328125, 77.4814453125, 81.3515625, 85.2216796875, 89.091796875, 92.9619140625, 96.83203125, 100.7021484375, 104.572265625, 108.4423828125, 112.3125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 8.0, 6.0, 9.0, 20.0, 19.0, 53.0, 83.0, 345.0, 2125.0, 53496.0, 985967.0, 5493.0, 630.0, 143.0, 51.0, 31.0, 12.0, 8.0, 12.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.9249420166015625, -0.885040283203125, -0.8451385498046875, -0.80523681640625, -0.7653350830078125, -0.725433349609375, -0.6855316162109375, -0.6456298828125, -0.6057281494140625, -0.565826416015625, -0.5259246826171875, -0.48602294921875, -0.4461212158203125, -0.406219482421875, -0.3663177490234375, -0.326416015625, -0.2865142822265625, -0.246612548828125, -0.2067108154296875, -0.16680908203125, -0.1269073486328125, -0.087005615234375, -0.0471038818359375, -0.0072021484375, 0.0326995849609375, 0.072601318359375, 0.1125030517578125, 0.15240478515625, 0.1923065185546875, 0.232208251953125, 0.2721099853515625, 0.31201171875, 0.3519134521484375, 0.391815185546875, 0.4317169189453125, 0.47161865234375, 0.5115203857421875, 0.551422119140625, 0.5913238525390625, 0.6312255859375, 0.6711273193359375, 0.711029052734375, 0.7509307861328125, 0.79083251953125, 0.8307342529296875, 0.870635986328125, 0.9105377197265625, 0.950439453125, 0.9903411865234375, 1.030242919921875, 1.0701446533203125, 1.11004638671875, 1.1499481201171875, 1.189849853515625, 1.2297515869140625, 1.2696533203125, 1.3095550537109375, 1.349456787109375, 1.3893585205078125, 1.42926025390625, 1.4691619873046875, 1.509063720703125, 1.5489654541015625, 1.5888671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 13.0, 14.0, 21.0, 55.0, 123.0, 383.0, 221.0, 85.0, 45.0, 14.0, 8.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022304058074951172, -0.0002168063074350357, -0.0002105720341205597, -0.00020433776080608368, -0.00019810348749160767, -0.00019186921417713165, -0.00018563494086265564, -0.00017940066754817963, -0.0001731663942337036, -0.0001669321209192276, -0.0001606978476047516, -0.00015446357429027557, -0.00014822930097579956, -0.00014199502766132355, -0.00013576075434684753, -0.00012952648103237152, -0.0001232922077178955, -0.0001170579344034195, -0.00011082366108894348, -0.00010458938777446747, -9.835511445999146e-05, -9.212084114551544e-05, -8.588656783103943e-05, -7.965229451656342e-05, -7.34180212020874e-05, -6.718374788761139e-05, -6.0949474573135376e-05, -5.471520125865936e-05, -4.848092794418335e-05, -4.2246654629707336e-05, -3.601238131523132e-05, -2.977810800075531e-05, -2.3543834686279297e-05, -1.7309561371803284e-05, -1.107528805732727e-05, -4.841014742851257e-06, 1.3932585716247559e-06, 7.627531886100769e-06, 1.3861805200576782e-05, 2.0096078515052795e-05, 2.633035182952881e-05, 3.256462514400482e-05, 3.8798898458480835e-05, 4.503317177295685e-05, 5.126744508743286e-05, 5.7501718401908875e-05, 6.373599171638489e-05, 6.99702650308609e-05, 7.620453834533691e-05, 8.243881165981293e-05, 8.867308497428894e-05, 9.490735828876495e-05, 0.00010114163160324097, 0.00010737590491771698, 0.00011361017823219299, 0.000119844451546669, 0.00012607872486114502, 0.00013231299817562103, 0.00013854727149009705, 0.00014478154480457306, 0.00015101581811904907, 0.00015725009143352509, 0.0001634843647480011, 0.0001697186380624771, 0.00017595291137695312]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 10.0, 18.0, 18.0, 29.0, 54.0, 148.0, 656.0, 3850.0, 174062.0, 864098.0, 4542.0, 709.0, 175.0, 52.0, 35.0, 19.0, 13.0, 12.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.251953125, -1.2128753662109375, -1.173797607421875, -1.1347198486328125, -1.09564208984375, -1.0565643310546875, -1.017486572265625, -0.9784088134765625, -0.9393310546875, -0.9002532958984375, -0.861175537109375, -0.8220977783203125, -0.78302001953125, -0.7439422607421875, -0.704864501953125, -0.6657867431640625, -0.626708984375, -0.5876312255859375, -0.548553466796875, -0.5094757080078125, -0.47039794921875, -0.4313201904296875, -0.392242431640625, -0.3531646728515625, -0.3140869140625, -0.2750091552734375, -0.235931396484375, -0.1968536376953125, -0.15777587890625, -0.1186981201171875, -0.079620361328125, -0.0405426025390625, -0.00146484375, 0.0376129150390625, 0.076690673828125, 0.1157684326171875, 0.15484619140625, 0.1939239501953125, 0.233001708984375, 0.2720794677734375, 0.3111572265625, 0.3502349853515625, 0.389312744140625, 0.4283905029296875, 0.46746826171875, 0.5065460205078125, 0.545623779296875, 0.5847015380859375, 0.623779296875, 0.6628570556640625, 0.701934814453125, 0.7410125732421875, 0.78009033203125, 0.8191680908203125, 0.858245849609375, 0.8973236083984375, 0.9364013671875, 0.9754791259765625, 1.014556884765625, 1.0536346435546875, 1.09271240234375, 1.1317901611328125, 1.170867919921875, 1.2099456787109375, 1.2490234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 14.0, 10.0, 34.0, 40.0, 99.0, 295.0, 252.0, 87.0, 45.0, 24.0, 13.0, 10.0, 8.0, 11.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1512451171875, -0.14651107788085938, -0.14177703857421875, -0.13704299926757812, -0.1323089599609375, -0.12757492065429688, -0.12284088134765625, -0.11810684204101562, -0.113372802734375, -0.10863876342773438, -0.10390472412109375, -0.09917068481445312, -0.0944366455078125, -0.08970260620117188, -0.08496856689453125, -0.08023452758789062, -0.07550048828125, -0.07076644897460938, -0.06603240966796875, -0.061298370361328125, -0.0565643310546875, -0.051830291748046875, -0.04709625244140625, -0.042362213134765625, -0.037628173828125, -0.032894134521484375, -0.02816009521484375, -0.023426055908203125, -0.0186920166015625, -0.013957977294921875, -0.00922393798828125, -0.004489898681640625, 0.000244140625, 0.004978179931640625, 0.00971221923828125, 0.014446258544921875, 0.0191802978515625, 0.023914337158203125, 0.02864837646484375, 0.033382415771484375, 0.038116455078125, 0.042850494384765625, 0.04758453369140625, 0.052318572998046875, 0.0570526123046875, 0.061786651611328125, 0.06652069091796875, 0.07125473022460938, 0.07598876953125, 0.08072280883789062, 0.08545684814453125, 0.09019088745117188, 0.0949249267578125, 0.09965896606445312, 0.10439300537109375, 0.10912704467773438, 0.113861083984375, 0.11859512329101562, 0.12332916259765625, 0.12806320190429688, 0.1327972412109375, 0.13753128051757812, 0.14226531982421875, 0.14699935913085938, 0.1517333984375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1018.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.542007446289062, -6.938444137573242, 8.665119171142578, 24.26868438720703, 39.87224578857422, 55.475807189941406, 71.07937622070312, 86.68293762207031, 102.2864990234375, 117.89006042480469, 133.49362182617188, 149.09719848632812, 164.70074462890625, 180.3043212890625, 195.9078826904297, 211.51144409179688, 227.11500549316406, 242.71856689453125, 258.3221435546875, 273.9256896972656, 289.5292663574219, 305.1328125, 320.73638916015625, 336.3399658203125, 351.9435119628906, 367.5470886230469, 383.150634765625, 398.75421142578125, 414.3577575683594, 429.9613342285156, 445.56488037109375, 461.16845703125, 476.77203369140625, 492.3756103515625, 507.9791564941406, 523.5827026367188, 539.186279296875, 554.7898559570312, 570.3934326171875, 585.9969482421875, 601.6005249023438, 617.2041015625, 632.8076782226562, 648.4111938476562, 664.0147705078125, 679.6183471679688, 695.221923828125, 710.825439453125, 726.4290771484375, 742.0326538085938, 757.63623046875, 773.23974609375, 788.8433227539062, 804.4468994140625, 820.0504760742188, 835.654052734375, 851.257568359375, 866.8611450195312, 882.4647216796875, 898.0682373046875, 913.6718139648438, 929.275390625, 944.8789672851562, 960.4825439453125, 976.0860595703125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 14.0, 17.0, 18.0, 32.0, 40.0, 37.0, 45.0, 64.0, 76.0, 49.0, 70.0, 60.0, 72.0, 58.0, 53.0, 53.0, 44.0, 52.0, 43.0, 25.0, 26.0, 23.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-136.90679931640625, -133.37371826171875, -129.84063720703125, -126.30755615234375, -122.77447509765625, -119.24139404296875, -115.70831298828125, -112.17523193359375, -108.64215087890625, -105.10906982421875, -101.57598876953125, -98.04290771484375, -94.50982666015625, -90.97674560546875, -87.44366455078125, -83.91058349609375, -80.37750244140625, -76.84442138671875, -73.31134033203125, -69.77825927734375, -66.24517822265625, -62.71209716796875, -59.17901611328125, -55.64593505859375, -52.11285400390625, -48.57977294921875, -45.04669189453125, -41.51361083984375, -37.98052978515625, -34.44744873046875, -30.91436767578125, -27.38128662109375, -23.84821319580078, -20.31513214111328, -16.78205108642578, -13.248970031738281, -9.715888977050781, -6.182807922363281, -2.6497268676757812, 0.8833541870117188, 4.416435241699219, 7.949516296386719, 11.482597351074219, 15.015678405761719, 18.54875946044922, 22.08184051513672, 25.61492156982422, 29.14800262451172, 32.68108367919922, 36.21416473388672, 39.74724578857422, 43.28032684326172, 46.81340789794922, 50.34648895263672, 53.87957000732422, 57.41265106201172, 60.94573211669922, 64.47881317138672, 68.01189422607422, 71.54497528076172, 75.07805633544922, 78.61113739013672, 82.14421844482422, 85.67729949951172, 89.21038055419922]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 7.0, 11.0, 15.0, 22.0, 39.0, 60.0, 76.0, 164.0, 300.0, 765.0, 3855065.0, 336529.0, 579.0, 269.0, 161.0, 74.0, 47.0, 33.0, 23.0, 17.0, 12.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.5625, -58.0703125, -56.578125, -55.0859375, -53.59375, -52.1015625, -50.609375, -49.1171875, -47.625, -46.1328125, -44.640625, -43.1484375, -41.65625, -40.1640625, -38.671875, -37.1796875, -35.6875, -34.1953125, -32.703125, -31.2109375, -29.71875, -28.2265625, -26.734375, -25.2421875, -23.75, -22.2578125, -20.765625, -19.2734375, -17.78125, -16.2890625, -14.796875, -13.3046875, -11.8125, -10.3203125, -8.828125, -7.3359375, -5.84375, -4.3515625, -2.859375, -1.3671875, 0.125, 1.6171875, 3.109375, 4.6015625, 6.09375, 7.5859375, 9.078125, 10.5703125, 12.0625, 13.5546875, 15.046875, 16.5390625, 18.03125, 19.5234375, 21.015625, 22.5078125, 24.0, 25.4921875, 26.984375, 28.4765625, 29.96875, 31.4609375, 32.953125, 34.4453125, 35.9375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 5.0, 7.0, 15.0, 22.0, 23.0, 31.0, 38.0, 39.0, 64.0, 65.0, 68.0, 70.0, 81.0, 78.0, 80.0, 56.0, 63.0, 50.0, 40.0, 22.0, 18.0, 22.0, 13.0, 3.0, 9.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.39447021484375, -7.1717529296875, -6.94903564453125, -6.726318359375, -6.50360107421875, -6.2808837890625, -6.05816650390625, -5.83544921875, -5.61273193359375, -5.3900146484375, -5.16729736328125, -4.944580078125, -4.72186279296875, -4.4991455078125, -4.27642822265625, -4.0537109375, -3.83099365234375, -3.6082763671875, -3.38555908203125, -3.162841796875, -2.94012451171875, -2.7174072265625, -2.49468994140625, -2.27197265625, -2.04925537109375, -1.8265380859375, -1.60382080078125, -1.381103515625, -1.15838623046875, -0.9356689453125, -0.71295166015625, -0.490234375, -0.26751708984375, -0.0447998046875, 0.17791748046875, 0.400634765625, 0.62335205078125, 0.8460693359375, 1.06878662109375, 1.29150390625, 1.51422119140625, 1.7369384765625, 1.95965576171875, 2.182373046875, 2.40509033203125, 2.6278076171875, 2.85052490234375, 3.0732421875, 3.29595947265625, 3.5186767578125, 3.74139404296875, 3.964111328125, 4.18682861328125, 4.4095458984375, 4.63226318359375, 4.85498046875, 5.07769775390625, 5.3004150390625, 5.52313232421875, 5.745849609375, 5.96856689453125, 6.1912841796875, 6.41400146484375, 6.63671875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 23.0, 111.0, 4193824.0, 218.0, 41.0, 25.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-476.75, -463.37890625, -450.0078125, -436.63671875, -423.265625, -409.89453125, -396.5234375, -383.15234375, -369.78125, -356.41015625, -343.0390625, -329.66796875, -316.296875, -302.92578125, -289.5546875, -276.18359375, -262.8125, -249.44140625, -236.0703125, -222.69921875, -209.328125, -195.95703125, -182.5859375, -169.21484375, -155.84375, -142.47265625, -129.1015625, -115.73046875, -102.359375, -88.98828125, -75.6171875, -62.24609375, -48.875, -35.50390625, -22.1328125, -8.76171875, 4.609375, 17.98046875, 31.3515625, 44.72265625, 58.09375, 71.46484375, 84.8359375, 98.20703125, 111.578125, 124.94921875, 138.3203125, 151.69140625, 165.0625, 178.43359375, 191.8046875, 205.17578125, 218.546875, 231.91796875, 245.2890625, 258.66015625, 272.03125, 285.40234375, 298.7734375, 312.14453125, 325.515625, 338.88671875, 352.2578125, 365.62890625, 379.0]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 12.0, 7.0, 13.0, 37.0, 45.0, 121.0, 442.0, 1243.0, 1417.0, 420.0, 149.0, 81.0, 28.0, 24.0, 13.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.718536376953125, -2.63629150390625, -2.554046630859375, -2.4718017578125, -2.389556884765625, -2.30731201171875, -2.225067138671875, -2.142822265625, -2.060577392578125, -1.97833251953125, -1.896087646484375, -1.8138427734375, -1.731597900390625, -1.64935302734375, -1.567108154296875, -1.48486328125, -1.402618408203125, -1.32037353515625, -1.238128662109375, -1.1558837890625, -1.073638916015625, -0.99139404296875, -0.909149169921875, -0.826904296875, -0.744659423828125, -0.66241455078125, -0.580169677734375, -0.4979248046875, -0.415679931640625, -0.33343505859375, -0.251190185546875, -0.1689453125, -0.086700439453125, -0.00445556640625, 0.077789306640625, 0.1600341796875, 0.242279052734375, 0.32452392578125, 0.406768798828125, 0.489013671875, 0.571258544921875, 0.65350341796875, 0.735748291015625, 0.8179931640625, 0.900238037109375, 0.98248291015625, 1.064727783203125, 1.14697265625, 1.229217529296875, 1.31146240234375, 1.393707275390625, 1.4759521484375, 1.558197021484375, 1.64044189453125, 1.722686767578125, 1.804931640625, 1.887176513671875, 1.96942138671875, 2.051666259765625, 2.1339111328125, 2.216156005859375, 2.29840087890625, 2.380645751953125, 2.462890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 14.0, 17.0, 32.0, 26.0, 67.0, 85.0, 108.0, 143.0, 178.0, 112.0, 85.0, 53.0, 29.0, 18.0, 11.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.210118293762207, -7.972774982452393, -7.735432147979736, -7.498088836669922, -7.260745525360107, -7.023402214050293, -6.786059379577637, -6.548716068267822, -6.311372756958008, -6.074029445648193, -5.836686611175537, -5.599343299865723, -5.361999988555908, -5.124656677246094, -4.8873138427734375, -4.649970531463623, -4.412627696990967, -4.175284385681152, -3.937941312789917, -3.7005982398986816, -3.463254928588867, -3.225911855697632, -2.9885687828063965, -2.751225471496582, -2.5138823986053467, -2.2765393257141113, -2.039196014404297, -1.8018529415130615, -1.5645097494125366, -1.3271665573120117, -1.0898234844207764, -0.8524802923202515, -0.6151366233825684, -0.37779346108436584, -0.14045029878616333, 0.0968928337097168, 0.3342360258102417, 0.5715792179107666, 0.808922290802002, 1.0462654829025269, 1.2836086750030518, 1.5209518671035767, 1.7582950592041016, 1.995638132095337, 2.2329812049865723, 2.4703245162963867, 2.707667589187622, 2.9450106620788574, 3.182353973388672, 3.4196970462799072, 3.6570403575897217, 3.894383430480957, 4.1317267417907715, 4.369070053100586, 4.606412887573242, 4.843756198883057, 5.081099510192871, 5.3184428215026855, 5.555785655975342, 5.793128967285156, 6.030472278594971, 6.267815589904785, 6.505158424377441, 6.742501735687256, 6.979844570159912]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 10.0, 10.0, 16.0, 15.0, 30.0, 25.0, 33.0, 49.0, 64.0, 63.0, 62.0, 82.0, 82.0, 72.0, 72.0, 58.0, 52.0, 54.0, 33.0, 24.0, 27.0, 19.0, 17.0, 9.0, 11.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6487226486206055, -7.417795658111572, -7.186868667602539, -6.955941677093506, -6.725014686584473, -6.4940876960754395, -6.263160705566406, -6.032233715057373, -5.80130672454834, -5.570379734039307, -5.339452743530273, -5.10852575302124, -4.877598762512207, -4.646671772003174, -4.415744781494141, -4.184817790985107, -3.953890562057495, -3.722963571548462, -3.4920365810394287, -3.2611095905303955, -3.0301826000213623, -2.79925537109375, -2.568328380584717, -2.3374013900756836, -2.1064743995666504, -1.8755474090576172, -1.644620418548584, -1.4136934280395508, -1.1827664375305176, -0.9518393278121948, -0.7209123373031616, -0.4899853467941284, -0.25905847549438477, -0.02813147008419037, 0.20279553532600403, 0.4337225556373596, 0.6646495461463928, 0.8955765962600708, 1.126503586769104, 1.3574305772781372, 1.5883575677871704, 1.8192845582962036, 2.0502116680145264, 2.2811386585235596, 2.5120656490325928, 2.742992639541626, 2.973919630050659, 3.2048466205596924, 3.4357736110687256, 3.666700601577759, 3.897627592086792, 4.128554821014404, 4.3594818115234375, 4.590408802032471, 4.821335792541504, 5.052262783050537, 5.28318977355957, 5.5141167640686035, 5.745043754577637, 5.97597074508667, 6.206897735595703, 6.437824726104736, 6.6687517166137695, 6.899678707122803, 7.130605697631836]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 11.0, 16.0, 30.0, 34.0, 59.0, 106.0, 223.0, 406.0, 758.0, 1664.0, 4062.0, 19006.0, 256390.0, 707388.0, 46867.0, 6998.0, 2228.0, 1101.0, 547.0, 282.0, 146.0, 72.0, 46.0, 24.0, 16.0, 10.0, 10.0, 10.0, 7.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.021484375, -1.960601806640625, -1.89971923828125, -1.838836669921875, -1.7779541015625, -1.717071533203125, -1.65618896484375, -1.595306396484375, -1.534423828125, -1.473541259765625, -1.41265869140625, -1.351776123046875, -1.2908935546875, -1.230010986328125, -1.16912841796875, -1.108245849609375, -1.04736328125, -0.986480712890625, -0.92559814453125, -0.864715576171875, -0.8038330078125, -0.742950439453125, -0.68206787109375, -0.621185302734375, -0.560302734375, -0.499420166015625, -0.43853759765625, -0.377655029296875, -0.3167724609375, -0.255889892578125, -0.19500732421875, -0.134124755859375, -0.0732421875, -0.012359619140625, 0.04852294921875, 0.109405517578125, 0.1702880859375, 0.231170654296875, 0.29205322265625, 0.352935791015625, 0.413818359375, 0.474700927734375, 0.53558349609375, 0.596466064453125, 0.6573486328125, 0.718231201171875, 0.77911376953125, 0.839996337890625, 0.90087890625, 0.961761474609375, 1.02264404296875, 1.083526611328125, 1.1444091796875, 1.205291748046875, 1.26617431640625, 1.327056884765625, 1.387939453125, 1.448822021484375, 1.50970458984375, 1.570587158203125, 1.6314697265625, 1.692352294921875, 1.75323486328125, 1.814117431640625, 1.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 7.0, 8.0, 8.0, 22.0, 33.0, 23.0, 31.0, 51.0, 64.0, 73.0, 100.0, 85.0, 98.0, 91.0, 66.0, 60.0, 45.0, 43.0, 32.0, 22.0, 20.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9140625, -6.748779296875, -6.58349609375, -6.418212890625, -6.2529296875, -6.087646484375, -5.92236328125, -5.757080078125, -5.591796875, -5.426513671875, -5.26123046875, -5.095947265625, -4.9306640625, -4.765380859375, -4.60009765625, -4.434814453125, -4.26953125, -4.104248046875, -3.93896484375, -3.773681640625, -3.6083984375, -3.443115234375, -3.27783203125, -3.112548828125, -2.947265625, -2.781982421875, -2.61669921875, -2.451416015625, -2.2861328125, -2.120849609375, -1.95556640625, -1.790283203125, -1.625, -1.459716796875, -1.29443359375, -1.129150390625, -0.9638671875, -0.798583984375, -0.63330078125, -0.468017578125, -0.302734375, -0.137451171875, 0.02783203125, 0.193115234375, 0.3583984375, 0.523681640625, 0.68896484375, 0.854248046875, 1.01953125, 1.184814453125, 1.35009765625, 1.515380859375, 1.6806640625, 1.845947265625, 2.01123046875, 2.176513671875, 2.341796875, 2.507080078125, 2.67236328125, 2.837646484375, 3.0029296875, 3.168212890625, 3.33349609375, 3.498779296875, 3.6640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 9.0, 16.0, 29.0, 22.0, 53.0, 96.0, 149.0, 279.0, 456.0, 946.0, 1634.0, 3292.0, 6898.0, 14624.0, 32315.0, 75332.0, 175218.0, 306777.0, 236400.0, 107902.0, 46451.0, 20374.0, 9617.0, 4534.0, 2318.0, 1211.0, 635.0, 397.0, 206.0, 121.0, 80.0, 44.0, 34.0, 30.0, 15.0, 10.0, 7.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.353759765625, -0.3432655334472656, -0.33277130126953125, -0.3222770690917969, -0.3117828369140625, -0.3012886047363281, -0.29079437255859375, -0.2803001403808594, -0.269805908203125, -0.2593116760253906, -0.24881744384765625, -0.23832321166992188, -0.2278289794921875, -0.21733474731445312, -0.20684051513671875, -0.19634628295898438, -0.18585205078125, -0.17535781860351562, -0.16486358642578125, -0.15436935424804688, -0.1438751220703125, -0.13338088989257812, -0.12288665771484375, -0.11239242553710938, -0.101898193359375, -0.09140396118164062, -0.08090972900390625, -0.07041549682617188, -0.0599212646484375, -0.049427032470703125, -0.03893280029296875, -0.028438568115234375, -0.0179443359375, -0.007450103759765625, 0.00304412841796875, 0.013538360595703125, 0.0240325927734375, 0.034526824951171875, 0.04502105712890625, 0.055515289306640625, 0.066009521484375, 0.07650375366210938, 0.08699798583984375, 0.09749221801757812, 0.1079864501953125, 0.11848068237304688, 0.12897491455078125, 0.13946914672851562, 0.14996337890625, 0.16045761108398438, 0.17095184326171875, 0.18144607543945312, 0.1919403076171875, 0.20243453979492188, 0.21292877197265625, 0.22342300415039062, 0.233917236328125, 0.24441146850585938, 0.25490570068359375, 0.2653999328613281, 0.2758941650390625, 0.2863883972167969, 0.29688262939453125, 0.3073768615722656, 0.31787109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 10.0, 14.0, 14.0, 15.0, 19.0, 25.0, 30.0, 22.0, 40.0, 36.0, 37.0, 35.0, 38.0, 42.0, 45.0, 48.0, 36.0, 53.0, 47.0, 44.0, 36.0, 38.0, 27.0, 32.0, 25.0, 21.0, 27.0, 12.0, 18.0, 17.0, 16.0, 16.0, 7.0, 4.0, 8.0, 1.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.859375, -4.711669921875, -4.56396484375, -4.416259765625, -4.2685546875, -4.120849609375, -3.97314453125, -3.825439453125, -3.677734375, -3.530029296875, -3.38232421875, -3.234619140625, -3.0869140625, -2.939208984375, -2.79150390625, -2.643798828125, -2.49609375, -2.348388671875, -2.20068359375, -2.052978515625, -1.9052734375, -1.757568359375, -1.60986328125, -1.462158203125, -1.314453125, -1.166748046875, -1.01904296875, -0.871337890625, -0.7236328125, -0.575927734375, -0.42822265625, -0.280517578125, -0.1328125, 0.014892578125, 0.16259765625, 0.310302734375, 0.4580078125, 0.605712890625, 0.75341796875, 0.901123046875, 1.048828125, 1.196533203125, 1.34423828125, 1.491943359375, 1.6396484375, 1.787353515625, 1.93505859375, 2.082763671875, 2.23046875, 2.378173828125, 2.52587890625, 2.673583984375, 2.8212890625, 2.968994140625, 3.11669921875, 3.264404296875, 3.412109375, 3.559814453125, 3.70751953125, 3.855224609375, 4.0029296875, 4.150634765625, 4.29833984375, 4.446044921875, 4.59375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 9.0, 5.0, 9.0, 4.0, 14.0, 17.0, 19.0, 35.0, 54.0, 64.0, 145.0, 189.0, 273.0, 426.0, 578.0, 990.0, 1572.0, 2488.0, 4299.0, 7572.0, 14525.0, 31247.0, 79090.0, 247441.0, 410558.0, 147958.0, 51739.0, 21915.0, 10560.0, 5714.0, 3419.0, 2021.0, 1194.0, 823.0, 551.0, 336.0, 221.0, 144.0, 113.0, 66.0, 51.0, 32.0, 25.0, 18.0, 16.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.039642333984375, -0.03833341598510742, -0.037024497985839844, -0.035715579986572266, -0.03440666198730469, -0.03309774398803711, -0.03178882598876953, -0.030479907989501953, -0.029170989990234375, -0.027862071990966797, -0.02655315399169922, -0.02524423599243164, -0.023935317993164062, -0.022626399993896484, -0.021317481994628906, -0.020008563995361328, -0.01869964599609375, -0.017390727996826172, -0.016081809997558594, -0.014772891998291016, -0.013463973999023438, -0.01215505599975586, -0.010846138000488281, -0.009537220001220703, -0.008228302001953125, -0.006919384002685547, -0.005610466003417969, -0.004301548004150391, -0.0029926300048828125, -0.0016837120056152344, -0.00037479400634765625, 0.0009341239929199219, 0.0022430419921875, 0.003551959991455078, 0.004860877990722656, 0.006169795989990234, 0.0074787139892578125, 0.00878763198852539, 0.010096549987792969, 0.011405467987060547, 0.012714385986328125, 0.014023303985595703, 0.015332221984863281, 0.01664113998413086, 0.017950057983398438, 0.019258975982666016, 0.020567893981933594, 0.021876811981201172, 0.02318572998046875, 0.024494647979736328, 0.025803565979003906, 0.027112483978271484, 0.028421401977539062, 0.02973031997680664, 0.03103923797607422, 0.0323481559753418, 0.033657073974609375, 0.03496599197387695, 0.03627490997314453, 0.03758382797241211, 0.03889274597167969, 0.040201663970947266, 0.041510581970214844, 0.04281949996948242, 0.04412841796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 2.0, 3.0, 10.0, 14.0, 17.0, 34.0, 29.0, 42.0, 78.0, 87.0, 122.0, 151.0, 91.0, 91.0, 75.0, 57.0, 26.0, 26.0, 18.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012731552124023438, -0.0001232437789440155, -0.00011917203664779663, -0.00011510029435157776, -0.00011102855205535889, -0.00010695680975914001, -0.00010288506746292114, -9.881332516670227e-05, -9.47415828704834e-05, -9.066984057426453e-05, -8.659809827804565e-05, -8.252635598182678e-05, -7.845461368560791e-05, -7.438287138938904e-05, -7.031112909317017e-05, -6.62393867969513e-05, -6.216764450073242e-05, -5.809590220451355e-05, -5.402415990829468e-05, -4.9952417612075806e-05, -4.5880675315856934e-05, -4.180893301963806e-05, -3.773719072341919e-05, -3.366544842720032e-05, -2.9593706130981445e-05, -2.5521963834762573e-05, -2.14502215385437e-05, -1.737847924232483e-05, -1.3306736946105957e-05, -9.234994649887085e-06, -5.163252353668213e-06, -1.0915100574493408e-06, 2.9802322387695312e-06, 7.051974534988403e-06, 1.1123716831207275e-05, 1.5195459127426147e-05, 1.926720142364502e-05, 2.333894371986389e-05, 2.7410686016082764e-05, 3.1482428312301636e-05, 3.555417060852051e-05, 3.962591290473938e-05, 4.369765520095825e-05, 4.7769397497177124e-05, 5.1841139793395996e-05, 5.591288208961487e-05, 5.998462438583374e-05, 6.405636668205261e-05, 6.812810897827148e-05, 7.219985127449036e-05, 7.627159357070923e-05, 8.03433358669281e-05, 8.441507816314697e-05, 8.848682045936584e-05, 9.255856275558472e-05, 9.663030505180359e-05, 0.00010070204734802246, 0.00010477378964424133, 0.0001088455319404602, 0.00011291727423667908, 0.00011698901653289795, 0.00012106075882911682, 0.0001251325011253357, 0.00012920424342155457, 0.00013327598571777344]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 6.0, 2.0, 7.0, 9.0, 6.0, 9.0, 14.0, 13.0, 28.0, 18.0, 34.0, 55.0, 76.0, 130.0, 281.0, 2840.0, 889406.0, 153775.0, 1276.0, 213.0, 108.0, 67.0, 44.0, 39.0, 23.0, 20.0, 13.0, 10.0, 3.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.283935546875, -0.2747383117675781, -0.26554107666015625, -0.2563438415527344, -0.2471466064453125, -0.23794937133789062, -0.22875213623046875, -0.21955490112304688, -0.210357666015625, -0.20116043090820312, -0.19196319580078125, -0.18276596069335938, -0.1735687255859375, -0.16437149047851562, -0.15517425537109375, -0.14597702026367188, -0.13677978515625, -0.12758255004882812, -0.11838531494140625, -0.10918807983398438, -0.0999908447265625, -0.09079360961914062, -0.08159637451171875, -0.07239913940429688, -0.063201904296875, -0.054004669189453125, -0.04480743408203125, -0.035610198974609375, -0.0264129638671875, -0.017215728759765625, -0.00801849365234375, 0.001178741455078125, 0.0103759765625, 0.019573211669921875, 0.02877044677734375, 0.037967681884765625, 0.0471649169921875, 0.056362152099609375, 0.06555938720703125, 0.07475662231445312, 0.083953857421875, 0.09315109252929688, 0.10234832763671875, 0.11154556274414062, 0.1207427978515625, 0.12994003295898438, 0.13913726806640625, 0.14833450317382812, 0.15753173828125, 0.16672897338867188, 0.17592620849609375, 0.18512344360351562, 0.1943206787109375, 0.20351791381835938, 0.21271514892578125, 0.22191238403320312, 0.231109619140625, 0.24030685424804688, 0.24950408935546875, 0.2587013244628906, 0.2678985595703125, 0.2770957946777344, 0.28629302978515625, 0.2954902648925781, 0.3046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 3.0, 13.0, 14.0, 12.0, 24.0, 29.0, 40.0, 39.0, 60.0, 90.0, 72.0, 66.0, 67.0, 70.0, 64.0, 62.0, 58.0, 53.0, 37.0, 27.0, 23.0, 20.0, 6.0, 12.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0167236328125, -0.016206026077270508, -0.015688419342041016, -0.015170812606811523, -0.014653205871582031, -0.014135599136352539, -0.013617992401123047, -0.013100385665893555, -0.012582778930664062, -0.01206517219543457, -0.011547565460205078, -0.011029958724975586, -0.010512351989746094, -0.009994745254516602, -0.00947713851928711, -0.008959531784057617, -0.008441925048828125, -0.007924318313598633, -0.007406711578369141, -0.0068891048431396484, -0.006371498107910156, -0.005853891372680664, -0.005336284637451172, -0.00481867790222168, -0.0043010711669921875, -0.0037834644317626953, -0.003265857696533203, -0.002748250961303711, -0.0022306442260742188, -0.0017130374908447266, -0.0011954307556152344, -0.0006778240203857422, -0.00016021728515625, 0.0003573894500732422, 0.0008749961853027344, 0.0013926029205322266, 0.0019102096557617188, 0.002427816390991211, 0.002945423126220703, 0.0034630298614501953, 0.0039806365966796875, 0.00449824333190918, 0.005015850067138672, 0.005533456802368164, 0.006051063537597656, 0.0065686702728271484, 0.007086277008056641, 0.007603883743286133, 0.008121490478515625, 0.008639097213745117, 0.00915670394897461, 0.009674310684204102, 0.010191917419433594, 0.010709524154663086, 0.011227130889892578, 0.01174473762512207, 0.012262344360351562, 0.012779951095581055, 0.013297557830810547, 0.013815164566040039, 0.014332771301269531, 0.014850378036499023, 0.015367984771728516, 0.015885591506958008, 0.0164031982421875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 10.0, 16.0, 25.0, 57.0, 84.0, 160.0, 221.0, 196.0, 115.0, 58.0, 24.0, 18.0, 5.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.7264084815979, -7.520515441894531, -7.314622402191162, -7.108729362487793, -6.902836799621582, -6.696943759918213, -6.491050720214844, -6.285157680511475, -6.0792646408081055, -5.873371601104736, -5.667478561401367, -5.461585998535156, -5.255692958831787, -5.049799919128418, -4.843906879425049, -4.63801383972168, -4.432121276855469, -4.2262282371521, -4.0203351974487305, -3.8144423961639404, -3.6085493564605713, -3.4026565551757812, -3.196763515472412, -2.990870475769043, -2.784977436065674, -2.5790843963623047, -2.3731915950775146, -2.1672985553741455, -1.9614055156707764, -1.7555125951766968, -1.5496196746826172, -1.343726634979248, -1.137833595275879, -0.9319406151771545, -0.7260476350784302, -0.5201547145843506, -0.3142617344856262, -0.10836875438690186, 0.09752416610717773, 0.3034172058105469, 0.5093101263046265, 0.7152031064033508, 0.9210960865020752, 1.1269890069961548, 1.3328819274902344, 1.5387749671936035, 1.744667887687683, 1.9505609273910522, 2.156453847885132, 2.362346887588501, 2.568239688873291, 2.77413272857666, 2.9800257682800293, 3.1859188079833984, 3.3918116092681885, 3.5977046489715576, 3.8035974502563477, 4.009490489959717, 4.215383529663086, 4.421276092529297, 4.627169132232666, 4.833062171936035, 5.038955211639404, 5.244848251342773, 5.450741291046143]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 8.0, 6.0, 8.0, 17.0, 19.0, 35.0, 31.0, 46.0, 69.0, 77.0, 75.0, 90.0, 108.0, 84.0, 73.0, 59.0, 48.0, 42.0, 29.0, 26.0, 17.0, 9.0, 13.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.077665328979492, -5.917468547821045, -5.757272243499756, -5.597075462341309, -5.4368791580200195, -5.276682376861572, -5.116485595703125, -4.956289291381836, -4.796092510223389, -4.635895729064941, -4.475699424743652, -4.315502643585205, -4.155305862426758, -3.9951095581054688, -3.8349127769470215, -3.6747162342071533, -3.514519691467285, -3.354323148727417, -3.194126605987549, -3.0339298248291016, -2.8737332820892334, -2.7135367393493652, -2.553339958190918, -2.39314341545105, -2.2329468727111816, -2.0727503299713135, -1.9125536680221558, -1.752357006072998, -1.5921604633331299, -1.4319639205932617, -1.271767258644104, -1.1115705966949463, -0.9513735771179199, -0.791176974773407, -0.630980372428894, -0.4707837700843811, -0.31058716773986816, -0.15039056539535522, 0.009806036949157715, 0.17000269889831543, 0.3301992416381836, 0.49039584398269653, 0.6505924463272095, 0.8107890486717224, 0.9709856510162354, 1.1311821937561035, 1.2913788557052612, 1.451575517654419, 1.611772060394287, 1.7719686031341553, 1.932165265083313, 2.0923619270324707, 2.252558469772339, 2.412755012512207, 2.5729517936706543, 2.7331483364105225, 2.8933448791503906, 3.053541421890259, 3.213737964630127, 3.373934745788574, 3.5341312885284424, 3.6943278312683105, 3.854524612426758, 4.014720916748047, 4.174917697906494]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 12.0, 12.0, 10.0, 19.0, 23.0, 25.0, 33.0, 68.0, 90.0, 127.0, 211.0, 344.0, 576.0, 993.0, 1850.0, 3644.0, 7722.0, 20555.0, 75359.0, 508032.0, 342781.0, 55837.0, 16590.0, 6473.0, 3193.0, 1648.0, 882.0, 513.0, 338.0, 194.0, 132.0, 64.0, 53.0, 44.0, 31.0, 18.0, 23.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.962890625, -3.842437744140625, -3.72198486328125, -3.601531982421875, -3.4810791015625, -3.360626220703125, -3.24017333984375, -3.119720458984375, -2.999267578125, -2.878814697265625, -2.75836181640625, -2.637908935546875, -2.5174560546875, -2.397003173828125, -2.27655029296875, -2.156097412109375, -2.03564453125, -1.915191650390625, -1.79473876953125, -1.674285888671875, -1.5538330078125, -1.433380126953125, -1.31292724609375, -1.192474365234375, -1.072021484375, -0.951568603515625, -0.83111572265625, -0.710662841796875, -0.5902099609375, -0.469757080078125, -0.34930419921875, -0.228851318359375, -0.1083984375, 0.012054443359375, 0.13250732421875, 0.252960205078125, 0.3734130859375, 0.493865966796875, 0.61431884765625, 0.734771728515625, 0.855224609375, 0.975677490234375, 1.09613037109375, 1.216583251953125, 1.3370361328125, 1.457489013671875, 1.57794189453125, 1.698394775390625, 1.81884765625, 1.939300537109375, 2.05975341796875, 2.180206298828125, 2.3006591796875, 2.421112060546875, 2.54156494140625, 2.662017822265625, 2.782470703125, 2.902923583984375, 3.02337646484375, 3.143829345703125, 3.2642822265625, 3.384735107421875, 3.50518798828125, 3.625640869140625, 3.74609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 7.0, 9.0, 8.0, 21.0, 30.0, 28.0, 30.0, 37.0, 54.0, 48.0, 50.0, 59.0, 82.0, 67.0, 68.0, 67.0, 67.0, 61.0, 40.0, 46.0, 30.0, 26.0, 19.0, 16.0, 10.0, 3.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.78125, -23.068115234375, -22.35498046875, -21.641845703125, -20.9287109375, -20.215576171875, -19.50244140625, -18.789306640625, -18.076171875, -17.363037109375, -16.64990234375, -15.936767578125, -15.2236328125, -14.510498046875, -13.79736328125, -13.084228515625, -12.37109375, -11.657958984375, -10.94482421875, -10.231689453125, -9.5185546875, -8.805419921875, -8.09228515625, -7.379150390625, -6.666015625, -5.952880859375, -5.23974609375, -4.526611328125, -3.8134765625, -3.100341796875, -2.38720703125, -1.674072265625, -0.9609375, -0.247802734375, 0.46533203125, 1.178466796875, 1.8916015625, 2.604736328125, 3.31787109375, 4.031005859375, 4.744140625, 5.457275390625, 6.17041015625, 6.883544921875, 7.5966796875, 8.309814453125, 9.02294921875, 9.736083984375, 10.44921875, 11.162353515625, 11.87548828125, 12.588623046875, 13.3017578125, 14.014892578125, 14.72802734375, 15.441162109375, 16.154296875, 16.867431640625, 17.58056640625, 18.293701171875, 19.0068359375, 19.719970703125, 20.43310546875, 21.146240234375, 21.859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 11.0, 15.0, 8.0, 22.0, 23.0, 32.0, 56.0, 76.0, 109.0, 680.0, 1046933.0, 224.0, 107.0, 87.0, 59.0, 25.0, 22.0, 15.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-110.125, -106.4951171875, -102.865234375, -99.2353515625, -95.60546875, -91.9755859375, -88.345703125, -84.7158203125, -81.0859375, -77.4560546875, -73.826171875, -70.1962890625, -66.56640625, -62.9365234375, -59.306640625, -55.6767578125, -52.046875, -48.4169921875, -44.787109375, -41.1572265625, -37.52734375, -33.8974609375, -30.267578125, -26.6376953125, -23.0078125, -19.3779296875, -15.748046875, -12.1181640625, -8.48828125, -4.8583984375, -1.228515625, 2.4013671875, 6.03125, 9.6611328125, 13.291015625, 16.9208984375, 20.55078125, 24.1806640625, 27.810546875, 31.4404296875, 35.0703125, 38.7001953125, 42.330078125, 45.9599609375, 49.58984375, 53.2197265625, 56.849609375, 60.4794921875, 64.109375, 67.7392578125, 71.369140625, 74.9990234375, 78.62890625, 82.2587890625, 85.888671875, 89.5185546875, 93.1484375, 96.7783203125, 100.408203125, 104.0380859375, 107.66796875, 111.2978515625, 114.927734375, 118.5576171875, 122.1875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 11.0, 15.0, 8.0, 22.0, 24.0, 31.0, 56.0, 77.0, 84.0, 97.0, 114.0, 115.0, 91.0, 85.0, 58.0, 27.0, 22.0, 15.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-39.8125, -38.5, -37.1875, -35.875, -34.5625, -33.25, -31.9375, -30.625, -29.3125, -28.0, -26.6875, -25.375, -24.0625, -22.75, -21.4375, -20.125, -18.8125, -17.5, -16.1875, -14.875, -13.5625, -12.25, -10.9375, -9.625, -8.3125, -7.0, -5.6875, -4.375, -3.0625, -1.75, -0.4375, 0.875, 2.1875, 3.5, 4.8125, 6.125, 7.4375, 8.75, 10.0625, 11.375, 12.6875, 14.0, 15.3125, 16.625, 17.9375, 19.25, 20.5625, 21.875, 23.1875, 24.5, 25.8125, 27.125, 28.4375, 29.75, 31.0625, 32.375, 33.6875, 35.0, 36.3125, 37.625, 38.9375, 40.25, 41.5625, 42.875, 44.1875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 11.0, 10.0, 40.0, 48.0, 52.0, 90.0, 183.0, 282.0, 624.0, 1522.0, 3976.0, 18175.0, 965301.0, 48315.0, 6002.0, 1990.0, 874.0, 413.0, 223.0, 135.0, 92.0, 58.0, 34.0, 23.0, 14.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6767196655273438, -0.6522674560546875, -0.6278152465820312, -0.603363037109375, -0.5789108276367188, -0.5544586181640625, -0.5300064086914062, -0.50555419921875, -0.48110198974609375, -0.4566497802734375, -0.43219757080078125, -0.407745361328125, -0.38329315185546875, -0.3588409423828125, -0.33438873291015625, -0.3099365234375, -0.28548431396484375, -0.2610321044921875, -0.23657989501953125, -0.212127685546875, -0.18767547607421875, -0.1632232666015625, -0.13877105712890625, -0.11431884765625, -0.08986663818359375, -0.0654144287109375, -0.04096221923828125, -0.016510009765625, 0.00794219970703125, 0.0323944091796875, 0.05684661865234375, 0.081298828125, 0.10575103759765625, 0.1302032470703125, 0.15465545654296875, 0.179107666015625, 0.20355987548828125, 0.2280120849609375, 0.25246429443359375, 0.27691650390625, 0.30136871337890625, 0.3258209228515625, 0.35027313232421875, 0.374725341796875, 0.39917755126953125, 0.4236297607421875, 0.44808197021484375, 0.4725341796875, 0.49698638916015625, 0.5214385986328125, 0.5458908081054688, 0.570343017578125, 0.5947952270507812, 0.6192474365234375, 0.6436996459960938, 0.66815185546875, 0.6926040649414062, 0.7170562744140625, 0.7415084838867188, 0.765960693359375, 0.7904129028320312, 0.8148651123046875, 0.8393173217773438, 0.86376953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 2.0, 7.0, 3.0, 4.0, 9.0, 21.0, 52.0, 280.0, 469.0, 68.0, 24.0, 13.0, 14.0, 11.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0005064010620117188, -0.0004954207688570023, -0.00048444047570228577, -0.0004734601825475693, -0.0004624798893928528, -0.0004514995962381363, -0.0004405193030834198, -0.0004295390099287033, -0.0004185587167739868, -0.0004075784236192703, -0.00039659813046455383, -0.00038561783730983734, -0.00037463754415512085, -0.00036365725100040436, -0.00035267695784568787, -0.0003416966646909714, -0.0003307163715362549, -0.0003197360783815384, -0.0003087557852268219, -0.0002977754920721054, -0.0002867951989173889, -0.0002758149057626724, -0.00026483461260795593, -0.00025385431945323944, -0.00024287402629852295, -0.00023189373314380646, -0.00022091343998908997, -0.00020993314683437347, -0.00019895285367965698, -0.0001879725605249405, -0.000176992267370224, -0.0001660119742155075, -0.00015503168106079102, -0.00014405138790607452, -0.00013307109475135803, -0.00012209080159664154, -0.00011111050844192505, -0.00010013021528720856, -8.914992213249207e-05, -7.816962897777557e-05, -6.718933582305908e-05, -5.620904266834259e-05, -4.52287495136261e-05, -3.424845635890961e-05, -2.3268163204193115e-05, -1.2287870049476624e-05, -1.3075768947601318e-06, 9.67271625995636e-06, 2.065300941467285e-05, 3.163330256938934e-05, 4.2613595724105835e-05, 5.359388887882233e-05, 6.457418203353882e-05, 7.555447518825531e-05, 8.65347683429718e-05, 9.75150614976883e-05, 0.00010849535465240479, 0.00011947564780712128, 0.00013045594096183777, 0.00014143623411655426, 0.00015241652727127075, 0.00016339682042598724, 0.00017437711358070374, 0.00018535740673542023, 0.00019633769989013672]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 4.0, 8.0, 17.0, 23.0, 32.0, 69.0, 175.0, 276.0, 632.0, 1550.0, 4439.0, 25706.0, 979165.0, 28703.0, 4817.0, 1645.0, 648.0, 295.0, 138.0, 95.0, 38.0, 20.0, 18.0, 3.0, 10.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.009765625, -0.983551025390625, -0.95733642578125, -0.931121826171875, -0.9049072265625, -0.878692626953125, -0.85247802734375, -0.826263427734375, -0.800048828125, -0.773834228515625, -0.74761962890625, -0.721405029296875, -0.6951904296875, -0.668975830078125, -0.64276123046875, -0.616546630859375, -0.59033203125, -0.564117431640625, -0.53790283203125, -0.511688232421875, -0.4854736328125, -0.459259033203125, -0.43304443359375, -0.406829833984375, -0.380615234375, -0.354400634765625, -0.32818603515625, -0.301971435546875, -0.2757568359375, -0.249542236328125, -0.22332763671875, -0.197113037109375, -0.1708984375, -0.144683837890625, -0.11846923828125, -0.092254638671875, -0.0660400390625, -0.039825439453125, -0.01361083984375, 0.012603759765625, 0.038818359375, 0.065032958984375, 0.09124755859375, 0.117462158203125, 0.1436767578125, 0.169891357421875, 0.19610595703125, 0.222320556640625, 0.24853515625, 0.274749755859375, 0.30096435546875, 0.327178955078125, 0.3533935546875, 0.379608154296875, 0.40582275390625, 0.432037353515625, 0.458251953125, 0.484466552734375, 0.51068115234375, 0.536895751953125, 0.5631103515625, 0.589324951171875, 0.61553955078125, 0.641754150390625, 0.66796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 8.0, 8.0, 21.0, 25.0, 40.0, 100.0, 335.0, 268.0, 78.0, 35.0, 20.0, 17.0, 7.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2412109375, -0.2348499298095703, -0.22848892211914062, -0.22212791442871094, -0.21576690673828125, -0.20940589904785156, -0.20304489135742188, -0.1966838836669922, -0.1903228759765625, -0.1839618682861328, -0.17760086059570312, -0.17123985290527344, -0.16487884521484375, -0.15851783752441406, -0.15215682983398438, -0.1457958221435547, -0.139434814453125, -0.1330738067626953, -0.12671279907226562, -0.12035179138183594, -0.11399078369140625, -0.10762977600097656, -0.10126876831054688, -0.09490776062011719, -0.0885467529296875, -0.08218574523925781, -0.07582473754882812, -0.06946372985839844, -0.06310272216796875, -0.05674171447753906, -0.050380706787109375, -0.04401969909667969, -0.03765869140625, -0.03129768371582031, -0.024936676025390625, -0.018575668334960938, -0.01221466064453125, -0.0058536529541015625, 0.000507354736328125, 0.0068683624267578125, 0.0132293701171875, 0.019590377807617188, 0.025951385498046875, 0.03231239318847656, 0.03867340087890625, 0.04503440856933594, 0.051395416259765625, 0.05775642395019531, 0.064117431640625, 0.07047843933105469, 0.07683944702148438, 0.08320045471191406, 0.08956146240234375, 0.09592247009277344, 0.10228347778320312, 0.10864448547363281, 0.1150054931640625, 0.12136650085449219, 0.12772750854492188, 0.13408851623535156, 0.14044952392578125, 0.14681053161621094, 0.15317153930664062, 0.1595325469970703, 0.1658935546875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 34.0, 292.0, 590.0, 85.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.87194538116455, -13.546290397644043, -12.220634460449219, -10.894979476928711, -9.569324493408203, -8.243669509887695, -6.918014049530029, -5.592358589172363, -4.2667036056518555, -2.9410483837127686, -1.6153931617736816, -0.2897379398345947, 1.0359172821044922, 2.361572265625, 3.687227725982666, 5.012883186340332, 6.33853816986084, 7.664193153381348, 8.989849090576172, 10.31550407409668, 11.641159057617188, 12.966814041137695, 14.292469024658203, 15.618124961853027, 16.94377899169922, 18.269433975219727, 19.595088958740234, 20.920743942260742, 22.24639892578125, 23.57205581665039, 24.8977108001709, 26.223365783691406, 27.54901885986328, 28.87467384338379, 30.200328826904297, 31.525983810424805, 32.85163879394531, 34.17729568481445, 35.50294876098633, 36.82860565185547, 38.154258728027344, 39.479915618896484, 40.80556869506836, 42.1312255859375, 43.456878662109375, 44.782535552978516, 46.10818862915039, 47.43384552001953, 48.75950241088867, 50.08515930175781, 51.41081237792969, 52.73646926879883, 54.0621223449707, 55.387779235839844, 56.71343231201172, 58.03908920288086, 59.36474609375, 60.69040298461914, 62.016056060791016, 63.341712951660156, 64.66736602783203, 65.9930191040039, 67.31867980957031, 68.64433288574219, 69.96998596191406]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 2.0, 7.0, 5.0, 6.0, 11.0, 14.0, 14.0, 24.0, 18.0, 25.0, 24.0, 17.0, 36.0, 27.0, 56.0, 30.0, 48.0, 50.0, 37.0, 33.0, 50.0, 38.0, 41.0, 54.0, 46.0, 23.0, 34.0, 41.0, 27.0, 25.0, 18.0, 17.0, 17.0, 18.0, 19.0, 15.0, 8.0, 7.0, 2.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.436553955078125, -18.712158203125, -17.987762451171875, -17.263364791870117, -16.538969039916992, -15.814573287963867, -15.090176582336426, -14.365779876708984, -13.64138412475586, -12.916988372802734, -12.192591667175293, -11.468194961547852, -10.743799209594727, -10.019403457641602, -9.29500675201416, -8.570610046386719, -7.846214294433594, -7.1218180656433105, -6.397421836853027, -5.673025608062744, -4.948629379272461, -4.224233150482178, -3.4998369216918945, -2.7754406929016113, -2.051044464111328, -1.326648235321045, -0.6022520065307617, 0.12214422225952148, 0.8465404510498047, 1.570936679840088, 2.295332908630371, 3.0197291374206543, 3.7441272735595703, 4.4685235023498535, 5.192919731140137, 5.91731595993042, 6.641712188720703, 7.366108417510986, 8.09050464630127, 8.814901351928711, 9.539297103881836, 10.263692855834961, 10.988089561462402, 11.712486267089844, 12.436882019042969, 13.161277770996094, 13.885674476623535, 14.610071182250977, 15.334466934204102, 16.058862686157227, 16.783260345458984, 17.50765609741211, 18.232051849365234, 18.95644760131836, 19.680843353271484, 20.405241012573242, 21.129636764526367, 21.854032516479492, 22.57843017578125, 23.302825927734375, 24.0272216796875, 24.751617431640625, 25.47601318359375, 26.200410842895508, 26.924806594848633]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 22.0, 50.0, 48.0, 74.0, 103.0, 354.0, 108745.0, 4083550.0, 980.0, 107.0, 81.0, 59.0, 35.0, 23.0, 14.0, 11.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.6875, -18.46875, -17.25, -16.03125, -14.8125, -13.59375, -12.375, -11.15625, -9.9375, -8.71875, -7.5, -6.28125, -5.0625, -3.84375, -2.625, -1.40625, -0.1875, 1.03125, 2.25, 3.46875, 4.6875, 5.90625, 7.125, 8.34375, 9.5625, 10.78125, 12.0, 13.21875, 14.4375, 15.65625, 16.875, 18.09375, 19.3125, 20.53125, 21.75, 22.96875, 24.1875, 25.40625, 26.625, 27.84375, 29.0625, 30.28125, 31.5, 32.71875, 33.9375, 35.15625, 36.375, 37.59375, 38.8125, 40.03125, 41.25, 42.46875, 43.6875, 44.90625, 46.125, 47.34375, 48.5625, 49.78125, 51.0, 52.21875, 53.4375, 54.65625, 55.875, 57.09375, 58.3125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 9.0, 3.0, 9.0, 9.0, 23.0, 29.0, 43.0, 63.0, 73.0, 95.0, 119.0, 110.0, 113.0, 102.0, 73.0, 53.0, 30.0, 18.0, 14.0, 14.0, 2.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.59375, -7.40924072265625, -7.2247314453125, -7.04022216796875, -6.855712890625, -6.67120361328125, -6.4866943359375, -6.30218505859375, -6.11767578125, -5.93316650390625, -5.7486572265625, -5.56414794921875, -5.379638671875, -5.19512939453125, -5.0106201171875, -4.82611083984375, -4.6416015625, -4.45709228515625, -4.2725830078125, -4.08807373046875, -3.903564453125, -3.71905517578125, -3.5345458984375, -3.35003662109375, -3.16552734375, -2.98101806640625, -2.7965087890625, -2.61199951171875, -2.427490234375, -2.24298095703125, -2.0584716796875, -1.87396240234375, -1.689453125, -1.50494384765625, -1.3204345703125, -1.13592529296875, -0.951416015625, -0.76690673828125, -0.5823974609375, -0.39788818359375, -0.21337890625, -0.02886962890625, 0.1556396484375, 0.34014892578125, 0.524658203125, 0.70916748046875, 0.8936767578125, 1.07818603515625, 1.2626953125, 1.44720458984375, 1.6317138671875, 1.81622314453125, 2.000732421875, 2.18524169921875, 2.3697509765625, 2.55426025390625, 2.73876953125, 2.92327880859375, 3.1077880859375, 3.29229736328125, 3.476806640625, 3.66131591796875, 3.8458251953125, 4.03033447265625, 4.21484375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 6.0, 6.0, 15.0, 38.0, 85.0, 238.0, 620.0, 4190872.0, 1746.0, 395.0, 126.0, 70.0, 22.0, 12.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.9375, -114.4404296875, -110.943359375, -107.4462890625, -103.94921875, -100.4521484375, -96.955078125, -93.4580078125, -89.9609375, -86.4638671875, -82.966796875, -79.4697265625, -75.97265625, -72.4755859375, -68.978515625, -65.4814453125, -61.984375, -58.4873046875, -54.990234375, -51.4931640625, -47.99609375, -44.4990234375, -41.001953125, -37.5048828125, -34.0078125, -30.5107421875, -27.013671875, -23.5166015625, -20.01953125, -16.5224609375, -13.025390625, -9.5283203125, -6.03125, -2.5341796875, 0.962890625, 4.4599609375, 7.95703125, 11.4541015625, 14.951171875, 18.4482421875, 21.9453125, 25.4423828125, 28.939453125, 32.4365234375, 35.93359375, 39.4306640625, 42.927734375, 46.4248046875, 49.921875, 53.4189453125, 56.916015625, 60.4130859375, 63.91015625, 67.4072265625, 70.904296875, 74.4013671875, 77.8984375, 81.3955078125, 84.892578125, 88.3896484375, 91.88671875, 95.3837890625, 98.880859375, 102.3779296875, 105.875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 9.0, 2.0, 9.0, 9.0, 16.0, 24.0, 27.0, 49.0, 74.0, 142.0, 298.0, 670.0, 1088.0, 799.0, 395.0, 209.0, 97.0, 50.0, 30.0, 26.0, 20.0, 13.0, 8.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.62109375, -2.5649261474609375, -2.508758544921875, -2.4525909423828125, -2.39642333984375, -2.3402557373046875, -2.284088134765625, -2.2279205322265625, -2.1717529296875, -2.1155853271484375, -2.059417724609375, -2.0032501220703125, -1.94708251953125, -1.8909149169921875, -1.834747314453125, -1.7785797119140625, -1.722412109375, -1.6662445068359375, -1.610076904296875, -1.5539093017578125, -1.49774169921875, -1.4415740966796875, -1.385406494140625, -1.3292388916015625, -1.2730712890625, -1.2169036865234375, -1.160736083984375, -1.1045684814453125, -1.04840087890625, -0.9922332763671875, -0.936065673828125, -0.8798980712890625, -0.82373046875, -0.7675628662109375, -0.711395263671875, -0.6552276611328125, -0.59906005859375, -0.5428924560546875, -0.486724853515625, -0.4305572509765625, -0.3743896484375, -0.3182220458984375, -0.262054443359375, -0.2058868408203125, -0.14971923828125, -0.0935516357421875, -0.037384033203125, 0.0187835693359375, 0.074951171875, 0.1311187744140625, 0.187286376953125, 0.2434539794921875, 0.29962158203125, 0.3557891845703125, 0.411956787109375, 0.4681243896484375, 0.5242919921875, 0.5804595947265625, 0.636627197265625, 0.6927947998046875, 0.74896240234375, 0.8051300048828125, 0.861297607421875, 0.9174652099609375, 0.9736328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 13.0, 15.0, 25.0, 27.0, 65.0, 66.0, 112.0, 121.0, 133.0, 120.0, 87.0, 69.0, 48.0, 23.0, 22.0, 11.0, 5.0, 12.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.342113971710205, -3.1774590015411377, -3.0128040313720703, -2.848149061203003, -2.6834940910339355, -2.518838882446289, -2.3541839122772217, -2.1895289421081543, -2.024873971939087, -1.8602190017700195, -1.6955640316009521, -1.5309089422225952, -1.3662539720535278, -1.2015990018844604, -1.0369439125061035, -0.8722889423370361, -0.7076339721679688, -0.5429790019989014, -0.3783239722251892, -0.21366897225379944, -0.04901397228240967, 0.11564099788665771, 0.2802960276603699, 0.44495105743408203, 0.6096060276031494, 0.7742609977722168, 0.938916027545929, 1.1035710573196411, 1.2682260274887085, 1.4328809976577759, 1.5975360870361328, 1.7621910572052002, 1.9268465042114258, 2.091501474380493, 2.2561564445495605, 2.420811414718628, 2.5854663848876953, 2.750121593475342, 2.914776563644409, 3.0794315338134766, 3.244086503982544, 3.4087414741516113, 3.5733964443206787, 3.738051414489746, 3.9027066230773926, 4.067361354827881, 4.232016563415527, 4.396671295166016, 4.561326503753662, 4.725981712341309, 4.890636444091797, 5.055291652679443, 5.219946384429932, 5.384601593017578, 5.549256324768066, 5.713911533355713, 5.878566741943359, 6.043221950531006, 6.207876682281494, 6.372531890869141, 6.537186622619629, 6.701841831207275, 6.866496562957764, 7.03115177154541, 7.195806503295898]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 10.0, 10.0, 21.0, 22.0, 33.0, 33.0, 43.0, 58.0, 64.0, 61.0, 80.0, 87.0, 79.0, 84.0, 65.0, 59.0, 56.0, 45.0, 31.0, 17.0, 16.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.086147308349609, -5.932651519775391, -5.779155731201172, -5.625659942626953, -5.472164154052734, -5.318668365478516, -5.165172576904297, -5.011676788330078, -4.858180999755859, -4.704685211181641, -4.551189422607422, -4.397693634033203, -4.244197845458984, -4.090702056884766, -3.937206268310547, -3.783710479736328, -3.6302146911621094, -3.4767189025878906, -3.323223114013672, -3.169727325439453, -3.0162315368652344, -2.8627357482910156, -2.709239959716797, -2.555744171142578, -2.4022483825683594, -2.2487525939941406, -2.095256805419922, -1.9417610168457031, -1.7882652282714844, -1.6347694396972656, -1.4812736511230469, -1.3277778625488281, -1.1742815971374512, -1.0207858085632324, -0.8672900199890137, -0.7137942314147949, -0.5602984428405762, -0.4068026542663574, -0.25330686569213867, -0.09981107711791992, 0.05368471145629883, 0.20718050003051758, 0.36067628860473633, 0.5141720771789551, 0.6676678657531738, 0.8211636543273926, 0.9746594429016113, 1.12815523147583, 1.2816510200500488, 1.4351468086242676, 1.5886425971984863, 1.742138385772705, 1.8956341743469238, 2.0491299629211426, 2.2026257514953613, 2.35612154006958, 2.509617328643799, 2.6631131172180176, 2.8166089057922363, 2.970104694366455, 3.123600482940674, 3.2770962715148926, 3.4305920600891113, 3.58408784866333, 3.737583637237549]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 0.0, 8.0, 7.0, 6.0, 17.0, 13.0, 29.0, 41.0, 63.0, 101.0, 183.0, 369.0, 819.0, 1772.0, 4718.0, 19568.0, 475746.0, 516048.0, 20598.0, 4981.0, 1799.0, 799.0, 362.0, 201.0, 99.0, 66.0, 43.0, 30.0, 23.0, 14.0, 11.0, 6.0, 6.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1078033447265625, -1.065216064453125, -1.0226287841796875, -0.98004150390625, -0.9374542236328125, -0.894866943359375, -0.8522796630859375, -0.8096923828125, -0.7671051025390625, -0.724517822265625, -0.6819305419921875, -0.63934326171875, -0.5967559814453125, -0.554168701171875, -0.5115814208984375, -0.468994140625, -0.4264068603515625, -0.383819580078125, -0.3412322998046875, -0.29864501953125, -0.2560577392578125, -0.213470458984375, -0.1708831787109375, -0.1282958984375, -0.0857086181640625, -0.043121337890625, -0.0005340576171875, 0.04205322265625, 0.0846405029296875, 0.127227783203125, 0.1698150634765625, 0.21240234375, 0.2549896240234375, 0.297576904296875, 0.3401641845703125, 0.38275146484375, 0.4253387451171875, 0.467926025390625, 0.5105133056640625, 0.5531005859375, 0.5956878662109375, 0.638275146484375, 0.6808624267578125, 0.72344970703125, 0.7660369873046875, 0.808624267578125, 0.8512115478515625, 0.893798828125, 0.9363861083984375, 0.978973388671875, 1.0215606689453125, 1.06414794921875, 1.1067352294921875, 1.149322509765625, 1.1919097900390625, 1.2344970703125, 1.2770843505859375, 1.319671630859375, 1.3622589111328125, 1.40484619140625, 1.4474334716796875, 1.490020751953125, 1.5326080322265625, 1.5751953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 7.0, 13.0, 18.0, 23.0, 19.0, 24.0, 49.0, 58.0, 71.0, 78.0, 81.0, 88.0, 82.0, 78.0, 75.0, 66.0, 47.0, 42.0, 28.0, 17.0, 10.0, 7.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.755859375, -3.6556396484375, -3.555419921875, -3.4552001953125, -3.35498046875, -3.2547607421875, -3.154541015625, -3.0543212890625, -2.9541015625, -2.8538818359375, -2.753662109375, -2.6534423828125, -2.55322265625, -2.4530029296875, -2.352783203125, -2.2525634765625, -2.15234375, -2.0521240234375, -1.951904296875, -1.8516845703125, -1.75146484375, -1.6512451171875, -1.551025390625, -1.4508056640625, -1.3505859375, -1.2503662109375, -1.150146484375, -1.0499267578125, -0.94970703125, -0.8494873046875, -0.749267578125, -0.6490478515625, -0.548828125, -0.4486083984375, -0.348388671875, -0.2481689453125, -0.14794921875, -0.0477294921875, 0.052490234375, 0.1527099609375, 0.2529296875, 0.3531494140625, 0.453369140625, 0.5535888671875, 0.65380859375, 0.7540283203125, 0.854248046875, 0.9544677734375, 1.0546875, 1.1549072265625, 1.255126953125, 1.3553466796875, 1.45556640625, 1.5557861328125, 1.656005859375, 1.7562255859375, 1.8564453125, 1.9566650390625, 2.056884765625, 2.1571044921875, 2.25732421875, 2.3575439453125, 2.457763671875, 2.5579833984375, 2.658203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 15.0, 18.0, 19.0, 29.0, 41.0, 67.0, 59.0, 98.0, 155.0, 234.0, 396.0, 621.0, 958.0, 1656.0, 2753.0, 4664.0, 7949.0, 14300.0, 25717.0, 47961.0, 90292.0, 167785.0, 247333.0, 196584.0, 109764.0, 57967.0, 30988.0, 16966.0, 9549.0, 5499.0, 3149.0, 1860.0, 1116.0, 685.0, 444.0, 284.0, 183.0, 107.0, 86.0, 54.0, 40.0, 21.0, 20.0, 16.0, 12.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.170654296875, -0.16558265686035156, -0.16051101684570312, -0.1554393768310547, -0.15036773681640625, -0.1452960968017578, -0.14022445678710938, -0.13515281677246094, -0.1300811767578125, -0.12500953674316406, -0.11993789672851562, -0.11486625671386719, -0.10979461669921875, -0.10472297668457031, -0.09965133666992188, -0.09457969665527344, -0.089508056640625, -0.08443641662597656, -0.07936477661132812, -0.07429313659667969, -0.06922149658203125, -0.06414985656738281, -0.059078216552734375, -0.05400657653808594, -0.0489349365234375, -0.04386329650878906, -0.038791656494140625, -0.03372001647949219, -0.02864837646484375, -0.023576736450195312, -0.018505096435546875, -0.013433456420898438, -0.00836181640625, -0.0032901763916015625, 0.001781463623046875, 0.0068531036376953125, 0.01192474365234375, 0.016996383666992188, 0.022068023681640625, 0.027139663696289062, 0.0322113037109375, 0.03728294372558594, 0.042354583740234375, 0.04742622375488281, 0.05249786376953125, 0.05756950378417969, 0.06264114379882812, 0.06771278381347656, 0.072784423828125, 0.07785606384277344, 0.08292770385742188, 0.08799934387207031, 0.09307098388671875, 0.09814262390136719, 0.10321426391601562, 0.10828590393066406, 0.1133575439453125, 0.11842918395996094, 0.12350082397460938, 0.1285724639892578, 0.13364410400390625, 0.1387157440185547, 0.14378738403320312, 0.14885902404785156, 0.1539306640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 9.0, 5.0, 5.0, 11.0, 7.0, 8.0, 8.0, 10.0, 12.0, 15.0, 20.0, 18.0, 30.0, 34.0, 28.0, 36.0, 27.0, 44.0, 32.0, 36.0, 33.0, 36.0, 36.0, 36.0, 33.0, 46.0, 28.0, 40.0, 35.0, 35.0, 30.0, 23.0, 24.0, 33.0, 21.0, 27.0, 10.0, 14.0, 7.0, 12.0, 13.0, 8.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.85546875, -2.768890380859375, -2.68231201171875, -2.595733642578125, -2.5091552734375, -2.422576904296875, -2.33599853515625, -2.249420166015625, -2.162841796875, -2.076263427734375, -1.98968505859375, -1.903106689453125, -1.8165283203125, -1.729949951171875, -1.64337158203125, -1.556793212890625, -1.47021484375, -1.383636474609375, -1.29705810546875, -1.210479736328125, -1.1239013671875, -1.037322998046875, -0.95074462890625, -0.864166259765625, -0.777587890625, -0.691009521484375, -0.60443115234375, -0.517852783203125, -0.4312744140625, -0.344696044921875, -0.25811767578125, -0.171539306640625, -0.0849609375, 0.001617431640625, 0.08819580078125, 0.174774169921875, 0.2613525390625, 0.347930908203125, 0.43450927734375, 0.521087646484375, 0.607666015625, 0.694244384765625, 0.78082275390625, 0.867401123046875, 0.9539794921875, 1.040557861328125, 1.12713623046875, 1.213714599609375, 1.30029296875, 1.386871337890625, 1.47344970703125, 1.560028076171875, 1.6466064453125, 1.733184814453125, 1.81976318359375, 1.906341552734375, 1.992919921875, 2.079498291015625, 2.16607666015625, 2.252655029296875, 2.3392333984375, 2.425811767578125, 2.51239013671875, 2.598968505859375, 2.685546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 7.0, 11.0, 10.0, 17.0, 25.0, 48.0, 61.0, 81.0, 125.0, 196.0, 267.0, 450.0, 726.0, 1314.0, 2377.0, 4349.0, 9065.0, 20184.0, 53669.0, 172870.0, 449635.0, 220778.0, 65867.0, 24332.0, 10413.0, 5128.0, 2695.0, 1508.0, 871.0, 486.0, 349.0, 194.0, 155.0, 75.0, 71.0, 43.0, 30.0, 27.0, 10.0, 12.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0369873046875, -0.03594827651977539, -0.03490924835205078, -0.03387022018432617, -0.03283119201660156, -0.03179216384887695, -0.030753135681152344, -0.029714107513427734, -0.028675079345703125, -0.027636051177978516, -0.026597023010253906, -0.025557994842529297, -0.024518966674804688, -0.023479938507080078, -0.02244091033935547, -0.02140188217163086, -0.02036285400390625, -0.01932382583618164, -0.01828479766845703, -0.017245769500732422, -0.016206741333007812, -0.015167713165283203, -0.014128684997558594, -0.013089656829833984, -0.012050628662109375, -0.011011600494384766, -0.009972572326660156, -0.008933544158935547, -0.007894515991210938, -0.006855487823486328, -0.005816459655761719, -0.004777431488037109, -0.0037384033203125, -0.0026993751525878906, -0.0016603469848632812, -0.0006213188171386719, 0.0004177093505859375, 0.0014567375183105469, 0.0024957656860351562, 0.0035347938537597656, 0.004573822021484375, 0.005612850189208984, 0.006651878356933594, 0.007690906524658203, 0.008729934692382812, 0.009768962860107422, 0.010807991027832031, 0.01184701919555664, 0.01288604736328125, 0.01392507553100586, 0.014964103698730469, 0.016003131866455078, 0.017042160034179688, 0.018081188201904297, 0.019120216369628906, 0.020159244537353516, 0.021198272705078125, 0.022237300872802734, 0.023276329040527344, 0.024315357208251953, 0.025354385375976562, 0.026393413543701172, 0.02743244171142578, 0.02847146987915039, 0.029510498046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 10.0, 7.0, 12.0, 17.0, 28.0, 41.0, 87.0, 102.0, 136.0, 151.0, 130.0, 80.0, 70.0, 43.0, 30.0, 23.0, 10.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.07046890258789e-05, -7.725320756435394e-05, -7.380172610282898e-05, -7.035024464130402e-05, -6.689876317977905e-05, -6.344728171825409e-05, -5.9995800256729126e-05, -5.654431879520416e-05, -5.30928373336792e-05, -4.9641355872154236e-05, -4.618987441062927e-05, -4.273839294910431e-05, -3.9286911487579346e-05, -3.583543002605438e-05, -3.238394856452942e-05, -2.8932467103004456e-05, -2.5480985641479492e-05, -2.202950417995453e-05, -1.8578022718429565e-05, -1.5126541256904602e-05, -1.1675059795379639e-05, -8.223578333854675e-06, -4.772096872329712e-06, -1.3206154108047485e-06, 2.130866050720215e-06, 5.582347512245178e-06, 9.033828973770142e-06, 1.2485310435295105e-05, 1.593679189682007e-05, 1.9388273358345032e-05, 2.2839754819869995e-05, 2.629123628139496e-05, 2.9742717742919922e-05, 3.3194199204444885e-05, 3.664568066596985e-05, 4.009716212749481e-05, 4.3548643589019775e-05, 4.700012505054474e-05, 5.04516065120697e-05, 5.3903087973594666e-05, 5.735456943511963e-05, 6.080605089664459e-05, 6.425753235816956e-05, 6.770901381969452e-05, 7.116049528121948e-05, 7.461197674274445e-05, 7.806345820426941e-05, 8.151493966579437e-05, 8.496642112731934e-05, 8.84179025888443e-05, 9.186938405036926e-05, 9.532086551189423e-05, 9.877234697341919e-05, 0.00010222382843494415, 0.00010567530989646912, 0.00010912679135799408, 0.00011257827281951904, 0.000116029754281044, 0.00011948123574256897, 0.00012293271720409393, 0.0001263841986656189, 0.00012983568012714386, 0.00013328716158866882, 0.0001367386430501938, 0.00014019012451171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 3.0, 3.0, 12.0, 14.0, 9.0, 14.0, 35.0, 54.0, 78.0, 136.0, 258.0, 624.0, 1845.0, 9238.0, 116835.0, 862685.0, 48946.0, 5524.0, 1281.0, 416.0, 225.0, 103.0, 76.0, 44.0, 32.0, 18.0, 13.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09097099304199219, -0.08806991577148438, -0.08516883850097656, -0.08226776123046875, -0.07936668395996094, -0.07646560668945312, -0.07356452941894531, -0.0706634521484375, -0.06776237487792969, -0.06486129760742188, -0.06196022033691406, -0.05905914306640625, -0.05615806579589844, -0.053256988525390625, -0.05035591125488281, -0.047454833984375, -0.04455375671386719, -0.041652679443359375, -0.03875160217285156, -0.03585052490234375, -0.03294944763183594, -0.030048370361328125, -0.027147293090820312, -0.0242462158203125, -0.021345138549804688, -0.018444061279296875, -0.015542984008789062, -0.01264190673828125, -0.009740829467773438, -0.006839752197265625, -0.0039386749267578125, -0.00103759765625, 0.0018634796142578125, 0.004764556884765625, 0.0076656341552734375, 0.01056671142578125, 0.013467788696289062, 0.016368865966796875, 0.019269943237304688, 0.0221710205078125, 0.025072097778320312, 0.027973175048828125, 0.030874252319335938, 0.03377532958984375, 0.03667640686035156, 0.039577484130859375, 0.04247856140136719, 0.045379638671875, 0.04828071594238281, 0.051181793212890625, 0.05408287048339844, 0.05698394775390625, 0.05988502502441406, 0.06278610229492188, 0.06568717956542969, 0.0685882568359375, 0.07148933410644531, 0.07439041137695312, 0.07729148864746094, 0.08019256591796875, 0.08309364318847656, 0.08599472045898438, 0.08889579772949219, 0.091796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 7.0, 2.0, 7.0, 8.0, 5.0, 8.0, 19.0, 25.0, 21.0, 25.0, 39.0, 51.0, 63.0, 69.0, 85.0, 102.0, 106.0, 76.0, 73.0, 47.0, 33.0, 23.0, 21.0, 23.0, 17.0, 17.0, 12.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013427734375, -0.013028144836425781, -0.012628555297851562, -0.012228965759277344, -0.011829376220703125, -0.011429786682128906, -0.011030197143554688, -0.010630607604980469, -0.01023101806640625, -0.009831428527832031, -0.009431838989257812, -0.009032249450683594, -0.008632659912109375, -0.008233070373535156, -0.007833480834960938, -0.007433891296386719, -0.0070343017578125, -0.006634712219238281, -0.0062351226806640625, -0.005835533142089844, -0.005435943603515625, -0.005036354064941406, -0.0046367645263671875, -0.004237174987792969, -0.00383758544921875, -0.0034379959106445312, -0.0030384063720703125, -0.0026388168334960938, -0.002239227294921875, -0.0018396377563476562, -0.0014400482177734375, -0.0010404586791992188, -0.000640869140625, -0.00024127960205078125, 0.0001583099365234375, 0.0005578994750976562, 0.000957489013671875, 0.0013570785522460938, 0.0017566680908203125, 0.0021562576293945312, 0.00255584716796875, 0.0029554367065429688, 0.0033550262451171875, 0.0037546157836914062, 0.004154205322265625, 0.004553794860839844, 0.0049533843994140625, 0.005352973937988281, 0.0057525634765625, 0.006152153015136719, 0.0065517425537109375, 0.006951332092285156, 0.007350921630859375, 0.007750511169433594, 0.008150100708007812, 0.008549690246582031, 0.00894927978515625, 0.009348869323730469, 0.009748458862304688, 0.010148048400878906, 0.010547637939453125, 0.010947227478027344, 0.011346817016601562, 0.011746406555175781, 0.01214599609375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 10.0, 14.0, 33.0, 40.0, 72.0, 85.0, 141.0, 135.0, 140.0, 98.0, 76.0, 54.0, 28.0, 23.0, 7.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0206398963928223, -1.9182775020599365, -1.8159152269363403, -1.7135528326034546, -1.6111905574798584, -1.5088281631469727, -1.406465768814087, -1.3041034936904907, -1.2017412185668945, -1.0993788242340088, -0.9970165491104126, -0.8946541547775269, -0.7922918796539307, -0.6899294853210449, -0.587567150592804, -0.485204815864563, -0.38284242153167725, -0.2804800868034363, -0.17811773717403412, -0.07575538754463196, 0.02660694718360901, 0.12896931171417236, 0.23133164644241333, 0.3336939811706543, 0.43605631589889526, 0.5384186506271362, 0.6407809853553772, 0.7431433200836182, 0.8455057144165039, 0.9478680491447449, 1.0502303838729858, 1.152592658996582, 1.2549550533294678, 1.3573174476623535, 1.4596797227859497, 1.5620421171188354, 1.6644043922424316, 1.7667667865753174, 1.8691291809082031, 1.9714914560317993, 2.0738537311553955, 2.1762161254882812, 2.278578519821167, 2.3809406757354736, 2.4833030700683594, 2.585665464401245, 2.688027858734131, 2.7903900146484375, 2.8927526473999023, 2.995115041732788, 3.097477436065674, 3.1998395919799805, 3.302201986312866, 3.404564380645752, 3.5069267749786377, 3.6092891693115234, 3.71165132522583, 3.814013719558716, 3.9163761138916016, 4.018738269805908, 4.121100902557373, 4.22346305847168, 4.325825214385986, 4.428187847137451, 4.530550003051758]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 7.0, 11.0, 9.0, 22.0, 28.0, 35.0, 44.0, 63.0, 78.0, 75.0, 98.0, 108.0, 94.0, 92.0, 65.0, 66.0, 46.0, 18.0, 19.0, 6.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.344552993774414, -4.235991477966309, -4.127430438995361, -4.018868923187256, -3.9103078842163086, -3.801746368408203, -3.6931850910186768, -3.5846238136291504, -3.476062536239624, -3.3675012588500977, -3.2589399814605713, -3.150378704071045, -3.0418171882629395, -2.933256149291992, -2.8246946334838867, -2.7161333560943604, -2.607572078704834, -2.4990108013153076, -2.3904495239257812, -2.281888246536255, -2.1733269691467285, -2.064765453338623, -1.9562041759490967, -1.8476428985595703, -1.739081621170044, -1.6305203437805176, -1.5219590663909912, -1.4133976697921753, -1.304836392402649, -1.1962751150131226, -1.0877137184143066, -0.9791524410247803, -0.8705909252166748, -0.7620296478271484, -0.6534683108329773, -0.5449069738388062, -0.4363456964492798, -0.3277844190597534, -0.21922308206558228, -0.11066174507141113, -0.0021004676818847656, 0.10646083950996399, 0.21502214670181274, 0.3235834538936615, 0.43214476108551025, 0.5407060384750366, 0.6492673754692078, 0.7578287124633789, 0.8663899898529053, 0.9749512672424316, 1.083512544631958, 1.192073941230774, 1.3006352186203003, 1.4091964960098267, 1.5177578926086426, 1.626319169998169, 1.7348804473876953, 1.8434417247772217, 1.952003002166748, 2.0605642795562744, 2.169125556945801, 2.2776870727539062, 2.3862483501434326, 2.494809627532959, 2.6033709049224854]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 10.0, 12.0, 16.0, 18.0, 28.0, 49.0, 70.0, 105.0, 171.0, 309.0, 515.0, 929.0, 1733.0, 3491.0, 7960.0, 24157.0, 131106.0, 723822.0, 116753.0, 22491.0, 7543.0, 3319.0, 1710.0, 896.0, 499.0, 317.0, 202.0, 104.0, 64.0, 46.0, 28.0, 24.0, 17.0, 13.0, 7.0, 3.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.63671875, -1.5863189697265625, -1.535919189453125, -1.4855194091796875, -1.43511962890625, -1.3847198486328125, -1.334320068359375, -1.2839202880859375, -1.2335205078125, -1.1831207275390625, -1.132720947265625, -1.0823211669921875, -1.03192138671875, -0.9815216064453125, -0.931121826171875, -0.8807220458984375, -0.830322265625, -0.7799224853515625, -0.729522705078125, -0.6791229248046875, -0.62872314453125, -0.5783233642578125, -0.527923583984375, -0.4775238037109375, -0.4271240234375, -0.3767242431640625, -0.326324462890625, -0.2759246826171875, -0.22552490234375, -0.1751251220703125, -0.124725341796875, -0.0743255615234375, -0.02392578125, 0.0264739990234375, 0.076873779296875, 0.1272735595703125, 0.17767333984375, 0.2280731201171875, 0.278472900390625, 0.3288726806640625, 0.3792724609375, 0.4296722412109375, 0.480072021484375, 0.5304718017578125, 0.58087158203125, 0.6312713623046875, 0.681671142578125, 0.7320709228515625, 0.782470703125, 0.8328704833984375, 0.883270263671875, 0.9336700439453125, 0.98406982421875, 1.0344696044921875, 1.084869384765625, 1.1352691650390625, 1.1856689453125, 1.2360687255859375, 1.286468505859375, 1.3368682861328125, 1.38726806640625, 1.4376678466796875, 1.488067626953125, 1.5384674072265625, 1.5888671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 12.0, 11.0, 18.0, 27.0, 42.0, 54.0, 61.0, 72.0, 89.0, 85.0, 96.0, 102.0, 94.0, 78.0, 49.0, 43.0, 22.0, 14.0, 5.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-15.3359375, -15.01556396484375, -14.6951904296875, -14.37481689453125, -14.054443359375, -13.73406982421875, -13.4136962890625, -13.09332275390625, -12.77294921875, -12.45257568359375, -12.1322021484375, -11.81182861328125, -11.491455078125, -11.17108154296875, -10.8507080078125, -10.53033447265625, -10.2099609375, -9.88958740234375, -9.5692138671875, -9.24884033203125, -8.928466796875, -8.60809326171875, -8.2877197265625, -7.96734619140625, -7.64697265625, -7.32659912109375, -7.0062255859375, -6.68585205078125, -6.365478515625, -6.04510498046875, -5.7247314453125, -5.40435791015625, -5.083984375, -4.76361083984375, -4.4432373046875, -4.12286376953125, -3.802490234375, -3.48211669921875, -3.1617431640625, -2.84136962890625, -2.52099609375, -2.20062255859375, -1.8802490234375, -1.55987548828125, -1.239501953125, -0.91912841796875, -0.5987548828125, -0.27838134765625, 0.0419921875, 0.36236572265625, 0.6827392578125, 1.00311279296875, 1.323486328125, 1.64385986328125, 1.9642333984375, 2.28460693359375, 2.60498046875, 2.92535400390625, 3.2457275390625, 3.56610107421875, 3.886474609375, 4.20684814453125, 4.5272216796875, 4.84759521484375, 5.16796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 8.0, 8.0, 4.0, 20.0, 8.0, 7.0, 14.0, 13.0, 20.0, 23.0, 19.0, 30.0, 34.0, 37.0, 20.0, 35.0, 51.0, 56.0, 110.0, 104475.0, 943053.0, 106.0, 47.0, 39.0, 43.0, 25.0, 32.0, 39.0, 18.0, 35.0, 16.0, 10.0, 10.0, 14.0, 13.0, 12.0, 11.0, 6.0, 9.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-25.65625, -24.879638671875, -24.10302734375, -23.326416015625, -22.5498046875, -21.773193359375, -20.99658203125, -20.219970703125, -19.443359375, -18.666748046875, -17.89013671875, -17.113525390625, -16.3369140625, -15.560302734375, -14.78369140625, -14.007080078125, -13.23046875, -12.453857421875, -11.67724609375, -10.900634765625, -10.1240234375, -9.347412109375, -8.57080078125, -7.794189453125, -7.017578125, -6.240966796875, -5.46435546875, -4.687744140625, -3.9111328125, -3.134521484375, -2.35791015625, -1.581298828125, -0.8046875, -0.028076171875, 0.74853515625, 1.525146484375, 2.3017578125, 3.078369140625, 3.85498046875, 4.631591796875, 5.408203125, 6.184814453125, 6.96142578125, 7.738037109375, 8.5146484375, 9.291259765625, 10.06787109375, 10.844482421875, 11.62109375, 12.397705078125, 13.17431640625, 13.950927734375, 14.7275390625, 15.504150390625, 16.28076171875, 17.057373046875, 17.833984375, 18.610595703125, 19.38720703125, 20.163818359375, 20.9404296875, 21.717041015625, 22.49365234375, 23.270263671875, 24.046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 19.0, 8.0, 10.0, 13.0, 16.0, 25.0, 20.0, 10.0, 43.0, 30.0, 39.0, 33.0, 29.0, 58.0, 57.0, 47.0, 45.0, 46.0, 46.0, 49.0, 40.0, 31.0, 34.0, 34.0, 27.0, 27.0, 22.0, 15.0, 14.0, 12.0, 11.0, 12.0, 12.0, 7.0, 9.0, 8.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.6566162109375, -5.477294921875, -5.2979736328125, -5.11865234375, -4.9393310546875, -4.760009765625, -4.5806884765625, -4.4013671875, -4.2220458984375, -4.042724609375, -3.8634033203125, -3.68408203125, -3.5047607421875, -3.325439453125, -3.1461181640625, -2.966796875, -2.7874755859375, -2.608154296875, -2.4288330078125, -2.24951171875, -2.0701904296875, -1.890869140625, -1.7115478515625, -1.5322265625, -1.3529052734375, -1.173583984375, -0.9942626953125, -0.81494140625, -0.6356201171875, -0.456298828125, -0.2769775390625, -0.09765625, 0.0816650390625, 0.260986328125, 0.4403076171875, 0.61962890625, 0.7989501953125, 0.978271484375, 1.1575927734375, 1.3369140625, 1.5162353515625, 1.695556640625, 1.8748779296875, 2.05419921875, 2.2335205078125, 2.412841796875, 2.5921630859375, 2.771484375, 2.9508056640625, 3.130126953125, 3.3094482421875, 3.48876953125, 3.6680908203125, 3.847412109375, 4.0267333984375, 4.2060546875, 4.3853759765625, 4.564697265625, 4.7440185546875, 4.92333984375, 5.1026611328125, 5.281982421875, 5.4613037109375, 5.640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 11.0, 8.0, 25.0, 27.0, 54.0, 90.0, 173.0, 336.0, 689.0, 1849.0, 5297.0, 19574.0, 120650.0, 845742.0, 39612.0, 9494.0, 2925.0, 1036.0, 422.0, 203.0, 109.0, 61.0, 41.0, 25.0, 22.0, 13.0, 9.0, 7.0, 3.0, 3.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.65283203125, -0.6343002319335938, -0.6157684326171875, -0.5972366333007812, -0.578704833984375, -0.5601730346679688, -0.5416412353515625, -0.5231094360351562, -0.50457763671875, -0.48604583740234375, -0.4675140380859375, -0.44898223876953125, -0.430450439453125, -0.41191864013671875, -0.3933868408203125, -0.37485504150390625, -0.3563232421875, -0.33779144287109375, -0.3192596435546875, -0.30072784423828125, -0.282196044921875, -0.26366424560546875, -0.2451324462890625, -0.22660064697265625, -0.20806884765625, -0.18953704833984375, -0.1710052490234375, -0.15247344970703125, -0.133941650390625, -0.11540985107421875, -0.0968780517578125, -0.07834625244140625, -0.059814453125, -0.04128265380859375, -0.0227508544921875, -0.00421905517578125, 0.014312744140625, 0.03284454345703125, 0.0513763427734375, 0.06990814208984375, 0.08843994140625, 0.10697174072265625, 0.1255035400390625, 0.14403533935546875, 0.162567138671875, 0.18109893798828125, 0.1996307373046875, 0.21816253662109375, 0.2366943359375, 0.25522613525390625, 0.2737579345703125, 0.29228973388671875, 0.310821533203125, 0.32935333251953125, 0.3478851318359375, 0.36641693115234375, 0.38494873046875, 0.40348052978515625, 0.4220123291015625, 0.44054412841796875, 0.459075927734375, 0.47760772705078125, 0.4961395263671875, 0.5146713256835938, 0.533203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 2.0, 8.0, 11.0, 13.0, 25.0, 38.0, 57.0, 119.0, 368.0, 177.0, 54.0, 26.0, 16.0, 13.0, 11.0, 9.0, 7.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00010007619857788086, -9.766966104507446e-05, -9.526312351226807e-05, -9.285658597946167e-05, -9.045004844665527e-05, -8.804351091384888e-05, -8.563697338104248e-05, -8.323043584823608e-05, -8.082389831542969e-05, -7.841736078262329e-05, -7.60108232498169e-05, -7.36042857170105e-05, -7.11977481842041e-05, -6.87912106513977e-05, -6.638467311859131e-05, -6.397813558578491e-05, -6.157159805297852e-05, -5.916506052017212e-05, -5.675852298736572e-05, -5.4351985454559326e-05, -5.194544792175293e-05, -4.953891038894653e-05, -4.713237285614014e-05, -4.472583532333374e-05, -4.2319297790527344e-05, -3.991276025772095e-05, -3.750622272491455e-05, -3.5099685192108154e-05, -3.269314765930176e-05, -3.028661012649536e-05, -2.7880072593688965e-05, -2.547353506088257e-05, -2.3066997528076172e-05, -2.0660459995269775e-05, -1.825392246246338e-05, -1.5847384929656982e-05, -1.3440847396850586e-05, -1.103430986404419e-05, -8.627772331237793e-06, -6.2212347984313965e-06, -3.814697265625e-06, -1.4081597328186035e-06, 9.98377799987793e-07, 3.4049153327941895e-06, 5.811452865600586e-06, 8.217990398406982e-06, 1.0624527931213379e-05, 1.3031065464019775e-05, 1.5437602996826172e-05, 1.784414052963257e-05, 2.0250678062438965e-05, 2.265721559524536e-05, 2.5063753128051758e-05, 2.7470290660858154e-05, 2.987682819366455e-05, 3.228336572647095e-05, 3.4689903259277344e-05, 3.709644079208374e-05, 3.950297832489014e-05, 4.190951585769653e-05, 4.431605339050293e-05, 4.6722590923309326e-05, 4.912912845611572e-05, 5.153566598892212e-05, 5.3942203521728516e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 7.0, 16.0, 14.0, 25.0, 43.0, 52.0, 85.0, 149.0, 186.0, 365.0, 599.0, 1230.0, 2573.0, 5922.0, 17260.0, 71573.0, 830488.0, 85785.0, 19738.0, 6601.0, 2787.0, 1357.0, 668.0, 386.0, 239.0, 131.0, 92.0, 76.0, 29.0, 25.0, 17.0, 11.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.465087890625, -0.450347900390625, -0.43560791015625, -0.420867919921875, -0.4061279296875, -0.391387939453125, -0.37664794921875, -0.361907958984375, -0.34716796875, -0.332427978515625, -0.31768798828125, -0.302947998046875, -0.2882080078125, -0.273468017578125, -0.25872802734375, -0.243988037109375, -0.229248046875, -0.214508056640625, -0.19976806640625, -0.185028076171875, -0.1702880859375, -0.155548095703125, -0.14080810546875, -0.126068115234375, -0.111328125, -0.096588134765625, -0.08184814453125, -0.067108154296875, -0.0523681640625, -0.037628173828125, -0.02288818359375, -0.008148193359375, 0.006591796875, 0.021331787109375, 0.03607177734375, 0.050811767578125, 0.0655517578125, 0.080291748046875, 0.09503173828125, 0.109771728515625, 0.12451171875, 0.139251708984375, 0.15399169921875, 0.168731689453125, 0.1834716796875, 0.198211669921875, 0.21295166015625, 0.227691650390625, 0.242431640625, 0.257171630859375, 0.27191162109375, 0.286651611328125, 0.3013916015625, 0.316131591796875, 0.33087158203125, 0.345611572265625, 0.3603515625, 0.375091552734375, 0.38983154296875, 0.404571533203125, 0.4193115234375, 0.434051513671875, 0.44879150390625, 0.463531494140625, 0.478271484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 10.0, 5.0, 11.0, 14.0, 17.0, 14.0, 30.0, 34.0, 51.0, 95.0, 381.0, 125.0, 39.0, 25.0, 30.0, 24.0, 13.0, 9.0, 10.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.164306640625, -0.15955352783203125, -0.1548004150390625, -0.15004730224609375, -0.145294189453125, -0.14054107666015625, -0.1357879638671875, -0.13103485107421875, -0.12628173828125, -0.12152862548828125, -0.1167755126953125, -0.11202239990234375, -0.107269287109375, -0.10251617431640625, -0.0977630615234375, -0.09300994873046875, -0.0882568359375, -0.08350372314453125, -0.0787506103515625, -0.07399749755859375, -0.069244384765625, -0.06449127197265625, -0.0597381591796875, -0.05498504638671875, -0.05023193359375, -0.04547882080078125, -0.0407257080078125, -0.03597259521484375, -0.031219482421875, -0.02646636962890625, -0.0217132568359375, -0.01696014404296875, -0.01220703125, -0.00745391845703125, -0.0027008056640625, 0.00205230712890625, 0.006805419921875, 0.01155853271484375, 0.0163116455078125, 0.02106475830078125, 0.02581787109375, 0.03057098388671875, 0.0353240966796875, 0.04007720947265625, 0.044830322265625, 0.04958343505859375, 0.0543365478515625, 0.05908966064453125, 0.0638427734375, 0.06859588623046875, 0.0733489990234375, 0.07810211181640625, 0.082855224609375, 0.08760833740234375, 0.0923614501953125, 0.09711456298828125, 0.10186767578125, 0.10662078857421875, 0.1113739013671875, 0.11612701416015625, 0.120880126953125, 0.12563323974609375, 0.1303863525390625, 0.13513946533203125, 0.139892578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 15.0, 32.0, 31.0, 76.0, 74.0, 127.0, 138.0, 157.0, 110.0, 85.0, 45.0, 30.0, 24.0, 9.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6269640922546387, -3.4230399131774902, -3.219115734100342, -3.0151915550231934, -2.811267375946045, -2.6073431968688965, -2.403418779373169, -2.1994946002960205, -1.995570421218872, -1.7916462421417236, -1.5877220630645752, -1.3837977647781372, -1.1798735857009888, -0.9759494066238403, -0.7720251083374023, -0.5681009292602539, -0.36417675018310547, -0.16025254130363464, 0.04367166757583618, 0.2475959062576294, 0.45152008533477783, 0.6554442644119263, 0.8593685626983643, 1.0632927417755127, 1.2672169208526611, 1.4711410999298096, 1.675065279006958, 1.878989577293396, 2.082913875579834, 2.2868380546569824, 2.490762233734131, 2.6946864128112793, 2.898611068725586, 3.1025352478027344, 3.306459426879883, 3.5103836059570312, 3.7143077850341797, 3.918231964111328, 4.122156143188477, 4.326080322265625, 4.530004501342773, 4.733928680419922, 4.93785285949707, 5.141777038574219, 5.345701217651367, 5.549625396728516, 5.753549575805664, 5.9574737548828125, 6.161398410797119, 6.365322589874268, 6.569246768951416, 6.7731709480285645, 6.977095127105713, 7.181019306182861, 7.384943962097168, 7.588868141174316, 7.792792320251465, 7.996716499328613, 8.200640678405762, 8.40456485748291, 8.608489036560059, 8.812413215637207, 9.016337394714355, 9.220261573791504, 9.424185752868652]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 2.0, 6.0, 12.0, 13.0, 11.0, 12.0, 14.0, 21.0, 27.0, 28.0, 38.0, 31.0, 38.0, 34.0, 50.0, 45.0, 45.0, 49.0, 51.0, 38.0, 52.0, 35.0, 42.0, 53.0, 37.0, 38.0, 26.0, 20.0, 26.0, 15.0, 23.0, 12.0, 13.0, 13.0, 11.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.5520601272583, -9.278101921081543, -9.004143714904785, -8.730185508728027, -8.45622730255127, -8.182269096374512, -7.908311367034912, -7.634353160858154, -7.3603949546813965, -7.086436748504639, -6.812478542327881, -6.538520336151123, -6.264562606811523, -5.990604400634766, -5.716646194458008, -5.44268798828125, -5.168729782104492, -4.894771575927734, -4.620813369750977, -4.346855163574219, -4.072896957397461, -3.7989389896392822, -3.5249810218811035, -3.2510228157043457, -2.977064609527588, -2.70310640335083, -2.4291481971740723, -2.1551902294158936, -1.8812320232391357, -1.607273817062378, -1.3333157300949097, -1.0593576431274414, -0.7853999137878418, -0.5114417672157288, -0.23748362064361572, 0.036474525928497314, 0.31043267250061035, 0.5843908786773682, 0.8583489656448364, 1.1323070526123047, 1.4062652587890625, 1.6802234649658203, 1.9541815519332886, 2.228139638900757, 2.5020978450775146, 2.7760560512542725, 3.050014019012451, 3.323972225189209, 3.597930431365967, 3.8718886375427246, 4.145846843719482, 4.41980504989624, 4.69376277923584, 4.967720985412598, 5.2416791915893555, 5.515637397766113, 5.789595603942871, 6.063553810119629, 6.337512016296387, 6.6114702224731445, 6.885428428649902, 7.15938663482666, 7.43334436416626, 7.707302570343018, 7.981260776519775]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 8.0, 7.0, 8.0, 12.0, 26.0, 34.0, 52.0, 104.0, 144.0, 247.0, 496.0, 1125.0, 3082.0, 12059.0, 110948.0, 3344952.0, 672180.0, 36260.0, 8034.0, 2798.0, 989.0, 345.0, 136.0, 82.0, 56.0, 40.0, 13.0, 13.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2734375, -7.075439453125, -6.87744140625, -6.679443359375, -6.4814453125, -6.283447265625, -6.08544921875, -5.887451171875, -5.689453125, -5.491455078125, -5.29345703125, -5.095458984375, -4.8974609375, -4.699462890625, -4.50146484375, -4.303466796875, -4.10546875, -3.907470703125, -3.70947265625, -3.511474609375, -3.3134765625, -3.115478515625, -2.91748046875, -2.719482421875, -2.521484375, -2.323486328125, -2.12548828125, -1.927490234375, -1.7294921875, -1.531494140625, -1.33349609375, -1.135498046875, -0.9375, -0.739501953125, -0.54150390625, -0.343505859375, -0.1455078125, 0.052490234375, 0.25048828125, 0.448486328125, 0.646484375, 0.844482421875, 1.04248046875, 1.240478515625, 1.4384765625, 1.636474609375, 1.83447265625, 2.032470703125, 2.23046875, 2.428466796875, 2.62646484375, 2.824462890625, 3.0224609375, 3.220458984375, 3.41845703125, 3.616455078125, 3.814453125, 4.012451171875, 4.21044921875, 4.408447265625, 4.6064453125, 4.804443359375, 5.00244140625, 5.200439453125, 5.3984375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 4.0, 5.0, 12.0, 17.0, 29.0, 47.0, 68.0, 81.0, 99.0, 124.0, 117.0, 106.0, 95.0, 64.0, 44.0, 38.0, 21.0, 15.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.4140625, -6.271392822265625, -6.12872314453125, -5.986053466796875, -5.8433837890625, -5.700714111328125, -5.55804443359375, -5.415374755859375, -5.272705078125, -5.130035400390625, -4.98736572265625, -4.844696044921875, -4.7020263671875, -4.559356689453125, -4.41668701171875, -4.274017333984375, -4.13134765625, -3.988677978515625, -3.84600830078125, -3.703338623046875, -3.5606689453125, -3.417999267578125, -3.27532958984375, -3.132659912109375, -2.989990234375, -2.847320556640625, -2.70465087890625, -2.561981201171875, -2.4193115234375, -2.276641845703125, -2.13397216796875, -1.991302490234375, -1.8486328125, -1.705963134765625, -1.56329345703125, -1.420623779296875, -1.2779541015625, -1.135284423828125, -0.99261474609375, -0.849945068359375, -0.707275390625, -0.564605712890625, -0.42193603515625, -0.279266357421875, -0.1365966796875, 0.006072998046875, 0.14874267578125, 0.291412353515625, 0.43408203125, 0.576751708984375, 0.71942138671875, 0.862091064453125, 1.0047607421875, 1.147430419921875, 1.29010009765625, 1.432769775390625, 1.575439453125, 1.718109130859375, 1.86077880859375, 2.003448486328125, 2.1461181640625, 2.288787841796875, 2.43145751953125, 2.574127197265625, 2.716796875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 7.0, 13.0, 25.0, 33.0, 61.0, 137.0, 363.0, 1495.0, 15007.0, 3753017.0, 415592.0, 7005.0, 977.0, 272.0, 130.0, 39.0, 42.0, 17.0, 7.0, 7.0, 6.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0211181640625, -7.698486328125, -7.3758544921875, -7.05322265625, -6.7305908203125, -6.407958984375, -6.0853271484375, -5.7626953125, -5.4400634765625, -5.117431640625, -4.7947998046875, -4.47216796875, -4.1495361328125, -3.826904296875, -3.5042724609375, -3.181640625, -2.8590087890625, -2.536376953125, -2.2137451171875, -1.89111328125, -1.5684814453125, -1.245849609375, -0.9232177734375, -0.6005859375, -0.2779541015625, 0.044677734375, 0.3673095703125, 0.68994140625, 1.0125732421875, 1.335205078125, 1.6578369140625, 1.98046875, 2.3031005859375, 2.625732421875, 2.9483642578125, 3.27099609375, 3.5936279296875, 3.916259765625, 4.2388916015625, 4.5615234375, 4.8841552734375, 5.206787109375, 5.5294189453125, 5.85205078125, 6.1746826171875, 6.497314453125, 6.8199462890625, 7.142578125, 7.4652099609375, 7.787841796875, 8.1104736328125, 8.43310546875, 8.7557373046875, 9.078369140625, 9.4010009765625, 9.7236328125, 10.0462646484375, 10.368896484375, 10.6915283203125, 11.01416015625, 11.3367919921875, 11.659423828125, 11.9820556640625, 12.3046875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 12.0, 4.0, 20.0, 17.0, 46.0, 50.0, 102.0, 185.0, 517.0, 1157.0, 1083.0, 436.0, 204.0, 86.0, 55.0, 29.0, 21.0, 22.0, 11.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.0951995849609375, -2.040008544921875, -1.9848175048828125, -1.92962646484375, -1.8744354248046875, -1.819244384765625, -1.7640533447265625, -1.7088623046875, -1.6536712646484375, -1.598480224609375, -1.5432891845703125, -1.48809814453125, -1.4329071044921875, -1.377716064453125, -1.3225250244140625, -1.267333984375, -1.2121429443359375, -1.156951904296875, -1.1017608642578125, -1.04656982421875, -0.9913787841796875, -0.936187744140625, -0.8809967041015625, -0.8258056640625, -0.7706146240234375, -0.715423583984375, -0.6602325439453125, -0.60504150390625, -0.5498504638671875, -0.494659423828125, -0.4394683837890625, -0.38427734375, -0.3290863037109375, -0.273895263671875, -0.2187042236328125, -0.16351318359375, -0.1083221435546875, -0.053131103515625, 0.0020599365234375, 0.0572509765625, 0.1124420166015625, 0.167633056640625, 0.2228240966796875, 0.27801513671875, 0.3332061767578125, 0.388397216796875, 0.4435882568359375, 0.498779296875, 0.5539703369140625, 0.609161376953125, 0.6643524169921875, 0.71954345703125, 0.7747344970703125, 0.829925537109375, 0.8851165771484375, 0.9403076171875, 0.9954986572265625, 1.050689697265625, 1.1058807373046875, 1.16107177734375, 1.2162628173828125, 1.271453857421875, 1.3266448974609375, 1.3818359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 12.0, 10.0, 12.0, 13.0, 29.0, 52.0, 77.0, 121.0, 140.0, 152.0, 127.0, 93.0, 57.0, 31.0, 26.0, 12.0, 11.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0614495277404785, -4.900074005126953, -4.738698959350586, -4.577323913574219, -4.415948390960693, -4.254572868347168, -4.093197822570801, -3.9318225383758545, -3.770447254180908, -3.609071969985962, -3.4476966857910156, -3.2863214015960693, -3.124946117401123, -2.9635708332061768, -2.8021955490112305, -2.640820264816284, -2.479444980621338, -2.3180696964263916, -2.1566944122314453, -1.995319128036499, -1.8339438438415527, -1.6725685596466064, -1.5111932754516602, -1.3498179912567139, -1.1884427070617676, -1.0270674228668213, -0.865692138671875, -0.7043168544769287, -0.5429415702819824, -0.38156628608703613, -0.22019100189208984, -0.058815717697143555, 0.10255908966064453, 0.2639343738555908, 0.4253096580505371, 0.5866849422454834, 0.7480602264404297, 0.909435510635376, 1.0708107948303223, 1.2321860790252686, 1.3935613632202148, 1.5549366474151611, 1.7163119316101074, 1.8776872158050537, 2.0390625, 2.2004377841949463, 2.3618130683898926, 2.523188352584839, 2.684563636779785, 2.8459389209747314, 3.0073142051696777, 3.168689489364624, 3.3300647735595703, 3.4914400577545166, 3.652815341949463, 3.814190626144409, 3.9755659103393555, 4.136940956115723, 4.298316478729248, 4.459692001342773, 4.621067047119141, 4.782442092895508, 4.943817615509033, 5.105193138122559, 5.266568183898926]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 8.0, 16.0, 28.0, 26.0, 42.0, 40.0, 53.0, 75.0, 67.0, 97.0, 91.0, 82.0, 71.0, 63.0, 66.0, 40.0, 34.0, 25.0, 16.0, 9.0, 18.0, 4.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.354079723358154, -4.232902526855469, -4.111725330352783, -3.9905481338500977, -3.869370698928833, -3.7481935024261475, -3.627016305923462, -3.5058391094207764, -3.3846616744995117, -3.263484477996826, -3.1423072814941406, -3.021130084991455, -2.8999526500701904, -2.778775453567505, -2.6575982570648193, -2.536421060562134, -2.4152438640594482, -2.2940666675567627, -2.172889471054077, -2.0517120361328125, -1.930534839630127, -1.8093576431274414, -1.6881804466247559, -1.5670032501220703, -1.4458259344100952, -1.3246487379074097, -1.2034714221954346, -1.082294225692749, -0.9611169695854187, -0.8399397134780884, -0.7187625169754028, -0.5975852608680725, -0.4764077663421631, -0.35523051023483276, -0.23405328392982483, -0.1128760576248169, 0.008301198482513428, 0.12947845458984375, 0.2506556510925293, 0.3718329071998596, 0.49301016330718994, 0.6141874194145203, 0.7353646755218506, 0.8565418720245361, 0.9777191281318665, 1.0988963842391968, 1.2200735807418823, 1.3412508964538574, 1.462428092956543, 1.5836052894592285, 1.7047826051712036, 1.8259598016738892, 1.9471371173858643, 2.06831431388855, 2.1894915103912354, 2.310668706893921, 2.4318461418151855, 2.553023338317871, 2.6742005348205566, 2.795377731323242, 2.916555166244507, 3.0377323627471924, 3.158909559249878, 3.2800867557525635, 3.401263952255249]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 8.0, 13.0, 14.0, 20.0, 21.0, 32.0, 64.0, 120.0, 252.0, 494.0, 1272.0, 4426.0, 39303.0, 906256.0, 86923.0, 6422.0, 1652.0, 640.0, 298.0, 127.0, 68.0, 41.0, 26.0, 21.0, 10.0, 8.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.216796875, -1.181640625, -1.146484375, -1.111328125, -1.076171875, -1.041015625, -1.005859375, -0.970703125, -0.935546875, -0.900390625, -0.865234375, -0.830078125, -0.794921875, -0.759765625, -0.724609375, -0.689453125, -0.654296875, -0.619140625, -0.583984375, -0.548828125, -0.513671875, -0.478515625, -0.443359375, -0.408203125, -0.373046875, -0.337890625, -0.302734375, -0.267578125, -0.232421875, -0.197265625, -0.162109375, -0.126953125, -0.091796875, -0.056640625, -0.021484375, 0.013671875, 0.048828125, 0.083984375, 0.119140625, 0.154296875, 0.189453125, 0.224609375, 0.259765625, 0.294921875, 0.330078125, 0.365234375, 0.400390625, 0.435546875, 0.470703125, 0.505859375, 0.541015625, 0.576171875, 0.611328125, 0.646484375, 0.681640625, 0.716796875, 0.751953125, 0.787109375, 0.822265625, 0.857421875, 0.892578125, 0.927734375, 0.962890625, 0.998046875, 1.033203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 6.0, 10.0, 11.0, 37.0, 46.0, 45.0, 79.0, 92.0, 103.0, 104.0, 105.0, 93.0, 83.0, 54.0, 37.0, 26.0, 18.0, 15.0, 5.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.048065185546875, -2.95941162109375, -2.870758056640625, -2.7821044921875, -2.693450927734375, -2.60479736328125, -2.516143798828125, -2.427490234375, -2.338836669921875, -2.25018310546875, -2.161529541015625, -2.0728759765625, -1.984222412109375, -1.89556884765625, -1.806915283203125, -1.71826171875, -1.629608154296875, -1.54095458984375, -1.452301025390625, -1.3636474609375, -1.274993896484375, -1.18634033203125, -1.097686767578125, -1.009033203125, -0.920379638671875, -0.83172607421875, -0.743072509765625, -0.6544189453125, -0.565765380859375, -0.47711181640625, -0.388458251953125, -0.2998046875, -0.211151123046875, -0.12249755859375, -0.033843994140625, 0.0548095703125, 0.143463134765625, 0.23211669921875, 0.320770263671875, 0.409423828125, 0.498077392578125, 0.58673095703125, 0.675384521484375, 0.7640380859375, 0.852691650390625, 0.94134521484375, 1.029998779296875, 1.11865234375, 1.207305908203125, 1.29595947265625, 1.384613037109375, 1.4732666015625, 1.561920166015625, 1.65057373046875, 1.739227294921875, 1.827880859375, 1.916534423828125, 2.00518798828125, 2.093841552734375, 2.1824951171875, 2.271148681640625, 2.35980224609375, 2.448455810546875, 2.537109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 8.0, 3.0, 14.0, 15.0, 29.0, 41.0, 71.0, 82.0, 119.0, 193.0, 315.0, 523.0, 905.0, 1527.0, 2806.0, 5403.0, 10084.0, 20093.0, 40904.0, 84489.0, 176864.0, 286449.0, 212274.0, 104347.0, 49753.0, 24756.0, 12391.0, 6444.0, 3366.0, 1815.0, 963.0, 575.0, 345.0, 231.0, 113.0, 88.0, 58.0, 31.0, 28.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1519775390625, -0.14783000946044922, -0.14368247985839844, -0.13953495025634766, -0.13538742065429688, -0.1312398910522461, -0.1270923614501953, -0.12294483184814453, -0.11879730224609375, -0.11464977264404297, -0.11050224304199219, -0.1063547134399414, -0.10220718383789062, -0.09805965423583984, -0.09391212463378906, -0.08976459503173828, -0.0856170654296875, -0.08146953582763672, -0.07732200622558594, -0.07317447662353516, -0.06902694702148438, -0.0648794174194336, -0.06073188781738281, -0.05658435821533203, -0.05243682861328125, -0.04828929901123047, -0.04414176940917969, -0.039994239807128906, -0.035846710205078125, -0.031699180603027344, -0.027551651000976562, -0.02340412139892578, -0.019256591796875, -0.015109062194824219, -0.010961532592773438, -0.006814002990722656, -0.002666473388671875, 0.0014810562133789062, 0.0056285858154296875, 0.009776115417480469, 0.01392364501953125, 0.01807117462158203, 0.022218704223632812, 0.026366233825683594, 0.030513763427734375, 0.034661293029785156, 0.03880882263183594, 0.04295635223388672, 0.0471038818359375, 0.05125141143798828, 0.05539894104003906, 0.059546470642089844, 0.06369400024414062, 0.0678415298461914, 0.07198905944824219, 0.07613658905029297, 0.08028411865234375, 0.08443164825439453, 0.08857917785644531, 0.0927267074584961, 0.09687423706054688, 0.10102176666259766, 0.10516929626464844, 0.10931682586669922, 0.11346435546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 12.0, 7.0, 9.0, 12.0, 14.0, 18.0, 20.0, 20.0, 31.0, 27.0, 31.0, 41.0, 57.0, 56.0, 56.0, 59.0, 53.0, 58.0, 49.0, 49.0, 39.0, 57.0, 34.0, 30.0, 31.0, 26.0, 28.0, 23.0, 11.0, 12.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.143707275390625, -3.05499267578125, -2.966278076171875, -2.8775634765625, -2.788848876953125, -2.70013427734375, -2.611419677734375, -2.522705078125, -2.433990478515625, -2.34527587890625, -2.256561279296875, -2.1678466796875, -2.079132080078125, -1.99041748046875, -1.901702880859375, -1.81298828125, -1.724273681640625, -1.63555908203125, -1.546844482421875, -1.4581298828125, -1.369415283203125, -1.28070068359375, -1.191986083984375, -1.103271484375, -1.014556884765625, -0.92584228515625, -0.837127685546875, -0.7484130859375, -0.659698486328125, -0.57098388671875, -0.482269287109375, -0.3935546875, -0.304840087890625, -0.21612548828125, -0.127410888671875, -0.0386962890625, 0.050018310546875, 0.13873291015625, 0.227447509765625, 0.316162109375, 0.404876708984375, 0.49359130859375, 0.582305908203125, 0.6710205078125, 0.759735107421875, 0.84844970703125, 0.937164306640625, 1.02587890625, 1.114593505859375, 1.20330810546875, 1.292022705078125, 1.3807373046875, 1.469451904296875, 1.55816650390625, 1.646881103515625, 1.735595703125, 1.824310302734375, 1.91302490234375, 2.001739501953125, 2.0904541015625, 2.179168701171875, 2.26788330078125, 2.356597900390625, 2.4453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 2.0, 9.0, 14.0, 22.0, 37.0, 47.0, 76.0, 127.0, 197.0, 342.0, 635.0, 1223.0, 2749.0, 7263.0, 25923.0, 150769.0, 684681.0, 138051.0, 24011.0, 7052.0, 2596.0, 1229.0, 599.0, 349.0, 213.0, 112.0, 58.0, 52.0, 27.0, 25.0, 16.0, 9.0, 11.0, 6.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047882080078125, -0.04636096954345703, -0.04483985900878906, -0.043318748474121094, -0.041797637939453125, -0.040276527404785156, -0.03875541687011719, -0.03723430633544922, -0.03571319580078125, -0.03419208526611328, -0.03267097473144531, -0.031149864196777344, -0.029628753662109375, -0.028107643127441406, -0.026586532592773438, -0.02506542205810547, -0.0235443115234375, -0.02202320098876953, -0.020502090454101562, -0.018980979919433594, -0.017459869384765625, -0.015938758850097656, -0.014417648315429688, -0.012896537780761719, -0.01137542724609375, -0.009854316711425781, -0.008333206176757812, -0.006812095642089844, -0.005290985107421875, -0.0037698745727539062, -0.0022487640380859375, -0.0007276535034179688, 0.00079345703125, 0.0023145675659179688, 0.0038356781005859375, 0.005356788635253906, 0.006877899169921875, 0.008399009704589844, 0.009920120239257812, 0.011441230773925781, 0.01296234130859375, 0.014483451843261719, 0.016004562377929688, 0.017525672912597656, 0.019046783447265625, 0.020567893981933594, 0.022089004516601562, 0.02361011505126953, 0.0251312255859375, 0.02665233612060547, 0.028173446655273438, 0.029694557189941406, 0.031215667724609375, 0.032736778259277344, 0.03425788879394531, 0.03577899932861328, 0.03730010986328125, 0.03882122039794922, 0.04034233093261719, 0.041863441467285156, 0.043384552001953125, 0.044905662536621094, 0.04642677307128906, 0.04794788360595703, 0.049468994140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 11.0, 14.0, 35.0, 37.0, 50.0, 58.0, 67.0, 98.0, 110.0, 106.0, 87.0, 80.0, 54.0, 38.0, 27.0, 28.0, 10.0, 23.0, 21.0, 6.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.175041198730469e-05, -6.00302591919899e-05, -5.831010639667511e-05, -5.658995360136032e-05, -5.486980080604553e-05, -5.3149648010730743e-05, -5.1429495215415955e-05, -4.9709342420101166e-05, -4.798918962478638e-05, -4.626903682947159e-05, -4.45488840341568e-05, -4.282873123884201e-05, -4.110857844352722e-05, -3.938842564821243e-05, -3.7668272852897644e-05, -3.5948120057582855e-05, -3.4227967262268066e-05, -3.250781446695328e-05, -3.078766167163849e-05, -2.90675088763237e-05, -2.734735608100891e-05, -2.5627203285694122e-05, -2.3907050490379333e-05, -2.2186897695064545e-05, -2.0466744899749756e-05, -1.8746592104434967e-05, -1.7026439309120178e-05, -1.530628651380539e-05, -1.35861337184906e-05, -1.1865980923175812e-05, -1.0145828127861023e-05, -8.425675332546234e-06, -6.705522537231445e-06, -4.9853697419166565e-06, -3.2652169466018677e-06, -1.5450641512870789e-06, 1.7508864402770996e-07, 1.8952414393424988e-06, 3.6153942346572876e-06, 5.335547029972076e-06, 7.055699825286865e-06, 8.775852620601654e-06, 1.0496005415916443e-05, 1.2216158211231232e-05, 1.393631100654602e-05, 1.565646380186081e-05, 1.7376616597175598e-05, 1.9096769392490387e-05, 2.0816922187805176e-05, 2.2537074983119965e-05, 2.4257227778434753e-05, 2.5977380573749542e-05, 2.769753336906433e-05, 2.941768616437912e-05, 3.113783895969391e-05, 3.28579917550087e-05, 3.4578144550323486e-05, 3.6298297345638275e-05, 3.8018450140953064e-05, 3.973860293626785e-05, 4.145875573158264e-05, 4.317890852689743e-05, 4.489906132221222e-05, 4.661921411752701e-05, 4.83393669128418e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 8.0, 6.0, 9.0, 6.0, 17.0, 18.0, 43.0, 49.0, 83.0, 143.0, 348.0, 836.0, 2535.0, 8317.0, 40530.0, 586547.0, 368459.0, 30316.0, 6737.0, 2091.0, 754.0, 319.0, 140.0, 75.0, 47.0, 28.0, 13.0, 16.0, 14.0, 8.0, 9.0, 2.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.061753273010253906, -0.05954170227050781, -0.05733013153076172, -0.055118560791015625, -0.05290699005126953, -0.05069541931152344, -0.048483848571777344, -0.04627227783203125, -0.044060707092285156, -0.04184913635253906, -0.03963756561279297, -0.037425994873046875, -0.03521442413330078, -0.03300285339355469, -0.030791282653808594, -0.0285797119140625, -0.026368141174316406, -0.024156570434570312, -0.02194499969482422, -0.019733428955078125, -0.01752185821533203, -0.015310287475585938, -0.013098716735839844, -0.01088714599609375, -0.008675575256347656, -0.0064640045166015625, -0.004252433776855469, -0.002040863037109375, 0.00017070770263671875, 0.0023822784423828125, 0.004593849182128906, 0.006805419921875, 0.009016990661621094, 0.011228561401367188, 0.013440132141113281, 0.015651702880859375, 0.01786327362060547, 0.020074844360351562, 0.022286415100097656, 0.02449798583984375, 0.026709556579589844, 0.028921127319335938, 0.03113269805908203, 0.033344268798828125, 0.03555583953857422, 0.03776741027832031, 0.039978981018066406, 0.0421905517578125, 0.044402122497558594, 0.04661369323730469, 0.04882526397705078, 0.051036834716796875, 0.05324840545654297, 0.05545997619628906, 0.057671546936035156, 0.05988311767578125, 0.062094688415527344, 0.06430625915527344, 0.06651782989501953, 0.06872940063476562, 0.07094097137451172, 0.07315254211425781, 0.0753641128540039, 0.07757568359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 5.0, 10.0, 6.0, 14.0, 15.0, 18.0, 37.0, 65.0, 81.0, 123.0, 146.0, 141.0, 98.0, 66.0, 40.0, 31.0, 18.0, 19.0, 11.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01641845703125, -0.015947580337524414, -0.015476703643798828, -0.015005826950073242, -0.014534950256347656, -0.01406407356262207, -0.013593196868896484, -0.013122320175170898, -0.012651443481445312, -0.012180566787719727, -0.01170969009399414, -0.011238813400268555, -0.010767936706542969, -0.010297060012817383, -0.009826183319091797, -0.009355306625366211, -0.008884429931640625, -0.008413553237915039, -0.007942676544189453, -0.007471799850463867, -0.007000923156738281, -0.006530046463012695, -0.006059169769287109, -0.0055882930755615234, -0.0051174163818359375, -0.0046465396881103516, -0.004175662994384766, -0.0037047863006591797, -0.0032339096069335938, -0.002763032913208008, -0.002292156219482422, -0.001821279525756836, -0.00135040283203125, -0.0008795261383056641, -0.0004086494445800781, 6.222724914550781e-05, 0.0005331039428710938, 0.0010039806365966797, 0.0014748573303222656, 0.0019457340240478516, 0.0024166107177734375, 0.0028874874114990234, 0.0033583641052246094, 0.0038292407989501953, 0.004300117492675781, 0.004770994186401367, 0.005241870880126953, 0.005712747573852539, 0.006183624267578125, 0.006654500961303711, 0.007125377655029297, 0.007596254348754883, 0.008067131042480469, 0.008538007736206055, 0.00900888442993164, 0.009479761123657227, 0.009950637817382812, 0.010421514511108398, 0.010892391204833984, 0.01136326789855957, 0.011834144592285156, 0.012305021286010742, 0.012775897979736328, 0.013246774673461914, 0.0137176513671875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 16.0, 7.0, 14.0, 22.0, 36.0, 68.0, 102.0, 114.0, 147.0, 146.0, 114.0, 73.0, 32.0, 35.0, 14.0, 12.0, 8.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9591652154922485, -1.8732901811599731, -1.7874151468276978, -1.7015401124954224, -1.615665078163147, -1.5297900438308716, -1.4439151287078857, -1.3580400943756104, -1.272165060043335, -1.1862900257110596, -1.1004149913787842, -1.0145399570465088, -0.9286649227142334, -0.842789888381958, -0.7569149136543274, -0.671039879322052, -0.5851647853851318, -0.49928975105285645, -0.41341471672058105, -0.32753971219062805, -0.24166467785835266, -0.15578964352607727, -0.06991463899612427, 0.015960395336151123, 0.10183542966842651, 0.1877104640007019, 0.2735854983329773, 0.3594605028629303, 0.4453355371952057, 0.5312105417251587, 0.6170855760574341, 0.7029606103897095, 0.7888355255126953, 0.8747105598449707, 0.9605855941772461, 1.0464606285095215, 1.1323356628417969, 1.2182106971740723, 1.3040857315063477, 1.389960765838623, 1.4758358001708984, 1.5617108345031738, 1.6475858688354492, 1.7334609031677246, 1.8193359375, 1.9052109718322754, 1.9910860061645508, 2.076961040496826, 2.1628360748291016, 2.248711109161377, 2.3345861434936523, 2.4204611778259277, 2.506336212158203, 2.5922112464904785, 2.678086280822754, 2.7639613151550293, 2.8498361110687256, 2.935711145401001, 3.0215861797332764, 3.1074612140655518, 3.193336248397827, 3.2792112827301025, 3.365086317062378, 3.4509613513946533, 3.5368363857269287]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 6.0, 14.0, 22.0, 29.0, 47.0, 52.0, 69.0, 83.0, 101.0, 107.0, 98.0, 76.0, 91.0, 57.0, 43.0, 24.0, 20.0, 15.0, 13.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7695186138153076, -2.689101219177246, -2.6086840629577637, -2.5282669067382812, -2.4478495121002197, -2.367432117462158, -2.287014961242676, -2.2065978050231934, -2.126180410385132, -2.0457630157470703, -1.965345859527588, -1.884928584098816, -1.804511308670044, -1.724094033241272, -1.6436767578125, -1.563259482383728, -1.482842206954956, -1.402424931526184, -1.322007656097412, -1.2415903806686401, -1.1611731052398682, -1.0807558298110962, -1.0003385543823242, -0.9199212789535522, -0.8395040035247803, -0.7590867280960083, -0.6786694526672363, -0.5982521772384644, -0.5178349018096924, -0.4374176263809204, -0.35700035095214844, -0.27658307552337646, -0.1961655616760254, -0.11574828624725342, -0.035331010818481445, 0.04508626461029053, 0.1255035400390625, 0.20592081546783447, 0.28633809089660645, 0.3667553663253784, 0.4471726417541504, 0.5275899171829224, 0.6080071926116943, 0.6884244680404663, 0.7688417434692383, 0.8492590188980103, 0.9296762943267822, 1.0100935697555542, 1.0905108451843262, 1.1709281206130981, 1.2513453960418701, 1.331762671470642, 1.412179946899414, 1.492597222328186, 1.573014497756958, 1.65343177318573, 1.733849048614502, 1.814266324043274, 1.894683599472046, 1.9751008749008179, 2.05551815032959, 2.1359353065490723, 2.216352701187134, 2.2967700958251953, 2.3771872520446777]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 7.0, 13.0, 18.0, 28.0, 39.0, 44.0, 86.0, 162.0, 229.0, 380.0, 836.0, 1866.0, 4264.0, 11001.0, 40893.0, 421402.0, 501071.0, 45643.0, 12014.0, 4599.0, 1937.0, 894.0, 450.0, 251.0, 162.0, 85.0, 47.0, 36.0, 20.0, 24.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.919921875, -1.8635101318359375, -1.807098388671875, -1.7506866455078125, -1.69427490234375, -1.6378631591796875, -1.581451416015625, -1.5250396728515625, -1.4686279296875, -1.4122161865234375, -1.355804443359375, -1.2993927001953125, -1.24298095703125, -1.1865692138671875, -1.130157470703125, -1.0737457275390625, -1.017333984375, -0.9609222412109375, -0.904510498046875, -0.8480987548828125, -0.79168701171875, -0.7352752685546875, -0.678863525390625, -0.6224517822265625, -0.5660400390625, -0.5096282958984375, -0.453216552734375, -0.3968048095703125, -0.34039306640625, -0.2839813232421875, -0.227569580078125, -0.1711578369140625, -0.11474609375, -0.0583343505859375, -0.001922607421875, 0.0544891357421875, 0.11090087890625, 0.1673126220703125, 0.223724365234375, 0.2801361083984375, 0.3365478515625, 0.3929595947265625, 0.449371337890625, 0.5057830810546875, 0.56219482421875, 0.6186065673828125, 0.675018310546875, 0.7314300537109375, 0.787841796875, 0.8442535400390625, 0.900665283203125, 0.9570770263671875, 1.01348876953125, 1.0699005126953125, 1.126312255859375, 1.1827239990234375, 1.2391357421875, 1.2955474853515625, 1.351959228515625, 1.4083709716796875, 1.46478271484375, 1.5211944580078125, 1.577606201171875, 1.6340179443359375, 1.6904296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 12.0, 18.0, 25.0, 31.0, 36.0, 66.0, 65.0, 82.0, 100.0, 87.0, 100.0, 80.0, 63.0, 59.0, 59.0, 26.0, 19.0, 22.0, 11.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.56640625, -5.40911865234375, -5.2518310546875, -5.09454345703125, -4.937255859375, -4.77996826171875, -4.6226806640625, -4.46539306640625, -4.30810546875, -4.15081787109375, -3.9935302734375, -3.83624267578125, -3.678955078125, -3.52166748046875, -3.3643798828125, -3.20709228515625, -3.0498046875, -2.89251708984375, -2.7352294921875, -2.57794189453125, -2.420654296875, -2.26336669921875, -2.1060791015625, -1.94879150390625, -1.79150390625, -1.63421630859375, -1.4769287109375, -1.31964111328125, -1.162353515625, -1.00506591796875, -0.8477783203125, -0.69049072265625, -0.533203125, -0.37591552734375, -0.2186279296875, -0.06134033203125, 0.095947265625, 0.25323486328125, 0.4105224609375, 0.56781005859375, 0.72509765625, 0.88238525390625, 1.0396728515625, 1.19696044921875, 1.354248046875, 1.51153564453125, 1.6688232421875, 1.82611083984375, 1.9833984375, 2.14068603515625, 2.2979736328125, 2.45526123046875, 2.612548828125, 2.76983642578125, 2.9271240234375, 3.08441162109375, 3.24169921875, 3.39898681640625, 3.5562744140625, 3.71356201171875, 3.870849609375, 4.02813720703125, 4.1854248046875, 4.34271240234375, 4.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 5.0, 11.0, 10.0, 8.0, 13.0, 13.0, 18.0, 16.0, 26.0, 27.0, 30.0, 40.0, 49.0, 49.0, 64.0, 107.0, 503.0, 21982.0, 1021319.0, 3593.0, 234.0, 72.0, 70.0, 47.0, 35.0, 38.0, 23.0, 25.0, 25.0, 11.0, 12.0, 12.0, 8.0, 9.0, 7.0, 9.0, 10.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5, -7.2037353515625, -6.907470703125, -6.6112060546875, -6.31494140625, -6.0186767578125, -5.722412109375, -5.4261474609375, -5.1298828125, -4.8336181640625, -4.537353515625, -4.2410888671875, -3.94482421875, -3.6485595703125, -3.352294921875, -3.0560302734375, -2.759765625, -2.4635009765625, -2.167236328125, -1.8709716796875, -1.57470703125, -1.2784423828125, -0.982177734375, -0.6859130859375, -0.3896484375, -0.0933837890625, 0.202880859375, 0.4991455078125, 0.79541015625, 1.0916748046875, 1.387939453125, 1.6842041015625, 1.98046875, 2.2767333984375, 2.572998046875, 2.8692626953125, 3.16552734375, 3.4617919921875, 3.758056640625, 4.0543212890625, 4.3505859375, 4.6468505859375, 4.943115234375, 5.2393798828125, 5.53564453125, 5.8319091796875, 6.128173828125, 6.4244384765625, 6.720703125, 7.0169677734375, 7.313232421875, 7.6094970703125, 7.90576171875, 8.2020263671875, 8.498291015625, 8.7945556640625, 9.0908203125, 9.3870849609375, 9.683349609375, 9.9796142578125, 10.27587890625, 10.5721435546875, 10.868408203125, 11.1646728515625, 11.4609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 6.0, 10.0, 11.0, 10.0, 15.0, 11.0, 17.0, 19.0, 23.0, 34.0, 33.0, 31.0, 39.0, 35.0, 45.0, 48.0, 58.0, 49.0, 50.0, 39.0, 39.0, 40.0, 53.0, 36.0, 32.0, 28.0, 27.0, 31.0, 22.0, 14.0, 14.0, 13.0, 11.0, 8.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.104888916015625, -2.01837158203125, -1.931854248046875, -1.8453369140625, -1.758819580078125, -1.67230224609375, -1.585784912109375, -1.499267578125, -1.412750244140625, -1.32623291015625, -1.239715576171875, -1.1531982421875, -1.066680908203125, -0.98016357421875, -0.893646240234375, -0.80712890625, -0.720611572265625, -0.63409423828125, -0.547576904296875, -0.4610595703125, -0.374542236328125, -0.28802490234375, -0.201507568359375, -0.114990234375, -0.028472900390625, 0.05804443359375, 0.144561767578125, 0.2310791015625, 0.317596435546875, 0.40411376953125, 0.490631103515625, 0.5771484375, 0.663665771484375, 0.75018310546875, 0.836700439453125, 0.9232177734375, 1.009735107421875, 1.09625244140625, 1.182769775390625, 1.269287109375, 1.355804443359375, 1.44232177734375, 1.528839111328125, 1.6153564453125, 1.701873779296875, 1.78839111328125, 1.874908447265625, 1.96142578125, 2.047943115234375, 2.13446044921875, 2.220977783203125, 2.3074951171875, 2.394012451171875, 2.48052978515625, 2.567047119140625, 2.653564453125, 2.740081787109375, 2.82659912109375, 2.913116455078125, 2.9996337890625, 3.086151123046875, 3.17266845703125, 3.259185791015625, 3.345703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 12.0, 11.0, 20.0, 25.0, 44.0, 64.0, 126.0, 268.0, 721.0, 2152.0, 10379.0, 115418.0, 878205.0, 33832.0, 5056.0, 1293.0, 456.0, 190.0, 101.0, 53.0, 32.0, 23.0, 16.0, 10.0, 10.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5649337768554688, -0.5434417724609375, -0.5219497680664062, -0.500457763671875, -0.47896575927734375, -0.4574737548828125, -0.43598175048828125, -0.41448974609375, -0.39299774169921875, -0.3715057373046875, -0.35001373291015625, -0.328521728515625, -0.30702972412109375, -0.2855377197265625, -0.26404571533203125, -0.2425537109375, -0.22106170654296875, -0.1995697021484375, -0.17807769775390625, -0.156585693359375, -0.13509368896484375, -0.1136016845703125, -0.09210968017578125, -0.07061767578125, -0.04912567138671875, -0.0276336669921875, -0.00614166259765625, 0.015350341796875, 0.03684234619140625, 0.0583343505859375, 0.07982635498046875, 0.101318359375, 0.12281036376953125, 0.1443023681640625, 0.16579437255859375, 0.187286376953125, 0.20877838134765625, 0.2302703857421875, 0.25176239013671875, 0.27325439453125, 0.29474639892578125, 0.3162384033203125, 0.33773040771484375, 0.359222412109375, 0.38071441650390625, 0.4022064208984375, 0.42369842529296875, 0.4451904296875, 0.46668243408203125, 0.4881744384765625, 0.5096664428710938, 0.531158447265625, 0.5526504516601562, 0.5741424560546875, 0.5956344604492188, 0.61712646484375, 0.6386184692382812, 0.6601104736328125, 0.6816024780273438, 0.703094482421875, 0.7245864868164062, 0.7460784912109375, 0.7675704956054688, 0.7890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 19.0, 17.0, 30.0, 55.0, 111.0, 192.0, 261.0, 106.0, 67.0, 38.0, 28.0, 12.0, 4.0, 15.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.940696716308594e-05, -8.64444300532341e-05, -8.348189294338226e-05, -8.051935583353043e-05, -7.755681872367859e-05, -7.459428161382675e-05, -7.163174450397491e-05, -6.866920739412308e-05, -6.570667028427124e-05, -6.27441331744194e-05, -5.9781596064567566e-05, -5.681905895471573e-05, -5.385652184486389e-05, -5.0893984735012054e-05, -4.793144762516022e-05, -4.496891051530838e-05, -4.200637340545654e-05, -3.9043836295604706e-05, -3.608129918575287e-05, -3.311876207590103e-05, -3.0156224966049194e-05, -2.7193687856197357e-05, -2.423115074634552e-05, -2.1268613636493683e-05, -1.8306076526641846e-05, -1.534353941679001e-05, -1.2381002306938171e-05, -9.418465197086334e-06, -6.455928087234497e-06, -3.49339097738266e-06, -5.308538675308228e-07, 2.4316832423210144e-06, 5.3942203521728516e-06, 8.356757462024689e-06, 1.1319294571876526e-05, 1.4281831681728363e-05, 1.72443687915802e-05, 2.0206905901432037e-05, 2.3169443011283875e-05, 2.613198012113571e-05, 2.909451723098755e-05, 3.2057054340839386e-05, 3.501959145069122e-05, 3.798212856054306e-05, 4.09446656703949e-05, 4.3907202780246735e-05, 4.686973989009857e-05, 4.983227699995041e-05, 5.2794814109802246e-05, 5.575735121965408e-05, 5.871988832950592e-05, 6.168242543935776e-05, 6.46449625492096e-05, 6.760749965906143e-05, 7.057003676891327e-05, 7.35325738787651e-05, 7.649511098861694e-05, 7.945764809846878e-05, 8.242018520832062e-05, 8.538272231817245e-05, 8.834525942802429e-05, 9.130779653787613e-05, 9.427033364772797e-05, 9.72328707575798e-05, 0.00010019540786743164]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 8.0, 15.0, 21.0, 44.0, 36.0, 76.0, 148.0, 238.0, 484.0, 1079.0, 2745.0, 8582.0, 34570.0, 404306.0, 544273.0, 37637.0, 9025.0, 2955.0, 1147.0, 531.0, 255.0, 121.0, 74.0, 55.0, 38.0, 22.0, 14.0, 10.0, 8.0, 10.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5712890625, -0.5558586120605469, -0.5404281616210938, -0.5249977111816406, -0.5095672607421875, -0.4941368103027344, -0.47870635986328125, -0.4632759094238281, -0.447845458984375, -0.4324150085449219, -0.41698455810546875, -0.4015541076660156, -0.3861236572265625, -0.3706932067871094, -0.35526275634765625, -0.3398323059082031, -0.32440185546875, -0.3089714050292969, -0.29354095458984375, -0.2781105041503906, -0.2626800537109375, -0.24724960327148438, -0.23181915283203125, -0.21638870239257812, -0.200958251953125, -0.18552780151367188, -0.17009735107421875, -0.15466690063476562, -0.1392364501953125, -0.12380599975585938, -0.10837554931640625, -0.09294509887695312, -0.0775146484375, -0.062084197998046875, -0.04665374755859375, -0.031223297119140625, -0.0157928466796875, -0.000362396240234375, 0.01506805419921875, 0.030498504638671875, 0.045928955078125, 0.061359405517578125, 0.07678985595703125, 0.09222030639648438, 0.1076507568359375, 0.12308120727539062, 0.13851165771484375, 0.15394210815429688, 0.16937255859375, 0.18480300903320312, 0.20023345947265625, 0.21566390991210938, 0.2310943603515625, 0.24652481079101562, 0.26195526123046875, 0.2773857116699219, 0.292816162109375, 0.3082466125488281, 0.32367706298828125, 0.3391075134277344, 0.3545379638671875, 0.3699684143066406, 0.38539886474609375, 0.4008293151855469, 0.416259765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 4.0, 10.0, 15.0, 16.0, 24.0, 21.0, 40.0, 56.0, 122.0, 278.0, 131.0, 78.0, 49.0, 25.0, 21.0, 18.0, 23.0, 8.0, 8.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15860366821289062, -0.15241241455078125, -0.14622116088867188, -0.1400299072265625, -0.13383865356445312, -0.12764739990234375, -0.12145614624023438, -0.115264892578125, -0.10907363891601562, -0.10288238525390625, -0.09669113159179688, -0.0904998779296875, -0.08430862426757812, -0.07811737060546875, -0.07192611694335938, -0.06573486328125, -0.059543609619140625, -0.05335235595703125, -0.047161102294921875, -0.0409698486328125, -0.034778594970703125, -0.02858734130859375, -0.022396087646484375, -0.016204833984375, -0.010013580322265625, -0.00382232666015625, 0.002368927001953125, 0.0085601806640625, 0.014751434326171875, 0.02094268798828125, 0.027133941650390625, 0.0333251953125, 0.039516448974609375, 0.04570770263671875, 0.051898956298828125, 0.0580902099609375, 0.06428146362304688, 0.07047271728515625, 0.07666397094726562, 0.082855224609375, 0.08904647827148438, 0.09523773193359375, 0.10142898559570312, 0.1076202392578125, 0.11381149291992188, 0.12000274658203125, 0.12619400024414062, 0.13238525390625, 0.13857650756835938, 0.14476776123046875, 0.15095901489257812, 0.1571502685546875, 0.16334152221679688, 0.16953277587890625, 0.17572402954101562, 0.181915283203125, 0.18810653686523438, 0.19429779052734375, 0.20048904418945312, 0.2066802978515625, 0.21287155151367188, 0.21906280517578125, 0.22525405883789062, 0.2314453125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 10.0, 30.0, 58.0, 223.0, 406.0, 184.0, 57.0, 16.0, 13.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.630336046218872, -3.1461570262908936, -2.661977767944336, -2.1777987480163574, -1.693619728088379, -1.2094407081604004, -0.7252614498138428, -0.24108242988586426, 0.24309659004211426, 0.7272756695747375, 1.2114547491073608, 1.695633888244629, 2.1798129081726074, 2.663991928100586, 3.1481711864471436, 3.632350206375122, 4.11652946472168, 4.600708484649658, 5.084887504577637, 5.569067001342773, 6.053245544433594, 6.5374250411987305, 7.021604061126709, 7.5057830810546875, 7.989961624145508, 8.474141120910645, 8.958319664001465, 9.442499160766602, 9.926677703857422, 10.410857200622559, 10.895036697387695, 11.379215240478516, 11.863393783569336, 12.347573280334473, 12.831751823425293, 13.31593132019043, 13.80010986328125, 14.284289360046387, 14.768468856811523, 15.252647399902344, 15.736825942993164, 16.221004486083984, 16.705184936523438, 17.189363479614258, 17.673542022705078, 18.1577205657959, 18.64190101623535, 19.126079559326172, 19.610260009765625, 20.094438552856445, 20.5786190032959, 21.06279754638672, 21.54697608947754, 22.03115463256836, 22.515335083007812, 22.999513626098633, 23.483692169189453, 23.967870712280273, 24.452051162719727, 24.936229705810547, 25.420408248901367, 25.904586791992188, 26.38876724243164, 26.87294578552246, 27.35712432861328]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 10.0, 10.0, 10.0, 11.0, 23.0, 20.0, 37.0, 48.0, 37.0, 41.0, 75.0, 61.0, 80.0, 67.0, 73.0, 59.0, 67.0, 66.0, 36.0, 37.0, 38.0, 25.0, 23.0, 18.0, 11.0, 11.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.628027439117432, -7.3864827156066895, -7.144937515258789, -6.903392791748047, -6.6618475914001465, -6.420302867889404, -6.178757667541504, -5.937212944030762, -5.6956682205200195, -5.454123497009277, -5.212578296661377, -4.971033573150635, -4.729488372802734, -4.487943649291992, -4.24639892578125, -4.00485372543335, -3.763308525085449, -3.521763563156128, -3.2802186012268066, -3.0386738777160645, -2.797128677368164, -2.555583953857422, -2.3140389919281006, -2.0724940299987793, -1.830949068069458, -1.5894041061401367, -1.3478591442108154, -1.1063143014907837, -0.8647693395614624, -0.6232243776321411, -0.3816795349121094, -0.14013457298278809, 0.101409912109375, 0.3429548442363739, 0.5844997763633728, 0.8260446786880493, 1.0675896406173706, 1.309134602546692, 1.5506794452667236, 1.792224407196045, 2.033769369125366, 2.2753143310546875, 2.516859292984009, 2.75840425491333, 2.9999489784240723, 3.2414941787719727, 3.483038902282715, 3.724583864212036, 3.9661288261413574, 4.2076735496521, 4.44921875, 4.690763473510742, 4.932308673858643, 5.173853397369385, 5.415398597717285, 5.656943321228027, 5.8984880447387695, 6.140032768249512, 6.381577968597412, 6.623122692108154, 6.864667892456055, 7.106212615966797, 7.347757339477539, 7.5893025398254395, 7.83084774017334]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 4.0, 15.0, 14.0, 18.0, 19.0, 24.0, 18.0, 49.0, 62.0, 64.0, 100.0, 176.0, 317.0, 560.0, 1009.0, 2185.0, 5732.0, 18217.0, 98814.0, 1649760.0, 2228750.0, 147154.0, 26671.0, 8685.0, 3203.0, 1257.0, 606.0, 294.0, 157.0, 97.0, 65.0, 31.0, 30.0, 12.0, 21.0, 18.0, 14.0, 8.0, 7.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 3.0], "bins": [-3.935546875, -3.8165283203125, -3.697509765625, -3.5784912109375, -3.45947265625, -3.3404541015625, -3.221435546875, -3.1024169921875, -2.9833984375, -2.8643798828125, -2.745361328125, -2.6263427734375, -2.50732421875, -2.3883056640625, -2.269287109375, -2.1502685546875, -2.03125, -1.9122314453125, -1.793212890625, -1.6741943359375, -1.55517578125, -1.4361572265625, -1.317138671875, -1.1981201171875, -1.0791015625, -0.9600830078125, -0.841064453125, -0.7220458984375, -0.60302734375, -0.4840087890625, -0.364990234375, -0.2459716796875, -0.126953125, -0.0079345703125, 0.111083984375, 0.2301025390625, 0.34912109375, 0.4681396484375, 0.587158203125, 0.7061767578125, 0.8251953125, 0.9442138671875, 1.063232421875, 1.1822509765625, 1.30126953125, 1.4202880859375, 1.539306640625, 1.6583251953125, 1.77734375, 1.8963623046875, 2.015380859375, 2.1343994140625, 2.25341796875, 2.3724365234375, 2.491455078125, 2.6104736328125, 2.7294921875, 2.8485107421875, 2.967529296875, 3.0865478515625, 3.20556640625, 3.3245849609375, 3.443603515625, 3.5626220703125, 3.681640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 6.0, 12.0, 18.0, 35.0, 45.0, 63.0, 76.0, 99.0, 110.0, 102.0, 115.0, 74.0, 67.0, 45.0, 45.0, 22.0, 17.0, 15.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.98809814453125, -3.8746337890625, -3.76116943359375, -3.647705078125, -3.53424072265625, -3.4207763671875, -3.30731201171875, -3.19384765625, -3.08038330078125, -2.9669189453125, -2.85345458984375, -2.739990234375, -2.62652587890625, -2.5130615234375, -2.39959716796875, -2.2861328125, -2.17266845703125, -2.0592041015625, -1.94573974609375, -1.832275390625, -1.71881103515625, -1.6053466796875, -1.49188232421875, -1.37841796875, -1.26495361328125, -1.1514892578125, -1.03802490234375, -0.924560546875, -0.81109619140625, -0.6976318359375, -0.58416748046875, -0.470703125, -0.35723876953125, -0.2437744140625, -0.13031005859375, -0.016845703125, 0.09661865234375, 0.2100830078125, 0.32354736328125, 0.43701171875, 0.55047607421875, 0.6639404296875, 0.77740478515625, 0.890869140625, 1.00433349609375, 1.1177978515625, 1.23126220703125, 1.3447265625, 1.45819091796875, 1.5716552734375, 1.68511962890625, 1.798583984375, 1.91204833984375, 2.0255126953125, 2.13897705078125, 2.25244140625, 2.36590576171875, 2.4793701171875, 2.59283447265625, 2.706298828125, 2.81976318359375, 2.9332275390625, 3.04669189453125, 3.16015625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 14.0, 11.0, 24.0, 24.0, 38.0, 73.0, 123.0, 611.0, 114614.0, 4077067.0, 1266.0, 186.0, 66.0, 37.0, 33.0, 26.0, 11.0, 11.0, 7.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.34375, -25.6875, -25.03125, -24.375, -23.71875, -23.0625, -22.40625, -21.75, -21.09375, -20.4375, -19.78125, -19.125, -18.46875, -17.8125, -17.15625, -16.5, -15.84375, -15.1875, -14.53125, -13.875, -13.21875, -12.5625, -11.90625, -11.25, -10.59375, -9.9375, -9.28125, -8.625, -7.96875, -7.3125, -6.65625, -6.0, -5.34375, -4.6875, -4.03125, -3.375, -2.71875, -2.0625, -1.40625, -0.75, -0.09375, 0.5625, 1.21875, 1.875, 2.53125, 3.1875, 3.84375, 4.5, 5.15625, 5.8125, 6.46875, 7.125, 7.78125, 8.4375, 9.09375, 9.75, 10.40625, 11.0625, 11.71875, 12.375, 13.03125, 13.6875, 14.34375, 15.0, 15.65625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 10.0, 15.0, 6.0, 14.0, 30.0, 48.0, 49.0, 84.0, 142.0, 239.0, 471.0, 819.0, 807.0, 511.0, 251.0, 205.0, 107.0, 73.0, 55.0, 36.0, 22.0, 20.0, 10.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9315185546875, -0.901611328125, -0.8717041015625, -0.841796875, -0.8118896484375, -0.781982421875, -0.7520751953125, -0.72216796875, -0.6922607421875, -0.662353515625, -0.6324462890625, -0.6025390625, -0.5726318359375, -0.542724609375, -0.5128173828125, -0.48291015625, -0.4530029296875, -0.423095703125, -0.3931884765625, -0.36328125, -0.3333740234375, -0.303466796875, -0.2735595703125, -0.24365234375, -0.2137451171875, -0.183837890625, -0.1539306640625, -0.1240234375, -0.0941162109375, -0.064208984375, -0.0343017578125, -0.00439453125, 0.0255126953125, 0.055419921875, 0.0853271484375, 0.115234375, 0.1451416015625, 0.175048828125, 0.2049560546875, 0.23486328125, 0.2647705078125, 0.294677734375, 0.3245849609375, 0.3544921875, 0.3843994140625, 0.414306640625, 0.4442138671875, 0.47412109375, 0.5040283203125, 0.533935546875, 0.5638427734375, 0.59375, 0.6236572265625, 0.653564453125, 0.6834716796875, 0.71337890625, 0.7432861328125, 0.773193359375, 0.8031005859375, 0.8330078125, 0.8629150390625, 0.892822265625, 0.9227294921875, 0.95263671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 13.0, 17.0, 33.0, 63.0, 118.0, 194.0, 195.0, 155.0, 98.0, 48.0, 28.0, 15.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.742671489715576, -6.561884880065918, -6.381097793579102, -6.200311183929443, -6.019524574279785, -5.838737487792969, -5.6579508781433105, -5.477164268493652, -5.296377182006836, -5.115590572357178, -4.934803485870361, -4.754016876220703, -4.573229789733887, -4.3924431800842285, -4.21165657043457, -4.030869483947754, -3.8500828742980957, -3.6692960262298584, -3.488509178161621, -3.307722568511963, -3.1269357204437256, -2.9461488723754883, -2.76536226272583, -2.5845754146575928, -2.4037885665893555, -2.223001718521118, -2.042214870452881, -1.8614282608032227, -1.6806414127349854, -1.499854564666748, -1.3190678358078003, -1.1382811069488525, -0.9574942588806152, -0.7767074704170227, -0.5959206819534302, -0.41513389348983765, -0.23434710502624512, -0.05356031656265259, 0.12722647190093994, 0.3080132007598877, 0.488800048828125, 0.6695868372917175, 0.8503736257553101, 1.0311603546142578, 1.2119472026824951, 1.3927340507507324, 1.5735207796096802, 1.754307508468628, 1.9350943565368652, 2.1158812046051025, 2.29666805267334, 2.477454662322998, 2.6582415103912354, 2.8390283584594727, 3.019814968109131, 3.200601816177368, 3.3813886642456055, 3.5621755123138428, 3.74296236038208, 3.9237489700317383, 4.104536056518555, 4.285322666168213, 4.466109275817871, 4.6468963623046875, 4.827682971954346]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 12.0, 17.0, 23.0, 35.0, 37.0, 42.0, 44.0, 49.0, 65.0, 62.0, 87.0, 88.0, 94.0, 63.0, 63.0, 41.0, 40.0, 29.0, 28.0, 15.0, 17.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0383687019348145, -2.9433116912841797, -2.848254680633545, -2.753197431564331, -2.6581404209136963, -2.5630834102630615, -2.4680263996124268, -2.372969150543213, -2.277912139892578, -2.1828551292419434, -2.0877981185913086, -1.9927409887313843, -1.89768385887146, -1.8026268482208252, -1.7075698375701904, -1.6125127077102661, -1.5174556970596313, -1.4223986864089966, -1.3273415565490723, -1.2322845458984375, -1.1372274160385132, -1.0421704053878784, -0.9471133351325989, -0.8520562648773193, -0.7569991946220398, -0.6619421243667603, -0.5668850541114807, -0.47182801365852356, -0.376770943403244, -0.2817138731479645, -0.18665683269500732, -0.09159976243972778, 0.003457307815551758, 0.0985143706202507, 0.19357143342494965, 0.288628488779068, 0.38368555903434753, 0.4787426292896271, 0.5737996697425842, 0.6688567399978638, 0.7639138102531433, 0.8589708805084229, 0.9540279507637024, 1.049085021018982, 1.1441420316696167, 1.239199161529541, 1.3342561721801758, 1.4293131828308105, 1.5243703126907349, 1.6194273233413696, 1.714484453201294, 1.8095414638519287, 1.904598593711853, 1.9996556043624878, 2.094712734222412, 2.189769744873047, 2.2848267555236816, 2.3798837661743164, 2.474940776824951, 2.569998025894165, 2.6650550365448, 2.7601120471954346, 2.8551690578460693, 2.950226306915283, 3.045283317565918]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 9.0, 2.0, 3.0, 11.0, 18.0, 27.0, 50.0, 46.0, 75.0, 146.0, 251.0, 499.0, 1134.0, 2642.0, 8455.0, 43247.0, 438206.0, 491604.0, 47891.0, 9059.0, 2819.0, 1110.0, 546.0, 308.0, 155.0, 88.0, 41.0, 35.0, 20.0, 19.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4566078186035156, -0.44031524658203125, -0.4240226745605469, -0.4077301025390625, -0.3914375305175781, -0.37514495849609375, -0.3588523864746094, -0.342559814453125, -0.3262672424316406, -0.30997467041015625, -0.2936820983886719, -0.2773895263671875, -0.2610969543457031, -0.24480438232421875, -0.22851181030273438, -0.21221923828125, -0.19592666625976562, -0.17963409423828125, -0.16334152221679688, -0.1470489501953125, -0.13075637817382812, -0.11446380615234375, -0.09817123413085938, -0.081878662109375, -0.06558609008789062, -0.04929351806640625, -0.033000946044921875, -0.0167083740234375, -0.000415802001953125, 0.01587677001953125, 0.032169342041015625, 0.0484619140625, 0.06475448608398438, 0.08104705810546875, 0.09733963012695312, 0.1136322021484375, 0.12992477416992188, 0.14621734619140625, 0.16250991821289062, 0.178802490234375, 0.19509506225585938, 0.21138763427734375, 0.22768020629882812, 0.2439727783203125, 0.2602653503417969, 0.27655792236328125, 0.2928504943847656, 0.30914306640625, 0.3254356384277344, 0.34172821044921875, 0.3580207824707031, 0.3743133544921875, 0.3906059265136719, 0.40689849853515625, 0.4231910705566406, 0.439483642578125, 0.4557762145996094, 0.47206878662109375, 0.4883613586425781, 0.5046539306640625, 0.5209465026855469, 0.5372390747070312, 0.5535316467285156, 0.56982421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 3.0, 12.0, 11.0, 17.0, 28.0, 42.0, 39.0, 57.0, 63.0, 93.0, 102.0, 101.0, 101.0, 79.0, 57.0, 53.0, 40.0, 29.0, 20.0, 14.0, 9.0, 6.0, 1.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8046875, -1.73541259765625, -1.6661376953125, -1.59686279296875, -1.527587890625, -1.45831298828125, -1.3890380859375, -1.31976318359375, -1.25048828125, -1.18121337890625, -1.1119384765625, -1.04266357421875, -0.973388671875, -0.90411376953125, -0.8348388671875, -0.76556396484375, -0.6962890625, -0.62701416015625, -0.5577392578125, -0.48846435546875, -0.419189453125, -0.34991455078125, -0.2806396484375, -0.21136474609375, -0.14208984375, -0.07281494140625, -0.0035400390625, 0.06573486328125, 0.135009765625, 0.20428466796875, 0.2735595703125, 0.34283447265625, 0.412109375, 0.48138427734375, 0.5506591796875, 0.61993408203125, 0.689208984375, 0.75848388671875, 0.8277587890625, 0.89703369140625, 0.96630859375, 1.03558349609375, 1.1048583984375, 1.17413330078125, 1.243408203125, 1.31268310546875, 1.3819580078125, 1.45123291015625, 1.5205078125, 1.58978271484375, 1.6590576171875, 1.72833251953125, 1.797607421875, 1.86688232421875, 1.9361572265625, 2.00543212890625, 2.07470703125, 2.14398193359375, 2.2132568359375, 2.28253173828125, 2.351806640625, 2.42108154296875, 2.4903564453125, 2.55963134765625, 2.62890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 3.0, 9.0, 10.0, 13.0, 14.0, 20.0, 25.0, 40.0, 43.0, 80.0, 100.0, 162.0, 215.0, 380.0, 579.0, 915.0, 1465.0, 2504.0, 4094.0, 6999.0, 12239.0, 22045.0, 39891.0, 75141.0, 139624.0, 226120.0, 221295.0, 134184.0, 72391.0, 38119.0, 21142.0, 11910.0, 6709.0, 3896.0, 2340.0, 1432.0, 872.0, 487.0, 352.0, 216.0, 158.0, 90.0, 67.0, 44.0, 33.0, 26.0, 22.0, 13.0, 8.0, 5.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.108642578125, -0.10544395446777344, -0.10224533081054688, -0.09904670715332031, -0.09584808349609375, -0.09264945983886719, -0.08945083618164062, -0.08625221252441406, -0.0830535888671875, -0.07985496520996094, -0.07665634155273438, -0.07345771789550781, -0.07025909423828125, -0.06706047058105469, -0.06386184692382812, -0.06066322326660156, -0.057464599609375, -0.05426597595214844, -0.051067352294921875, -0.04786872863769531, -0.04467010498046875, -0.04147148132324219, -0.038272857666015625, -0.03507423400878906, -0.0318756103515625, -0.028676986694335938, -0.025478363037109375, -0.022279739379882812, -0.01908111572265625, -0.015882492065429688, -0.012683868408203125, -0.009485244750976562, -0.00628662109375, -0.0030879974365234375, 0.000110626220703125, 0.0033092498779296875, 0.00650787353515625, 0.009706497192382812, 0.012905120849609375, 0.016103744506835938, 0.0193023681640625, 0.022500991821289062, 0.025699615478515625, 0.028898239135742188, 0.03209686279296875, 0.03529548645019531, 0.038494110107421875, 0.04169273376464844, 0.044891357421875, 0.04808998107910156, 0.051288604736328125, 0.05448722839355469, 0.05768585205078125, 0.06088447570800781, 0.06408309936523438, 0.06728172302246094, 0.0704803466796875, 0.07367897033691406, 0.07687759399414062, 0.08007621765136719, 0.08327484130859375, 0.08647346496582031, 0.08967208862304688, 0.09287071228027344, 0.0960693359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 6.0, 7.0, 1.0, 10.0, 9.0, 6.0, 10.0, 13.0, 18.0, 18.0, 23.0, 22.0, 20.0, 26.0, 27.0, 36.0, 38.0, 43.0, 41.0, 36.0, 45.0, 41.0, 46.0, 40.0, 53.0, 41.0, 39.0, 35.0, 44.0, 32.0, 15.0, 15.0, 19.0, 23.0, 23.0, 17.0, 14.0, 9.0, 5.0, 11.0, 5.0, 5.0, 5.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.965576171875, -1.90185546875, -1.838134765625, -1.7744140625, -1.710693359375, -1.64697265625, -1.583251953125, -1.51953125, -1.455810546875, -1.39208984375, -1.328369140625, -1.2646484375, -1.200927734375, -1.13720703125, -1.073486328125, -1.009765625, -0.946044921875, -0.88232421875, -0.818603515625, -0.7548828125, -0.691162109375, -0.62744140625, -0.563720703125, -0.5, -0.436279296875, -0.37255859375, -0.308837890625, -0.2451171875, -0.181396484375, -0.11767578125, -0.053955078125, 0.009765625, 0.073486328125, 0.13720703125, 0.200927734375, 0.2646484375, 0.328369140625, 0.39208984375, 0.455810546875, 0.51953125, 0.583251953125, 0.64697265625, 0.710693359375, 0.7744140625, 0.838134765625, 0.90185546875, 0.965576171875, 1.029296875, 1.093017578125, 1.15673828125, 1.220458984375, 1.2841796875, 1.347900390625, 1.41162109375, 1.475341796875, 1.5390625, 1.602783203125, 1.66650390625, 1.730224609375, 1.7939453125, 1.857666015625, 1.92138671875, 1.985107421875, 2.048828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 21.0, 47.0, 63.0, 104.0, 194.0, 425.0, 1078.0, 3166.0, 12753.0, 100785.0, 842293.0, 72314.0, 10582.0, 2879.0, 972.0, 377.0, 180.0, 106.0, 58.0, 49.0, 23.0, 22.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0755615234375, -0.07315826416015625, -0.0707550048828125, -0.06835174560546875, -0.065948486328125, -0.06354522705078125, -0.0611419677734375, -0.05873870849609375, -0.05633544921875, -0.05393218994140625, -0.0515289306640625, -0.04912567138671875, -0.046722412109375, -0.04431915283203125, -0.0419158935546875, -0.03951263427734375, -0.037109375, -0.03470611572265625, -0.0323028564453125, -0.02989959716796875, -0.027496337890625, -0.02509307861328125, -0.0226898193359375, -0.02028656005859375, -0.01788330078125, -0.01548004150390625, -0.0130767822265625, -0.01067352294921875, -0.008270263671875, -0.00586700439453125, -0.0034637451171875, -0.00106048583984375, 0.0013427734375, 0.00374603271484375, 0.0061492919921875, 0.00855255126953125, 0.010955810546875, 0.01335906982421875, 0.0157623291015625, 0.01816558837890625, 0.02056884765625, 0.02297210693359375, 0.0253753662109375, 0.02777862548828125, 0.030181884765625, 0.03258514404296875, 0.0349884033203125, 0.03739166259765625, 0.039794921875, 0.04219818115234375, 0.0446014404296875, 0.04700469970703125, 0.049407958984375, 0.05181121826171875, 0.0542144775390625, 0.05661773681640625, 0.05902099609375, 0.06142425537109375, 0.0638275146484375, 0.06623077392578125, 0.068634033203125, 0.07103729248046875, 0.0734405517578125, 0.07584381103515625, 0.0782470703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 16.0, 30.0, 24.0, 40.0, 85.0, 105.0, 175.0, 179.0, 131.0, 91.0, 55.0, 22.0, 15.0, 14.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00013113021850585938, -0.00012834277004003525, -0.00012555532157421112, -0.000122767873108387, -0.00011998042464256287, -0.00011719297617673874, -0.00011440552771091461, -0.00011161807924509048, -0.00010883063077926636, -0.00010604318231344223, -0.0001032557338476181, -0.00010046828538179398, -9.768083691596985e-05, -9.489338845014572e-05, -9.21059399843216e-05, -8.931849151849747e-05, -8.653104305267334e-05, -8.374359458684921e-05, -8.095614612102509e-05, -7.816869765520096e-05, -7.538124918937683e-05, -7.25938007235527e-05, -6.980635225772858e-05, -6.701890379190445e-05, -6.423145532608032e-05, -6.14440068602562e-05, -5.865655839443207e-05, -5.586910992860794e-05, -5.3081661462783813e-05, -5.0294212996959686e-05, -4.750676453113556e-05, -4.471931606531143e-05, -4.1931867599487305e-05, -3.914441913366318e-05, -3.635697066783905e-05, -3.356952220201492e-05, -3.0782073736190796e-05, -2.799462527036667e-05, -2.520717680454254e-05, -2.2419728338718414e-05, -1.9632279872894287e-05, -1.684483140707016e-05, -1.4057382941246033e-05, -1.1269934475421906e-05, -8.482486009597778e-06, -5.695037543773651e-06, -2.907589077949524e-06, -1.2014061212539673e-07, 2.6673078536987305e-06, 5.454756319522858e-06, 8.242204785346985e-06, 1.1029653251171112e-05, 1.381710171699524e-05, 1.6604550182819366e-05, 1.9391998648643494e-05, 2.217944711446762e-05, 2.4966895580291748e-05, 2.7754344046115875e-05, 3.054179251194e-05, 3.332924097776413e-05, 3.611668944358826e-05, 3.8904137909412384e-05, 4.169158637523651e-05, 4.447903484106064e-05, 4.7266483306884766e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 11.0, 14.0, 23.0, 41.0, 66.0, 128.0, 223.0, 485.0, 1044.0, 2582.0, 7314.0, 29684.0, 411001.0, 548481.0, 34178.0, 8196.0, 2824.0, 1136.0, 515.0, 258.0, 121.0, 74.0, 41.0, 23.0, 19.0, 6.0, 9.0, 6.0, 4.0, 4.0, 3.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06951904296875, -0.06734943389892578, -0.06517982482910156, -0.06301021575927734, -0.060840606689453125, -0.058670997619628906, -0.05650138854980469, -0.05433177947998047, -0.05216217041015625, -0.04999256134033203, -0.04782295227050781, -0.045653343200683594, -0.043483734130859375, -0.041314125061035156, -0.03914451599121094, -0.03697490692138672, -0.0348052978515625, -0.03263568878173828, -0.030466079711914062, -0.028296470642089844, -0.026126861572265625, -0.023957252502441406, -0.021787643432617188, -0.01961803436279297, -0.01744842529296875, -0.015278816223144531, -0.013109207153320312, -0.010939598083496094, -0.008769989013671875, -0.006600379943847656, -0.0044307708740234375, -0.0022611618041992188, -9.1552734375e-05, 0.0020780563354492188, 0.0042476654052734375, 0.006417274475097656, 0.008586883544921875, 0.010756492614746094, 0.012926101684570312, 0.015095710754394531, 0.01726531982421875, 0.01943492889404297, 0.021604537963867188, 0.023774147033691406, 0.025943756103515625, 0.028113365173339844, 0.030282974243164062, 0.03245258331298828, 0.0346221923828125, 0.03679180145263672, 0.03896141052246094, 0.041131019592285156, 0.043300628662109375, 0.045470237731933594, 0.04763984680175781, 0.04980945587158203, 0.05197906494140625, 0.05414867401123047, 0.05631828308105469, 0.058487892150878906, 0.060657501220703125, 0.06282711029052734, 0.06499671936035156, 0.06716632843017578, 0.0693359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 3.0, 10.0, 8.0, 12.0, 15.0, 20.0, 18.0, 40.0, 52.0, 82.0, 140.0, 162.0, 158.0, 85.0, 42.0, 34.0, 18.0, 23.0, 10.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01445770263671875, -0.013997554779052734, -0.013537406921386719, -0.013077259063720703, -0.012617111206054688, -0.012156963348388672, -0.011696815490722656, -0.01123666763305664, -0.010776519775390625, -0.01031637191772461, -0.009856224060058594, -0.009396076202392578, -0.008935928344726562, -0.008475780487060547, -0.008015632629394531, -0.007555484771728516, -0.0070953369140625, -0.006635189056396484, -0.006175041198730469, -0.005714893341064453, -0.0052547454833984375, -0.004794597625732422, -0.004334449768066406, -0.0038743019104003906, -0.003414154052734375, -0.0029540061950683594, -0.0024938583374023438, -0.002033710479736328, -0.0015735626220703125, -0.0011134147644042969, -0.0006532669067382812, -0.00019311904907226562, 0.00026702880859375, 0.0007271766662597656, 0.0011873245239257812, 0.0016474723815917969, 0.0021076202392578125, 0.002567768096923828, 0.0030279159545898438, 0.0034880638122558594, 0.003948211669921875, 0.004408359527587891, 0.004868507385253906, 0.005328655242919922, 0.0057888031005859375, 0.006248950958251953, 0.006709098815917969, 0.007169246673583984, 0.00762939453125, 0.008089542388916016, 0.008549690246582031, 0.009009838104248047, 0.009469985961914062, 0.009930133819580078, 0.010390281677246094, 0.01085042953491211, 0.011310577392578125, 0.01177072525024414, 0.012230873107910156, 0.012691020965576172, 0.013151168823242188, 0.013611316680908203, 0.014071464538574219, 0.014531612396240234, 0.01499176025390625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 14.0, 24.0, 46.0, 65.0, 126.0, 201.0, 186.0, 121.0, 90.0, 52.0, 25.0, 9.0, 9.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.754124641418457, -2.6563334465026855, -2.558542013168335, -2.4607508182525635, -2.362959384918213, -2.2651681900024414, -2.16737699508667, -2.0695858001708984, -1.9717943668365479, -1.8740030527114868, -1.7762117385864258, -1.6784205436706543, -1.5806292295455933, -1.4828379154205322, -1.3850467205047607, -1.2872554063796997, -1.1894640922546387, -1.0916727781295776, -0.9938815236091614, -0.8960902690887451, -0.7982989549636841, -0.700507640838623, -0.6027163863182068, -0.5049251317977905, -0.4071338176727295, -0.30934253334999084, -0.2115512490272522, -0.11375996470451355, -0.015968680381774902, 0.08182260394096375, 0.1796138882637024, 0.27740514278411865, 0.3751962184906006, 0.47298750281333923, 0.5707787871360779, 0.6685700416564941, 0.7663613557815552, 0.8641526699066162, 0.9619439244270325, 1.0597351789474487, 1.1575264930725098, 1.2553178071975708, 1.3531091213226318, 1.4509003162384033, 1.5486916303634644, 1.6464829444885254, 1.7442741394042969, 1.842065453529358, 1.939856767654419, 2.0376479625701904, 2.135439395904541, 2.2332305908203125, 2.331021785736084, 2.4288132190704346, 2.526604413986206, 2.6243958473205566, 2.722187042236328, 2.8199782371520996, 2.91776967048645, 3.0155608654022217, 3.1133522987365723, 3.2111434936523438, 3.3089346885681152, 3.4067258834838867, 3.5045173168182373]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 4.0, 7.0, 5.0, 14.0, 13.0, 34.0, 32.0, 56.0, 53.0, 62.0, 86.0, 98.0, 119.0, 112.0, 71.0, 61.0, 54.0, 34.0, 29.0, 13.0, 17.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.197026252746582, -2.1263413429260254, -2.0556564331054688, -1.9849717617034912, -1.9142868518829346, -1.843601942062378, -1.7729171514511108, -1.7022323608398438, -1.631547451019287, -1.5608625411987305, -1.4901777505874634, -1.4194929599761963, -1.3488080501556396, -1.278123140335083, -1.207438349723816, -1.1367535591125488, -1.0660686492919922, -0.9953837990760803, -0.9246989488601685, -0.8540140986442566, -0.7833292484283447, -0.7126443982124329, -0.641959547996521, -0.5712746977806091, -0.5005898475646973, -0.4299049973487854, -0.35922014713287354, -0.28853529691696167, -0.2178504467010498, -0.14716559648513794, -0.07648074626922607, -0.005795896053314209, 0.06488871574401855, 0.13557356595993042, 0.20625841617584229, 0.27694326639175415, 0.347628116607666, 0.4183129668235779, 0.48899781703948975, 0.5596826672554016, 0.6303675174713135, 0.7010523676872253, 0.7717372179031372, 0.8424220681190491, 0.9131069183349609, 0.9837917685508728, 1.0544766187667847, 1.1251614093780518, 1.1958463191986084, 1.266531229019165, 1.3372160196304321, 1.4079008102416992, 1.4785857200622559, 1.5492706298828125, 1.6199554204940796, 1.6906402111053467, 1.7613251209259033, 1.83201003074646, 1.902694821357727, 1.9733796119689941, 2.044064521789551, 2.1147494316101074, 2.185434341430664, 2.2561190128326416, 2.3268039226531982]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 17.0, 12.0, 15.0, 19.0, 31.0, 37.0, 63.0, 89.0, 156.0, 241.0, 478.0, 924.0, 1959.0, 4837.0, 16139.0, 106079.0, 790143.0, 102696.0, 15820.0, 4789.0, 1900.0, 911.0, 478.0, 251.0, 177.0, 116.0, 58.0, 31.0, 28.0, 17.0, 19.0, 4.0, 8.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4453125, -2.374420166015625, -2.30352783203125, -2.232635498046875, -2.1617431640625, -2.090850830078125, -2.01995849609375, -1.949066162109375, -1.878173828125, -1.807281494140625, -1.73638916015625, -1.665496826171875, -1.5946044921875, -1.523712158203125, -1.45281982421875, -1.381927490234375, -1.31103515625, -1.240142822265625, -1.16925048828125, -1.098358154296875, -1.0274658203125, -0.956573486328125, -0.88568115234375, -0.814788818359375, -0.743896484375, -0.673004150390625, -0.60211181640625, -0.531219482421875, -0.4603271484375, -0.389434814453125, -0.31854248046875, -0.247650146484375, -0.1767578125, -0.105865478515625, -0.03497314453125, 0.035919189453125, 0.1068115234375, 0.177703857421875, 0.24859619140625, 0.319488525390625, 0.390380859375, 0.461273193359375, 0.53216552734375, 0.603057861328125, 0.6739501953125, 0.744842529296875, 0.81573486328125, 0.886627197265625, 0.95751953125, 1.028411865234375, 1.09930419921875, 1.170196533203125, 1.2410888671875, 1.311981201171875, 1.38287353515625, 1.453765869140625, 1.524658203125, 1.595550537109375, 1.66644287109375, 1.737335205078125, 1.8082275390625, 1.879119873046875, 1.95001220703125, 2.020904541015625, 2.091796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 3.0, 11.0, 15.0, 19.0, 25.0, 26.0, 39.0, 48.0, 64.0, 83.0, 92.0, 99.0, 86.0, 81.0, 73.0, 64.0, 42.0, 36.0, 22.0, 16.0, 15.0, 10.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.224853515625, -4.08642578125, -3.947998046875, -3.8095703125, -3.671142578125, -3.53271484375, -3.394287109375, -3.255859375, -3.117431640625, -2.97900390625, -2.840576171875, -2.7021484375, -2.563720703125, -2.42529296875, -2.286865234375, -2.1484375, -2.010009765625, -1.87158203125, -1.733154296875, -1.5947265625, -1.456298828125, -1.31787109375, -1.179443359375, -1.041015625, -0.902587890625, -0.76416015625, -0.625732421875, -0.4873046875, -0.348876953125, -0.21044921875, -0.072021484375, 0.06640625, 0.204833984375, 0.34326171875, 0.481689453125, 0.6201171875, 0.758544921875, 0.89697265625, 1.035400390625, 1.173828125, 1.312255859375, 1.45068359375, 1.589111328125, 1.7275390625, 1.865966796875, 2.00439453125, 2.142822265625, 2.28125, 2.419677734375, 2.55810546875, 2.696533203125, 2.8349609375, 2.973388671875, 3.11181640625, 3.250244140625, 3.388671875, 3.527099609375, 3.66552734375, 3.803955078125, 3.9423828125, 4.080810546875, 4.21923828125, 4.357666015625, 4.49609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 11.0, 4.0, 11.0, 12.0, 27.0, 18.0, 30.0, 41.0, 69.0, 110.0, 142.0, 300.0, 1196.0, 10207.0, 814185.0, 214962.0, 5683.0, 807.0, 254.0, 118.0, 73.0, 59.0, 59.0, 36.0, 29.0, 31.0, 12.0, 15.0, 11.0, 9.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.7890625, -4.651763916015625, -4.51446533203125, -4.377166748046875, -4.2398681640625, -4.102569580078125, -3.96527099609375, -3.827972412109375, -3.690673828125, -3.553375244140625, -3.41607666015625, -3.278778076171875, -3.1414794921875, -3.004180908203125, -2.86688232421875, -2.729583740234375, -2.59228515625, -2.454986572265625, -2.31768798828125, -2.180389404296875, -2.0430908203125, -1.905792236328125, -1.76849365234375, -1.631195068359375, -1.493896484375, -1.356597900390625, -1.21929931640625, -1.082000732421875, -0.9447021484375, -0.807403564453125, -0.67010498046875, -0.532806396484375, -0.3955078125, -0.258209228515625, -0.12091064453125, 0.016387939453125, 0.1536865234375, 0.290985107421875, 0.42828369140625, 0.565582275390625, 0.702880859375, 0.840179443359375, 0.97747802734375, 1.114776611328125, 1.2520751953125, 1.389373779296875, 1.52667236328125, 1.663970947265625, 1.80126953125, 1.938568115234375, 2.07586669921875, 2.213165283203125, 2.3504638671875, 2.487762451171875, 2.62506103515625, 2.762359619140625, 2.899658203125, 3.036956787109375, 3.17425537109375, 3.311553955078125, 3.4488525390625, 3.586151123046875, 3.72344970703125, 3.860748291015625, 3.998046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 14.0, 6.0, 7.0, 17.0, 20.0, 18.0, 16.0, 26.0, 39.0, 33.0, 45.0, 37.0, 50.0, 46.0, 65.0, 47.0, 65.0, 56.0, 58.0, 47.0, 44.0, 33.0, 40.0, 26.0, 30.0, 21.0, 23.0, 16.0, 13.0, 11.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.458984375, -3.360443115234375, -3.26190185546875, -3.163360595703125, -3.0648193359375, -2.966278076171875, -2.86773681640625, -2.769195556640625, -2.670654296875, -2.572113037109375, -2.47357177734375, -2.375030517578125, -2.2764892578125, -2.177947998046875, -2.07940673828125, -1.980865478515625, -1.88232421875, -1.783782958984375, -1.68524169921875, -1.586700439453125, -1.4881591796875, -1.389617919921875, -1.29107666015625, -1.192535400390625, -1.093994140625, -0.995452880859375, -0.89691162109375, -0.798370361328125, -0.6998291015625, -0.601287841796875, -0.50274658203125, -0.404205322265625, -0.3056640625, -0.207122802734375, -0.10858154296875, -0.010040283203125, 0.0885009765625, 0.187042236328125, 0.28558349609375, 0.384124755859375, 0.482666015625, 0.581207275390625, 0.67974853515625, 0.778289794921875, 0.8768310546875, 0.975372314453125, 1.07391357421875, 1.172454833984375, 1.27099609375, 1.369537353515625, 1.46807861328125, 1.566619873046875, 1.6651611328125, 1.763702392578125, 1.86224365234375, 1.960784912109375, 2.059326171875, 2.157867431640625, 2.25640869140625, 2.354949951171875, 2.4534912109375, 2.552032470703125, 2.65057373046875, 2.749114990234375, 2.84765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 13.0, 17.0, 32.0, 43.0, 57.0, 92.0, 150.0, 199.0, 378.0, 650.0, 1206.0, 2518.0, 7322.0, 41933.0, 865031.0, 110329.0, 11685.0, 3411.0, 1498.0, 786.0, 440.0, 265.0, 166.0, 93.0, 76.0, 42.0, 26.0, 28.0, 15.0, 9.0, 10.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.53759765625, -0.5194778442382812, -0.5013580322265625, -0.48323822021484375, -0.465118408203125, -0.44699859619140625, -0.4288787841796875, -0.41075897216796875, -0.39263916015625, -0.37451934814453125, -0.3563995361328125, -0.33827972412109375, -0.320159912109375, -0.30204010009765625, -0.2839202880859375, -0.26580047607421875, -0.2476806640625, -0.22956085205078125, -0.2114410400390625, -0.19332122802734375, -0.175201416015625, -0.15708160400390625, -0.1389617919921875, -0.12084197998046875, -0.10272216796875, -0.08460235595703125, -0.0664825439453125, -0.04836273193359375, -0.030242919921875, -0.01212310791015625, 0.0059967041015625, 0.02411651611328125, 0.042236328125, 0.06035614013671875, 0.0784759521484375, 0.09659576416015625, 0.114715576171875, 0.13283538818359375, 0.1509552001953125, 0.16907501220703125, 0.18719482421875, 0.20531463623046875, 0.2234344482421875, 0.24155426025390625, 0.259674072265625, 0.27779388427734375, 0.2959136962890625, 0.31403350830078125, 0.3321533203125, 0.35027313232421875, 0.3683929443359375, 0.38651275634765625, 0.404632568359375, 0.42275238037109375, 0.4408721923828125, 0.45899200439453125, 0.47711181640625, 0.49523162841796875, 0.5133514404296875, 0.5314712524414062, 0.549591064453125, 0.5677108764648438, 0.5858306884765625, 0.6039505004882812, 0.6220703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 19.0, 23.0, 51.0, 101.0, 195.0, 268.0, 162.0, 64.0, 45.0, 19.0, 12.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010716915130615234, -0.00010443944483995438, -0.00010170973837375641, -9.898003190755844e-05, -9.625032544136047e-05, -9.35206189751625e-05, -9.079091250896454e-05, -8.806120604276657e-05, -8.53314995765686e-05, -8.260179311037064e-05, -7.987208664417267e-05, -7.71423801779747e-05, -7.441267371177673e-05, -7.168296724557877e-05, -6.89532607793808e-05, -6.622355431318283e-05, -6.349384784698486e-05, -6.0764141380786896e-05, -5.803443491458893e-05, -5.530472844839096e-05, -5.257502198219299e-05, -4.9845315515995026e-05, -4.711560904979706e-05, -4.438590258359909e-05, -4.165619611740112e-05, -3.8926489651203156e-05, -3.619678318500519e-05, -3.346707671880722e-05, -3.073737025260925e-05, -2.8007663786411285e-05, -2.5277957320213318e-05, -2.254825085401535e-05, -1.9818544387817383e-05, -1.7088837921619415e-05, -1.4359131455421448e-05, -1.162942498922348e-05, -8.899718523025513e-06, -6.170012056827545e-06, -3.4403055906295776e-06, -7.105991244316101e-07, 2.0191073417663574e-06, 4.748813807964325e-06, 7.4785202741622925e-06, 1.020822674036026e-05, 1.2937933206558228e-05, 1.5667639672756195e-05, 1.8397346138954163e-05, 2.112705260515213e-05, 2.3856759071350098e-05, 2.6586465537548065e-05, 2.9316172003746033e-05, 3.2045878469944e-05, 3.477558493614197e-05, 3.7505291402339935e-05, 4.02349978685379e-05, 4.296470433473587e-05, 4.569441080093384e-05, 4.8424117267131805e-05, 5.115382373332977e-05, 5.388353019952774e-05, 5.661323666572571e-05, 5.9342943131923676e-05, 6.207264959812164e-05, 6.480235606431961e-05, 6.753206253051758e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 17.0, 12.0, 16.0, 29.0, 44.0, 65.0, 108.0, 160.0, 243.0, 389.0, 694.0, 1158.0, 2195.0, 5453.0, 25435.0, 650153.0, 334183.0, 19075.0, 4647.0, 1920.0, 961.0, 519.0, 359.0, 224.0, 167.0, 95.0, 66.0, 61.0, 29.0, 21.0, 15.0, 8.0, 10.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.603515625, -0.5846099853515625, -0.565704345703125, -0.5467987060546875, -0.52789306640625, -0.5089874267578125, -0.490081787109375, -0.4711761474609375, -0.4522705078125, -0.4333648681640625, -0.414459228515625, -0.3955535888671875, -0.37664794921875, -0.3577423095703125, -0.338836669921875, -0.3199310302734375, -0.301025390625, -0.2821197509765625, -0.263214111328125, -0.2443084716796875, -0.22540283203125, -0.2064971923828125, -0.187591552734375, -0.1686859130859375, -0.1497802734375, -0.1308746337890625, -0.111968994140625, -0.0930633544921875, -0.07415771484375, -0.0552520751953125, -0.036346435546875, -0.0174407958984375, 0.00146484375, 0.0203704833984375, 0.039276123046875, 0.0581817626953125, 0.07708740234375, 0.0959930419921875, 0.114898681640625, 0.1338043212890625, 0.1527099609375, 0.1716156005859375, 0.190521240234375, 0.2094268798828125, 0.22833251953125, 0.2472381591796875, 0.266143798828125, 0.2850494384765625, 0.303955078125, 0.3228607177734375, 0.341766357421875, 0.3606719970703125, 0.37957763671875, 0.3984832763671875, 0.417388916015625, 0.4362945556640625, 0.4552001953125, 0.4741058349609375, 0.493011474609375, 0.5119171142578125, 0.53082275390625, 0.5497283935546875, 0.568634033203125, 0.5875396728515625, 0.6064453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 21.0, 20.0, 55.0, 96.0, 193.0, 247.0, 155.0, 88.0, 43.0, 28.0, 12.0, 7.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23492431640625, -0.2269287109375, -0.21893310546875, -0.2109375, -0.20294189453125, -0.1949462890625, -0.18695068359375, -0.178955078125, -0.17095947265625, -0.1629638671875, -0.15496826171875, -0.14697265625, -0.13897705078125, -0.1309814453125, -0.12298583984375, -0.114990234375, -0.10699462890625, -0.0989990234375, -0.09100341796875, -0.0830078125, -0.07501220703125, -0.0670166015625, -0.05902099609375, -0.051025390625, -0.04302978515625, -0.0350341796875, -0.02703857421875, -0.01904296875, -0.01104736328125, -0.0030517578125, 0.00494384765625, 0.012939453125, 0.02093505859375, 0.0289306640625, 0.03692626953125, 0.044921875, 0.05291748046875, 0.0609130859375, 0.06890869140625, 0.076904296875, 0.08489990234375, 0.0928955078125, 0.10089111328125, 0.10888671875, 0.11688232421875, 0.1248779296875, 0.13287353515625, 0.140869140625, 0.14886474609375, 0.1568603515625, 0.16485595703125, 0.1728515625, 0.18084716796875, 0.1888427734375, 0.19683837890625, 0.204833984375, 0.21282958984375, 0.2208251953125, 0.22882080078125, 0.23681640625, 0.24481201171875, 0.2528076171875, 0.26080322265625, 0.268798828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 10.0, 13.0, 15.0, 14.0, 30.0, 60.0, 93.0, 157.0, 163.0, 134.0, 107.0, 77.0, 39.0, 29.0, 14.0, 15.0, 12.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.511663913726807, -4.349172592163086, -4.186681270599365, -4.0241899490356445, -3.8616983890533447, -3.699206829071045, -3.536715507507324, -3.3742241859436035, -3.211732864379883, -3.049241542816162, -2.8867499828338623, -2.7242586612701416, -2.561767339706421, -2.399275779724121, -2.2367844581604004, -2.0742931365966797, -1.9118015766143799, -1.7493101358413696, -1.586818814277649, -1.4243273735046387, -1.261836051940918, -1.0993446111679077, -0.9368531703948975, -0.7743618488311768, -0.6118704080581665, -0.449379026889801, -0.28688761591911316, -0.12439620494842529, 0.038095176219940186, 0.20058655738830566, 0.3630779981613159, 0.5255693197250366, 0.6880607604980469, 0.8505521416664124, 1.0130435228347778, 1.175534963607788, 1.3380262851715088, 1.500517725944519, 1.6630091667175293, 1.82550048828125, 1.9879919290542603, 2.1504833698272705, 2.312974691390991, 2.475466251373291, 2.6379575729370117, 2.8004488945007324, 2.962940216064453, 3.125431537628174, 3.2879230976104736, 3.4504144191741943, 3.612905979156494, 3.775397300720215, 3.9378886222839355, 4.100379943847656, 4.262871742248535, 4.425362586975098, 4.587854385375977, 4.750345706939697, 4.912837028503418, 5.075328826904297, 5.237820148468018, 5.400311470031738, 5.562802791595459, 5.72529411315918, 5.8877854347229]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 13.0, 19.0, 16.0, 20.0, 28.0, 34.0, 51.0, 55.0, 50.0, 67.0, 80.0, 73.0, 66.0, 73.0, 69.0, 57.0, 52.0, 41.0, 36.0, 32.0, 13.0, 17.0, 13.0, 10.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.097884654998779, -6.857694625854492, -6.617504119873047, -6.377313613891602, -6.1371235847473145, -5.896933555603027, -5.656743049621582, -5.416552543640137, -5.17636251449585, -4.9361724853515625, -4.695981979370117, -4.455791473388672, -4.215601444244385, -3.9754111766815186, -3.7352209091186523, -3.495030641555786, -3.25484037399292, -3.0146501064300537, -2.7744598388671875, -2.5342695713043213, -2.294079303741455, -2.053889036178589, -1.8136987686157227, -1.5735085010528564, -1.3333182334899902, -1.093127965927124, -0.8529376983642578, -0.6127474308013916, -0.3725571632385254, -0.13236689567565918, 0.10782337188720703, 0.34801363945007324, 0.5882043838500977, 0.8283946514129639, 1.06858491897583, 1.3087751865386963, 1.5489654541015625, 1.7891557216644287, 2.029345989227295, 2.269536256790161, 2.5097265243530273, 2.7499167919158936, 2.9901070594787598, 3.230297327041626, 3.470487594604492, 3.7106778621673584, 3.9508681297302246, 4.191058158874512, 4.431248664855957, 4.671439170837402, 4.9116291999816895, 5.151819229125977, 5.392009735107422, 5.632200241088867, 5.872390270233154, 6.112580299377441, 6.352770805358887, 6.592961311340332, 6.833151340484619, 7.073341369628906, 7.313531875610352, 7.553722381591797, 7.793912410736084, 8.034102439880371, 8.274292945861816]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 15.0, 14.0, 33.0, 41.0, 63.0, 108.0, 154.0, 263.0, 483.0, 1008.0, 1883.0, 4721.0, 13646.0, 55294.0, 610077.0, 3078336.0, 358083.0, 49101.0, 12978.0, 4322.0, 1756.0, 824.0, 413.0, 293.0, 154.0, 92.0, 39.0, 32.0, 17.0, 14.0, 7.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.68359375, -3.58770751953125, -3.4918212890625, -3.39593505859375, -3.300048828125, -3.20416259765625, -3.1082763671875, -3.01239013671875, -2.91650390625, -2.82061767578125, -2.7247314453125, -2.62884521484375, -2.532958984375, -2.43707275390625, -2.3411865234375, -2.24530029296875, -2.1494140625, -2.05352783203125, -1.9576416015625, -1.86175537109375, -1.765869140625, -1.66998291015625, -1.5740966796875, -1.47821044921875, -1.38232421875, -1.28643798828125, -1.1905517578125, -1.09466552734375, -0.998779296875, -0.90289306640625, -0.8070068359375, -0.71112060546875, -0.615234375, -0.51934814453125, -0.4234619140625, -0.32757568359375, -0.231689453125, -0.13580322265625, -0.0399169921875, 0.05596923828125, 0.15185546875, 0.24774169921875, 0.3436279296875, 0.43951416015625, 0.535400390625, 0.63128662109375, 0.7271728515625, 0.82305908203125, 0.9189453125, 1.01483154296875, 1.1107177734375, 1.20660400390625, 1.302490234375, 1.39837646484375, 1.4942626953125, 1.59014892578125, 1.68603515625, 1.78192138671875, 1.8778076171875, 1.97369384765625, 2.069580078125, 2.16546630859375, 2.2613525390625, 2.35723876953125, 2.453125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 13.0, 18.0, 25.0, 38.0, 55.0, 65.0, 77.0, 97.0, 114.0, 103.0, 88.0, 79.0, 62.0, 43.0, 41.0, 16.0, 15.0, 12.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.9012451171875, -2.812255859375, -2.7232666015625, -2.63427734375, -2.5452880859375, -2.456298828125, -2.3673095703125, -2.2783203125, -2.1893310546875, -2.100341796875, -2.0113525390625, -1.92236328125, -1.8333740234375, -1.744384765625, -1.6553955078125, -1.56640625, -1.4774169921875, -1.388427734375, -1.2994384765625, -1.21044921875, -1.1214599609375, -1.032470703125, -0.9434814453125, -0.8544921875, -0.7655029296875, -0.676513671875, -0.5875244140625, -0.49853515625, -0.4095458984375, -0.320556640625, -0.2315673828125, -0.142578125, -0.0535888671875, 0.035400390625, 0.1243896484375, 0.21337890625, 0.3023681640625, 0.391357421875, 0.4803466796875, 0.5693359375, 0.6583251953125, 0.747314453125, 0.8363037109375, 0.92529296875, 1.0142822265625, 1.103271484375, 1.1922607421875, 1.28125, 1.3702392578125, 1.459228515625, 1.5482177734375, 1.63720703125, 1.7261962890625, 1.815185546875, 1.9041748046875, 1.9931640625, 2.0821533203125, 2.171142578125, 2.2601318359375, 2.34912109375, 2.4381103515625, 2.527099609375, 2.6160888671875, 2.705078125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 10.0, 17.0, 34.0, 53.0, 120.0, 179.0, 470.0, 1602.0, 15218.0, 3797410.0, 370524.0, 6842.0, 1017.0, 364.0, 176.0, 83.0, 76.0, 28.0, 18.0, 14.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.47320556640625, -9.2354736328125, -8.99774169921875, -8.760009765625, -8.52227783203125, -8.2845458984375, -8.04681396484375, -7.80908203125, -7.57135009765625, -7.3336181640625, -7.09588623046875, -6.858154296875, -6.62042236328125, -6.3826904296875, -6.14495849609375, -5.9072265625, -5.66949462890625, -5.4317626953125, -5.19403076171875, -4.956298828125, -4.71856689453125, -4.4808349609375, -4.24310302734375, -4.00537109375, -3.76763916015625, -3.5299072265625, -3.29217529296875, -3.054443359375, -2.81671142578125, -2.5789794921875, -2.34124755859375, -2.103515625, -1.86578369140625, -1.6280517578125, -1.39031982421875, -1.152587890625, -0.91485595703125, -0.6771240234375, -0.43939208984375, -0.20166015625, 0.03607177734375, 0.2738037109375, 0.51153564453125, 0.749267578125, 0.98699951171875, 1.2247314453125, 1.46246337890625, 1.7001953125, 1.93792724609375, 2.1756591796875, 2.41339111328125, 2.651123046875, 2.88885498046875, 3.1265869140625, 3.36431884765625, 3.60205078125, 3.83978271484375, 4.0775146484375, 4.31524658203125, 4.552978515625, 4.79071044921875, 5.0284423828125, 5.26617431640625, 5.50390625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 6.0, 15.0, 14.0, 20.0, 27.0, 34.0, 63.0, 95.0, 200.0, 347.0, 736.0, 1029.0, 692.0, 339.0, 139.0, 97.0, 56.0, 40.0, 35.0, 26.0, 14.0, 8.0, 3.0, 12.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.990875244140625, -0.96124267578125, -0.931610107421875, -0.9019775390625, -0.872344970703125, -0.84271240234375, -0.813079833984375, -0.783447265625, -0.753814697265625, -0.72418212890625, -0.694549560546875, -0.6649169921875, -0.635284423828125, -0.60565185546875, -0.576019287109375, -0.54638671875, -0.516754150390625, -0.48712158203125, -0.457489013671875, -0.4278564453125, -0.398223876953125, -0.36859130859375, -0.338958740234375, -0.309326171875, -0.279693603515625, -0.25006103515625, -0.220428466796875, -0.1907958984375, -0.161163330078125, -0.13153076171875, -0.101898193359375, -0.072265625, -0.042633056640625, -0.01300048828125, 0.016632080078125, 0.0462646484375, 0.075897216796875, 0.10552978515625, 0.135162353515625, 0.164794921875, 0.194427490234375, 0.22406005859375, 0.253692626953125, 0.2833251953125, 0.312957763671875, 0.34259033203125, 0.372222900390625, 0.40185546875, 0.431488037109375, 0.46112060546875, 0.490753173828125, 0.5203857421875, 0.550018310546875, 0.57965087890625, 0.609283447265625, 0.638916015625, 0.668548583984375, 0.69818115234375, 0.727813720703125, 0.7574462890625, 0.787078857421875, 0.81671142578125, 0.846343994140625, 0.8759765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 12.0, 12.0, 17.0, 18.0, 48.0, 64.0, 104.0, 171.0, 173.0, 124.0, 108.0, 51.0, 35.0, 15.0, 15.0, 10.0, 12.0, 7.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.637568950653076, -5.504051208496094, -5.370533466339111, -5.237015724182129, -5.1034979820251465, -4.969980239868164, -4.83646297454834, -4.702945232391357, -4.569427490234375, -4.435909748077393, -4.30239200592041, -4.168874263763428, -4.035356521606445, -3.901839017868042, -3.7683212757110596, -3.634803533554077, -3.5012857913970947, -3.3677680492401123, -3.23425030708313, -3.1007328033447266, -2.967215061187744, -2.8336973190307617, -2.7001795768737793, -2.566661834716797, -2.4331440925598145, -2.299626350402832, -2.1661086082458496, -2.032590866088867, -1.8990733623504639, -1.7655556201934814, -1.632037878036499, -1.4985201358795166, -1.3650026321411133, -1.2314848899841309, -1.097967267036438, -0.9644495248794556, -0.8309318423271179, -0.6974141597747803, -0.5638964176177979, -0.4303787350654602, -0.29686105251312256, -0.16334335505962372, -0.029825657606124878, 0.10369205474853516, 0.2372097373008728, 0.37072741985321045, 0.5042451620101929, 0.6377628445625305, 0.7712805271148682, 0.9047982096672058, 1.0383158922195435, 1.1718336343765259, 1.3053512573242188, 1.4388689994812012, 1.5723867416381836, 1.705904483795166, 1.8394221067428589, 1.9729398488998413, 2.106457471847534, 2.2399752140045166, 2.373492956161499, 2.5070104598999023, 2.6405282020568848, 2.774045944213867, 2.9075636863708496]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 12.0, 13.0, 20.0, 16.0, 27.0, 42.0, 40.0, 56.0, 55.0, 83.0, 76.0, 91.0, 81.0, 73.0, 64.0, 54.0, 50.0, 27.0, 36.0, 22.0, 22.0, 10.0, 8.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0201945304870605, -2.9325990676879883, -2.845003843307495, -2.757408380508423, -2.6698131561279297, -2.5822176933288574, -2.494622230529785, -2.407027006149292, -2.3194315433502197, -2.2318360805511475, -2.1442408561706543, -2.056645393371582, -1.9690500497817993, -1.8814547061920166, -1.7938593626022339, -1.7062640190124512, -1.6186686754226685, -1.5310733318328857, -1.443477988243103, -1.3558826446533203, -1.268287181854248, -1.1806918382644653, -1.0930964946746826, -1.0055010318756104, -0.9179057478904724, -0.8303104043006897, -0.7427150011062622, -0.6551196575164795, -0.5675243139266968, -0.4799289107322693, -0.3923335671424866, -0.3047381639480591, -0.21714282035827637, -0.12954744696617126, -0.041952088475227356, 0.04564327001571655, 0.13323864340782166, 0.22083401679992676, 0.3084293603897095, 0.39602476358413696, 0.4836201071739197, 0.5712154507637024, 0.6588108539581299, 0.7464061975479126, 0.8340015411376953, 0.9215969443321228, 1.0091922283172607, 1.096787691116333, 1.1843830347061157, 1.2719783782958984, 1.3595737218856812, 1.4471690654754639, 1.5347645282745361, 1.6223598718643188, 1.7099552154541016, 1.7975506782531738, 1.885145902633667, 1.9727412462234497, 2.0603365898132324, 2.1479320526123047, 2.235527276992798, 2.32312273979187, 2.4107179641723633, 2.4983134269714355, 2.585908889770508]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 9.0, 5.0, 11.0, 10.0, 23.0, 32.0, 52.0, 48.0, 102.0, 141.0, 230.0, 346.0, 648.0, 1192.0, 2599.0, 6521.0, 21851.0, 99715.0, 541974.0, 299376.0, 52122.0, 13031.0, 4391.0, 1876.0, 906.0, 481.0, 295.0, 199.0, 108.0, 82.0, 46.0, 32.0, 27.0, 18.0, 15.0, 10.0, 9.0, 10.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.365478515625, -0.3543357849121094, -0.34319305419921875, -0.3320503234863281, -0.3209075927734375, -0.3097648620605469, -0.29862213134765625, -0.2874794006347656, -0.276336669921875, -0.2651939392089844, -0.25405120849609375, -0.24290847778320312, -0.2317657470703125, -0.22062301635742188, -0.20948028564453125, -0.19833755493164062, -0.18719482421875, -0.17605209350585938, -0.16490936279296875, -0.15376663208007812, -0.1426239013671875, -0.13148117065429688, -0.12033843994140625, -0.10919570922851562, -0.098052978515625, -0.08691024780273438, -0.07576751708984375, -0.06462478637695312, -0.0534820556640625, -0.042339324951171875, -0.03119659423828125, -0.020053863525390625, -0.0089111328125, 0.002231597900390625, 0.01337432861328125, 0.024517059326171875, 0.0356597900390625, 0.046802520751953125, 0.05794525146484375, 0.06908798217773438, 0.080230712890625, 0.09137344360351562, 0.10251617431640625, 0.11365890502929688, 0.1248016357421875, 0.13594436645507812, 0.14708709716796875, 0.15822982788085938, 0.16937255859375, 0.18051528930664062, 0.19165802001953125, 0.20280075073242188, 0.2139434814453125, 0.22508621215820312, 0.23622894287109375, 0.24737167358398438, 0.258514404296875, 0.2696571350097656, 0.28079986572265625, 0.2919425964355469, 0.3030853271484375, 0.3142280578613281, 0.32537078857421875, 0.3365135192871094, 0.34765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 17.0, 23.0, 13.0, 34.0, 57.0, 73.0, 75.0, 120.0, 106.0, 97.0, 124.0, 69.0, 53.0, 37.0, 28.0, 21.0, 17.0, 8.0, 10.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.35345458984375, -2.2791748046875, -2.20489501953125, -2.130615234375, -2.05633544921875, -1.9820556640625, -1.90777587890625, -1.83349609375, -1.75921630859375, -1.6849365234375, -1.61065673828125, -1.536376953125, -1.46209716796875, -1.3878173828125, -1.31353759765625, -1.2392578125, -1.16497802734375, -1.0906982421875, -1.01641845703125, -0.942138671875, -0.86785888671875, -0.7935791015625, -0.71929931640625, -0.64501953125, -0.57073974609375, -0.4964599609375, -0.42218017578125, -0.347900390625, -0.27362060546875, -0.1993408203125, -0.12506103515625, -0.05078125, 0.02349853515625, 0.0977783203125, 0.17205810546875, 0.246337890625, 0.32061767578125, 0.3948974609375, 0.46917724609375, 0.54345703125, 0.61773681640625, 0.6920166015625, 0.76629638671875, 0.840576171875, 0.91485595703125, 0.9891357421875, 1.06341552734375, 1.1376953125, 1.21197509765625, 1.2862548828125, 1.36053466796875, 1.434814453125, 1.50909423828125, 1.5833740234375, 1.65765380859375, 1.73193359375, 1.80621337890625, 1.8804931640625, 1.95477294921875, 2.029052734375, 2.10333251953125, 2.1776123046875, 2.25189208984375, 2.326171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 11.0, 20.0, 32.0, 51.0, 94.0, 114.0, 180.0, 257.0, 382.0, 623.0, 1042.0, 1730.0, 2760.0, 4750.0, 8179.0, 15077.0, 28214.0, 54743.0, 109096.0, 211581.0, 266903.0, 166589.0, 83042.0, 41706.0, 22022.0, 12024.0, 6806.0, 4025.0, 2350.0, 1479.0, 905.0, 579.0, 380.0, 241.0, 163.0, 92.0, 97.0, 57.0, 39.0, 31.0, 19.0, 14.0, 11.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.10980224609375, -0.10617923736572266, -0.10255622863769531, -0.09893321990966797, -0.09531021118164062, -0.09168720245361328, -0.08806419372558594, -0.0844411849975586, -0.08081817626953125, -0.0771951675415039, -0.07357215881347656, -0.06994915008544922, -0.06632614135742188, -0.06270313262939453, -0.05908012390136719, -0.055457115173339844, -0.0518341064453125, -0.048211097717285156, -0.04458808898925781, -0.04096508026123047, -0.037342071533203125, -0.03371906280517578, -0.030096054077148438, -0.026473045349121094, -0.02285003662109375, -0.019227027893066406, -0.015604019165039062, -0.011981010437011719, -0.008358001708984375, -0.004734992980957031, -0.0011119842529296875, 0.0025110244750976562, 0.006134033203125, 0.009757041931152344, 0.013380050659179688, 0.01700305938720703, 0.020626068115234375, 0.02424907684326172, 0.027872085571289062, 0.031495094299316406, 0.03511810302734375, 0.038741111755371094, 0.04236412048339844, 0.04598712921142578, 0.049610137939453125, 0.05323314666748047, 0.05685615539550781, 0.060479164123535156, 0.0641021728515625, 0.06772518157958984, 0.07134819030761719, 0.07497119903564453, 0.07859420776367188, 0.08221721649169922, 0.08584022521972656, 0.0894632339477539, 0.09308624267578125, 0.0967092514038086, 0.10033226013183594, 0.10395526885986328, 0.10757827758789062, 0.11120128631591797, 0.11482429504394531, 0.11844730377197266, 0.1220703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 3.0, 9.0, 6.0, 11.0, 12.0, 10.0, 27.0, 25.0, 22.0, 39.0, 18.0, 41.0, 35.0, 30.0, 37.0, 46.0, 28.0, 43.0, 36.0, 44.0, 51.0, 48.0, 46.0, 46.0, 37.0, 29.0, 28.0, 24.0, 15.0, 18.0, 22.0, 12.0, 10.0, 15.0, 13.0, 7.0, 8.0, 2.0, 4.0, 6.0, 8.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-2.00390625, -1.936614990234375, -1.86932373046875, -1.802032470703125, -1.7347412109375, -1.667449951171875, -1.60015869140625, -1.532867431640625, -1.465576171875, -1.398284912109375, -1.33099365234375, -1.263702392578125, -1.1964111328125, -1.129119873046875, -1.06182861328125, -0.994537353515625, -0.92724609375, -0.859954833984375, -0.79266357421875, -0.725372314453125, -0.6580810546875, -0.590789794921875, -0.52349853515625, -0.456207275390625, -0.388916015625, -0.321624755859375, -0.25433349609375, -0.187042236328125, -0.1197509765625, -0.052459716796875, 0.01483154296875, 0.082122802734375, 0.1494140625, 0.216705322265625, 0.28399658203125, 0.351287841796875, 0.4185791015625, 0.485870361328125, 0.55316162109375, 0.620452880859375, 0.687744140625, 0.755035400390625, 0.82232666015625, 0.889617919921875, 0.9569091796875, 1.024200439453125, 1.09149169921875, 1.158782958984375, 1.22607421875, 1.293365478515625, 1.36065673828125, 1.427947998046875, 1.4952392578125, 1.562530517578125, 1.62982177734375, 1.697113037109375, 1.764404296875, 1.831695556640625, 1.89898681640625, 1.966278076171875, 2.0335693359375, 2.100860595703125, 2.16815185546875, 2.235443115234375, 2.302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 8.0, 8.0, 13.0, 21.0, 30.0, 35.0, 62.0, 88.0, 158.0, 231.0, 299.0, 512.0, 887.0, 1592.0, 2902.0, 6089.0, 14245.0, 39820.0, 155853.0, 584801.0, 170472.0, 42228.0, 14914.0, 6346.0, 2965.0, 1606.0, 863.0, 530.0, 329.0, 211.0, 129.0, 92.0, 62.0, 54.0, 31.0, 20.0, 9.0, 14.0, 7.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0305328369140625, -0.029462575912475586, -0.028392314910888672, -0.027322053909301758, -0.026251792907714844, -0.02518153190612793, -0.024111270904541016, -0.0230410099029541, -0.021970748901367188, -0.020900487899780273, -0.01983022689819336, -0.018759965896606445, -0.01768970489501953, -0.016619443893432617, -0.015549182891845703, -0.014478921890258789, -0.013408660888671875, -0.012338399887084961, -0.011268138885498047, -0.010197877883911133, -0.009127616882324219, -0.008057355880737305, -0.006987094879150391, -0.0059168338775634766, -0.0048465728759765625, -0.0037763118743896484, -0.0027060508728027344, -0.0016357898712158203, -0.0005655288696289062, 0.0005047321319580078, 0.0015749931335449219, 0.002645254135131836, 0.00371551513671875, 0.004785776138305664, 0.005856037139892578, 0.006926298141479492, 0.007996559143066406, 0.00906682014465332, 0.010137081146240234, 0.011207342147827148, 0.012277603149414062, 0.013347864151000977, 0.01441812515258789, 0.015488386154174805, 0.01655864715576172, 0.017628908157348633, 0.018699169158935547, 0.01976943016052246, 0.020839691162109375, 0.02190995216369629, 0.022980213165283203, 0.024050474166870117, 0.02512073516845703, 0.026190996170043945, 0.02726125717163086, 0.028331518173217773, 0.029401779174804688, 0.0304720401763916, 0.031542301177978516, 0.03261256217956543, 0.033682823181152344, 0.03475308418273926, 0.03582334518432617, 0.036893606185913086, 0.0379638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 11.0, 7.0, 12.0, 12.0, 17.0, 21.0, 21.0, 32.0, 42.0, 49.0, 73.0, 97.0, 114.0, 106.0, 96.0, 60.0, 54.0, 41.0, 30.0, 23.0, 19.0, 13.0, 7.0, 15.0, 9.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.125999450683594e-05, -4.959758371114731e-05, -4.793517291545868e-05, -4.627276211977005e-05, -4.461035132408142e-05, -4.294794052839279e-05, -4.128552973270416e-05, -3.9623118937015533e-05, -3.7960708141326904e-05, -3.6298297345638275e-05, -3.4635886549949646e-05, -3.297347575426102e-05, -3.131106495857239e-05, -2.964865416288376e-05, -2.798624336719513e-05, -2.63238325715065e-05, -2.466142177581787e-05, -2.2999010980129242e-05, -2.1336600184440613e-05, -1.9674189388751984e-05, -1.8011778593063354e-05, -1.6349367797374725e-05, -1.4686957001686096e-05, -1.3024546205997467e-05, -1.1362135410308838e-05, -9.699724614620209e-06, -8.03731381893158e-06, -6.3749030232429504e-06, -4.712492227554321e-06, -3.050081431865692e-06, -1.387670636177063e-06, 2.7474015951156616e-07, 1.9371509552001953e-06, 3.5995617508888245e-06, 5.261972546577454e-06, 6.924383342266083e-06, 8.586794137954712e-06, 1.0249204933643341e-05, 1.191161572933197e-05, 1.35740265250206e-05, 1.5236437320709229e-05, 1.6898848116397858e-05, 1.8561258912086487e-05, 2.0223669707775116e-05, 2.1886080503463745e-05, 2.3548491299152374e-05, 2.5210902094841003e-05, 2.6873312890529633e-05, 2.8535723686218262e-05, 3.019813448190689e-05, 3.186054527759552e-05, 3.352295607328415e-05, 3.518536686897278e-05, 3.684777766466141e-05, 3.851018846035004e-05, 4.0172599256038666e-05, 4.1835010051727295e-05, 4.3497420847415924e-05, 4.515983164310455e-05, 4.682224243879318e-05, 4.848465323448181e-05, 5.014706403017044e-05, 5.180947482585907e-05, 5.34718856215477e-05, 5.513429641723633e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 7.0, 10.0, 11.0, 16.0, 23.0, 37.0, 76.0, 184.0, 553.0, 2167.0, 14458.0, 304614.0, 697621.0, 24327.0, 3186.0, 743.0, 263.0, 99.0, 65.0, 30.0, 19.0, 11.0, 12.0, 6.0, 3.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09204292297363281, -0.08917617797851562, -0.08630943298339844, -0.08344268798828125, -0.08057594299316406, -0.07770919799804688, -0.07484245300292969, -0.0719757080078125, -0.06910896301269531, -0.06624221801757812, -0.06337547302246094, -0.06050872802734375, -0.05764198303222656, -0.054775238037109375, -0.05190849304199219, -0.049041748046875, -0.04617500305175781, -0.043308258056640625, -0.04044151306152344, -0.03757476806640625, -0.03470802307128906, -0.031841278076171875, -0.028974533081054688, -0.0261077880859375, -0.023241043090820312, -0.020374298095703125, -0.017507553100585938, -0.01464080810546875, -0.011774063110351562, -0.008907318115234375, -0.0060405731201171875, -0.003173828125, -0.0003070831298828125, 0.002559661865234375, 0.0054264068603515625, 0.00829315185546875, 0.011159896850585938, 0.014026641845703125, 0.016893386840820312, 0.0197601318359375, 0.022626876831054688, 0.025493621826171875, 0.028360366821289062, 0.03122711181640625, 0.03409385681152344, 0.036960601806640625, 0.03982734680175781, 0.042694091796875, 0.04556083679199219, 0.048427581787109375, 0.05129432678222656, 0.05416107177734375, 0.05702781677246094, 0.059894561767578125, 0.06276130676269531, 0.0656280517578125, 0.06849479675292969, 0.07136154174804688, 0.07422828674316406, 0.07709503173828125, 0.07996177673339844, 0.08282852172851562, 0.08569526672363281, 0.08856201171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 22.0, 22.0, 27.0, 36.0, 27.0, 62.0, 92.0, 117.0, 164.0, 121.0, 74.0, 51.0, 34.0, 22.0, 17.0, 14.0, 14.0, 8.0, 9.0, 6.0, 7.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01161956787109375, -0.011195778846740723, -0.010771989822387695, -0.010348200798034668, -0.00992441177368164, -0.009500622749328613, -0.009076833724975586, -0.008653044700622559, -0.008229255676269531, -0.007805466651916504, -0.0073816776275634766, -0.006957888603210449, -0.006534099578857422, -0.0061103105545043945, -0.005686521530151367, -0.00526273250579834, -0.0048389434814453125, -0.004415154457092285, -0.003991365432739258, -0.0035675764083862305, -0.003143787384033203, -0.0027199983596801758, -0.0022962093353271484, -0.001872420310974121, -0.0014486312866210938, -0.0010248422622680664, -0.0006010532379150391, -0.00017726421356201172, 0.0002465248107910156, 0.000670313835144043, 0.0010941028594970703, 0.0015178918838500977, 0.001941680908203125, 0.0023654699325561523, 0.0027892589569091797, 0.003213047981262207, 0.0036368370056152344, 0.004060626029968262, 0.004484415054321289, 0.004908204078674316, 0.005331993103027344, 0.005755782127380371, 0.0061795711517333984, 0.006603360176086426, 0.007027149200439453, 0.0074509382247924805, 0.007874727249145508, 0.008298516273498535, 0.008722305297851562, 0.00914609432220459, 0.009569883346557617, 0.009993672370910645, 0.010417461395263672, 0.0108412504196167, 0.011265039443969727, 0.011688828468322754, 0.012112617492675781, 0.012536406517028809, 0.012960195541381836, 0.013383984565734863, 0.01380777359008789, 0.014231562614440918, 0.014655351638793945, 0.015079140663146973, 0.0155029296875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 15.0, 15.0, 30.0, 46.0, 100.0, 197.0, 230.0, 179.0, 86.0, 43.0, 23.0, 11.0, 10.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9247541427612305, -2.8138818740844727, -2.7030093669891357, -2.592136859893799, -2.481264591217041, -2.370392322540283, -2.2595198154449463, -2.1486473083496094, -2.0377750396728516, -1.9269026517868042, -1.8160302639007568, -1.7051578760147095, -1.594285488128662, -1.4834131002426147, -1.3725407123565674, -1.26166832447052, -1.1507959365844727, -1.0399235486984253, -0.9290511608123779, -0.8181787729263306, -0.7073063850402832, -0.5964339971542358, -0.4855616092681885, -0.3746892213821411, -0.26381683349609375, -0.1529444456100464, -0.04207205772399902, 0.06880033016204834, 0.1796727180480957, 0.29054510593414307, 0.40141749382019043, 0.5122898817062378, 0.6231622695922852, 0.7340346574783325, 0.8449070453643799, 0.9557794332504272, 1.0666518211364746, 1.177524209022522, 1.2883965969085693, 1.3992689847946167, 1.510141372680664, 1.6210137605667114, 1.7318861484527588, 1.8427585363388062, 1.9536309242248535, 2.0645031929016113, 2.1753756999969482, 2.286248207092285, 2.397120475769043, 2.507992744445801, 2.6188652515411377, 2.7297377586364746, 2.8406100273132324, 2.9514822959899902, 3.062354803085327, 3.173227310180664, 3.284099578857422, 3.3949718475341797, 3.5058443546295166, 3.6167168617248535, 3.7275891304016113, 3.838461399078369, 3.949333906173706, 4.060206413269043, 4.171078681945801]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 14.0, 18.0, 18.0, 30.0, 50.0, 54.0, 75.0, 86.0, 111.0, 109.0, 78.0, 94.0, 74.0, 47.0, 37.0, 29.0, 25.0, 16.0, 9.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2683541774749756, -2.200474500656128, -2.1325950622558594, -2.0647153854370117, -1.996835708618164, -1.928956151008606, -1.8610765933990479, -1.7931969165802002, -1.7253172397613525, -1.6574376821517944, -1.5895580053329468, -1.5216784477233887, -1.453798770904541, -1.385919213294983, -1.3180396556854248, -1.2501599788665771, -1.182280421257019, -1.114400863647461, -1.0465211868286133, -0.9786416292190552, -0.9107619524002075, -0.8428823947906494, -0.7750027775764465, -0.7071231603622437, -0.6392435431480408, -0.5713639259338379, -0.503484308719635, -0.4356047213077545, -0.36772510409355164, -0.29984548687934875, -0.23196589946746826, -0.16408628225326538, -0.0962066650390625, -0.028327055275440216, 0.03955255448818207, 0.10743215680122375, 0.17531177401542664, 0.24319139122962952, 0.31107097864151, 0.3789505958557129, 0.44683021306991577, 0.5147098302841187, 0.5825894474983215, 0.6504690647125244, 0.7183486223220825, 0.7862282991409302, 0.8541078567504883, 0.9219874739646912, 0.989867091178894, 1.0577466487884521, 1.1256263256072998, 1.193505883216858, 1.2613855600357056, 1.3292651176452637, 1.3971447944641113, 1.4650243520736694, 1.5329039096832275, 1.6007834672927856, 1.6686631441116333, 1.7365427017211914, 1.804422378540039, 1.8723019361495972, 1.9401814937591553, 2.008061170578003, 2.0759408473968506]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 10.0, 14.0, 19.0, 37.0, 54.0, 115.0, 271.0, 894.0, 3994.0, 36760.0, 948236.0, 51522.0, 4983.0, 1055.0, 296.0, 97.0, 53.0, 31.0, 18.0, 21.0, 11.0, 5.0, 10.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.8994140625, -3.783203125, -3.6669921875, -3.55078125, -3.4345703125, -3.318359375, -3.2021484375, -3.0859375, -2.9697265625, -2.853515625, -2.7373046875, -2.62109375, -2.5048828125, -2.388671875, -2.2724609375, -2.15625, -2.0400390625, -1.923828125, -1.8076171875, -1.69140625, -1.5751953125, -1.458984375, -1.3427734375, -1.2265625, -1.1103515625, -0.994140625, -0.8779296875, -0.76171875, -0.6455078125, -0.529296875, -0.4130859375, -0.296875, -0.1806640625, -0.064453125, 0.0517578125, 0.16796875, 0.2841796875, 0.400390625, 0.5166015625, 0.6328125, 0.7490234375, 0.865234375, 0.9814453125, 1.09765625, 1.2138671875, 1.330078125, 1.4462890625, 1.5625, 1.6787109375, 1.794921875, 1.9111328125, 2.02734375, 2.1435546875, 2.259765625, 2.3759765625, 2.4921875, 2.6083984375, 2.724609375, 2.8408203125, 2.95703125, 3.0732421875, 3.189453125, 3.3056640625, 3.421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 12.0, 9.0, 25.0, 41.0, 65.0, 88.0, 97.0, 136.0, 123.0, 108.0, 93.0, 64.0, 49.0, 27.0, 20.0, 18.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.409698486328125, -7.22955322265625, -7.049407958984375, -6.8692626953125, -6.689117431640625, -6.50897216796875, -6.328826904296875, -6.148681640625, -5.968536376953125, -5.78839111328125, -5.608245849609375, -5.4281005859375, -5.247955322265625, -5.06781005859375, -4.887664794921875, -4.70751953125, -4.527374267578125, -4.34722900390625, -4.167083740234375, -3.9869384765625, -3.806793212890625, -3.62664794921875, -3.446502685546875, -3.266357421875, -3.086212158203125, -2.90606689453125, -2.725921630859375, -2.5457763671875, -2.365631103515625, -2.18548583984375, -2.005340576171875, -1.8251953125, -1.645050048828125, -1.46490478515625, -1.284759521484375, -1.1046142578125, -0.924468994140625, -0.74432373046875, -0.564178466796875, -0.384033203125, -0.203887939453125, -0.02374267578125, 0.156402587890625, 0.3365478515625, 0.516693115234375, 0.69683837890625, 0.876983642578125, 1.05712890625, 1.237274169921875, 1.41741943359375, 1.597564697265625, 1.7777099609375, 1.957855224609375, 2.13800048828125, 2.318145751953125, 2.498291015625, 2.678436279296875, 2.85858154296875, 3.038726806640625, 3.2188720703125, 3.399017333984375, 3.57916259765625, 3.759307861328125, 3.939453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 10.0, 3.0, 3.0, 9.0, 11.0, 22.0, 19.0, 22.0, 19.0, 40.0, 41.0, 83.0, 92.0, 169.0, 360.0, 1033.0, 4380.0, 38717.0, 934573.0, 61253.0, 5502.0, 1156.0, 410.0, 208.0, 113.0, 76.0, 49.0, 36.0, 33.0, 27.0, 18.0, 14.0, 12.0, 10.0, 8.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.837890625, -2.75335693359375, -2.6688232421875, -2.58428955078125, -2.499755859375, -2.41522216796875, -2.3306884765625, -2.24615478515625, -2.16162109375, -2.07708740234375, -1.9925537109375, -1.90802001953125, -1.823486328125, -1.73895263671875, -1.6544189453125, -1.56988525390625, -1.4853515625, -1.40081787109375, -1.3162841796875, -1.23175048828125, -1.147216796875, -1.06268310546875, -0.9781494140625, -0.89361572265625, -0.80908203125, -0.72454833984375, -0.6400146484375, -0.55548095703125, -0.470947265625, -0.38641357421875, -0.3018798828125, -0.21734619140625, -0.1328125, -0.04827880859375, 0.0362548828125, 0.12078857421875, 0.205322265625, 0.28985595703125, 0.3743896484375, 0.45892333984375, 0.54345703125, 0.62799072265625, 0.7125244140625, 0.79705810546875, 0.881591796875, 0.96612548828125, 1.0506591796875, 1.13519287109375, 1.2197265625, 1.30426025390625, 1.3887939453125, 1.47332763671875, 1.557861328125, 1.64239501953125, 1.7269287109375, 1.81146240234375, 1.89599609375, 1.98052978515625, 2.0650634765625, 2.14959716796875, 2.234130859375, 2.31866455078125, 2.4031982421875, 2.48773193359375, 2.572265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 7.0, 10.0, 17.0, 15.0, 12.0, 15.0, 19.0, 25.0, 37.0, 41.0, 39.0, 51.0, 60.0, 61.0, 52.0, 66.0, 72.0, 44.0, 60.0, 43.0, 39.0, 45.0, 31.0, 29.0, 22.0, 15.0, 22.0, 17.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.92578125, -3.817138671875, -3.70849609375, -3.599853515625, -3.4912109375, -3.382568359375, -3.27392578125, -3.165283203125, -3.056640625, -2.947998046875, -2.83935546875, -2.730712890625, -2.6220703125, -2.513427734375, -2.40478515625, -2.296142578125, -2.1875, -2.078857421875, -1.97021484375, -1.861572265625, -1.7529296875, -1.644287109375, -1.53564453125, -1.427001953125, -1.318359375, -1.209716796875, -1.10107421875, -0.992431640625, -0.8837890625, -0.775146484375, -0.66650390625, -0.557861328125, -0.44921875, -0.340576171875, -0.23193359375, -0.123291015625, -0.0146484375, 0.093994140625, 0.20263671875, 0.311279296875, 0.419921875, 0.528564453125, 0.63720703125, 0.745849609375, 0.8544921875, 0.963134765625, 1.07177734375, 1.180419921875, 1.2890625, 1.397705078125, 1.50634765625, 1.614990234375, 1.7236328125, 1.832275390625, 1.94091796875, 2.049560546875, 2.158203125, 2.266845703125, 2.37548828125, 2.484130859375, 2.5927734375, 2.701416015625, 2.81005859375, 2.918701171875, 3.02734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 12.0, 17.0, 18.0, 24.0, 38.0, 50.0, 89.0, 166.0, 270.0, 564.0, 993.0, 2138.0, 4607.0, 11438.0, 34653.0, 296507.0, 631562.0, 42006.0, 13283.0, 5186.0, 2330.0, 1155.0, 628.0, 323.0, 194.0, 91.0, 62.0, 37.0, 31.0, 18.0, 12.0, 8.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.490234375, -0.474456787109375, -0.45867919921875, -0.442901611328125, -0.4271240234375, -0.411346435546875, -0.39556884765625, -0.379791259765625, -0.364013671875, -0.348236083984375, -0.33245849609375, -0.316680908203125, -0.3009033203125, -0.285125732421875, -0.26934814453125, -0.253570556640625, -0.23779296875, -0.222015380859375, -0.20623779296875, -0.190460205078125, -0.1746826171875, -0.158905029296875, -0.14312744140625, -0.127349853515625, -0.111572265625, -0.095794677734375, -0.08001708984375, -0.064239501953125, -0.0484619140625, -0.032684326171875, -0.01690673828125, -0.001129150390625, 0.0146484375, 0.030426025390625, 0.04620361328125, 0.061981201171875, 0.0777587890625, 0.093536376953125, 0.10931396484375, 0.125091552734375, 0.140869140625, 0.156646728515625, 0.17242431640625, 0.188201904296875, 0.2039794921875, 0.219757080078125, 0.23553466796875, 0.251312255859375, 0.26708984375, 0.282867431640625, 0.29864501953125, 0.314422607421875, 0.3302001953125, 0.345977783203125, 0.36175537109375, 0.377532958984375, 0.393310546875, 0.409088134765625, 0.42486572265625, 0.440643310546875, 0.4564208984375, 0.472198486328125, 0.48797607421875, 0.503753662109375, 0.51953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 3.0, 6.0, 8.0, 6.0, 16.0, 14.0, 15.0, 27.0, 28.0, 60.0, 129.0, 212.0, 208.0, 82.0, 55.0, 33.0, 22.0, 13.0, 10.0, 4.0, 7.0, 7.0, 3.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8041343688964844e-05, -4.5952387154102325e-05, -4.386343061923981e-05, -4.177447408437729e-05, -3.968551754951477e-05, -3.759656101465225e-05, -3.5507604479789734e-05, -3.3418647944927216e-05, -3.13296914100647e-05, -2.924073487520218e-05, -2.715177834033966e-05, -2.5062821805477142e-05, -2.2973865270614624e-05, -2.0884908735752106e-05, -1.8795952200889587e-05, -1.670699566602707e-05, -1.461803913116455e-05, -1.2529082596302032e-05, -1.0440126061439514e-05, -8.351169526576996e-06, -6.2622129917144775e-06, -4.173256456851959e-06, -2.084299921989441e-06, 4.6566128730773926e-09, 2.0936131477355957e-06, 4.182569682598114e-06, 6.271526217460632e-06, 8.36048275232315e-06, 1.0449439287185669e-05, 1.2538395822048187e-05, 1.4627352356910706e-05, 1.6716308891773224e-05, 1.8805265426635742e-05, 2.089422196149826e-05, 2.298317849636078e-05, 2.5072135031223297e-05, 2.7161091566085815e-05, 2.9250048100948334e-05, 3.133900463581085e-05, 3.342796117067337e-05, 3.551691770553589e-05, 3.760587424039841e-05, 3.9694830775260925e-05, 4.1783787310123444e-05, 4.387274384498596e-05, 4.596170037984848e-05, 4.8050656914711e-05, 5.013961344957352e-05, 5.2228569984436035e-05, 5.4317526519298553e-05, 5.640648305416107e-05, 5.849543958902359e-05, 6.058439612388611e-05, 6.267335265874863e-05, 6.476230919361115e-05, 6.685126572847366e-05, 6.894022226333618e-05, 7.10291787981987e-05, 7.311813533306122e-05, 7.520709186792374e-05, 7.729604840278625e-05, 7.938500493764877e-05, 8.147396147251129e-05, 8.356291800737381e-05, 8.565187454223633e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 6.0, 7.0, 10.0, 16.0, 13.0, 26.0, 48.0, 76.0, 138.0, 223.0, 487.0, 933.0, 2078.0, 5925.0, 18733.0, 93120.0, 830725.0, 71545.0, 15770.0, 4899.0, 2004.0, 857.0, 385.0, 210.0, 106.0, 73.0, 47.0, 33.0, 18.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5836868286132812, -0.5638580322265625, -0.5440292358398438, -0.524200439453125, -0.5043716430664062, -0.4845428466796875, -0.46471405029296875, -0.44488525390625, -0.42505645751953125, -0.4052276611328125, -0.38539886474609375, -0.365570068359375, -0.34574127197265625, -0.3259124755859375, -0.30608367919921875, -0.2862548828125, -0.26642608642578125, -0.2465972900390625, -0.22676849365234375, -0.206939697265625, -0.18711090087890625, -0.1672821044921875, -0.14745330810546875, -0.12762451171875, -0.10779571533203125, -0.0879669189453125, -0.06813812255859375, -0.048309326171875, -0.02848052978515625, -0.0086517333984375, 0.01117706298828125, 0.031005859375, 0.05083465576171875, 0.0706634521484375, 0.09049224853515625, 0.110321044921875, 0.13014984130859375, 0.1499786376953125, 0.16980743408203125, 0.18963623046875, 0.20946502685546875, 0.2292938232421875, 0.24912261962890625, 0.268951416015625, 0.28878021240234375, 0.3086090087890625, 0.32843780517578125, 0.3482666015625, 0.36809539794921875, 0.3879241943359375, 0.40775299072265625, 0.427581787109375, 0.44741058349609375, 0.4672393798828125, 0.48706817626953125, 0.50689697265625, 0.5267257690429688, 0.5465545654296875, 0.5663833618164062, 0.586212158203125, 0.6060409545898438, 0.6258697509765625, 0.6456985473632812, 0.66552734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 4.0, 6.0, 7.0, 14.0, 14.0, 19.0, 33.0, 22.0, 38.0, 90.0, 353.0, 178.0, 55.0, 40.0, 29.0, 19.0, 16.0, 10.0, 11.0, 8.0, 3.0, 2.0, 5.0, 6.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.2973365783691406, -0.28852081298828125, -0.2797050476074219, -0.2708892822265625, -0.2620735168457031, -0.25325775146484375, -0.24444198608398438, -0.235626220703125, -0.22681045532226562, -0.21799468994140625, -0.20917892456054688, -0.2003631591796875, -0.19154739379882812, -0.18273162841796875, -0.17391586303710938, -0.16510009765625, -0.15628433227539062, -0.14746856689453125, -0.13865280151367188, -0.1298370361328125, -0.12102127075195312, -0.11220550537109375, -0.10338973999023438, -0.094573974609375, -0.08575820922851562, -0.07694244384765625, -0.06812667846679688, -0.0593109130859375, -0.050495147705078125, -0.04167938232421875, -0.032863616943359375, -0.0240478515625, -0.015232086181640625, -0.00641632080078125, 0.002399444580078125, 0.0112152099609375, 0.020030975341796875, 0.02884674072265625, 0.037662506103515625, 0.046478271484375, 0.055294036865234375, 0.06410980224609375, 0.07292556762695312, 0.0817413330078125, 0.09055709838867188, 0.09937286376953125, 0.10818862915039062, 0.11700439453125, 0.12582015991210938, 0.13463592529296875, 0.14345169067382812, 0.1522674560546875, 0.16108322143554688, 0.16989898681640625, 0.17871475219726562, 0.187530517578125, 0.19634628295898438, 0.20516204833984375, 0.21397781372070312, 0.2227935791015625, 0.23160934448242188, 0.24042510986328125, 0.24924087524414062, 0.258056640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 42.0, 179.0, 456.0, 238.0, 55.0, 16.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.137155532836914, -9.645425796508789, -9.15369701385498, -8.661967277526855, -8.170238494873047, -7.678508758544922, -7.186779499053955, -6.695050239562988, -6.2033209800720215, -5.711591720581055, -5.219862461090088, -4.728133201599121, -4.236403465270996, -3.7446744441986084, -3.2529449462890625, -2.7612156867980957, -2.269486427307129, -1.777757167816162, -1.2860277891159058, -0.7942984104156494, -0.3025691509246826, 0.18916010856628418, 0.6808896064758301, 1.1726188659667969, 1.6643481254577637, 2.1560773849487305, 2.6478066444396973, 3.139536142349243, 3.63126540184021, 4.122994422912598, 4.614724159240723, 5.1064534187316895, 5.598182678222656, 6.089911937713623, 6.58164119720459, 7.073370933532715, 7.565099716186523, 8.056829452514648, 8.548559188842773, 9.040287971496582, 9.53201675415039, 10.023746490478516, 10.515475273132324, 11.00720500946045, 11.498933792114258, 11.990663528442383, 12.482393264770508, 12.974122047424316, 13.465851783752441, 13.957581520080566, 14.449310302734375, 14.9410400390625, 15.432768821716309, 15.924498558044434, 16.416227340698242, 16.907957077026367, 17.399686813354492, 17.891416549682617, 18.383146286010742, 18.874874114990234, 19.36660385131836, 19.858333587646484, 20.35006332397461, 20.841793060302734, 21.333520889282227]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 6.0, 13.0, 12.0, 28.0, 20.0, 22.0, 26.0, 45.0, 39.0, 46.0, 51.0, 52.0, 62.0, 53.0, 60.0, 62.0, 62.0, 59.0, 47.0, 45.0, 44.0, 41.0, 25.0, 22.0, 12.0, 13.0, 12.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.681855201721191, -8.464140892028809, -8.246426582336426, -8.028712272644043, -7.81099796295166, -7.593283653259277, -7.3755693435668945, -7.157855033874512, -6.940140724182129, -6.722426414489746, -6.504712104797363, -6.2869977951049805, -6.069283485412598, -5.851569175720215, -5.633854866027832, -5.416140556335449, -5.198426246643066, -4.980711936950684, -4.762997627258301, -4.545283317565918, -4.327569007873535, -4.109854698181152, -3.8921403884887695, -3.6744260787963867, -3.456712245941162, -3.2389979362487793, -3.0212836265563965, -2.8035693168640137, -2.585855007171631, -2.368140697479248, -2.1504263877868652, -1.932712197303772, -1.7149977684020996, -1.4972834587097168, -1.279569149017334, -1.0618548393249512, -0.8441405892372131, -0.6264263391494751, -0.4087120294570923, -0.19099771976470947, 0.02671658992767334, 0.24443088471889496, 0.4621451795101166, 0.679859459400177, 0.8975737690925598, 1.1152880191802979, 1.3330023288726807, 1.5507166385650635, 1.7684309482574463, 1.986145257949829, 2.203859567642212, 2.4215738773345947, 2.6392881870269775, 2.8570022583007812, 3.074716567993164, 3.292430877685547, 3.5101451873779297, 3.7278594970703125, 3.9455738067626953, 4.163288116455078, 4.381002426147461, 4.598716735839844, 4.816431045532227, 5.034145355224609, 5.251859664916992]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 6.0, 10.0, 15.0, 12.0, 23.0, 29.0, 38.0, 58.0, 75.0, 113.0, 180.0, 259.0, 399.0, 725.0, 1143.0, 2092.0, 4272.0, 10528.0, 36317.0, 242963.0, 2403489.0, 1320690.0, 122558.0, 29136.0, 10508.0, 4292.0, 1813.0, 943.0, 537.0, 376.0, 235.0, 145.0, 89.0, 63.0, 56.0, 25.0, 16.0, 14.0, 11.0, 8.0, 7.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.308624267578125, -2.23834228515625, -2.168060302734375, -2.0977783203125, -2.027496337890625, -1.95721435546875, -1.886932373046875, -1.816650390625, -1.746368408203125, -1.67608642578125, -1.605804443359375, -1.5355224609375, -1.465240478515625, -1.39495849609375, -1.324676513671875, -1.25439453125, -1.184112548828125, -1.11383056640625, -1.043548583984375, -0.9732666015625, -0.902984619140625, -0.83270263671875, -0.762420654296875, -0.692138671875, -0.621856689453125, -0.55157470703125, -0.481292724609375, -0.4110107421875, -0.340728759765625, -0.27044677734375, -0.200164794921875, -0.1298828125, -0.059600830078125, 0.01068115234375, 0.080963134765625, 0.1512451171875, 0.221527099609375, 0.29180908203125, 0.362091064453125, 0.432373046875, 0.502655029296875, 0.57293701171875, 0.643218994140625, 0.7135009765625, 0.783782958984375, 0.85406494140625, 0.924346923828125, 0.99462890625, 1.064910888671875, 1.13519287109375, 1.205474853515625, 1.2757568359375, 1.346038818359375, 1.41632080078125, 1.486602783203125, 1.556884765625, 1.627166748046875, 1.69744873046875, 1.767730712890625, 1.8380126953125, 1.908294677734375, 1.97857666015625, 2.048858642578125, 2.119140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 8.0, 16.0, 10.0, 22.0, 38.0, 49.0, 53.0, 69.0, 70.0, 73.0, 99.0, 96.0, 64.0, 76.0, 54.0, 51.0, 27.0, 22.0, 22.0, 29.0, 12.0, 5.0, 8.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.59765625, -2.5268096923828125, -2.455963134765625, -2.3851165771484375, -2.31427001953125, -2.2434234619140625, -2.172576904296875, -2.1017303466796875, -2.0308837890625, -1.9600372314453125, -1.889190673828125, -1.8183441162109375, -1.74749755859375, -1.6766510009765625, -1.605804443359375, -1.5349578857421875, -1.464111328125, -1.3932647705078125, -1.322418212890625, -1.2515716552734375, -1.18072509765625, -1.1098785400390625, -1.039031982421875, -0.9681854248046875, -0.8973388671875, -0.8264923095703125, -0.755645751953125, -0.6847991943359375, -0.61395263671875, -0.5431060791015625, -0.472259521484375, -0.4014129638671875, -0.33056640625, -0.2597198486328125, -0.188873291015625, -0.1180267333984375, -0.04718017578125, 0.0236663818359375, 0.094512939453125, 0.1653594970703125, 0.2362060546875, 0.3070526123046875, 0.377899169921875, 0.4487457275390625, 0.51959228515625, 0.5904388427734375, 0.661285400390625, 0.7321319580078125, 0.802978515625, 0.8738250732421875, 0.944671630859375, 1.0155181884765625, 1.08636474609375, 1.1572113037109375, 1.228057861328125, 1.2989044189453125, 1.3697509765625, 1.4405975341796875, 1.511444091796875, 1.5822906494140625, 1.65313720703125, 1.7239837646484375, 1.794830322265625, 1.8656768798828125, 1.9365234375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 3.0, 5.0, 2.0, 10.0, 9.0, 18.0, 18.0, 33.0, 52.0, 89.0, 136.0, 275.0, 581.0, 1501.0, 4784.0, 20878.0, 249126.0, 3799950.0, 98518.0, 13059.0, 3263.0, 1039.0, 423.0, 202.0, 120.0, 61.0, 44.0, 28.0, 13.0, 10.0, 12.0, 5.0, 6.0, 5.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.958984375, -3.85009765625, -3.7412109375, -3.63232421875, -3.5234375, -3.41455078125, -3.3056640625, -3.19677734375, -3.087890625, -2.97900390625, -2.8701171875, -2.76123046875, -2.65234375, -2.54345703125, -2.4345703125, -2.32568359375, -2.216796875, -2.10791015625, -1.9990234375, -1.89013671875, -1.78125, -1.67236328125, -1.5634765625, -1.45458984375, -1.345703125, -1.23681640625, -1.1279296875, -1.01904296875, -0.91015625, -0.80126953125, -0.6923828125, -0.58349609375, -0.474609375, -0.36572265625, -0.2568359375, -0.14794921875, -0.0390625, 0.06982421875, 0.1787109375, 0.28759765625, 0.396484375, 0.50537109375, 0.6142578125, 0.72314453125, 0.83203125, 0.94091796875, 1.0498046875, 1.15869140625, 1.267578125, 1.37646484375, 1.4853515625, 1.59423828125, 1.703125, 1.81201171875, 1.9208984375, 2.02978515625, 2.138671875, 2.24755859375, 2.3564453125, 2.46533203125, 2.57421875, 2.68310546875, 2.7919921875, 2.90087890625, 3.009765625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 8.0, 6.0, 11.0, 15.0, 22.0, 27.0, 42.0, 77.0, 100.0, 241.0, 602.0, 1034.0, 952.0, 430.0, 192.0, 107.0, 52.0, 53.0, 20.0, 15.0, 13.0, 12.0, 9.0, 6.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.672943115234375, -0.64471435546875, -0.616485595703125, -0.5882568359375, -0.560028076171875, -0.53179931640625, -0.503570556640625, -0.475341796875, -0.447113037109375, -0.41888427734375, -0.390655517578125, -0.3624267578125, -0.334197998046875, -0.30596923828125, -0.277740478515625, -0.24951171875, -0.221282958984375, -0.19305419921875, -0.164825439453125, -0.1365966796875, -0.108367919921875, -0.08013916015625, -0.051910400390625, -0.023681640625, 0.004547119140625, 0.03277587890625, 0.061004638671875, 0.0892333984375, 0.117462158203125, 0.14569091796875, 0.173919677734375, 0.2021484375, 0.230377197265625, 0.25860595703125, 0.286834716796875, 0.3150634765625, 0.343292236328125, 0.37152099609375, 0.399749755859375, 0.427978515625, 0.456207275390625, 0.48443603515625, 0.512664794921875, 0.5408935546875, 0.569122314453125, 0.59735107421875, 0.625579833984375, 0.65380859375, 0.682037353515625, 0.71026611328125, 0.738494873046875, 0.7667236328125, 0.794952392578125, 0.82318115234375, 0.851409912109375, 0.879638671875, 0.907867431640625, 0.93609619140625, 0.964324951171875, 0.9925537109375, 1.020782470703125, 1.04901123046875, 1.077239990234375, 1.10546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 9.0, 12.0, 28.0, 35.0, 68.0, 91.0, 110.0, 141.0, 129.0, 115.0, 81.0, 44.0, 42.0, 23.0, 17.0, 15.0, 8.0, 9.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.388582706451416, -4.2811970710754395, -4.173811912536621, -4.0664262771606445, -3.959040880203247, -3.8516554832458496, -3.744269847869873, -3.6368844509124756, -3.529499053955078, -3.4221136569976807, -3.314728021621704, -3.2073426246643066, -3.099957227706909, -2.9925718307495117, -2.885186195373535, -2.7778007984161377, -2.670415163040161, -2.5630297660827637, -2.455644130706787, -2.3482587337493896, -2.240873336791992, -2.1334877014160156, -2.026102304458618, -1.9187169075012207, -1.8113313913345337, -1.7039458751678467, -1.5965604782104492, -1.4891749620437622, -1.3817894458770752, -1.2744040489196777, -1.1670185327529907, -1.0596330165863037, -0.9522476196289062, -0.844862163066864, -0.7374767065048218, -0.6300911903381348, -0.5227057337760925, -0.4153202772140503, -0.3079347610473633, -0.20054930448532104, -0.09316384792327881, 0.014221623539924622, 0.12160709500312805, 0.22899258136749268, 0.3363780379295349, 0.44376349449157715, 0.5511490106582642, 0.6585344672203064, 0.7659199237823486, 0.8733053803443909, 0.9806908369064331, 1.0880763530731201, 1.1954617500305176, 1.3028472661972046, 1.4102327823638916, 1.517618179321289, 1.625003695487976, 1.732389211654663, 1.8397746086120605, 1.9471601247787476, 2.0545456409454346, 2.161931037902832, 2.2693166732788086, 2.376702070236206, 2.4840874671936035]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 10.0, 14.0, 17.0, 18.0, 38.0, 39.0, 54.0, 76.0, 87.0, 88.0, 89.0, 87.0, 80.0, 66.0, 60.0, 33.0, 33.0, 27.0, 22.0, 8.0, 11.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.731536626815796, -2.6452627182006836, -2.5589888095855713, -2.472714900970459, -2.3864407539367676, -2.3001668453216553, -2.213892936706543, -2.1276190280914307, -2.0413451194763184, -1.955071210861206, -1.8687971830368042, -1.782523274421692, -1.6962493658065796, -1.6099753379821777, -1.5237014293670654, -1.4374275207519531, -1.3511534929275513, -1.264879584312439, -1.178605556488037, -1.0923316478729248, -1.0060577392578125, -0.9197837710380554, -0.8335098028182983, -0.747235894203186, -0.660961925983429, -0.5746879577636719, -0.48841404914855957, -0.4021400809288025, -0.3158661425113678, -0.2295922040939331, -0.14331823587417603, -0.05704432725906372, 0.02922964096069336, 0.11550358682870865, 0.20177753269672394, 0.2880514860153198, 0.3743254244327545, 0.4605993628501892, 0.5468733310699463, 0.6331472396850586, 0.7194212079048157, 0.8056951761245728, 0.8919690847396851, 0.9782430529594421, 1.0645170211791992, 1.1507909297943115, 1.2370648384094238, 1.3233387470245361, 1.409612774848938, 1.4958866834640503, 1.5821607112884521, 1.6684346199035645, 1.7547085285186768, 1.840982437133789, 1.927256464958191, 2.0135302543640137, 2.099804401397705, 2.1860783100128174, 2.2723522186279297, 2.358626365661621, 2.4449002742767334, 2.5311741828918457, 2.617448091506958, 2.7037220001220703, 2.7899959087371826]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 16.0, 25.0, 36.0, 48.0, 73.0, 115.0, 245.0, 387.0, 733.0, 1667.0, 3915.0, 12681.0, 58933.0, 445363.0, 445331.0, 58739.0, 12896.0, 4032.0, 1623.0, 718.0, 376.0, 221.0, 134.0, 85.0, 50.0, 32.0, 21.0, 11.0, 13.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369384765625, -0.3585205078125, -0.34765625, -0.3367919921875, -0.325927734375, -0.3150634765625, -0.30419921875, -0.2933349609375, -0.282470703125, -0.2716064453125, -0.2607421875, -0.2498779296875, -0.239013671875, -0.2281494140625, -0.21728515625, -0.2064208984375, -0.195556640625, -0.1846923828125, -0.173828125, -0.1629638671875, -0.152099609375, -0.1412353515625, -0.13037109375, -0.1195068359375, -0.108642578125, -0.0977783203125, -0.0869140625, -0.0760498046875, -0.065185546875, -0.0543212890625, -0.04345703125, -0.0325927734375, -0.021728515625, -0.0108642578125, 0.0, 0.0108642578125, 0.021728515625, 0.0325927734375, 0.04345703125, 0.0543212890625, 0.065185546875, 0.0760498046875, 0.0869140625, 0.0977783203125, 0.108642578125, 0.1195068359375, 0.13037109375, 0.1412353515625, 0.152099609375, 0.1629638671875, 0.173828125, 0.1846923828125, 0.195556640625, 0.2064208984375, 0.21728515625, 0.2281494140625, 0.239013671875, 0.2498779296875, 0.2607421875, 0.2716064453125, 0.282470703125, 0.2933349609375, 0.30419921875, 0.3150634765625, 0.325927734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 1.0, 7.0, 8.0, 15.0, 18.0, 14.0, 25.0, 38.0, 52.0, 69.0, 99.0, 108.0, 101.0, 94.0, 110.0, 64.0, 40.0, 45.0, 26.0, 21.0, 11.0, 11.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701171875, -1.638946533203125, -1.57672119140625, -1.514495849609375, -1.4522705078125, -1.390045166015625, -1.32781982421875, -1.265594482421875, -1.203369140625, -1.141143798828125, -1.07891845703125, -1.016693115234375, -0.9544677734375, -0.892242431640625, -0.83001708984375, -0.767791748046875, -0.70556640625, -0.643341064453125, -0.58111572265625, -0.518890380859375, -0.4566650390625, -0.394439697265625, -0.33221435546875, -0.269989013671875, -0.207763671875, -0.145538330078125, -0.08331298828125, -0.021087646484375, 0.0411376953125, 0.103363037109375, 0.16558837890625, 0.227813720703125, 0.2900390625, 0.352264404296875, 0.41448974609375, 0.476715087890625, 0.5389404296875, 0.601165771484375, 0.66339111328125, 0.725616455078125, 0.787841796875, 0.850067138671875, 0.91229248046875, 0.974517822265625, 1.0367431640625, 1.098968505859375, 1.16119384765625, 1.223419189453125, 1.28564453125, 1.347869873046875, 1.41009521484375, 1.472320556640625, 1.5345458984375, 1.596771240234375, 1.65899658203125, 1.721221923828125, 1.783447265625, 1.845672607421875, 1.90789794921875, 1.970123291015625, 2.0323486328125, 2.094573974609375, 2.15679931640625, 2.219024658203125, 2.28125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 9.0, 5.0, 16.0, 18.0, 24.0, 43.0, 46.0, 87.0, 128.0, 262.0, 345.0, 571.0, 991.0, 1660.0, 2824.0, 5020.0, 9205.0, 17130.0, 32903.0, 66639.0, 137536.0, 255913.0, 250374.0, 133272.0, 64781.0, 31861.0, 16581.0, 8732.0, 4803.0, 2702.0, 1624.0, 909.0, 554.0, 338.0, 234.0, 143.0, 86.0, 53.0, 34.0, 28.0, 17.0, 15.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.08979606628417969, -0.08669662475585938, -0.08359718322753906, -0.08049774169921875, -0.07739830017089844, -0.07429885864257812, -0.07119941711425781, -0.0680999755859375, -0.06500053405761719, -0.061901092529296875, -0.05880165100097656, -0.05570220947265625, -0.05260276794433594, -0.049503326416015625, -0.04640388488769531, -0.043304443359375, -0.04020500183105469, -0.037105560302734375, -0.03400611877441406, -0.03090667724609375, -0.027807235717773438, -0.024707794189453125, -0.021608352661132812, -0.0185089111328125, -0.015409469604492188, -0.012310028076171875, -0.009210586547851562, -0.00611114501953125, -0.0030117034912109375, 8.7738037109375e-05, 0.0031871795654296875, 0.00628662109375, 0.009386062622070312, 0.012485504150390625, 0.015584945678710938, 0.01868438720703125, 0.021783828735351562, 0.024883270263671875, 0.027982711791992188, 0.0310821533203125, 0.03418159484863281, 0.037281036376953125, 0.04038047790527344, 0.04347991943359375, 0.04657936096191406, 0.049678802490234375, 0.05277824401855469, 0.055877685546875, 0.05897712707519531, 0.062076568603515625, 0.06517601013183594, 0.06827545166015625, 0.07137489318847656, 0.07447433471679688, 0.07757377624511719, 0.0806732177734375, 0.08377265930175781, 0.08687210083007812, 0.08997154235839844, 0.09307098388671875, 0.09617042541503906, 0.09926986694335938, 0.10236930847167969, 0.10546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 7.0, 7.0, 9.0, 7.0, 15.0, 13.0, 20.0, 23.0, 26.0, 17.0, 31.0, 38.0, 42.0, 36.0, 30.0, 43.0, 53.0, 42.0, 46.0, 40.0, 57.0, 46.0, 43.0, 50.0, 34.0, 33.0, 27.0, 31.0, 22.0, 21.0, 9.0, 16.0, 12.0, 4.0, 7.0, 12.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.8466796875, -1.787261962890625, -1.72784423828125, -1.668426513671875, -1.6090087890625, -1.549591064453125, -1.49017333984375, -1.430755615234375, -1.371337890625, -1.311920166015625, -1.25250244140625, -1.193084716796875, -1.1336669921875, -1.074249267578125, -1.01483154296875, -0.955413818359375, -0.89599609375, -0.836578369140625, -0.77716064453125, -0.717742919921875, -0.6583251953125, -0.598907470703125, -0.53948974609375, -0.480072021484375, -0.420654296875, -0.361236572265625, -0.30181884765625, -0.242401123046875, -0.1829833984375, -0.123565673828125, -0.06414794921875, -0.004730224609375, 0.0546875, 0.114105224609375, 0.17352294921875, 0.232940673828125, 0.2923583984375, 0.351776123046875, 0.41119384765625, 0.470611572265625, 0.530029296875, 0.589447021484375, 0.64886474609375, 0.708282470703125, 0.7677001953125, 0.827117919921875, 0.88653564453125, 0.945953369140625, 1.00537109375, 1.064788818359375, 1.12420654296875, 1.183624267578125, 1.2430419921875, 1.302459716796875, 1.36187744140625, 1.421295166015625, 1.480712890625, 1.540130615234375, 1.59954833984375, 1.658966064453125, 1.7183837890625, 1.777801513671875, 1.83721923828125, 1.896636962890625, 1.9560546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 10.0, 11.0, 17.0, 18.0, 28.0, 36.0, 54.0, 118.0, 175.0, 312.0, 539.0, 913.0, 1752.0, 3711.0, 9090.0, 27232.0, 122255.0, 648416.0, 178646.0, 35754.0, 10849.0, 4167.0, 2025.0, 996.0, 582.0, 311.0, 191.0, 126.0, 65.0, 53.0, 27.0, 26.0, 15.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.028228759765625, -0.027362823486328125, -0.02649688720703125, -0.025630950927734375, -0.0247650146484375, -0.023899078369140625, -0.02303314208984375, -0.022167205810546875, -0.02130126953125, -0.020435333251953125, -0.01956939697265625, -0.018703460693359375, -0.0178375244140625, -0.016971588134765625, -0.01610565185546875, -0.015239715576171875, -0.014373779296875, -0.013507843017578125, -0.01264190673828125, -0.011775970458984375, -0.0109100341796875, -0.010044097900390625, -0.00917816162109375, -0.008312225341796875, -0.0074462890625, -0.006580352783203125, -0.00571441650390625, -0.004848480224609375, -0.0039825439453125, -0.003116607666015625, -0.00225067138671875, -0.001384735107421875, -0.000518798828125, 0.000347137451171875, 0.00121307373046875, 0.002079010009765625, 0.0029449462890625, 0.003810882568359375, 0.00467681884765625, 0.005542755126953125, 0.00640869140625, 0.007274627685546875, 0.00814056396484375, 0.009006500244140625, 0.0098724365234375, 0.010738372802734375, 0.01160430908203125, 0.012470245361328125, 0.013336181640625, 0.014202117919921875, 0.01506805419921875, 0.015933990478515625, 0.0167999267578125, 0.017665863037109375, 0.01853179931640625, 0.019397735595703125, 0.020263671875, 0.021129608154296875, 0.02199554443359375, 0.022861480712890625, 0.0237274169921875, 0.024593353271484375, 0.02545928955078125, 0.026325225830078125, 0.027191162109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 9.0, 15.0, 19.0, 15.0, 19.0, 38.0, 35.0, 36.0, 74.0, 105.0, 105.0, 135.0, 74.0, 95.0, 64.0, 47.0, 29.0, 24.0, 12.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0040740966796875e-05, -2.893339842557907e-05, -2.7826055884361267e-05, -2.6718713343143463e-05, -2.561137080192566e-05, -2.4504028260707855e-05, -2.339668571949005e-05, -2.2289343178272247e-05, -2.1182000637054443e-05, -2.007465809583664e-05, -1.8967315554618835e-05, -1.785997301340103e-05, -1.6752630472183228e-05, -1.5645287930965424e-05, -1.453794538974762e-05, -1.3430602848529816e-05, -1.2323260307312012e-05, -1.1215917766094208e-05, -1.0108575224876404e-05, -9.0012326836586e-06, -7.893890142440796e-06, -6.786547601222992e-06, -5.679205060005188e-06, -4.571862518787384e-06, -3.46451997756958e-06, -2.357177436351776e-06, -1.2498348951339722e-06, -1.424923539161682e-07, 9.648501873016357e-07, 2.0721927285194397e-06, 3.1795352697372437e-06, 4.286877810955048e-06, 5.3942203521728516e-06, 6.5015628933906555e-06, 7.6089054346084595e-06, 8.716247975826263e-06, 9.823590517044067e-06, 1.0930933058261871e-05, 1.2038275599479675e-05, 1.314561814069748e-05, 1.4252960681915283e-05, 1.5360303223133087e-05, 1.646764576435089e-05, 1.7574988305568695e-05, 1.86823308467865e-05, 1.9789673388004303e-05, 2.0897015929222107e-05, 2.200435847043991e-05, 2.3111701011657715e-05, 2.421904355287552e-05, 2.5326386094093323e-05, 2.6433728635311127e-05, 2.754107117652893e-05, 2.8648413717746735e-05, 2.975575625896454e-05, 3.086309880018234e-05, 3.1970441341400146e-05, 3.307778388261795e-05, 3.4185126423835754e-05, 3.529246896505356e-05, 3.639981150627136e-05, 3.7507154047489166e-05, 3.861449658870697e-05, 3.9721839129924774e-05, 4.082918167114258e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 10.0, 14.0, 15.0, 20.0, 21.0, 45.0, 54.0, 78.0, 177.0, 342.0, 625.0, 1404.0, 3472.0, 10521.0, 46039.0, 448712.0, 472002.0, 47824.0, 10935.0, 3444.0, 1343.0, 638.0, 308.0, 192.0, 92.0, 48.0, 40.0, 39.0, 28.0, 17.0, 10.0, 5.0, 2.0, 7.0, 1.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.04156494140625, -0.04034280776977539, -0.03912067413330078, -0.03789854049682617, -0.03667640686035156, -0.03545427322387695, -0.034232139587402344, -0.033010005950927734, -0.031787872314453125, -0.030565738677978516, -0.029343605041503906, -0.028121471405029297, -0.026899337768554688, -0.025677204132080078, -0.02445507049560547, -0.02323293685913086, -0.02201080322265625, -0.02078866958618164, -0.01956653594970703, -0.018344402313232422, -0.017122268676757812, -0.015900135040283203, -0.014678001403808594, -0.013455867767333984, -0.012233734130859375, -0.011011600494384766, -0.009789466857910156, -0.008567333221435547, -0.0073451995849609375, -0.006123065948486328, -0.004900932312011719, -0.0036787986755371094, -0.0024566650390625, -0.0012345314025878906, -1.239776611328125e-05, 0.0012097358703613281, 0.0024318695068359375, 0.003654003143310547, 0.004876136779785156, 0.006098270416259766, 0.007320404052734375, 0.008542537689208984, 0.009764671325683594, 0.010986804962158203, 0.012208938598632812, 0.013431072235107422, 0.014653205871582031, 0.01587533950805664, 0.01709747314453125, 0.01831960678100586, 0.01954174041748047, 0.020763874053955078, 0.021986007690429688, 0.023208141326904297, 0.024430274963378906, 0.025652408599853516, 0.026874542236328125, 0.028096675872802734, 0.029318809509277344, 0.030540943145751953, 0.03176307678222656, 0.03298521041870117, 0.03420734405517578, 0.03542947769165039, 0.036651611328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 7.0, 5.0, 10.0, 7.0, 13.0, 18.0, 26.0, 27.0, 33.0, 38.0, 52.0, 59.0, 83.0, 104.0, 113.0, 83.0, 84.0, 41.0, 31.0, 44.0, 28.0, 18.0, 21.0, 12.0, 7.0, 8.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00807952880859375, -0.007809638977050781, -0.0075397491455078125, -0.007269859313964844, -0.006999969482421875, -0.006730079650878906, -0.0064601898193359375, -0.006190299987792969, -0.00592041015625, -0.005650520324707031, -0.0053806304931640625, -0.005110740661621094, -0.004840850830078125, -0.004570960998535156, -0.0043010711669921875, -0.004031181335449219, -0.00376129150390625, -0.0034914016723632812, -0.0032215118408203125, -0.0029516220092773438, -0.002681732177734375, -0.0024118423461914062, -0.0021419525146484375, -0.0018720626831054688, -0.0016021728515625, -0.0013322830200195312, -0.0010623931884765625, -0.0007925033569335938, -0.000522613525390625, -0.00025272369384765625, 1.71661376953125e-05, 0.00028705596923828125, 0.00055694580078125, 0.0008268356323242188, 0.0010967254638671875, 0.0013666152954101562, 0.001636505126953125, 0.0019063949584960938, 0.0021762847900390625, 0.0024461746215820312, 0.002716064453125, 0.0029859542846679688, 0.0032558441162109375, 0.0035257339477539062, 0.003795623779296875, 0.004065513610839844, 0.0043354034423828125, 0.004605293273925781, 0.00487518310546875, 0.005145072937011719, 0.0054149627685546875, 0.005684852600097656, 0.005954742431640625, 0.006224632263183594, 0.0064945220947265625, 0.006764411926269531, 0.0070343017578125, 0.007304191589355469, 0.0075740814208984375, 0.007843971252441406, 0.008113861083984375, 0.008383750915527344, 0.008653640747070312, 0.008923530578613281, 0.00919342041015625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 24.0, 58.0, 136.0, 245.0, 248.0, 122.0, 76.0, 35.0, 15.0, 7.0, 6.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.378666400909424, -3.266465425491333, -3.154264450073242, -3.0420632362365723, -2.9298622608184814, -2.8176612854003906, -2.7054600715637207, -2.59325909614563, -2.481058120727539, -2.3688571453094482, -2.2566561698913574, -2.1444549560546875, -2.0322539806365967, -1.9200530052185059, -1.8078519105911255, -1.6956508159637451, -1.5834498405456543, -1.4712488651275635, -1.359047770500183, -1.2468466758728027, -1.134645700454712, -1.022444725036621, -0.9102436304092407, -0.7980425953865051, -0.6858415603637695, -0.5736405253410339, -0.46143949031829834, -0.34923845529556274, -0.23703742027282715, -0.12483638525009155, -0.012635350227355957, 0.09956568479537964, 0.21176648139953613, 0.32396751642227173, 0.4361685514450073, 0.5483695864677429, 0.6605706214904785, 0.7727716565132141, 0.8849726915359497, 0.9971737265586853, 1.109374761581421, 1.2215757369995117, 1.333776831626892, 1.4459779262542725, 1.5581789016723633, 1.670379877090454, 1.7825809717178345, 1.8947820663452148, 2.0069830417633057, 2.1191840171813965, 2.2313852310180664, 2.3435862064361572, 2.455787181854248, 2.567988157272339, 2.6801891326904297, 2.7923903465270996, 2.9045913219451904, 3.0167922973632812, 3.128993511199951, 3.241194486618042, 3.353395462036133, 3.4655964374542236, 3.5777974128723145, 3.6899986267089844, 3.802199602127075]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 9.0, 13.0, 15.0, 24.0, 37.0, 50.0, 76.0, 106.0, 114.0, 110.0, 113.0, 98.0, 71.0, 42.0, 36.0, 26.0, 19.0, 8.0, 12.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1013505458831787, -2.0344078540802, -1.9674649238586426, -1.900522232055664, -1.833579421043396, -1.766636610031128, -1.6996939182281494, -1.6327511072158813, -1.5658082962036133, -1.4988654851913452, -1.4319226741790771, -1.3649799823760986, -1.2980371713638306, -1.2310943603515625, -1.164151668548584, -1.097208857536316, -1.0302660465240479, -0.9633232355117798, -0.8963804841041565, -0.8294377326965332, -0.7624949216842651, -0.6955521106719971, -0.6286093592643738, -0.5616666078567505, -0.4947237968444824, -0.42778101563453674, -0.36083823442459106, -0.2938954532146454, -0.2269526720046997, -0.16000989079475403, -0.09306710958480835, -0.02612432837486267, 0.04081869125366211, 0.10776147246360779, 0.17470425367355347, 0.24164703488349915, 0.3085898160934448, 0.3755325973033905, 0.4424753785133362, 0.5094181299209595, 0.5763609409332275, 0.6433037519454956, 0.7102465033531189, 0.7771892547607422, 0.8441320657730103, 0.9110748767852783, 0.9780176281929016, 1.044960379600525, 1.111903190612793, 1.178846001625061, 1.245788812637329, 1.3127315044403076, 1.3796743154525757, 1.4466171264648438, 1.5135598182678223, 1.5805026292800903, 1.6474454402923584, 1.7143882513046265, 1.7813310623168945, 1.848273754119873, 1.9152165651321411, 1.9821593761444092, 2.0491020679473877, 2.1160449981689453, 2.182987689971924]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 13.0, 21.0, 15.0, 26.0, 37.0, 62.0, 104.0, 157.0, 251.0, 421.0, 790.0, 1424.0, 2797.0, 5847.0, 13588.0, 41647.0, 202450.0, 606570.0, 122202.0, 29492.0, 10893.0, 4673.0, 2285.0, 1213.0, 603.0, 363.0, 203.0, 121.0, 86.0, 62.0, 48.0, 28.0, 15.0, 9.0, 12.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6646728515625, -0.640380859375, -0.6160888671875, -0.591796875, -0.5675048828125, -0.543212890625, -0.5189208984375, -0.49462890625, -0.4703369140625, -0.446044921875, -0.4217529296875, -0.3974609375, -0.3731689453125, -0.348876953125, -0.3245849609375, -0.30029296875, -0.2760009765625, -0.251708984375, -0.2274169921875, -0.203125, -0.1788330078125, -0.154541015625, -0.1302490234375, -0.10595703125, -0.0816650390625, -0.057373046875, -0.0330810546875, -0.0087890625, 0.0155029296875, 0.039794921875, 0.0640869140625, 0.08837890625, 0.1126708984375, 0.136962890625, 0.1612548828125, 0.185546875, 0.2098388671875, 0.234130859375, 0.2584228515625, 0.28271484375, 0.3070068359375, 0.331298828125, 0.3555908203125, 0.3798828125, 0.4041748046875, 0.428466796875, 0.4527587890625, 0.47705078125, 0.5013427734375, 0.525634765625, 0.5499267578125, 0.57421875, 0.5985107421875, 0.622802734375, 0.6470947265625, 0.67138671875, 0.6956787109375, 0.719970703125, 0.7442626953125, 0.7685546875, 0.7928466796875, 0.817138671875, 0.8414306640625, 0.86572265625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 9.0, 15.0, 22.0, 24.0, 51.0, 66.0, 72.0, 88.0, 103.0, 105.0, 103.0, 80.0, 74.0, 43.0, 48.0, 21.0, 13.0, 15.0, 13.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.588165283203125, -4.45758056640625, -4.326995849609375, -4.1964111328125, -4.065826416015625, -3.93524169921875, -3.804656982421875, -3.674072265625, -3.543487548828125, -3.41290283203125, -3.282318115234375, -3.1517333984375, -3.021148681640625, -2.89056396484375, -2.759979248046875, -2.62939453125, -2.498809814453125, -2.36822509765625, -2.237640380859375, -2.1070556640625, -1.976470947265625, -1.84588623046875, -1.715301513671875, -1.584716796875, -1.454132080078125, -1.32354736328125, -1.192962646484375, -1.0623779296875, -0.931793212890625, -0.80120849609375, -0.670623779296875, -0.5400390625, -0.409454345703125, -0.27886962890625, -0.148284912109375, -0.0177001953125, 0.112884521484375, 0.24346923828125, 0.374053955078125, 0.504638671875, 0.635223388671875, 0.76580810546875, 0.896392822265625, 1.0269775390625, 1.157562255859375, 1.28814697265625, 1.418731689453125, 1.54931640625, 1.679901123046875, 1.81048583984375, 1.941070556640625, 2.0716552734375, 2.202239990234375, 2.33282470703125, 2.463409423828125, 2.593994140625, 2.724578857421875, 2.85516357421875, 2.985748291015625, 3.1163330078125, 3.246917724609375, 3.37750244140625, 3.508087158203125, 3.638671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 7.0, 6.0, 6.0, 4.0, 10.0, 6.0, 10.0, 12.0, 11.0, 28.0, 30.0, 35.0, 55.0, 72.0, 113.0, 146.0, 244.0, 500.0, 1287.0, 8340.0, 197249.0, 814440.0, 21772.0, 2530.0, 674.0, 330.0, 169.0, 140.0, 89.0, 63.0, 51.0, 26.0, 21.0, 21.0, 13.0, 8.0, 8.0, 7.0, 5.0, 3.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8046875, -1.748626708984375, -1.69256591796875, -1.636505126953125, -1.5804443359375, -1.524383544921875, -1.46832275390625, -1.412261962890625, -1.356201171875, -1.300140380859375, -1.24407958984375, -1.188018798828125, -1.1319580078125, -1.075897216796875, -1.01983642578125, -0.963775634765625, -0.90771484375, -0.851654052734375, -0.79559326171875, -0.739532470703125, -0.6834716796875, -0.627410888671875, -0.57135009765625, -0.515289306640625, -0.459228515625, -0.403167724609375, -0.34710693359375, -0.291046142578125, -0.2349853515625, -0.178924560546875, -0.12286376953125, -0.066802978515625, -0.0107421875, 0.045318603515625, 0.10137939453125, 0.157440185546875, 0.2135009765625, 0.269561767578125, 0.32562255859375, 0.381683349609375, 0.437744140625, 0.493804931640625, 0.54986572265625, 0.605926513671875, 0.6619873046875, 0.718048095703125, 0.77410888671875, 0.830169677734375, 0.88623046875, 0.942291259765625, 0.99835205078125, 1.054412841796875, 1.1104736328125, 1.166534423828125, 1.22259521484375, 1.278656005859375, 1.334716796875, 1.390777587890625, 1.44683837890625, 1.502899169921875, 1.5589599609375, 1.615020751953125, 1.67108154296875, 1.727142333984375, 1.783203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 8.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 14.0, 13.0, 19.0, 26.0, 24.0, 27.0, 36.0, 39.0, 46.0, 45.0, 41.0, 59.0, 51.0, 61.0, 61.0, 44.0, 49.0, 56.0, 35.0, 47.0, 29.0, 30.0, 25.0, 24.0, 11.0, 9.0, 12.0, 4.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.193359375, -3.096710205078125, -3.00006103515625, -2.903411865234375, -2.8067626953125, -2.710113525390625, -2.61346435546875, -2.516815185546875, -2.420166015625, -2.323516845703125, -2.22686767578125, -2.130218505859375, -2.0335693359375, -1.936920166015625, -1.84027099609375, -1.743621826171875, -1.64697265625, -1.550323486328125, -1.45367431640625, -1.357025146484375, -1.2603759765625, -1.163726806640625, -1.06707763671875, -0.970428466796875, -0.873779296875, -0.777130126953125, -0.68048095703125, -0.583831787109375, -0.4871826171875, -0.390533447265625, -0.29388427734375, -0.197235107421875, -0.1005859375, -0.003936767578125, 0.09271240234375, 0.189361572265625, 0.2860107421875, 0.382659912109375, 0.47930908203125, 0.575958251953125, 0.672607421875, 0.769256591796875, 0.86590576171875, 0.962554931640625, 1.0592041015625, 1.155853271484375, 1.25250244140625, 1.349151611328125, 1.44580078125, 1.542449951171875, 1.63909912109375, 1.735748291015625, 1.8323974609375, 1.929046630859375, 2.02569580078125, 2.122344970703125, 2.218994140625, 2.315643310546875, 2.41229248046875, 2.508941650390625, 2.6055908203125, 2.702239990234375, 2.79888916015625, 2.895538330078125, 2.9921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 4.0, 11.0, 10.0, 31.0, 57.0, 113.0, 304.0, 956.0, 7756.0, 988133.0, 48459.0, 1870.0, 480.0, 193.0, 79.0, 37.0, 16.0, 16.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.55859375, -1.5061492919921875, -1.453704833984375, -1.4012603759765625, -1.34881591796875, -1.2963714599609375, -1.243927001953125, -1.1914825439453125, -1.1390380859375, -1.0865936279296875, -1.034149169921875, -0.9817047119140625, -0.92926025390625, -0.8768157958984375, -0.824371337890625, -0.7719268798828125, -0.719482421875, -0.6670379638671875, -0.614593505859375, -0.5621490478515625, -0.50970458984375, -0.4572601318359375, -0.404815673828125, -0.3523712158203125, -0.2999267578125, -0.2474822998046875, -0.195037841796875, -0.1425933837890625, -0.09014892578125, -0.0377044677734375, 0.014739990234375, 0.0671844482421875, 0.11962890625, 0.1720733642578125, 0.224517822265625, 0.2769622802734375, 0.32940673828125, 0.3818511962890625, 0.434295654296875, 0.4867401123046875, 0.5391845703125, 0.5916290283203125, 0.644073486328125, 0.6965179443359375, 0.74896240234375, 0.8014068603515625, 0.853851318359375, 0.9062957763671875, 0.958740234375, 1.0111846923828125, 1.063629150390625, 1.1160736083984375, 1.16851806640625, 1.2209625244140625, 1.273406982421875, 1.3258514404296875, 1.3782958984375, 1.4307403564453125, 1.483184814453125, 1.5356292724609375, 1.58807373046875, 1.6405181884765625, 1.692962646484375, 1.7454071044921875, 1.7978515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 8.0, 23.0, 23.0, 24.0, 59.0, 149.0, 314.0, 197.0, 64.0, 58.0, 27.0, 19.0, 6.0, 2.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.00011976342648267746, -0.00011650286614894867, -0.00011324230581521988, -0.00010998174548149109, -0.0001067211851477623, -0.00010346062481403351, -0.00010020006448030472, -9.693950414657593e-05, -9.367894381284714e-05, -9.041838347911835e-05, -8.715782314538956e-05, -8.389726281166077e-05, -8.063670247793198e-05, -7.737614214420319e-05, -7.41155818104744e-05, -7.08550214767456e-05, -6.759446114301682e-05, -6.433390080928802e-05, -6.107334047555923e-05, -5.7812780141830444e-05, -5.4552219808101654e-05, -5.1291659474372864e-05, -4.8031099140644073e-05, -4.477053880691528e-05, -4.150997847318649e-05, -3.82494181394577e-05, -3.498885780572891e-05, -3.172829747200012e-05, -2.8467737138271332e-05, -2.520717680454254e-05, -2.194661647081375e-05, -1.868605613708496e-05, -1.542549580335617e-05, -1.216493546962738e-05, -8.90437513589859e-06, -5.6438148021698e-06, -2.3832544684410095e-06, 8.773058652877808e-07, 4.137866199016571e-06, 7.398426532745361e-06, 1.0658986866474152e-05, 1.3919547200202942e-05, 1.7180107533931732e-05, 2.0440667867660522e-05, 2.3701228201389313e-05, 2.6961788535118103e-05, 3.0222348868846893e-05, 3.3482909202575684e-05, 3.6743469536304474e-05, 4.0004029870033264e-05, 4.3264590203762054e-05, 4.6525150537490845e-05, 4.9785710871219635e-05, 5.3046271204948425e-05, 5.6306831538677216e-05, 5.9567391872406006e-05, 6.28279522061348e-05, 6.608851253986359e-05, 6.934907287359238e-05, 7.260963320732117e-05, 7.587019354104996e-05, 7.913075387477875e-05, 8.239131420850754e-05, 8.565187454223633e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 2.0, 8.0, 13.0, 21.0, 39.0, 89.0, 312.0, 917.0, 4556.0, 109584.0, 920200.0, 10554.0, 1553.0, 407.0, 161.0, 58.0, 24.0, 16.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4462890625, -1.39837646484375, -1.3504638671875, -1.30255126953125, -1.254638671875, -1.20672607421875, -1.1588134765625, -1.11090087890625, -1.06298828125, -1.01507568359375, -0.9671630859375, -0.91925048828125, -0.871337890625, -0.82342529296875, -0.7755126953125, -0.72760009765625, -0.6796875, -0.63177490234375, -0.5838623046875, -0.53594970703125, -0.488037109375, -0.44012451171875, -0.3922119140625, -0.34429931640625, -0.29638671875, -0.24847412109375, -0.2005615234375, -0.15264892578125, -0.104736328125, -0.05682373046875, -0.0089111328125, 0.03900146484375, 0.0869140625, 0.13482666015625, 0.1827392578125, 0.23065185546875, 0.278564453125, 0.32647705078125, 0.3743896484375, 0.42230224609375, 0.47021484375, 0.51812744140625, 0.5660400390625, 0.61395263671875, 0.661865234375, 0.70977783203125, 0.7576904296875, 0.80560302734375, 0.853515625, 0.90142822265625, 0.9493408203125, 0.99725341796875, 1.045166015625, 1.09307861328125, 1.1409912109375, 1.18890380859375, 1.23681640625, 1.28472900390625, 1.3326416015625, 1.38055419921875, 1.428466796875, 1.47637939453125, 1.5242919921875, 1.57220458984375, 1.6201171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 8.0, 7.0, 5.0, 13.0, 18.0, 32.0, 74.0, 150.0, 348.0, 162.0, 78.0, 43.0, 24.0, 7.0, 7.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.49221038818359375, -0.4770965576171875, -0.46198272705078125, -0.446868896484375, -0.43175506591796875, -0.4166412353515625, -0.40152740478515625, -0.38641357421875, -0.37129974365234375, -0.3561859130859375, -0.34107208251953125, -0.325958251953125, -0.31084442138671875, -0.2957305908203125, -0.28061676025390625, -0.2655029296875, -0.25038909912109375, -0.2352752685546875, -0.22016143798828125, -0.205047607421875, -0.18993377685546875, -0.1748199462890625, -0.15970611572265625, -0.14459228515625, -0.12947845458984375, -0.1143646240234375, -0.09925079345703125, -0.084136962890625, -0.06902313232421875, -0.0539093017578125, -0.03879547119140625, -0.023681640625, -0.00856781005859375, 0.0065460205078125, 0.02165985107421875, 0.036773681640625, 0.05188751220703125, 0.0670013427734375, 0.08211517333984375, 0.09722900390625, 0.11234283447265625, 0.1274566650390625, 0.14257049560546875, 0.157684326171875, 0.17279815673828125, 0.1879119873046875, 0.20302581787109375, 0.2181396484375, 0.23325347900390625, 0.2483673095703125, 0.26348114013671875, 0.278594970703125, 0.29370880126953125, 0.3088226318359375, 0.32393646240234375, 0.33905029296875, 0.35416412353515625, 0.3692779541015625, 0.38439178466796875, 0.399505615234375, 0.41461944580078125, 0.4297332763671875, 0.44484710693359375, 0.4599609375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 19.0, 253.0, 587.0, 118.0, 17.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.123626232147217, -5.468524932861328, -4.813423156738281, -4.158321380615234, -3.5032200813293457, -2.848118543624878, -2.19301700592041, -1.5379157066345215, -0.8828139305114746, -0.22771239280700684, 0.42738914489746094, 1.0824906826019287, 1.7375922203063965, 2.3926937580108643, 3.047795295715332, 3.7028965950012207, 4.357998371124268, 5.013099670410156, 5.668201446533203, 6.32330322265625, 6.978404521942139, 7.633505821228027, 8.288607597351074, 8.943708419799805, 9.598810195922852, 10.253911972045898, 10.909013748168945, 11.564114570617676, 12.219216346740723, 12.87431812286377, 13.5294189453125, 14.184520721435547, 14.839622497558594, 15.49472427368164, 16.149826049804688, 16.804927825927734, 17.46002960205078, 18.115129470825195, 18.770231246948242, 19.42533302307129, 20.080434799194336, 20.735536575317383, 21.39063835144043, 22.045740127563477, 22.70083999633789, 23.355941772460938, 24.011043548583984, 24.66614532470703, 25.321247100830078, 25.976348876953125, 26.631450653076172, 27.28655242919922, 27.941654205322266, 28.59675407409668, 29.251855850219727, 29.906957626342773, 30.56205940246582, 31.217161178588867, 31.872262954711914, 32.52736282348633, 33.182464599609375, 33.83756637573242, 34.49266815185547, 35.147769927978516, 35.80287170410156]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 11.0, 11.0, 20.0, 32.0, 32.0, 36.0, 49.0, 42.0, 57.0, 63.0, 54.0, 56.0, 66.0, 59.0, 40.0, 65.0, 51.0, 47.0, 49.0, 39.0, 21.0, 26.0, 20.0, 11.0, 14.0, 5.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.675444602966309, -7.437404155731201, -7.1993632316589355, -6.961322784423828, -6.723282337188721, -6.485241889953613, -6.247200965881348, -6.00916051864624, -5.771120071411133, -5.533079624176025, -5.29503870010376, -5.056998252868652, -4.818957805633545, -4.5809173583984375, -4.342876434326172, -4.1048359870910645, -3.866795063018799, -3.6287543773651123, -3.390713930130005, -3.1526732444763184, -2.914632797241211, -2.6765921115875244, -2.438551425933838, -2.2005109786987305, -1.962470293045044, -1.724429726600647, -1.48638916015625, -1.2483484745025635, -1.0103079080581665, -0.7722673416137695, -0.534226655960083, -0.29618608951568604, -0.058145999908447266, 0.1798945963382721, 0.41793519258499146, 0.6559758186340332, 0.8940163850784302, 1.1320569515228271, 1.3700976371765137, 1.6081382036209106, 1.8461787700653076, 2.084219455718994, 2.3222599029541016, 2.560300588607788, 2.7983412742614746, 3.036381721496582, 3.2744224071502686, 3.512463092803955, 3.7505035400390625, 3.988544225692749, 4.2265849113464355, 4.464625358581543, 4.70266580581665, 4.940706253051758, 5.178747177124023, 5.416787624359131, 5.654828071594238, 5.892868518829346, 6.130909442901611, 6.368949890136719, 6.606990337371826, 6.845030784606934, 7.083071708679199, 7.321112155914307, 7.559153079986572]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 14.0, 25.0, 26.0, 37.0, 68.0, 143.0, 215.0, 445.0, 935.0, 2280.0, 5479.0, 18835.0, 167287.0, 3194785.0, 746536.0, 43484.0, 8439.0, 2771.0, 1147.0, 620.0, 303.0, 175.0, 88.0, 50.0, 26.0, 17.0, 14.0, 12.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.6712646484375, -2.574951171875, -2.4786376953125, -2.38232421875, -2.2860107421875, -2.189697265625, -2.0933837890625, -1.9970703125, -1.9007568359375, -1.804443359375, -1.7081298828125, -1.61181640625, -1.5155029296875, -1.419189453125, -1.3228759765625, -1.2265625, -1.1302490234375, -1.033935546875, -0.9376220703125, -0.84130859375, -0.7449951171875, -0.648681640625, -0.5523681640625, -0.4560546875, -0.3597412109375, -0.263427734375, -0.1671142578125, -0.07080078125, 0.0255126953125, 0.121826171875, 0.2181396484375, 0.314453125, 0.4107666015625, 0.507080078125, 0.6033935546875, 0.69970703125, 0.7960205078125, 0.892333984375, 0.9886474609375, 1.0849609375, 1.1812744140625, 1.277587890625, 1.3739013671875, 1.47021484375, 1.5665283203125, 1.662841796875, 1.7591552734375, 1.85546875, 1.9517822265625, 2.048095703125, 2.1444091796875, 2.24072265625, 2.3370361328125, 2.433349609375, 2.5296630859375, 2.6259765625, 2.7222900390625, 2.818603515625, 2.9149169921875, 3.01123046875, 3.1075439453125, 3.203857421875, 3.3001708984375, 3.396484375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 11.0, 11.0, 21.0, 28.0, 45.0, 51.0, 93.0, 106.0, 118.0, 115.0, 87.0, 83.0, 56.0, 55.0, 30.0, 27.0, 14.0, 15.0, 15.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.822265625, -1.73974609375, -1.6572265625, -1.57470703125, -1.4921875, -1.40966796875, -1.3271484375, -1.24462890625, -1.162109375, -1.07958984375, -0.9970703125, -0.91455078125, -0.83203125, -0.74951171875, -0.6669921875, -0.58447265625, -0.501953125, -0.41943359375, -0.3369140625, -0.25439453125, -0.171875, -0.08935546875, -0.0068359375, 0.07568359375, 0.158203125, 0.24072265625, 0.3232421875, 0.40576171875, 0.48828125, 0.57080078125, 0.6533203125, 0.73583984375, 0.818359375, 0.90087890625, 0.9833984375, 1.06591796875, 1.1484375, 1.23095703125, 1.3134765625, 1.39599609375, 1.478515625, 1.56103515625, 1.6435546875, 1.72607421875, 1.80859375, 1.89111328125, 1.9736328125, 2.05615234375, 2.138671875, 2.22119140625, 2.3037109375, 2.38623046875, 2.46875, 2.55126953125, 2.6337890625, 2.71630859375, 2.798828125, 2.88134765625, 2.9638671875, 3.04638671875, 3.12890625, 3.21142578125, 3.2939453125, 3.37646484375, 3.458984375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 4.0, 12.0, 14.0, 19.0, 37.0, 48.0, 77.0, 118.0, 198.0, 431.0, 1024.0, 3020.0, 11524.0, 77564.0, 3668735.0, 397268.0, 25815.0, 5339.0, 1627.0, 643.0, 312.0, 154.0, 95.0, 57.0, 39.0, 31.0, 16.0, 16.0, 7.0, 6.0, 7.0, 3.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.669921875, -3.570037841796875, -3.47015380859375, -3.370269775390625, -3.2703857421875, -3.170501708984375, -3.07061767578125, -2.970733642578125, -2.870849609375, -2.770965576171875, -2.67108154296875, -2.571197509765625, -2.4713134765625, -2.371429443359375, -2.27154541015625, -2.171661376953125, -2.07177734375, -1.971893310546875, -1.87200927734375, -1.772125244140625, -1.6722412109375, -1.572357177734375, -1.47247314453125, -1.372589111328125, -1.272705078125, -1.172821044921875, -1.07293701171875, -0.973052978515625, -0.8731689453125, -0.773284912109375, -0.67340087890625, -0.573516845703125, -0.4736328125, -0.373748779296875, -0.27386474609375, -0.173980712890625, -0.0740966796875, 0.025787353515625, 0.12567138671875, 0.225555419921875, 0.325439453125, 0.425323486328125, 0.52520751953125, 0.625091552734375, 0.7249755859375, 0.824859619140625, 0.92474365234375, 1.024627685546875, 1.12451171875, 1.224395751953125, 1.32427978515625, 1.424163818359375, 1.5240478515625, 1.623931884765625, 1.72381591796875, 1.823699951171875, 1.923583984375, 2.023468017578125, 2.12335205078125, 2.223236083984375, 2.3231201171875, 2.423004150390625, 2.52288818359375, 2.622772216796875, 2.72265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 8.0, 9.0, 24.0, 14.0, 22.0, 32.0, 47.0, 65.0, 109.0, 257.0, 538.0, 1005.0, 923.0, 481.0, 210.0, 101.0, 62.0, 41.0, 26.0, 23.0, 14.0, 12.0, 14.0, 4.0, 8.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.837890625, -0.8131484985351562, -0.7884063720703125, -0.7636642456054688, -0.738922119140625, -0.7141799926757812, -0.6894378662109375, -0.6646957397460938, -0.63995361328125, -0.6152114868164062, -0.5904693603515625, -0.5657272338867188, -0.540985107421875, -0.5162429809570312, -0.4915008544921875, -0.46675872802734375, -0.4420166015625, -0.41727447509765625, -0.3925323486328125, -0.36779022216796875, -0.343048095703125, -0.31830596923828125, -0.2935638427734375, -0.26882171630859375, -0.24407958984375, -0.21933746337890625, -0.1945953369140625, -0.16985321044921875, -0.145111083984375, -0.12036895751953125, -0.0956268310546875, -0.07088470458984375, -0.046142578125, -0.02140045166015625, 0.0033416748046875, 0.02808380126953125, 0.052825927734375, 0.07756805419921875, 0.1023101806640625, 0.12705230712890625, 0.15179443359375, 0.17653656005859375, 0.2012786865234375, 0.22602081298828125, 0.250762939453125, 0.27550506591796875, 0.3002471923828125, 0.32498931884765625, 0.3497314453125, 0.37447357177734375, 0.3992156982421875, 0.42395782470703125, 0.448699951171875, 0.47344207763671875, 0.4981842041015625, 0.5229263305664062, 0.54766845703125, 0.5724105834960938, 0.5971527099609375, 0.6218948364257812, 0.646636962890625, 0.6713790893554688, 0.6961212158203125, 0.7208633422851562, 0.74560546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 25.0, 45.0, 74.0, 124.0, 186.0, 183.0, 133.0, 90.0, 50.0, 28.0, 19.0, 9.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9403655529022217, -3.8054347038269043, -3.670504093170166, -3.5355734825134277, -3.4006426334381104, -3.265711784362793, -3.1307811737060547, -2.9958505630493164, -2.860919713973999, -2.7259888648986816, -2.5910582542419434, -2.456127643585205, -2.3211967945098877, -2.1862659454345703, -2.051335334777832, -1.9164046049118042, -1.7814738750457764, -1.6465431451797485, -1.5116124153137207, -1.3766816854476929, -1.241750955581665, -1.1068202257156372, -0.9718894958496094, -0.8369587659835815, -0.7020280361175537, -0.5670973062515259, -0.43216657638549805, -0.2972358465194702, -0.16230511665344238, -0.02737438678741455, 0.10755634307861328, 0.2424870729446411, 0.37741756439208984, 0.5123482942581177, 0.6472790241241455, 0.7822097539901733, 0.9171404838562012, 1.052071213722229, 1.1870019435882568, 1.3219326734542847, 1.4568634033203125, 1.5917941331863403, 1.7267248630523682, 1.861655592918396, 1.9965863227844238, 2.131516933441162, 2.2664477825164795, 2.401378631591797, 2.536309242248535, 2.6712398529052734, 2.806170701980591, 2.941101551055908, 3.0760321617126465, 3.2109627723693848, 3.345893621444702, 3.4808244705200195, 3.615755081176758, 3.750685691833496, 3.8856165409088135, 4.020547389984131, 4.155478000640869, 4.290408611297607, 4.425339698791504, 4.560270309448242, 4.6952009201049805]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 12.0, 8.0, 21.0, 25.0, 35.0, 47.0, 48.0, 65.0, 79.0, 65.0, 69.0, 81.0, 99.0, 74.0, 67.0, 57.0, 31.0, 40.0, 17.0, 19.0, 16.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3137388229370117, -2.234884738922119, -2.1560306549072266, -2.077176809310913, -1.9983227252960205, -1.919468641281128, -1.8406145572662354, -1.7617604732513428, -1.6829065084457397, -1.6040524244308472, -1.5251984596252441, -1.4463443756103516, -1.367490291595459, -1.288636326789856, -1.2097822427749634, -1.1309282779693604, -1.0520741939544678, -0.97322016954422, -0.8943661451339722, -0.8155120611190796, -0.7366580367088318, -0.657804012298584, -0.5789499282836914, -0.5000959038734436, -0.4212418794631958, -0.342387855052948, -0.2635338008403778, -0.1846797615289688, -0.10582572221755981, -0.02697169780731201, 0.05188235640525818, 0.13073641061782837, 0.20959043502807617, 0.288444459438324, 0.36729851365089417, 0.44615256786346436, 0.5250065922737122, 0.60386061668396, 0.6827147006988525, 0.7615687251091003, 0.8404227495193481, 0.919276773929596, 0.9981307983398438, 1.0769848823547363, 1.155838966369629, 1.234692931175232, 1.3135470151901245, 1.3924009799957275, 1.4712550640106201, 1.5501091480255127, 1.6289631128311157, 1.7078171968460083, 1.7866711616516113, 1.865525245666504, 1.9443793296813965, 2.023233413696289, 2.1020874977111816, 2.180941581726074, 2.259795665740967, 2.3386495113372803, 2.417503595352173, 2.4963576793670654, 2.575211763381958, 2.6540658473968506, 2.732919692993164]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 10.0, 7.0, 18.0, 15.0, 20.0, 42.0, 51.0, 80.0, 145.0, 234.0, 425.0, 974.0, 2158.0, 5967.0, 22776.0, 123739.0, 651831.0, 195367.0, 31815.0, 7861.0, 2614.0, 1129.0, 535.0, 292.0, 166.0, 95.0, 66.0, 39.0, 29.0, 14.0, 15.0, 7.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.33322906494140625, -0.3219757080078125, -0.31072235107421875, -0.299468994140625, -0.28821563720703125, -0.2769622802734375, -0.26570892333984375, -0.25445556640625, -0.24320220947265625, -0.2319488525390625, -0.22069549560546875, -0.209442138671875, -0.19818878173828125, -0.1869354248046875, -0.17568206787109375, -0.1644287109375, -0.15317535400390625, -0.1419219970703125, -0.13066864013671875, -0.119415283203125, -0.10816192626953125, -0.0969085693359375, -0.08565521240234375, -0.07440185546875, -0.06314849853515625, -0.0518951416015625, -0.04064178466796875, -0.029388427734375, -0.01813507080078125, -0.0068817138671875, 0.00437164306640625, 0.015625, 0.02687835693359375, 0.0381317138671875, 0.04938507080078125, 0.060638427734375, 0.07189178466796875, 0.0831451416015625, 0.09439849853515625, 0.10565185546875, 0.11690521240234375, 0.1281585693359375, 0.13941192626953125, 0.150665283203125, 0.16191864013671875, 0.1731719970703125, 0.18442535400390625, 0.1956787109375, 0.20693206787109375, 0.2181854248046875, 0.22943878173828125, 0.240692138671875, 0.25194549560546875, 0.2631988525390625, 0.27445220947265625, 0.28570556640625, 0.29695892333984375, 0.3082122802734375, 0.31946563720703125, 0.330718994140625, 0.34197235107421875, 0.3532257080078125, 0.36447906494140625, 0.375732421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 10.0, 6.0, 12.0, 22.0, 39.0, 61.0, 43.0, 80.0, 93.0, 95.0, 116.0, 106.0, 93.0, 70.0, 51.0, 37.0, 25.0, 20.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7560577392578125, -1.688873291015625, -1.6216888427734375, -1.55450439453125, -1.4873199462890625, -1.420135498046875, -1.3529510498046875, -1.2857666015625, -1.2185821533203125, -1.151397705078125, -1.0842132568359375, -1.01702880859375, -0.9498443603515625, -0.882659912109375, -0.8154754638671875, -0.748291015625, -0.6811065673828125, -0.613922119140625, -0.5467376708984375, -0.47955322265625, -0.4123687744140625, -0.345184326171875, -0.2779998779296875, -0.2108154296875, -0.1436309814453125, -0.076446533203125, -0.0092620849609375, 0.05792236328125, 0.1251068115234375, 0.192291259765625, 0.2594757080078125, 0.32666015625, 0.3938446044921875, 0.461029052734375, 0.5282135009765625, 0.59539794921875, 0.6625823974609375, 0.729766845703125, 0.7969512939453125, 0.8641357421875, 0.9313201904296875, 0.998504638671875, 1.0656890869140625, 1.13287353515625, 1.2000579833984375, 1.267242431640625, 1.3344268798828125, 1.401611328125, 1.4687957763671875, 1.535980224609375, 1.6031646728515625, 1.67034912109375, 1.7375335693359375, 1.804718017578125, 1.8719024658203125, 1.9390869140625, 2.0062713623046875, 2.073455810546875, 2.1406402587890625, 2.20782470703125, 2.2750091552734375, 2.342193603515625, 2.4093780517578125, 2.4765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 10.0, 14.0, 19.0, 27.0, 45.0, 62.0, 114.0, 162.0, 227.0, 421.0, 662.0, 1155.0, 1813.0, 3268.0, 5829.0, 10293.0, 19246.0, 36476.0, 70541.0, 137721.0, 242509.0, 238619.0, 134199.0, 68129.0, 35217.0, 18284.0, 10027.0, 5580.0, 3147.0, 1843.0, 1138.0, 644.0, 392.0, 246.0, 166.0, 106.0, 55.0, 54.0, 19.0, 21.0, 20.0, 5.0, 10.0, 3.0, 8.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0916748046875, -0.0887155532836914, -0.08575630187988281, -0.08279705047607422, -0.07983779907226562, -0.07687854766845703, -0.07391929626464844, -0.07096004486083984, -0.06800079345703125, -0.06504154205322266, -0.06208229064941406, -0.05912303924560547, -0.056163787841796875, -0.05320453643798828, -0.05024528503417969, -0.047286033630371094, -0.0443267822265625, -0.041367530822753906, -0.03840827941894531, -0.03544902801513672, -0.032489776611328125, -0.02953052520751953, -0.026571273803710938, -0.023612022399902344, -0.02065277099609375, -0.017693519592285156, -0.014734268188476562, -0.011775016784667969, -0.008815765380859375, -0.005856513977050781, -0.0028972625732421875, 6.198883056640625e-05, 0.003021240234375, 0.005980491638183594, 0.008939743041992188, 0.011898994445800781, 0.014858245849609375, 0.01781749725341797, 0.020776748657226562, 0.023736000061035156, 0.02669525146484375, 0.029654502868652344, 0.03261375427246094, 0.03557300567626953, 0.038532257080078125, 0.04149150848388672, 0.04445075988769531, 0.047410011291503906, 0.0503692626953125, 0.053328514099121094, 0.05628776550292969, 0.05924701690673828, 0.062206268310546875, 0.06516551971435547, 0.06812477111816406, 0.07108402252197266, 0.07404327392578125, 0.07700252532958984, 0.07996177673339844, 0.08292102813720703, 0.08588027954101562, 0.08883953094482422, 0.09179878234863281, 0.0947580337524414, 0.09771728515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 14.0, 11.0, 6.0, 12.0, 16.0, 21.0, 22.0, 21.0, 34.0, 35.0, 31.0, 38.0, 33.0, 43.0, 43.0, 53.0, 40.0, 55.0, 51.0, 44.0, 44.0, 30.0, 40.0, 45.0, 40.0, 27.0, 26.0, 23.0, 13.0, 19.0, 7.0, 12.0, 4.0, 13.0, 8.0, 3.0, 3.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.7191162109375, -1.658935546875, -1.5987548828125, -1.53857421875, -1.4783935546875, -1.418212890625, -1.3580322265625, -1.2978515625, -1.2376708984375, -1.177490234375, -1.1173095703125, -1.05712890625, -0.9969482421875, -0.936767578125, -0.8765869140625, -0.81640625, -0.7562255859375, -0.696044921875, -0.6358642578125, -0.57568359375, -0.5155029296875, -0.455322265625, -0.3951416015625, -0.3349609375, -0.2747802734375, -0.214599609375, -0.1544189453125, -0.09423828125, -0.0340576171875, 0.026123046875, 0.0863037109375, 0.146484375, 0.2066650390625, 0.266845703125, 0.3270263671875, 0.38720703125, 0.4473876953125, 0.507568359375, 0.5677490234375, 0.6279296875, 0.6881103515625, 0.748291015625, 0.8084716796875, 0.86865234375, 0.9288330078125, 0.989013671875, 1.0491943359375, 1.109375, 1.1695556640625, 1.229736328125, 1.2899169921875, 1.35009765625, 1.4102783203125, 1.470458984375, 1.5306396484375, 1.5908203125, 1.6510009765625, 1.711181640625, 1.7713623046875, 1.83154296875, 1.8917236328125, 1.951904296875, 2.0120849609375, 2.072265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 12.0, 6.0, 18.0, 23.0, 22.0, 49.0, 72.0, 98.0, 178.0, 268.0, 463.0, 801.0, 1395.0, 2459.0, 4879.0, 10594.0, 27853.0, 103496.0, 548096.0, 263810.0, 51821.0, 16980.0, 7130.0, 3491.0, 1836.0, 1050.0, 618.0, 386.0, 246.0, 129.0, 82.0, 68.0, 40.0, 17.0, 16.0, 13.0, 10.0, 10.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0257415771484375, -0.025001049041748047, -0.024260520935058594, -0.02351999282836914, -0.022779464721679688, -0.022038936614990234, -0.02129840850830078, -0.020557880401611328, -0.019817352294921875, -0.019076824188232422, -0.01833629608154297, -0.017595767974853516, -0.016855239868164062, -0.01611471176147461, -0.015374183654785156, -0.014633655548095703, -0.01389312744140625, -0.013152599334716797, -0.012412071228027344, -0.01167154312133789, -0.010931015014648438, -0.010190486907958984, -0.009449958801269531, -0.008709430694580078, -0.007968902587890625, -0.007228374481201172, -0.006487846374511719, -0.005747318267822266, -0.0050067901611328125, -0.004266262054443359, -0.0035257339477539062, -0.002785205841064453, -0.002044677734375, -0.0013041496276855469, -0.0005636215209960938, 0.00017690658569335938, 0.0009174346923828125, 0.0016579627990722656, 0.0023984909057617188, 0.003139019012451172, 0.003879547119140625, 0.004620075225830078, 0.005360603332519531, 0.006101131439208984, 0.0068416595458984375, 0.007582187652587891, 0.008322715759277344, 0.009063243865966797, 0.00980377197265625, 0.010544300079345703, 0.011284828186035156, 0.01202535629272461, 0.012765884399414062, 0.013506412506103516, 0.014246940612792969, 0.014987468719482422, 0.015727996826171875, 0.016468524932861328, 0.01720905303955078, 0.017949581146240234, 0.018690109252929688, 0.01943063735961914, 0.020171165466308594, 0.020911693572998047, 0.0216522216796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 10.0, 14.0, 10.0, 7.0, 26.0, 31.0, 34.0, 72.0, 81.0, 118.0, 124.0, 115.0, 92.0, 72.0, 53.0, 34.0, 32.0, 18.0, 10.0, 10.0, 11.0, 6.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.553794860839844e-05, -4.414655268192291e-05, -4.275515675544739e-05, -4.136376082897186e-05, -3.997236490249634e-05, -3.858096897602081e-05, -3.718957304954529e-05, -3.579817712306976e-05, -3.440678119659424e-05, -3.301538527011871e-05, -3.162398934364319e-05, -3.0232593417167664e-05, -2.884119749069214e-05, -2.7449801564216614e-05, -2.605840563774109e-05, -2.4667009711265564e-05, -2.327561378479004e-05, -2.1884217858314514e-05, -2.049282193183899e-05, -1.9101426005363464e-05, -1.771003007888794e-05, -1.6318634152412415e-05, -1.492723822593689e-05, -1.3535842299461365e-05, -1.214444637298584e-05, -1.0753050446510315e-05, -9.36165452003479e-06, -7.970258593559265e-06, -6.57886266708374e-06, -5.187466740608215e-06, -3.7960708141326904e-06, -2.4046748876571655e-06, -1.0132789611816406e-06, 3.781169652938843e-07, 1.7695128917694092e-06, 3.160908818244934e-06, 4.552304744720459e-06, 5.943700671195984e-06, 7.335096597671509e-06, 8.726492524147034e-06, 1.0117888450622559e-05, 1.1509284377098083e-05, 1.2900680303573608e-05, 1.4292076230049133e-05, 1.5683472156524658e-05, 1.7074868083000183e-05, 1.8466264009475708e-05, 1.9857659935951233e-05, 2.1249055862426758e-05, 2.2640451788902283e-05, 2.4031847715377808e-05, 2.5423243641853333e-05, 2.6814639568328857e-05, 2.8206035494804382e-05, 2.9597431421279907e-05, 3.098882734775543e-05, 3.238022327423096e-05, 3.377161920070648e-05, 3.516301512718201e-05, 3.655441105365753e-05, 3.794580698013306e-05, 3.933720290660858e-05, 4.0728598833084106e-05, 4.211999475955963e-05, 4.3511390686035156e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 8.0, 6.0, 7.0, 16.0, 13.0, 26.0, 44.0, 79.0, 106.0, 199.0, 389.0, 886.0, 1886.0, 5271.0, 18665.0, 108661.0, 736341.0, 143532.0, 22292.0, 5969.0, 2179.0, 968.0, 469.0, 229.0, 108.0, 68.0, 31.0, 39.0, 17.0, 16.0, 11.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030029296875, -0.02889871597290039, -0.02776813507080078, -0.026637554168701172, -0.025506973266601562, -0.024376392364501953, -0.023245811462402344, -0.022115230560302734, -0.020984649658203125, -0.019854068756103516, -0.018723487854003906, -0.017592906951904297, -0.016462326049804688, -0.015331745147705078, -0.014201164245605469, -0.01307058334350586, -0.01194000244140625, -0.01080942153930664, -0.009678840637207031, -0.008548259735107422, -0.0074176788330078125, -0.006287097930908203, -0.005156517028808594, -0.004025936126708984, -0.002895355224609375, -0.0017647743225097656, -0.0006341934204101562, 0.0004963874816894531, 0.0016269683837890625, 0.002757549285888672, 0.0038881301879882812, 0.005018711090087891, 0.0061492919921875, 0.007279872894287109, 0.008410453796386719, 0.009541034698486328, 0.010671615600585938, 0.011802196502685547, 0.012932777404785156, 0.014063358306884766, 0.015193939208984375, 0.016324520111083984, 0.017455101013183594, 0.018585681915283203, 0.019716262817382812, 0.020846843719482422, 0.02197742462158203, 0.02310800552368164, 0.02423858642578125, 0.02536916732788086, 0.02649974822998047, 0.027630329132080078, 0.028760910034179688, 0.029891490936279297, 0.031022071838378906, 0.032152652740478516, 0.033283233642578125, 0.034413814544677734, 0.035544395446777344, 0.03667497634887695, 0.03780555725097656, 0.03893613815307617, 0.04006671905517578, 0.04119729995727539, 0.042327880859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 4.0, 15.0, 11.0, 19.0, 25.0, 44.0, 42.0, 80.0, 79.0, 148.0, 115.0, 99.0, 75.0, 61.0, 41.0, 26.0, 12.0, 14.0, 10.0, 10.0, 11.0, 2.0, 5.0, 4.0, 6.0, 1.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00800323486328125, -0.007754087448120117, -0.007504940032958984, -0.0072557926177978516, -0.007006645202636719, -0.006757497787475586, -0.006508350372314453, -0.00625920295715332, -0.0060100555419921875, -0.005760908126831055, -0.005511760711669922, -0.005262613296508789, -0.005013465881347656, -0.0047643184661865234, -0.004515171051025391, -0.004266023635864258, -0.004016876220703125, -0.003767728805541992, -0.0035185813903808594, -0.0032694339752197266, -0.0030202865600585938, -0.002771139144897461, -0.002521991729736328, -0.0022728443145751953, -0.0020236968994140625, -0.0017745494842529297, -0.0015254020690917969, -0.001276254653930664, -0.0010271072387695312, -0.0007779598236083984, -0.0005288124084472656, -0.0002796649932861328, -3.0517578125e-05, 0.0002186298370361328, 0.0004677772521972656, 0.0007169246673583984, 0.0009660720825195312, 0.001215219497680664, 0.0014643669128417969, 0.0017135143280029297, 0.0019626617431640625, 0.0022118091583251953, 0.002460956573486328, 0.002710103988647461, 0.0029592514038085938, 0.0032083988189697266, 0.0034575462341308594, 0.003706693649291992, 0.003955841064453125, 0.004204988479614258, 0.004454135894775391, 0.0047032833099365234, 0.004952430725097656, 0.005201578140258789, 0.005450725555419922, 0.005699872970581055, 0.0059490203857421875, 0.00619816780090332, 0.006447315216064453, 0.006696462631225586, 0.006945610046386719, 0.0071947574615478516, 0.007443904876708984, 0.007693052291870117, 0.00794219970703125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 15.0, 38.0, 82.0, 203.0, 262.0, 207.0, 104.0, 41.0, 25.0, 11.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.895549774169922, -2.773299217224121, -2.6510486602783203, -2.5287981033325195, -2.4065475463867188, -2.284296989440918, -2.162046194076538, -2.0397956371307373, -1.9175450801849365, -1.7952945232391357, -1.673043966293335, -1.5507932901382446, -1.4285427331924438, -1.306292176246643, -1.1840415000915527, -1.061790943145752, -0.9395403861999512, -0.8172898292541504, -0.6950392127037048, -0.5727885961532593, -0.4505380392074585, -0.3282874822616577, -0.20603686571121216, -0.0837862491607666, 0.03846430778503418, 0.16071489453315735, 0.2829654812812805, 0.4052160680294037, 0.5274666547775269, 0.6497172117233276, 0.7719678282737732, 0.8942184448242188, 1.0164690017700195, 1.1387195587158203, 1.260970115661621, 1.3832207918167114, 1.5054713487625122, 1.627721905708313, 1.7499725818634033, 1.872223138809204, 1.9944736957550049, 2.1167242527008057, 2.2389748096466064, 2.3612253665924072, 2.483476161956787, 2.605726718902588, 2.7279772758483887, 2.8502278327941895, 2.9724783897399902, 3.094728946685791, 3.216979503631592, 3.3392300605773926, 3.4614806175231934, 3.583731174468994, 3.705981969833374, 3.828232526779175, 3.9504830837249756, 4.0727338790893555, 4.194984436035156, 4.317234992980957, 4.439485549926758, 4.561736106872559, 4.683986663818359, 4.80623722076416, 4.928487777709961]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 15.0, 22.0, 29.0, 47.0, 62.0, 71.0, 90.0, 94.0, 87.0, 111.0, 98.0, 83.0, 46.0, 38.0, 34.0, 20.0, 19.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6790030002593994, -1.6179542541503906, -1.5569053888320923, -1.495856523513794, -1.4348077774047852, -1.3737590312957764, -1.312710165977478, -1.2516613006591797, -1.190612554550171, -1.129563808441162, -1.0685149431228638, -1.0074660778045654, -0.9464173316955566, -0.8853685259819031, -0.8243197202682495, -0.763270914554596, -0.7022221088409424, -0.6411733031272888, -0.5801244974136353, -0.5190756916999817, -0.4580268859863281, -0.39697808027267456, -0.335929274559021, -0.27488046884536743, -0.21383166313171387, -0.1527828574180603, -0.09173405170440674, -0.030685245990753174, 0.03036355972290039, 0.09141236543655396, 0.15246117115020752, 0.21350997686386108, 0.27455878257751465, 0.3356075882911682, 0.3966563940048218, 0.45770519971847534, 0.5187540054321289, 0.5798028111457825, 0.640851616859436, 0.7019004225730896, 0.7629492282867432, 0.8239980340003967, 0.8850468397140503, 0.9460956454277039, 1.0071444511413574, 1.0681931972503662, 1.1292420625686646, 1.190290927886963, 1.2513396739959717, 1.3123884201049805, 1.3734372854232788, 1.4344861507415771, 1.495534896850586, 1.5565836429595947, 1.617632508277893, 1.6786813735961914, 1.7397301197052002, 1.800778865814209, 1.8618277311325073, 1.9228765964508057, 1.9839253425598145, 2.0449740886688232, 2.106022834777832, 2.16707181930542, 2.2281205654144287]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 9.0, 23.0, 26.0, 48.0, 56.0, 94.0, 153.0, 238.0, 419.0, 786.0, 1554.0, 3372.0, 7656.0, 20967.0, 102866.0, 766869.0, 107329.0, 21422.0, 7749.0, 3396.0, 1642.0, 839.0, 399.0, 243.0, 129.0, 96.0, 51.0, 29.0, 22.0, 19.0, 11.0, 10.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8930435180664062, -0.8647003173828125, -0.8363571166992188, -0.808013916015625, -0.7796707153320312, -0.7513275146484375, -0.7229843139648438, -0.69464111328125, -0.6662979125976562, -0.6379547119140625, -0.6096115112304688, -0.581268310546875, -0.5529251098632812, -0.5245819091796875, -0.49623870849609375, -0.4678955078125, -0.43955230712890625, -0.4112091064453125, -0.38286590576171875, -0.354522705078125, -0.32617950439453125, -0.2978363037109375, -0.26949310302734375, -0.24114990234375, -0.21280670166015625, -0.1844635009765625, -0.15612030029296875, -0.127777099609375, -0.09943389892578125, -0.0710906982421875, -0.04274749755859375, -0.014404296875, 0.01393890380859375, 0.0422821044921875, 0.07062530517578125, 0.098968505859375, 0.12731170654296875, 0.1556549072265625, 0.18399810791015625, 0.21234130859375, 0.24068450927734375, 0.2690277099609375, 0.29737091064453125, 0.325714111328125, 0.35405731201171875, 0.3824005126953125, 0.41074371337890625, 0.4390869140625, 0.46743011474609375, 0.4957733154296875, 0.5241165161132812, 0.552459716796875, 0.5808029174804688, 0.6091461181640625, 0.6374893188476562, 0.66583251953125, 0.6941757202148438, 0.7225189208984375, 0.7508621215820312, 0.779205322265625, 0.8075485229492188, 0.8358917236328125, 0.8642349243164062, 0.892578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 10.0, 6.0, 18.0, 22.0, 30.0, 44.0, 55.0, 61.0, 74.0, 80.0, 86.0, 75.0, 76.0, 86.0, 75.0, 46.0, 47.0, 18.0, 25.0, 13.0, 17.0, 10.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.708984375, -3.599822998046875, -3.49066162109375, -3.381500244140625, -3.2723388671875, -3.163177490234375, -3.05401611328125, -2.944854736328125, -2.835693359375, -2.726531982421875, -2.61737060546875, -2.508209228515625, -2.3990478515625, -2.289886474609375, -2.18072509765625, -2.071563720703125, -1.96240234375, -1.853240966796875, -1.74407958984375, -1.634918212890625, -1.5257568359375, -1.416595458984375, -1.30743408203125, -1.198272705078125, -1.089111328125, -0.979949951171875, -0.87078857421875, -0.761627197265625, -0.6524658203125, -0.543304443359375, -0.43414306640625, -0.324981689453125, -0.2158203125, -0.106658935546875, 0.00250244140625, 0.111663818359375, 0.2208251953125, 0.329986572265625, 0.43914794921875, 0.548309326171875, 0.657470703125, 0.766632080078125, 0.87579345703125, 0.984954833984375, 1.0941162109375, 1.203277587890625, 1.31243896484375, 1.421600341796875, 1.53076171875, 1.639923095703125, 1.74908447265625, 1.858245849609375, 1.9674072265625, 2.076568603515625, 2.18572998046875, 2.294891357421875, 2.404052734375, 2.513214111328125, 2.62237548828125, 2.731536865234375, 2.8406982421875, 2.949859619140625, 3.05902099609375, 3.168182373046875, 3.27734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 13.0, 18.0, 34.0, 65.0, 66.0, 143.0, 262.0, 595.0, 2155.0, 39539.0, 991145.0, 12357.0, 1262.0, 418.0, 203.0, 112.0, 55.0, 35.0, 20.0, 17.0, 15.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.158203125, -3.060546875, -2.962890625, -2.865234375, -2.767578125, -2.669921875, -2.572265625, -2.474609375, -2.376953125, -2.279296875, -2.181640625, -2.083984375, -1.986328125, -1.888671875, -1.791015625, -1.693359375, -1.595703125, -1.498046875, -1.400390625, -1.302734375, -1.205078125, -1.107421875, -1.009765625, -0.912109375, -0.814453125, -0.716796875, -0.619140625, -0.521484375, -0.423828125, -0.326171875, -0.228515625, -0.130859375, -0.033203125, 0.064453125, 0.162109375, 0.259765625, 0.357421875, 0.455078125, 0.552734375, 0.650390625, 0.748046875, 0.845703125, 0.943359375, 1.041015625, 1.138671875, 1.236328125, 1.333984375, 1.431640625, 1.529296875, 1.626953125, 1.724609375, 1.822265625, 1.919921875, 2.017578125, 2.115234375, 2.212890625, 2.310546875, 2.408203125, 2.505859375, 2.603515625, 2.701171875, 2.798828125, 2.896484375, 2.994140625, 3.091796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 2.0, 9.0, 16.0, 20.0, 33.0, 49.0, 42.0, 58.0, 81.0, 87.0, 93.0, 84.0, 87.0, 77.0, 72.0, 59.0, 38.0, 29.0, 17.0, 16.0, 10.0, 11.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.13623046875, -4.9716796875, -4.80712890625, -4.642578125, -4.47802734375, -4.3134765625, -4.14892578125, -3.984375, -3.81982421875, -3.6552734375, -3.49072265625, -3.326171875, -3.16162109375, -2.9970703125, -2.83251953125, -2.66796875, -2.50341796875, -2.3388671875, -2.17431640625, -2.009765625, -1.84521484375, -1.6806640625, -1.51611328125, -1.3515625, -1.18701171875, -1.0224609375, -0.85791015625, -0.693359375, -0.52880859375, -0.3642578125, -0.19970703125, -0.03515625, 0.12939453125, 0.2939453125, 0.45849609375, 0.623046875, 0.78759765625, 0.9521484375, 1.11669921875, 1.28125, 1.44580078125, 1.6103515625, 1.77490234375, 1.939453125, 2.10400390625, 2.2685546875, 2.43310546875, 2.59765625, 2.76220703125, 2.9267578125, 3.09130859375, 3.255859375, 3.42041015625, 3.5849609375, 3.74951171875, 3.9140625, 4.07861328125, 4.2431640625, 4.40771484375, 4.572265625, 4.73681640625, 4.9013671875, 5.06591796875, 5.23046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 6.0, 9.0, 9.0, 7.0, 6.0, 14.0, 24.0, 25.0, 34.0, 62.0, 81.0, 149.0, 248.0, 449.0, 969.0, 2548.0, 7599.0, 29640.0, 260325.0, 685248.0, 44874.0, 10422.0, 3151.0, 1297.0, 570.0, 301.0, 164.0, 95.0, 58.0, 43.0, 31.0, 24.0, 17.0, 11.0, 4.0, 6.0, 1.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.291015625, -0.2822303771972656, -0.27344512939453125, -0.2646598815917969, -0.2558746337890625, -0.24708938598632812, -0.23830413818359375, -0.22951889038085938, -0.220733642578125, -0.21194839477539062, -0.20316314697265625, -0.19437789916992188, -0.1855926513671875, -0.17680740356445312, -0.16802215576171875, -0.15923690795898438, -0.15045166015625, -0.14166641235351562, -0.13288116455078125, -0.12409591674804688, -0.1153106689453125, -0.10652542114257812, -0.09774017333984375, -0.08895492553710938, -0.080169677734375, -0.07138442993164062, -0.06259918212890625, -0.053813934326171875, -0.0450286865234375, -0.036243438720703125, -0.02745819091796875, -0.018672943115234375, -0.0098876953125, -0.001102447509765625, 0.00768280029296875, 0.016468048095703125, 0.0252532958984375, 0.034038543701171875, 0.04282379150390625, 0.051609039306640625, 0.060394287109375, 0.06917953491210938, 0.07796478271484375, 0.08675003051757812, 0.0955352783203125, 0.10432052612304688, 0.11310577392578125, 0.12189102172851562, 0.13067626953125, 0.13946151733398438, 0.14824676513671875, 0.15703201293945312, 0.1658172607421875, 0.17460250854492188, 0.18338775634765625, 0.19217300415039062, 0.200958251953125, 0.20974349975585938, 0.21852874755859375, 0.22731399536132812, 0.2360992431640625, 0.24488449096679688, 0.25366973876953125, 0.2624549865722656, 0.271240234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 7.0, 2.0, 3.0, 6.0, 3.0, 10.0, 16.0, 25.0, 32.0, 51.0, 89.0, 233.0, 243.0, 107.0, 49.0, 40.0, 21.0, 18.0, 13.0, 7.0, 9.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-05, -2.8242357075214386e-05, -2.668239176273346e-05, -2.5122426450252533e-05, -2.3562461137771606e-05, -2.200249582529068e-05, -2.0442530512809753e-05, -1.8882565200328827e-05, -1.73225998878479e-05, -1.5762634575366974e-05, -1.4202669262886047e-05, -1.2642703950405121e-05, -1.1082738637924194e-05, -9.522773325443268e-06, -7.962808012962341e-06, -6.402842700481415e-06, -4.842877388000488e-06, -3.2829120755195618e-06, -1.7229467630386353e-06, -1.6298145055770874e-07, 1.3969838619232178e-06, 2.9569491744041443e-06, 4.516914486885071e-06, 6.076879799365997e-06, 7.636845111846924e-06, 9.19681042432785e-06, 1.0756775736808777e-05, 1.2316741049289703e-05, 1.387670636177063e-05, 1.5436671674251556e-05, 1.6996636986732483e-05, 1.855660229921341e-05, 2.0116567611694336e-05, 2.1676532924175262e-05, 2.323649823665619e-05, 2.4796463549137115e-05, 2.6356428861618042e-05, 2.791639417409897e-05, 2.9476359486579895e-05, 3.103632479906082e-05, 3.259629011154175e-05, 3.4156255424022675e-05, 3.57162207365036e-05, 3.727618604898453e-05, 3.8836151361465454e-05, 4.039611667394638e-05, 4.195608198642731e-05, 4.3516047298908234e-05, 4.507601261138916e-05, 4.663597792387009e-05, 4.819594323635101e-05, 4.975590854883194e-05, 5.1315873861312866e-05, 5.287583917379379e-05, 5.443580448627472e-05, 5.5995769798755646e-05, 5.755573511123657e-05, 5.91157004237175e-05, 6.0675665736198425e-05, 6.223563104867935e-05, 6.379559636116028e-05, 6.53555616736412e-05, 6.691552698612213e-05, 6.847549229860306e-05, 7.003545761108398e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 18.0, 12.0, 26.0, 41.0, 46.0, 65.0, 126.0, 248.0, 454.0, 884.0, 2165.0, 5158.0, 15802.0, 75197.0, 794811.0, 120863.0, 21388.0, 6402.0, 2465.0, 1157.0, 502.0, 306.0, 150.0, 79.0, 42.0, 34.0, 30.0, 21.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31591796875, -0.3065185546875, -0.297119140625, -0.2877197265625, -0.2783203125, -0.2689208984375, -0.259521484375, -0.2501220703125, -0.24072265625, -0.2313232421875, -0.221923828125, -0.2125244140625, -0.203125, -0.1937255859375, -0.184326171875, -0.1749267578125, -0.16552734375, -0.1561279296875, -0.146728515625, -0.1373291015625, -0.1279296875, -0.1185302734375, -0.109130859375, -0.0997314453125, -0.09033203125, -0.0809326171875, -0.071533203125, -0.0621337890625, -0.052734375, -0.0433349609375, -0.033935546875, -0.0245361328125, -0.01513671875, -0.0057373046875, 0.003662109375, 0.0130615234375, 0.0224609375, 0.0318603515625, 0.041259765625, 0.0506591796875, 0.06005859375, 0.0694580078125, 0.078857421875, 0.0882568359375, 0.09765625, 0.1070556640625, 0.116455078125, 0.1258544921875, 0.13525390625, 0.1446533203125, 0.154052734375, 0.1634521484375, 0.1728515625, 0.1822509765625, 0.191650390625, 0.2010498046875, 0.21044921875, 0.2198486328125, 0.229248046875, 0.2386474609375, 0.248046875, 0.2574462890625, 0.266845703125, 0.2762451171875, 0.28564453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 16.0, 18.0, 13.0, 19.0, 24.0, 35.0, 43.0, 51.0, 86.0, 183.0, 152.0, 99.0, 36.0, 40.0, 42.0, 24.0, 19.0, 16.0, 12.0, 11.0, 8.0, 8.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.10364055633544922, -0.10028648376464844, -0.09693241119384766, -0.09357833862304688, -0.0902242660522461, -0.08687019348144531, -0.08351612091064453, -0.08016204833984375, -0.07680797576904297, -0.07345390319824219, -0.0700998306274414, -0.06674575805664062, -0.06339168548583984, -0.06003761291503906, -0.05668354034423828, -0.0533294677734375, -0.04997539520263672, -0.04662132263183594, -0.043267250061035156, -0.039913177490234375, -0.036559104919433594, -0.03320503234863281, -0.02985095977783203, -0.02649688720703125, -0.02314281463623047, -0.019788742065429688, -0.016434669494628906, -0.013080596923828125, -0.009726524353027344, -0.0063724517822265625, -0.0030183792114257812, 0.000335693359375, 0.0036897659301757812, 0.0070438385009765625, 0.010397911071777344, 0.013751983642578125, 0.017106056213378906, 0.020460128784179688, 0.02381420135498047, 0.02716827392578125, 0.03052234649658203, 0.03387641906738281, 0.037230491638183594, 0.040584564208984375, 0.043938636779785156, 0.04729270935058594, 0.05064678192138672, 0.0540008544921875, 0.05735492706298828, 0.06070899963378906, 0.06406307220458984, 0.06741714477539062, 0.0707712173461914, 0.07412528991699219, 0.07747936248779297, 0.08083343505859375, 0.08418750762939453, 0.08754158020019531, 0.0908956527709961, 0.09424972534179688, 0.09760379791259766, 0.10095787048339844, 0.10431194305419922, 0.107666015625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 12.0, 23.0, 54.0, 82.0, 149.0, 185.0, 190.0, 131.0, 74.0, 44.0, 14.0, 12.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.311061382293701, -4.1314697265625, -3.9518778324127197, -3.7722859382629395, -3.5926942825317383, -3.413102388381958, -3.2335104942321777, -3.0539188385009766, -2.8743271827697754, -2.694735288619995, -2.515143632888794, -2.3355517387390137, -2.1559600830078125, -1.9763681888580322, -1.7967764139175415, -1.6171846389770508, -1.4375927448272705, -1.2580009698867798, -1.078409194946289, -0.8988173604011536, -0.7192255854606628, -0.5396338105201721, -0.3600419759750366, -0.1804502010345459, -0.0008584260940551758, 0.17873336374759674, 0.35832515358924866, 0.5379169583320618, 0.7175087332725525, 0.8971005082130432, 1.0766923427581787, 1.2562841176986694, 1.4358758926391602, 1.6154676675796509, 1.7950594425201416, 1.9746513366699219, 2.154242992401123, 2.3338348865509033, 2.5134267807006836, 2.6930184364318848, 2.872610092163086, 3.052201986312866, 3.2317936420440674, 3.4113855361938477, 3.590977191925049, 3.770569086074829, 3.9501609802246094, 4.1297526359558105, 4.309344291687012, 4.488935947418213, 4.668528079986572, 4.848119735717773, 5.027711391448975, 5.207303047180176, 5.386895179748535, 5.566486835479736, 5.746078968048096, 5.925670623779297, 6.105262756347656, 6.284854412078857, 6.464446067810059, 6.64403772354126, 6.823629856109619, 7.00322151184082, 7.1828131675720215]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 11.0, 7.0, 8.0, 17.0, 35.0, 31.0, 47.0, 57.0, 59.0, 64.0, 83.0, 82.0, 75.0, 66.0, 71.0, 69.0, 55.0, 42.0, 34.0, 30.0, 24.0, 23.0, 11.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78622817993164, -8.4733247756958, -8.160421371459961, -7.847517490386963, -7.534614086151123, -7.221710681915283, -6.908806800842285, -6.595903396606445, -6.2829999923706055, -5.970096588134766, -5.657193183898926, -5.344289302825928, -5.031385898590088, -4.718482494354248, -4.40557861328125, -4.09267520904541, -3.7797718048095703, -3.4668684005737305, -3.1539647579193115, -2.8410611152648926, -2.5281577110290527, -2.215254306793213, -1.902350664138794, -1.589447021484375, -1.2765436172485352, -0.9636400938034058, -0.6507365703582764, -0.337833046913147, -0.024929523468017578, 0.2879739999771118, 0.6008775234222412, 0.9137811660766602, 1.2266836166381836, 1.539587140083313, 1.8524906635284424, 2.1653943061828613, 2.478297710418701, 2.791201114654541, 3.10410475730896, 3.417008399963379, 3.7299118041992188, 4.042815208435059, 4.355718612670898, 4.6686224937438965, 4.981525897979736, 5.294429302215576, 5.607333183288574, 5.920236587524414, 6.233139991760254, 6.546043395996094, 6.858946800231934, 7.171850681304932, 7.4847540855407715, 7.797657489776611, 8.11056137084961, 8.42346477508545, 8.736368179321289, 9.049271583557129, 9.362174987792969, 9.675078392028809, 9.987981796264648, 10.300886154174805, 10.613789558410645, 10.926692962646484, 11.239596366882324]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 4.0, 13.0, 12.0, 15.0, 20.0, 50.0, 60.0, 87.0, 148.0, 256.0, 456.0, 895.0, 2026.0, 5999.0, 30868.0, 775834.0, 3264716.0, 94787.0, 12236.0, 3231.0, 1203.0, 557.0, 319.0, 184.0, 119.0, 57.0, 39.0, 29.0, 22.0, 12.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.029296875, -2.913726806640625, -2.79815673828125, -2.682586669921875, -2.5670166015625, -2.451446533203125, -2.33587646484375, -2.220306396484375, -2.104736328125, -1.989166259765625, -1.87359619140625, -1.758026123046875, -1.6424560546875, -1.526885986328125, -1.41131591796875, -1.295745849609375, -1.18017578125, -1.064605712890625, -0.94903564453125, -0.833465576171875, -0.7178955078125, -0.602325439453125, -0.48675537109375, -0.371185302734375, -0.255615234375, -0.140045166015625, -0.02447509765625, 0.091094970703125, 0.2066650390625, 0.322235107421875, 0.43780517578125, 0.553375244140625, 0.6689453125, 0.784515380859375, 0.90008544921875, 1.015655517578125, 1.1312255859375, 1.246795654296875, 1.36236572265625, 1.477935791015625, 1.593505859375, 1.709075927734375, 1.82464599609375, 1.940216064453125, 2.0557861328125, 2.171356201171875, 2.28692626953125, 2.402496337890625, 2.51806640625, 2.633636474609375, 2.74920654296875, 2.864776611328125, 2.9803466796875, 3.095916748046875, 3.21148681640625, 3.327056884765625, 3.442626953125, 3.558197021484375, 3.67376708984375, 3.789337158203125, 3.9049072265625, 4.020477294921875, 4.13604736328125, 4.251617431640625, 4.3671875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 21.0, 25.0, 30.0, 40.0, 60.0, 83.0, 78.0, 96.0, 91.0, 101.0, 103.0, 71.0, 52.0, 34.0, 35.0, 22.0, 10.0, 12.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.271484375, -2.198974609375, -2.12646484375, -2.053955078125, -1.9814453125, -1.908935546875, -1.83642578125, -1.763916015625, -1.69140625, -1.618896484375, -1.54638671875, -1.473876953125, -1.4013671875, -1.328857421875, -1.25634765625, -1.183837890625, -1.111328125, -1.038818359375, -0.96630859375, -0.893798828125, -0.8212890625, -0.748779296875, -0.67626953125, -0.603759765625, -0.53125, -0.458740234375, -0.38623046875, -0.313720703125, -0.2412109375, -0.168701171875, -0.09619140625, -0.023681640625, 0.048828125, 0.121337890625, 0.19384765625, 0.266357421875, 0.3388671875, 0.411376953125, 0.48388671875, 0.556396484375, 0.62890625, 0.701416015625, 0.77392578125, 0.846435546875, 0.9189453125, 0.991455078125, 1.06396484375, 1.136474609375, 1.208984375, 1.281494140625, 1.35400390625, 1.426513671875, 1.4990234375, 1.571533203125, 1.64404296875, 1.716552734375, 1.7890625, 1.861572265625, 1.93408203125, 2.006591796875, 2.0791015625, 2.151611328125, 2.22412109375, 2.296630859375, 2.369140625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 25.0, 22.0, 41.0, 99.0, 200.0, 598.0, 2368.0, 14515.0, 647725.0, 3500968.0, 23215.0, 3234.0, 734.0, 272.0, 110.0, 60.0, 15.0, 19.0, 10.0, 8.0, 6.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.60357666015625, -4.4337158203125, -4.26385498046875, -4.093994140625, -3.92413330078125, -3.7542724609375, -3.58441162109375, -3.41455078125, -3.24468994140625, -3.0748291015625, -2.90496826171875, -2.735107421875, -2.56524658203125, -2.3953857421875, -2.22552490234375, -2.0556640625, -1.88580322265625, -1.7159423828125, -1.54608154296875, -1.376220703125, -1.20635986328125, -1.0364990234375, -0.86663818359375, -0.69677734375, -0.52691650390625, -0.3570556640625, -0.18719482421875, -0.017333984375, 0.15252685546875, 0.3223876953125, 0.49224853515625, 0.662109375, 0.83197021484375, 1.0018310546875, 1.17169189453125, 1.341552734375, 1.51141357421875, 1.6812744140625, 1.85113525390625, 2.02099609375, 2.19085693359375, 2.3607177734375, 2.53057861328125, 2.700439453125, 2.87030029296875, 3.0401611328125, 3.21002197265625, 3.3798828125, 3.54974365234375, 3.7196044921875, 3.88946533203125, 4.059326171875, 4.22918701171875, 4.3990478515625, 4.56890869140625, 4.73876953125, 4.90863037109375, 5.0784912109375, 5.24835205078125, 5.418212890625, 5.58807373046875, 5.7579345703125, 5.92779541015625, 6.09765625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 9.0, 6.0, 12.0, 10.0, 19.0, 23.0, 33.0, 61.0, 77.0, 133.0, 308.0, 725.0, 1140.0, 741.0, 350.0, 148.0, 85.0, 58.0, 30.0, 21.0, 20.0, 13.0, 11.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.939453125, -0.91229248046875, -0.8851318359375, -0.85797119140625, -0.830810546875, -0.80364990234375, -0.7764892578125, -0.74932861328125, -0.72216796875, -0.69500732421875, -0.6678466796875, -0.64068603515625, -0.613525390625, -0.58636474609375, -0.5592041015625, -0.53204345703125, -0.5048828125, -0.47772216796875, -0.4505615234375, -0.42340087890625, -0.396240234375, -0.36907958984375, -0.3419189453125, -0.31475830078125, -0.28759765625, -0.26043701171875, -0.2332763671875, -0.20611572265625, -0.178955078125, -0.15179443359375, -0.1246337890625, -0.09747314453125, -0.0703125, -0.04315185546875, -0.0159912109375, 0.01116943359375, 0.038330078125, 0.06549072265625, 0.0926513671875, 0.11981201171875, 0.14697265625, 0.17413330078125, 0.2012939453125, 0.22845458984375, 0.255615234375, 0.28277587890625, 0.3099365234375, 0.33709716796875, 0.3642578125, 0.39141845703125, 0.4185791015625, 0.44573974609375, 0.472900390625, 0.50006103515625, 0.5272216796875, 0.55438232421875, 0.58154296875, 0.60870361328125, 0.6358642578125, 0.66302490234375, 0.690185546875, 0.71734619140625, 0.7445068359375, 0.77166748046875, 0.798828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 11.0, 20.0, 39.0, 55.0, 95.0, 127.0, 181.0, 145.0, 116.0, 83.0, 45.0, 22.0, 15.0, 8.0, 11.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5279645919799805, -3.410412073135376, -3.2928597927093506, -3.175307273864746, -3.0577549934387207, -2.940202474594116, -2.8226499557495117, -2.7050976753234863, -2.587545156478882, -2.4699926376342773, -2.352440357208252, -2.2348878383636475, -2.117335319519043, -1.9997830390930176, -1.882230520248413, -1.7646781206130981, -1.6471257209777832, -1.5295733213424683, -1.4120209217071533, -1.2944684028625488, -1.1769160032272339, -1.059363603591919, -0.9418111443519592, -0.8242586851119995, -0.7067062854766846, -0.5891538858413696, -0.4716014266014099, -0.3540489971637726, -0.23649656772613525, -0.11894416809082031, -0.0013917088508605957, 0.11616075038909912, 0.23371338844299316, 0.3512658178806305, 0.4688182473182678, 0.5863707065582275, 0.7039231061935425, 0.8214755058288574, 0.9390279650688171, 1.0565804243087769, 1.1741328239440918, 1.2916852235794067, 1.4092376232147217, 1.5267901420593262, 1.6443425416946411, 1.761894941329956, 1.8794474601745605, 1.9969998598098755, 2.1145522594451904, 2.232104778289795, 2.3496570587158203, 2.467209577560425, 2.5847620964050293, 2.7023143768310547, 2.819866895675659, 2.9374194145202637, 3.054971694946289, 3.1725242137908936, 3.290076494216919, 3.4076290130615234, 3.525181293487549, 3.6427338123321533, 3.760286331176758, 3.877838611602783, 3.9953911304473877]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 3.0, 6.0, 12.0, 13.0, 25.0, 31.0, 40.0, 47.0, 57.0, 67.0, 74.0, 72.0, 73.0, 86.0, 55.0, 52.0, 66.0, 48.0, 43.0, 33.0, 29.0, 13.0, 16.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8239723443984985, -1.7498902082443237, -1.675808072090149, -1.6017259359359741, -1.5276439189910889, -1.453561782836914, -1.3794796466827393, -1.3053975105285645, -1.2313153743743896, -1.1572332382202148, -1.08315110206604, -1.0090689659118652, -0.9349868893623352, -0.8609047532081604, -0.7868226766586304, -0.7127405405044556, -0.6386584043502808, -0.564576268196106, -0.49049416184425354, -0.4164120554924011, -0.3423299193382263, -0.2682477831840515, -0.1941656768321991, -0.12008357048034668, -0.046001434326171875, 0.028080686926841736, 0.10216280817985535, 0.17624492943286896, 0.25032705068588257, 0.3244091868400574, 0.3984912931919098, 0.4725733995437622, 0.5466554164886475, 0.6207375526428223, 0.6948196887969971, 0.7689017653465271, 0.8429839015007019, 0.9170660376548767, 0.9911481142044067, 1.0652302503585815, 1.1393123865127563, 1.2133945226669312, 1.287476658821106, 1.3615587949752808, 1.435640811920166, 1.5097229480743408, 1.5838050842285156, 1.6578872203826904, 1.7319693565368652, 1.80605149269104, 1.8801336288452148, 1.9542157649993896, 2.0282979011535645, 2.1023800373077393, 2.176462173461914, 2.2505440711975098, 2.3246264457702637, 2.3987085819244385, 2.4727907180786133, 2.546872854232788, 2.620954990386963, 2.6950371265411377, 2.7691192626953125, 2.843201160430908, 2.917283296585083]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 12.0, 12.0, 27.0, 37.0, 57.0, 90.0, 167.0, 277.0, 526.0, 1117.0, 2656.0, 7787.0, 30810.0, 232855.0, 662866.0, 85321.0, 15796.0, 4700.0, 1742.0, 794.0, 374.0, 192.0, 121.0, 70.0, 47.0, 30.0, 15.0, 15.0, 11.0, 4.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412109375, -0.39893341064453125, -0.3857574462890625, -0.37258148193359375, -0.359405517578125, -0.34622955322265625, -0.3330535888671875, -0.31987762451171875, -0.30670166015625, -0.29352569580078125, -0.2803497314453125, -0.26717376708984375, -0.253997802734375, -0.24082183837890625, -0.2276458740234375, -0.21446990966796875, -0.2012939453125, -0.18811798095703125, -0.1749420166015625, -0.16176605224609375, -0.148590087890625, -0.13541412353515625, -0.1222381591796875, -0.10906219482421875, -0.09588623046875, -0.08271026611328125, -0.0695343017578125, -0.05635833740234375, -0.043182373046875, -0.03000640869140625, -0.0168304443359375, -0.00365447998046875, 0.009521484375, 0.02269744873046875, 0.0358734130859375, 0.04904937744140625, 0.062225341796875, 0.07540130615234375, 0.0885772705078125, 0.10175323486328125, 0.11492919921875, 0.12810516357421875, 0.1412811279296875, 0.15445709228515625, 0.167633056640625, 0.18080902099609375, 0.1939849853515625, 0.20716094970703125, 0.2203369140625, 0.23351287841796875, 0.2466888427734375, 0.25986480712890625, 0.273040771484375, 0.28621673583984375, 0.2993927001953125, 0.31256866455078125, 0.32574462890625, 0.33892059326171875, 0.3520965576171875, 0.36527252197265625, 0.378448486328125, 0.39162445068359375, 0.4048004150390625, 0.41797637939453125, 0.43115234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 14.0, 17.0, 34.0, 51.0, 63.0, 91.0, 99.0, 107.0, 111.0, 77.0, 80.0, 61.0, 65.0, 42.0, 24.0, 10.0, 14.0, 6.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0859375, -2.021087646484375, -1.95623779296875, -1.891387939453125, -1.8265380859375, -1.761688232421875, -1.69683837890625, -1.631988525390625, -1.567138671875, -1.502288818359375, -1.43743896484375, -1.372589111328125, -1.3077392578125, -1.242889404296875, -1.17803955078125, -1.113189697265625, -1.04833984375, -0.983489990234375, -0.91864013671875, -0.853790283203125, -0.7889404296875, -0.724090576171875, -0.65924072265625, -0.594390869140625, -0.529541015625, -0.464691162109375, -0.39984130859375, -0.334991455078125, -0.2701416015625, -0.205291748046875, -0.14044189453125, -0.075592041015625, -0.0107421875, 0.054107666015625, 0.11895751953125, 0.183807373046875, 0.2486572265625, 0.313507080078125, 0.37835693359375, 0.443206787109375, 0.508056640625, 0.572906494140625, 0.63775634765625, 0.702606201171875, 0.7674560546875, 0.832305908203125, 0.89715576171875, 0.962005615234375, 1.02685546875, 1.091705322265625, 1.15655517578125, 1.221405029296875, 1.2862548828125, 1.351104736328125, 1.41595458984375, 1.480804443359375, 1.545654296875, 1.610504150390625, 1.67535400390625, 1.740203857421875, 1.8050537109375, 1.869903564453125, 1.93475341796875, 1.999603271484375, 2.064453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 11.0, 3.0, 18.0, 29.0, 19.0, 44.0, 67.0, 89.0, 145.0, 256.0, 401.0, 679.0, 1148.0, 1910.0, 3206.0, 5614.0, 10239.0, 19149.0, 37044.0, 74557.0, 160213.0, 292722.0, 226710.0, 106699.0, 51434.0, 25841.0, 13307.0, 7140.0, 4072.0, 2300.0, 1383.0, 850.0, 484.0, 271.0, 192.0, 107.0, 66.0, 47.0, 29.0, 19.0, 14.0, 15.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08394908905029297, -0.08092308044433594, -0.0778970718383789, -0.07487106323242188, -0.07184505462646484, -0.06881904602050781, -0.06579303741455078, -0.06276702880859375, -0.05974102020263672, -0.05671501159667969, -0.053689002990722656, -0.050662994384765625, -0.047636985778808594, -0.04461097717285156, -0.04158496856689453, -0.0385589599609375, -0.03553295135498047, -0.03250694274902344, -0.029480934143066406, -0.026454925537109375, -0.023428916931152344, -0.020402908325195312, -0.01737689971923828, -0.01435089111328125, -0.011324882507324219, -0.008298873901367188, -0.005272865295410156, -0.002246856689453125, 0.0007791519165039062, 0.0038051605224609375, 0.006831169128417969, 0.009857177734375, 0.012883186340332031, 0.015909194946289062, 0.018935203552246094, 0.021961212158203125, 0.024987220764160156, 0.028013229370117188, 0.03103923797607422, 0.03406524658203125, 0.03709125518798828, 0.04011726379394531, 0.043143272399902344, 0.046169281005859375, 0.049195289611816406, 0.05222129821777344, 0.05524730682373047, 0.0582733154296875, 0.06129932403564453, 0.06432533264160156, 0.0673513412475586, 0.07037734985351562, 0.07340335845947266, 0.07642936706542969, 0.07945537567138672, 0.08248138427734375, 0.08550739288330078, 0.08853340148925781, 0.09155941009521484, 0.09458541870117188, 0.0976114273071289, 0.10063743591308594, 0.10366344451904297, 0.106689453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 2.0, 8.0, 9.0, 4.0, 6.0, 17.0, 18.0, 23.0, 19.0, 28.0, 27.0, 20.0, 37.0, 36.0, 41.0, 47.0, 44.0, 46.0, 58.0, 43.0, 42.0, 43.0, 31.0, 45.0, 28.0, 31.0, 25.0, 32.0, 25.0, 23.0, 20.0, 19.0, 15.0, 14.0, 15.0, 6.0, 5.0, 5.0, 6.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.771484375, -1.715850830078125, -1.66021728515625, -1.604583740234375, -1.5489501953125, -1.493316650390625, -1.43768310546875, -1.382049560546875, -1.326416015625, -1.270782470703125, -1.21514892578125, -1.159515380859375, -1.1038818359375, -1.048248291015625, -0.99261474609375, -0.936981201171875, -0.88134765625, -0.825714111328125, -0.77008056640625, -0.714447021484375, -0.6588134765625, -0.603179931640625, -0.54754638671875, -0.491912841796875, -0.436279296875, -0.380645751953125, -0.32501220703125, -0.269378662109375, -0.2137451171875, -0.158111572265625, -0.10247802734375, -0.046844482421875, 0.0087890625, 0.064422607421875, 0.12005615234375, 0.175689697265625, 0.2313232421875, 0.286956787109375, 0.34259033203125, 0.398223876953125, 0.453857421875, 0.509490966796875, 0.56512451171875, 0.620758056640625, 0.6763916015625, 0.732025146484375, 0.78765869140625, 0.843292236328125, 0.89892578125, 0.954559326171875, 1.01019287109375, 1.065826416015625, 1.1214599609375, 1.177093505859375, 1.23272705078125, 1.288360595703125, 1.343994140625, 1.399627685546875, 1.45526123046875, 1.510894775390625, 1.5665283203125, 1.622161865234375, 1.67779541015625, 1.733428955078125, 1.7890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 13.0, 10.0, 10.0, 25.0, 28.0, 56.0, 74.0, 105.0, 143.0, 211.0, 337.0, 565.0, 889.0, 1655.0, 3132.0, 7255.0, 20114.0, 71003.0, 441407.0, 402935.0, 65951.0, 18799.0, 6917.0, 3039.0, 1567.0, 860.0, 499.0, 330.0, 197.0, 138.0, 86.0, 66.0, 38.0, 31.0, 21.0, 16.0, 9.0, 7.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028106689453125, -0.027199268341064453, -0.026291847229003906, -0.02538442611694336, -0.024477005004882812, -0.023569583892822266, -0.02266216278076172, -0.021754741668701172, -0.020847320556640625, -0.019939899444580078, -0.01903247833251953, -0.018125057220458984, -0.017217636108398438, -0.01631021499633789, -0.015402793884277344, -0.014495372772216797, -0.01358795166015625, -0.012680530548095703, -0.011773109436035156, -0.01086568832397461, -0.009958267211914062, -0.009050846099853516, -0.008143424987792969, -0.007236003875732422, -0.006328582763671875, -0.005421161651611328, -0.004513740539550781, -0.0036063194274902344, -0.0026988983154296875, -0.0017914772033691406, -0.0008840560913085938, 2.3365020751953125e-05, 0.0009307861328125, 0.0018382072448730469, 0.0027456283569335938, 0.0036530494689941406, 0.0045604705810546875, 0.005467891693115234, 0.006375312805175781, 0.007282733917236328, 0.008190155029296875, 0.009097576141357422, 0.010004997253417969, 0.010912418365478516, 0.011819839477539062, 0.01272726058959961, 0.013634681701660156, 0.014542102813720703, 0.01544952392578125, 0.016356945037841797, 0.017264366149902344, 0.01817178726196289, 0.019079208374023438, 0.019986629486083984, 0.02089405059814453, 0.021801471710205078, 0.022708892822265625, 0.023616313934326172, 0.02452373504638672, 0.025431156158447266, 0.026338577270507812, 0.02724599838256836, 0.028153419494628906, 0.029060840606689453, 0.02996826171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 14.0, 5.0, 10.0, 20.0, 22.0, 26.0, 30.0, 44.0, 59.0, 75.0, 92.0, 106.0, 73.0, 88.0, 74.0, 63.0, 52.0, 33.0, 21.0, 22.0, 13.0, 14.0, 8.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.0100345611572266e-05, -2.8935261070728302e-05, -2.777017652988434e-05, -2.6605091989040375e-05, -2.544000744819641e-05, -2.4274922907352448e-05, -2.3109838366508484e-05, -2.194475382566452e-05, -2.0779669284820557e-05, -1.9614584743976593e-05, -1.844950020313263e-05, -1.7284415662288666e-05, -1.6119331121444702e-05, -1.4954246580600739e-05, -1.3789162039756775e-05, -1.2624077498912811e-05, -1.1458992958068848e-05, -1.0293908417224884e-05, -9.12882387638092e-06, -7.963739335536957e-06, -6.798654794692993e-06, -5.6335702538490295e-06, -4.468485713005066e-06, -3.3034011721611023e-06, -2.1383166313171387e-06, -9.73232090473175e-07, 1.9185245037078857e-07, 1.3569369912147522e-06, 2.522021532058716e-06, 3.6871060729026794e-06, 4.852190613746643e-06, 6.017275154590607e-06, 7.18235969543457e-06, 8.347444236278534e-06, 9.512528777122498e-06, 1.0677613317966461e-05, 1.1842697858810425e-05, 1.3007782399654388e-05, 1.4172866940498352e-05, 1.5337951481342316e-05, 1.650303602218628e-05, 1.7668120563030243e-05, 1.8833205103874207e-05, 1.999828964471817e-05, 2.1163374185562134e-05, 2.2328458726406097e-05, 2.349354326725006e-05, 2.4658627808094025e-05, 2.5823712348937988e-05, 2.6988796889781952e-05, 2.8153881430625916e-05, 2.931896597146988e-05, 3.0484050512313843e-05, 3.1649135053157806e-05, 3.281421959400177e-05, 3.3979304134845734e-05, 3.51443886756897e-05, 3.630947321653366e-05, 3.7474557757377625e-05, 3.863964229822159e-05, 3.980472683906555e-05, 4.0969811379909515e-05, 4.213489592075348e-05, 4.329998046159744e-05, 4.4465065002441406e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 12.0, 17.0, 26.0, 34.0, 44.0, 76.0, 119.0, 200.0, 323.0, 652.0, 1335.0, 3650.0, 10222.0, 39441.0, 287405.0, 610198.0, 70304.0, 15775.0, 5048.0, 1825.0, 816.0, 383.0, 202.0, 138.0, 90.0, 63.0, 46.0, 32.0, 9.0, 11.0, 13.0, 8.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.041015625, -0.039815425872802734, -0.03861522674560547, -0.0374150276184082, -0.03621482849121094, -0.03501462936401367, -0.033814430236816406, -0.03261423110961914, -0.031414031982421875, -0.03021383285522461, -0.029013633728027344, -0.027813434600830078, -0.026613235473632812, -0.025413036346435547, -0.02421283721923828, -0.023012638092041016, -0.02181243896484375, -0.020612239837646484, -0.01941204071044922, -0.018211841583251953, -0.017011642456054688, -0.015811443328857422, -0.014611244201660156, -0.01341104507446289, -0.012210845947265625, -0.01101064682006836, -0.009810447692871094, -0.008610248565673828, -0.0074100494384765625, -0.006209850311279297, -0.005009651184082031, -0.0038094520568847656, -0.0026092529296875, -0.0014090538024902344, -0.00020885467529296875, 0.0009913444519042969, 0.0021915435791015625, 0.003391742706298828, 0.004591941833496094, 0.005792140960693359, 0.006992340087890625, 0.00819253921508789, 0.009392738342285156, 0.010592937469482422, 0.011793136596679688, 0.012993335723876953, 0.014193534851074219, 0.015393733978271484, 0.01659393310546875, 0.017794132232666016, 0.01899433135986328, 0.020194530487060547, 0.021394729614257812, 0.022594928741455078, 0.023795127868652344, 0.02499532699584961, 0.026195526123046875, 0.02739572525024414, 0.028595924377441406, 0.029796123504638672, 0.030996322631835938, 0.0321965217590332, 0.03339672088623047, 0.034596920013427734, 0.035797119140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 14.0, 6.0, 13.0, 14.0, 15.0, 20.0, 31.0, 44.0, 61.0, 108.0, 170.0, 118.0, 104.0, 52.0, 47.0, 42.0, 21.0, 20.0, 17.0, 12.0, 6.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00946044921875, -0.0091552734375, -0.00885009765625, -0.008544921875, -0.00823974609375, -0.0079345703125, -0.00762939453125, -0.00732421875, -0.00701904296875, -0.0067138671875, -0.00640869140625, -0.006103515625, -0.00579833984375, -0.0054931640625, -0.00518798828125, -0.0048828125, -0.00457763671875, -0.0042724609375, -0.00396728515625, -0.003662109375, -0.00335693359375, -0.0030517578125, -0.00274658203125, -0.00244140625, -0.00213623046875, -0.0018310546875, -0.00152587890625, -0.001220703125, -0.00091552734375, -0.0006103515625, -0.00030517578125, 0.0, 0.00030517578125, 0.0006103515625, 0.00091552734375, 0.001220703125, 0.00152587890625, 0.0018310546875, 0.00213623046875, 0.00244140625, 0.00274658203125, 0.0030517578125, 0.00335693359375, 0.003662109375, 0.00396728515625, 0.0042724609375, 0.00457763671875, 0.0048828125, 0.00518798828125, 0.0054931640625, 0.00579833984375, 0.006103515625, 0.00640869140625, 0.0067138671875, 0.00701904296875, 0.00732421875, 0.00762939453125, 0.0079345703125, 0.00823974609375, 0.008544921875, 0.00885009765625, 0.0091552734375, 0.00946044921875, 0.009765625, 0.01007080078125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 17.0, 42.0, 89.0, 168.0, 243.0, 203.0, 121.0, 46.0, 22.0, 13.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.777898073196411, -2.674182176589966, -2.5704662799835205, -2.466750383377075, -2.36303448677063, -2.2593185901641846, -2.1556026935577393, -2.051886796951294, -1.9481709003448486, -1.8444550037384033, -1.740739107131958, -1.6370232105255127, -1.5333073139190674, -1.429591417312622, -1.3258755207061768, -1.2221596240997314, -1.1184436082839966, -1.0147277116775513, -0.911011815071106, -0.8072959184646606, -0.7035800218582153, -0.5998640656471252, -0.49614816904067993, -0.3924322724342346, -0.2887163758277893, -0.185000479221344, -0.08128456771373749, 0.02243134379386902, 0.12614724040031433, 0.22986316680908203, 0.33357906341552734, 0.43729496002197266, 0.541010856628418, 0.6447267532348633, 0.7484426498413086, 0.8521585464477539, 0.9558744430541992, 1.0595903396606445, 1.1633062362670898, 1.2670221328735352, 1.3707380294799805, 1.4744539260864258, 1.578169822692871, 1.6818857192993164, 1.7856016159057617, 1.889317512512207, 1.9930334091186523, 2.0967493057250977, 2.200465202331543, 2.3041810989379883, 2.4078969955444336, 2.511612892150879, 2.615328788757324, 2.7190446853637695, 2.822760581970215, 2.92647647857666, 3.0301926136016846, 3.13390851020813, 3.237624406814575, 3.3413403034210205, 3.445056200027466, 3.548772096633911, 3.6524879932403564, 3.7562038898468018, 3.859919786453247]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 11.0, 16.0, 26.0, 46.0, 60.0, 75.0, 102.0, 109.0, 117.0, 91.0, 85.0, 74.0, 61.0, 41.0, 26.0, 19.0, 10.0, 9.0, 9.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9391765594482422, -1.8735145330429077, -1.8078523874282837, -1.7421903610229492, -1.6765282154083252, -1.6108661890029907, -1.5452041625976562, -1.4795420169830322, -1.4138798713684082, -1.3482178449630737, -1.2825556993484497, -1.2168936729431152, -1.1512315273284912, -1.0855695009231567, -1.0199074745178223, -0.9542453289031982, -0.8885833024978638, -0.8229212164878845, -0.7572591304779053, -0.6915971040725708, -0.6259349584579468, -0.5602729320526123, -0.49461084604263306, -0.4289487600326538, -0.36328667402267456, -0.2976245880126953, -0.23196251690387726, -0.1663004457950592, -0.10063835978507996, -0.03497627377510071, 0.030685782432556152, 0.0963478684425354, 0.16200995445251465, 0.2276720404624939, 0.29333412647247314, 0.35899618268013, 0.42465826869010925, 0.4903203547000885, 0.5559824109077454, 0.6216444969177246, 0.6873065829277039, 0.7529686689376831, 0.8186307549476624, 0.8842928409576416, 0.9499548673629761, 1.0156170129776, 1.0812790393829346, 1.1469411849975586, 1.212603211402893, 1.2782652378082275, 1.3439273834228516, 1.409589409828186, 1.47525155544281, 1.5409135818481445, 1.6065757274627686, 1.672237753868103, 1.7378997802734375, 1.803561806678772, 1.869223952293396, 1.9348859786987305, 2.0005481243133545, 2.0662102699279785, 2.1318721771240234, 2.1975343227386475, 2.2631964683532715]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 16.0, 26.0, 32.0, 62.0, 101.0, 174.0, 353.0, 776.0, 2545.0, 14040.0, 246993.0, 746796.0, 30372.0, 4153.0, 1150.0, 434.0, 220.0, 114.0, 52.0, 49.0, 34.0, 18.0, 5.0, 8.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2265625, -1.1884307861328125, -1.150299072265625, -1.1121673583984375, -1.07403564453125, -1.0359039306640625, -0.997772216796875, -0.9596405029296875, -0.9215087890625, -0.8833770751953125, -0.845245361328125, -0.8071136474609375, -0.76898193359375, -0.7308502197265625, -0.692718505859375, -0.6545867919921875, -0.616455078125, -0.5783233642578125, -0.540191650390625, -0.5020599365234375, -0.46392822265625, -0.4257965087890625, -0.387664794921875, -0.3495330810546875, -0.3114013671875, -0.2732696533203125, -0.235137939453125, -0.1970062255859375, -0.15887451171875, -0.1207427978515625, -0.082611083984375, -0.0444793701171875, -0.00634765625, 0.0317840576171875, 0.069915771484375, 0.1080474853515625, 0.14617919921875, 0.1843109130859375, 0.222442626953125, 0.2605743408203125, 0.2987060546875, 0.3368377685546875, 0.374969482421875, 0.4131011962890625, 0.45123291015625, 0.4893646240234375, 0.527496337890625, 0.5656280517578125, 0.603759765625, 0.6418914794921875, 0.680023193359375, 0.7181549072265625, 0.75628662109375, 0.7944183349609375, 0.832550048828125, 0.8706817626953125, 0.9088134765625, 0.9469451904296875, 0.985076904296875, 1.0232086181640625, 1.06134033203125, 1.0994720458984375, 1.137603759765625, 1.1757354736328125, 1.2138671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 11.0, 30.0, 31.0, 34.0, 61.0, 70.0, 91.0, 69.0, 105.0, 109.0, 68.0, 79.0, 64.0, 43.0, 35.0, 24.0, 17.0, 15.0, 10.0, 9.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.373199462890625, -3.25225830078125, -3.131317138671875, -3.0103759765625, -2.889434814453125, -2.76849365234375, -2.647552490234375, -2.526611328125, -2.405670166015625, -2.28472900390625, -2.163787841796875, -2.0428466796875, -1.921905517578125, -1.80096435546875, -1.680023193359375, -1.55908203125, -1.438140869140625, -1.31719970703125, -1.196258544921875, -1.0753173828125, -0.954376220703125, -0.83343505859375, -0.712493896484375, -0.591552734375, -0.470611572265625, -0.34967041015625, -0.228729248046875, -0.1077880859375, 0.013153076171875, 0.13409423828125, 0.255035400390625, 0.3759765625, 0.496917724609375, 0.61785888671875, 0.738800048828125, 0.8597412109375, 0.980682373046875, 1.10162353515625, 1.222564697265625, 1.343505859375, 1.464447021484375, 1.58538818359375, 1.706329345703125, 1.8272705078125, 1.948211669921875, 2.06915283203125, 2.190093994140625, 2.31103515625, 2.431976318359375, 2.55291748046875, 2.673858642578125, 2.7947998046875, 2.915740966796875, 3.03668212890625, 3.157623291015625, 3.278564453125, 3.399505615234375, 3.52044677734375, 3.641387939453125, 3.7623291015625, 3.883270263671875, 4.00421142578125, 4.125152587890625, 4.24609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 8.0, 5.0, 10.0, 15.0, 21.0, 18.0, 23.0, 28.0, 40.0, 43.0, 60.0, 117.0, 392.0, 22435.0, 1024134.0, 764.0, 123.0, 65.0, 44.0, 49.0, 29.0, 30.0, 24.0, 15.0, 10.0, 12.0, 10.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.51953125, -6.30322265625, -6.0869140625, -5.87060546875, -5.654296875, -5.43798828125, -5.2216796875, -5.00537109375, -4.7890625, -4.57275390625, -4.3564453125, -4.14013671875, -3.923828125, -3.70751953125, -3.4912109375, -3.27490234375, -3.05859375, -2.84228515625, -2.6259765625, -2.40966796875, -2.193359375, -1.97705078125, -1.7607421875, -1.54443359375, -1.328125, -1.11181640625, -0.8955078125, -0.67919921875, -0.462890625, -0.24658203125, -0.0302734375, 0.18603515625, 0.40234375, 0.61865234375, 0.8349609375, 1.05126953125, 1.267578125, 1.48388671875, 1.7001953125, 1.91650390625, 2.1328125, 2.34912109375, 2.5654296875, 2.78173828125, 2.998046875, 3.21435546875, 3.4306640625, 3.64697265625, 3.86328125, 4.07958984375, 4.2958984375, 4.51220703125, 4.728515625, 4.94482421875, 5.1611328125, 5.37744140625, 5.59375, 5.81005859375, 6.0263671875, 6.24267578125, 6.458984375, 6.67529296875, 6.8916015625, 7.10791015625, 7.32421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 4.0, 6.0, 10.0, 15.0, 20.0, 18.0, 22.0, 33.0, 38.0, 46.0, 55.0, 76.0, 70.0, 77.0, 84.0, 68.0, 79.0, 51.0, 35.0, 47.0, 35.0, 25.0, 18.0, 16.0, 15.0, 8.0, 5.0, 9.0, 2.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.8984375, -3.7686767578125, -3.638916015625, -3.5091552734375, -3.37939453125, -3.2496337890625, -3.119873046875, -2.9901123046875, -2.8603515625, -2.7305908203125, -2.600830078125, -2.4710693359375, -2.34130859375, -2.2115478515625, -2.081787109375, -1.9520263671875, -1.822265625, -1.6925048828125, -1.562744140625, -1.4329833984375, -1.30322265625, -1.1734619140625, -1.043701171875, -0.9139404296875, -0.7841796875, -0.6544189453125, -0.524658203125, -0.3948974609375, -0.26513671875, -0.1353759765625, -0.005615234375, 0.1241455078125, 0.25390625, 0.3836669921875, 0.513427734375, 0.6431884765625, 0.77294921875, 0.9027099609375, 1.032470703125, 1.1622314453125, 1.2919921875, 1.4217529296875, 1.551513671875, 1.6812744140625, 1.81103515625, 1.9407958984375, 2.070556640625, 2.2003173828125, 2.330078125, 2.4598388671875, 2.589599609375, 2.7193603515625, 2.84912109375, 2.9788818359375, 3.108642578125, 3.2384033203125, 3.3681640625, 3.4979248046875, 3.627685546875, 3.7574462890625, 3.88720703125, 4.0169677734375, 4.146728515625, 4.2764892578125, 4.40625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 8.0, 8.0, 14.0, 22.0, 29.0, 62.0, 106.0, 211.0, 422.0, 749.0, 1706.0, 3801.0, 10272.0, 1005235.0, 16650.0, 5042.0, 2074.0, 1083.0, 439.0, 259.0, 168.0, 68.0, 27.0, 32.0, 17.0, 12.0, 5.0, 4.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7080078125, -1.6626434326171875, -1.617279052734375, -1.5719146728515625, -1.52655029296875, -1.4811859130859375, -1.435821533203125, -1.3904571533203125, -1.3450927734375, -1.2997283935546875, -1.254364013671875, -1.2089996337890625, -1.16363525390625, -1.1182708740234375, -1.072906494140625, -1.0275421142578125, -0.982177734375, -0.9368133544921875, -0.891448974609375, -0.8460845947265625, -0.80072021484375, -0.7553558349609375, -0.709991455078125, -0.6646270751953125, -0.6192626953125, -0.5738983154296875, -0.528533935546875, -0.4831695556640625, -0.43780517578125, -0.3924407958984375, -0.347076416015625, -0.3017120361328125, -0.25634765625, -0.2109832763671875, -0.165618896484375, -0.1202545166015625, -0.07489013671875, -0.0295257568359375, 0.015838623046875, 0.0612030029296875, 0.1065673828125, 0.1519317626953125, 0.197296142578125, 0.2426605224609375, 0.28802490234375, 0.3333892822265625, 0.378753662109375, 0.4241180419921875, 0.469482421875, 0.5148468017578125, 0.560211181640625, 0.6055755615234375, 0.65093994140625, 0.6963043212890625, 0.741668701171875, 0.7870330810546875, 0.8323974609375, 0.8777618408203125, 0.923126220703125, 0.9684906005859375, 1.01385498046875, 1.0592193603515625, 1.104583740234375, 1.1499481201171875, 1.1953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 20.0, 128.0, 758.0, 61.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016689300537109375, -0.00016005337238311768, -0.0001532137393951416, -0.00014637410640716553, -0.00013953447341918945, -0.00013269484043121338, -0.0001258552074432373, -0.00011901557445526123, -0.00011217594146728516, -0.00010533630847930908, -9.849667549133301e-05, -9.165704250335693e-05, -8.481740951538086e-05, -7.797777652740479e-05, -7.113814353942871e-05, -6.429851055145264e-05, -5.745887756347656e-05, -5.061924457550049e-05, -4.3779611587524414e-05, -3.693997859954834e-05, -3.0100345611572266e-05, -2.326071262359619e-05, -1.6421079635620117e-05, -9.581446647644043e-06, -2.7418136596679688e-06, 4.0978193283081055e-06, 1.093745231628418e-05, 1.7777085304260254e-05, 2.4616718292236328e-05, 3.14563512802124e-05, 3.8295984268188477e-05, 4.513561725616455e-05, 5.1975250244140625e-05, 5.88148832321167e-05, 6.565451622009277e-05, 7.249414920806885e-05, 7.933378219604492e-05, 8.6173415184021e-05, 9.301304817199707e-05, 9.985268115997314e-05, 0.00010669231414794922, 0.00011353194713592529, 0.00012037158012390137, 0.00012721121311187744, 0.00013405084609985352, 0.0001408904790878296, 0.00014773011207580566, 0.00015456974506378174, 0.0001614093780517578, 0.0001682490110397339, 0.00017508864402770996, 0.00018192827701568604, 0.0001887679100036621, 0.00019560754299163818, 0.00020244717597961426, 0.00020928680896759033, 0.0002161264419555664, 0.00022296607494354248, 0.00022980570793151855, 0.00023664534091949463, 0.0002434849739074707, 0.0002503246068954468, 0.00025716423988342285, 0.0002640038728713989, 0.000270843505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 18.0, 20.0, 41.0, 40.0, 55.0, 125.0, 206.0, 299.0, 526.0, 970.0, 1765.0, 3536.0, 7438.0, 320006.0, 698201.0, 7515.0, 3581.0, 1784.0, 1014.0, 525.0, 343.0, 173.0, 127.0, 76.0, 47.0, 27.0, 28.0, 19.0, 10.0, 7.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.4963226318359375, -1.453582763671875, -1.4108428955078125, -1.36810302734375, -1.3253631591796875, -1.282623291015625, -1.2398834228515625, -1.1971435546875, -1.1544036865234375, -1.111663818359375, -1.0689239501953125, -1.02618408203125, -0.9834442138671875, -0.940704345703125, -0.8979644775390625, -0.855224609375, -0.8124847412109375, -0.769744873046875, -0.7270050048828125, -0.68426513671875, -0.6415252685546875, -0.598785400390625, -0.5560455322265625, -0.5133056640625, -0.4705657958984375, -0.427825927734375, -0.3850860595703125, -0.34234619140625, -0.2996063232421875, -0.256866455078125, -0.2141265869140625, -0.17138671875, -0.1286468505859375, -0.085906982421875, -0.0431671142578125, -0.00042724609375, 0.0423126220703125, 0.085052490234375, 0.1277923583984375, 0.1705322265625, 0.2132720947265625, 0.256011962890625, 0.2987518310546875, 0.34149169921875, 0.3842315673828125, 0.426971435546875, 0.4697113037109375, 0.512451171875, 0.5551910400390625, 0.597930908203125, 0.6406707763671875, 0.68341064453125, 0.7261505126953125, 0.768890380859375, 0.8116302490234375, 0.8543701171875, 0.8971099853515625, 0.939849853515625, 0.9825897216796875, 1.02532958984375, 1.0680694580078125, 1.110809326171875, 1.1535491943359375, 1.1962890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 21.0, 596.0, 327.0, 13.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.599609375, -0.578155517578125, -0.55670166015625, -0.535247802734375, -0.5137939453125, -0.492340087890625, -0.47088623046875, -0.449432373046875, -0.427978515625, -0.406524658203125, -0.38507080078125, -0.363616943359375, -0.3421630859375, -0.320709228515625, -0.29925537109375, -0.277801513671875, -0.25634765625, -0.234893798828125, -0.21343994140625, -0.191986083984375, -0.1705322265625, -0.149078369140625, -0.12762451171875, -0.106170654296875, -0.084716796875, -0.063262939453125, -0.04180908203125, -0.020355224609375, 0.0010986328125, 0.022552490234375, 0.04400634765625, 0.065460205078125, 0.0869140625, 0.108367919921875, 0.12982177734375, 0.151275634765625, 0.1727294921875, 0.194183349609375, 0.21563720703125, 0.237091064453125, 0.258544921875, 0.279998779296875, 0.30145263671875, 0.322906494140625, 0.3443603515625, 0.365814208984375, 0.38726806640625, 0.408721923828125, 0.43017578125, 0.451629638671875, 0.47308349609375, 0.494537353515625, 0.5159912109375, 0.537445068359375, 0.55889892578125, 0.580352783203125, 0.601806640625, 0.623260498046875, 0.64471435546875, 0.666168212890625, 0.6876220703125, 0.709075927734375, 0.73052978515625, 0.751983642578125, 0.7734375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 14.0, 35.0, 87.0, 251.0, 341.0, 180.0, 63.0, 16.0, 11.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9980034828186035, -2.641268253326416, -2.2845330238342285, -1.9277979135513306, -1.571062684059143, -1.2143274545669556, -0.8575923442840576, -0.5008571147918701, -0.14412188529968262, 0.2126133143901825, 0.5693485140800476, 0.9260836839675903, 1.2828189134597778, 1.6395541429519653, 1.9962892532348633, 2.353024482727051, 2.7097597122192383, 3.066494941711426, 3.4232301712036133, 3.779965400695801, 4.136700630187988, 4.493435859680176, 4.850171089172363, 5.206906318664551, 5.563641548156738, 5.920376777648926, 6.277112007141113, 6.633847236633301, 6.990582466125488, 7.347317695617676, 7.704052925109863, 8.06078815460205, 8.417523384094238, 8.774258613586426, 9.130993843078613, 9.4877290725708, 9.844464302062988, 10.201199531555176, 10.557934761047363, 10.91466999053955, 11.271405220031738, 11.628140449523926, 11.984875679016113, 12.3416109085083, 12.698346138000488, 13.055081367492676, 13.411816596984863, 13.76855182647705, 14.125286102294922, 14.48202133178711, 14.838756561279297, 15.195491790771484, 15.552227020263672, 15.90896224975586, 16.265697479248047, 16.622432708740234, 16.979167938232422, 17.33590316772461, 17.692638397216797, 18.049373626708984, 18.406108856201172, 18.76284408569336, 19.119579315185547, 19.476314544677734, 19.833049774169922]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 12.0, 15.0, 16.0, 14.0, 15.0, 22.0, 22.0, 30.0, 22.0, 35.0, 50.0, 43.0, 44.0, 50.0, 31.0, 60.0, 49.0, 41.0, 52.0, 45.0, 46.0, 38.0, 25.0, 33.0, 30.0, 31.0, 27.0, 22.0, 11.0, 10.0, 8.0, 4.0, 9.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.792844295501709, -4.644896030426025, -4.496947765350342, -4.348999500274658, -4.201051235198975, -4.053102970123291, -3.9051544666290283, -3.7572062015533447, -3.609257936477661, -3.4613096714019775, -3.313361406326294, -3.1654131412506104, -3.0174646377563477, -2.869516372680664, -2.7215681076049805, -2.573619842529297, -2.4256715774536133, -2.2777233123779297, -2.129775047302246, -1.981826663017273, -1.8338783979415894, -1.6859301328659058, -1.5379817485809326, -1.390033483505249, -1.2420852184295654, -1.0941369533538818, -0.9461886286735535, -0.7982403039932251, -0.6502920389175415, -0.5023437738418579, -0.35439544916152954, -0.20644712448120117, -0.05849885940551758, 0.0894494354724884, 0.23739773035049438, 0.38534602522850037, 0.5332943201065063, 0.6812425851821899, 0.8291909098625183, 0.9771392345428467, 1.1250874996185303, 1.2730357646942139, 1.4209840297698975, 1.5689324140548706, 1.7168806791305542, 1.8648289442062378, 2.012777328491211, 2.1607255935668945, 2.308673858642578, 2.4566221237182617, 2.6045703887939453, 2.752518653869629, 2.9004669189453125, 3.048415184020996, 3.196363687515259, 3.3443119525909424, 3.492260217666626, 3.6402084827423096, 3.788156747817993, 3.9361050128936768, 4.0840535163879395, 4.232001781463623, 4.379950046539307, 4.52789831161499, 4.675846576690674]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 6.0, 12.0, 19.0, 23.0, 25.0, 35.0, 37.0, 64.0, 100.0, 151.0, 276.0, 499.0, 995.0, 1719.0, 3932.0, 11635.0, 59181.0, 1424247.0, 2578877.0, 87428.0, 15223.0, 4984.0, 2196.0, 1062.0, 602.0, 332.0, 201.0, 122.0, 85.0, 59.0, 35.0, 32.0, 20.0, 18.0, 8.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.177734375, -3.075531005859375, -2.97332763671875, -2.871124267578125, -2.7689208984375, -2.666717529296875, -2.56451416015625, -2.462310791015625, -2.360107421875, -2.257904052734375, -2.15570068359375, -2.053497314453125, -1.9512939453125, -1.849090576171875, -1.74688720703125, -1.644683837890625, -1.54248046875, -1.440277099609375, -1.33807373046875, -1.235870361328125, -1.1336669921875, -1.031463623046875, -0.92926025390625, -0.827056884765625, -0.724853515625, -0.622650146484375, -0.52044677734375, -0.418243408203125, -0.3160400390625, -0.213836669921875, -0.11163330078125, -0.009429931640625, 0.0927734375, 0.194976806640625, 0.29718017578125, 0.399383544921875, 0.5015869140625, 0.603790283203125, 0.70599365234375, 0.808197021484375, 0.910400390625, 1.012603759765625, 1.11480712890625, 1.217010498046875, 1.3192138671875, 1.421417236328125, 1.52362060546875, 1.625823974609375, 1.72802734375, 1.830230712890625, 1.93243408203125, 2.034637451171875, 2.1368408203125, 2.239044189453125, 2.34124755859375, 2.443450927734375, 2.545654296875, 2.647857666015625, 2.75006103515625, 2.852264404296875, 2.9544677734375, 3.056671142578125, 3.15887451171875, 3.261077880859375, 3.36328125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 8.0, 20.0, 14.0, 25.0, 40.0, 44.0, 46.0, 58.0, 76.0, 83.0, 88.0, 84.0, 69.0, 73.0, 49.0, 53.0, 41.0, 27.0, 32.0, 16.0, 13.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6611328125, -1.605682373046875, -1.55023193359375, -1.494781494140625, -1.4393310546875, -1.383880615234375, -1.32843017578125, -1.272979736328125, -1.217529296875, -1.162078857421875, -1.10662841796875, -1.051177978515625, -0.9957275390625, -0.940277099609375, -0.88482666015625, -0.829376220703125, -0.77392578125, -0.718475341796875, -0.66302490234375, -0.607574462890625, -0.5521240234375, -0.496673583984375, -0.44122314453125, -0.385772705078125, -0.330322265625, -0.274871826171875, -0.21942138671875, -0.163970947265625, -0.1085205078125, -0.053070068359375, 0.00238037109375, 0.057830810546875, 0.11328125, 0.168731689453125, 0.22418212890625, 0.279632568359375, 0.3350830078125, 0.390533447265625, 0.44598388671875, 0.501434326171875, 0.556884765625, 0.612335205078125, 0.66778564453125, 0.723236083984375, 0.7786865234375, 0.834136962890625, 0.88958740234375, 0.945037841796875, 1.00048828125, 1.055938720703125, 1.11138916015625, 1.166839599609375, 1.2222900390625, 1.277740478515625, 1.33319091796875, 1.388641357421875, 1.444091796875, 1.499542236328125, 1.55499267578125, 1.610443115234375, 1.6658935546875, 1.721343994140625, 1.77679443359375, 1.832244873046875, 1.8876953125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 13.0, 24.0, 59.0, 150.0, 424.0, 2028.0, 20653.0, 3966311.0, 196884.0, 6379.0, 933.0, 244.0, 86.0, 45.0, 14.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.671875, -11.42236328125, -11.1728515625, -10.92333984375, -10.673828125, -10.42431640625, -10.1748046875, -9.92529296875, -9.67578125, -9.42626953125, -9.1767578125, -8.92724609375, -8.677734375, -8.42822265625, -8.1787109375, -7.92919921875, -7.6796875, -7.43017578125, -7.1806640625, -6.93115234375, -6.681640625, -6.43212890625, -6.1826171875, -5.93310546875, -5.68359375, -5.43408203125, -5.1845703125, -4.93505859375, -4.685546875, -4.43603515625, -4.1865234375, -3.93701171875, -3.6875, -3.43798828125, -3.1884765625, -2.93896484375, -2.689453125, -2.43994140625, -2.1904296875, -1.94091796875, -1.69140625, -1.44189453125, -1.1923828125, -0.94287109375, -0.693359375, -0.44384765625, -0.1943359375, 0.05517578125, 0.3046875, 0.55419921875, 0.8037109375, 1.05322265625, 1.302734375, 1.55224609375, 1.8017578125, 2.05126953125, 2.30078125, 2.55029296875, 2.7998046875, 3.04931640625, 3.298828125, 3.54833984375, 3.7978515625, 4.04736328125, 4.296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 10.0, 7.0, 4.0, 14.0, 19.0, 20.0, 34.0, 39.0, 70.0, 106.0, 219.0, 474.0, 905.0, 955.0, 535.0, 283.0, 116.0, 75.0, 40.0, 34.0, 24.0, 21.0, 14.0, 6.0, 11.0, 12.0, 5.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63720703125, -0.6084213256835938, -0.5796356201171875, -0.5508499145507812, -0.522064208984375, -0.49327850341796875, -0.4644927978515625, -0.43570709228515625, -0.40692138671875, -0.37813568115234375, -0.3493499755859375, -0.32056427001953125, -0.291778564453125, -0.26299285888671875, -0.2342071533203125, -0.20542144775390625, -0.1766357421875, -0.14785003662109375, -0.1190643310546875, -0.09027862548828125, -0.061492919921875, -0.03270721435546875, -0.0039215087890625, 0.02486419677734375, 0.05364990234375, 0.08243560791015625, 0.1112213134765625, 0.14000701904296875, 0.168792724609375, 0.19757843017578125, 0.2263641357421875, 0.25514984130859375, 0.283935546875, 0.31272125244140625, 0.3415069580078125, 0.37029266357421875, 0.399078369140625, 0.42786407470703125, 0.4566497802734375, 0.48543548583984375, 0.51422119140625, 0.5430068969726562, 0.5717926025390625, 0.6005783081054688, 0.629364013671875, 0.6581497192382812, 0.6869354248046875, 0.7157211303710938, 0.7445068359375, 0.7732925415039062, 0.8020782470703125, 0.8308639526367188, 0.859649658203125, 0.8884353637695312, 0.9172210693359375, 0.9460067749023438, 0.97479248046875, 1.0035781860351562, 1.0323638916015625, 1.0611495971679688, 1.089935302734375, 1.1187210083007812, 1.1475067138671875, 1.1762924194335938, 1.205078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 13.0, 17.0, 16.0, 24.0, 28.0, 55.0, 54.0, 73.0, 107.0, 97.0, 86.0, 93.0, 86.0, 70.0, 40.0, 29.0, 24.0, 24.0, 15.0, 9.0, 11.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6273624897003174, -2.54500412940979, -2.4626457691192627, -2.3802874088287354, -2.297929048538208, -2.2155706882476807, -2.1332123279571533, -2.050853729248047, -1.968495488166809, -1.8861371278762817, -1.8037787675857544, -1.721420407295227, -1.6390619277954102, -1.5567035675048828, -1.4743452072143555, -1.3919868469238281, -1.3096284866333008, -1.2272701263427734, -1.144911766052246, -1.0625534057617188, -0.9801949858665466, -0.8978366255760193, -0.8154782056808472, -0.7331198453903198, -0.6507614850997925, -0.5684031248092651, -0.4860447347164154, -0.4036863446235657, -0.32132798433303833, -0.238969624042511, -0.15661123394966125, -0.07425284385681152, 0.00810551643371582, 0.09046389162540436, 0.1728222668170929, 0.2551806569099426, 0.33753901720046997, 0.4198973774909973, 0.5022557973861694, 0.5846141576766968, 0.6669725179672241, 0.7493308782577515, 0.8316892385482788, 0.9140476584434509, 0.9964060187339783, 1.0787644386291504, 1.1611227989196777, 1.243481159210205, 1.3258395195007324, 1.4081978797912598, 1.490556240081787, 1.5729146003723145, 1.6552729606628418, 1.7376313209533691, 1.819989800453186, 1.9023481607437134, 1.9847065210342407, 2.0670650005340576, 2.149423360824585, 2.2317817211151123, 2.3141400814056396, 2.396498441696167, 2.4788568019866943, 2.5612151622772217, 2.643573522567749]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 4.0, 8.0, 11.0, 13.0, 17.0, 12.0, 25.0, 32.0, 36.0, 33.0, 37.0, 43.0, 47.0, 43.0, 44.0, 57.0, 47.0, 59.0, 58.0, 57.0, 56.0, 35.0, 39.0, 40.0, 20.0, 30.0, 19.0, 20.0, 17.0, 13.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8371407985687256, -1.777982473373413, -1.718824028968811, -1.6596657037734985, -1.6005072593688965, -1.541348934173584, -1.4821906089782715, -1.423032283782959, -1.363873839378357, -1.3047155141830444, -1.2455570697784424, -1.1863987445831299, -1.1272404193878174, -1.0680819749832153, -1.0089236497879028, -0.9497652649879456, -0.8906068801879883, -0.831448495388031, -0.7722901105880737, -0.7131317853927612, -0.653973400592804, -0.5948150157928467, -0.5356566905975342, -0.4764983057975769, -0.41733992099761963, -0.35818153619766235, -0.29902318120002747, -0.23986481130123138, -0.1807064414024353, -0.12154805660247803, -0.06238970160484314, -0.003231346607208252, 0.055927157402038574, 0.11508552730083466, 0.17424389719963074, 0.23340226709842682, 0.2925606369972229, 0.3517190217971802, 0.41087737679481506, 0.47003573179244995, 0.5291941165924072, 0.5883525013923645, 0.6475108861923218, 0.7066692113876343, 0.7658275961875916, 0.8249859809875488, 0.8841443061828613, 0.9433026909828186, 1.0024610757827759, 1.0616194009780884, 1.1207778453826904, 1.179936170578003, 1.2390944957733154, 1.2982529401779175, 1.35741126537323, 1.416569709777832, 1.4757280349731445, 1.534886360168457, 1.594044804573059, 1.6532031297683716, 1.7123615741729736, 1.7715198993682861, 1.8306782245635986, 1.8898365497589111, 1.9489949941635132]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 8.0, 9.0, 15.0, 18.0, 16.0, 47.0, 58.0, 55.0, 98.0, 172.0, 304.0, 442.0, 810.0, 1577.0, 3669.0, 11565.0, 58575.0, 539780.0, 373595.0, 41947.0, 9302.0, 3154.0, 1429.0, 773.0, 415.0, 236.0, 143.0, 110.0, 67.0, 49.0, 29.0, 28.0, 16.0, 10.0, 8.0, 11.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.56689453125, -0.5501785278320312, -0.5334625244140625, -0.5167465209960938, -0.500030517578125, -0.48331451416015625, -0.4665985107421875, -0.44988250732421875, -0.43316650390625, -0.41645050048828125, -0.3997344970703125, -0.38301849365234375, -0.366302490234375, -0.34958648681640625, -0.3328704833984375, -0.31615447998046875, -0.2994384765625, -0.28272247314453125, -0.2660064697265625, -0.24929046630859375, -0.232574462890625, -0.21585845947265625, -0.1991424560546875, -0.18242645263671875, -0.16571044921875, -0.14899444580078125, -0.1322784423828125, -0.11556243896484375, -0.098846435546875, -0.08213043212890625, -0.0654144287109375, -0.04869842529296875, -0.031982421875, -0.01526641845703125, 0.0014495849609375, 0.01816558837890625, 0.034881591796875, 0.05159759521484375, 0.0683135986328125, 0.08502960205078125, 0.10174560546875, 0.11846160888671875, 0.1351776123046875, 0.15189361572265625, 0.168609619140625, 0.18532562255859375, 0.2020416259765625, 0.21875762939453125, 0.2354736328125, 0.25218963623046875, 0.2689056396484375, 0.28562164306640625, 0.302337646484375, 0.31905364990234375, 0.3357696533203125, 0.35248565673828125, 0.36920166015625, 0.38591766357421875, 0.4026336669921875, 0.41934967041015625, 0.436065673828125, 0.45278167724609375, 0.4694976806640625, 0.48621368408203125, 0.5029296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 6.0, 4.0, 13.0, 13.0, 19.0, 24.0, 32.0, 26.0, 39.0, 36.0, 47.0, 40.0, 63.0, 68.0, 70.0, 47.0, 64.0, 61.0, 59.0, 50.0, 44.0, 44.0, 35.0, 28.0, 10.0, 17.0, 13.0, 10.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4033203125, -1.3549652099609375, -1.306610107421875, -1.2582550048828125, -1.20989990234375, -1.1615447998046875, -1.113189697265625, -1.0648345947265625, -1.0164794921875, -0.9681243896484375, -0.919769287109375, -0.8714141845703125, -0.82305908203125, -0.7747039794921875, -0.726348876953125, -0.6779937744140625, -0.629638671875, -0.5812835693359375, -0.532928466796875, -0.4845733642578125, -0.43621826171875, -0.3878631591796875, -0.339508056640625, -0.2911529541015625, -0.2427978515625, -0.1944427490234375, -0.146087646484375, -0.0977325439453125, -0.04937744140625, -0.0010223388671875, 0.047332763671875, 0.0956878662109375, 0.14404296875, 0.1923980712890625, 0.240753173828125, 0.2891082763671875, 0.33746337890625, 0.3858184814453125, 0.434173583984375, 0.4825286865234375, 0.5308837890625, 0.5792388916015625, 0.627593994140625, 0.6759490966796875, 0.72430419921875, 0.7726593017578125, 0.821014404296875, 0.8693695068359375, 0.917724609375, 0.9660797119140625, 1.014434814453125, 1.0627899169921875, 1.11114501953125, 1.1595001220703125, 1.207855224609375, 1.2562103271484375, 1.3045654296875, 1.3529205322265625, 1.401275634765625, 1.4496307373046875, 1.49798583984375, 1.5463409423828125, 1.594696044921875, 1.6430511474609375, 1.69140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 15.0, 17.0, 18.0, 44.0, 48.0, 61.0, 109.0, 139.0, 246.0, 369.0, 569.0, 830.0, 1341.0, 2216.0, 3444.0, 5879.0, 9913.0, 17328.0, 30389.0, 56255.0, 107541.0, 210461.0, 267376.0, 155675.0, 79552.0, 42805.0, 23303.0, 13098.0, 7754.0, 4481.0, 2715.0, 1666.0, 1063.0, 610.0, 426.0, 257.0, 182.0, 122.0, 87.0, 46.0, 31.0, 23.0, 13.0, 11.0, 8.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.111328125, -0.10798263549804688, -0.10463714599609375, -0.10129165649414062, -0.0979461669921875, -0.09460067749023438, -0.09125518798828125, -0.08790969848632812, -0.084564208984375, -0.08121871948242188, -0.07787322998046875, -0.07452774047851562, -0.0711822509765625, -0.06783676147460938, -0.06449127197265625, -0.061145782470703125, -0.05780029296875, -0.054454803466796875, -0.05110931396484375, -0.047763824462890625, -0.0444183349609375, -0.041072845458984375, -0.03772735595703125, -0.034381866455078125, -0.031036376953125, -0.027690887451171875, -0.02434539794921875, -0.020999908447265625, -0.0176544189453125, -0.014308929443359375, -0.01096343994140625, -0.007617950439453125, -0.0042724609375, -0.000926971435546875, 0.00241851806640625, 0.005764007568359375, 0.0091094970703125, 0.012454986572265625, 0.01580047607421875, 0.019145965576171875, 0.022491455078125, 0.025836944580078125, 0.02918243408203125, 0.032527923583984375, 0.0358734130859375, 0.039218902587890625, 0.04256439208984375, 0.045909881591796875, 0.04925537109375, 0.052600860595703125, 0.05594635009765625, 0.059291839599609375, 0.0626373291015625, 0.06598281860351562, 0.06932830810546875, 0.07267379760742188, 0.076019287109375, 0.07936477661132812, 0.08271026611328125, 0.08605575561523438, 0.0894012451171875, 0.09274673461914062, 0.09609222412109375, 0.09943771362304688, 0.102783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 10.0, 6.0, 11.0, 17.0, 18.0, 17.0, 16.0, 15.0, 23.0, 33.0, 33.0, 34.0, 38.0, 42.0, 38.0, 37.0, 47.0, 53.0, 54.0, 35.0, 38.0, 37.0, 35.0, 37.0, 33.0, 34.0, 31.0, 23.0, 24.0, 32.0, 13.0, 12.0, 9.0, 16.0, 9.0, 6.0, 5.0, 1.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.48828125, -2.41400146484375, -2.3397216796875, -2.26544189453125, -2.191162109375, -2.11688232421875, -2.0426025390625, -1.96832275390625, -1.89404296875, -1.81976318359375, -1.7454833984375, -1.67120361328125, -1.596923828125, -1.52264404296875, -1.4483642578125, -1.37408447265625, -1.2998046875, -1.22552490234375, -1.1512451171875, -1.07696533203125, -1.002685546875, -0.92840576171875, -0.8541259765625, -0.77984619140625, -0.70556640625, -0.63128662109375, -0.5570068359375, -0.48272705078125, -0.408447265625, -0.33416748046875, -0.2598876953125, -0.18560791015625, -0.111328125, -0.03704833984375, 0.0372314453125, 0.11151123046875, 0.185791015625, 0.26007080078125, 0.3343505859375, 0.40863037109375, 0.48291015625, 0.55718994140625, 0.6314697265625, 0.70574951171875, 0.780029296875, 0.85430908203125, 0.9285888671875, 1.00286865234375, 1.0771484375, 1.15142822265625, 1.2257080078125, 1.29998779296875, 1.374267578125, 1.44854736328125, 1.5228271484375, 1.59710693359375, 1.67138671875, 1.74566650390625, 1.8199462890625, 1.89422607421875, 1.968505859375, 2.04278564453125, 2.1170654296875, 2.19134521484375, 2.265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 8.0, 12.0, 9.0, 20.0, 29.0, 46.0, 64.0, 85.0, 166.0, 305.0, 489.0, 962.0, 2434.0, 7614.0, 38901.0, 603728.0, 356492.0, 27126.0, 5967.0, 2053.0, 857.0, 480.0, 281.0, 149.0, 92.0, 55.0, 48.0, 35.0, 19.0, 8.0, 3.0, 1.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055145263671875, -0.05356550216674805, -0.051985740661621094, -0.05040597915649414, -0.04882621765136719, -0.047246456146240234, -0.04566669464111328, -0.04408693313598633, -0.042507171630859375, -0.04092741012573242, -0.03934764862060547, -0.037767887115478516, -0.03618812561035156, -0.03460836410522461, -0.033028602600097656, -0.0314488410949707, -0.02986907958984375, -0.028289318084716797, -0.026709556579589844, -0.02512979507446289, -0.023550033569335938, -0.021970272064208984, -0.02039051055908203, -0.018810749053955078, -0.017230987548828125, -0.015651226043701172, -0.014071464538574219, -0.012491703033447266, -0.010911941528320312, -0.00933218002319336, -0.007752418518066406, -0.006172657012939453, -0.0045928955078125, -0.003013134002685547, -0.0014333724975585938, 0.00014638900756835938, 0.0017261505126953125, 0.0033059120178222656, 0.004885673522949219, 0.006465435028076172, 0.008045196533203125, 0.009624958038330078, 0.011204719543457031, 0.012784481048583984, 0.014364242553710938, 0.01594400405883789, 0.017523765563964844, 0.019103527069091797, 0.02068328857421875, 0.022263050079345703, 0.023842811584472656, 0.02542257308959961, 0.027002334594726562, 0.028582096099853516, 0.03016185760498047, 0.03174161911010742, 0.033321380615234375, 0.03490114212036133, 0.03648090362548828, 0.038060665130615234, 0.03964042663574219, 0.04122018814086914, 0.042799949645996094, 0.04437971115112305, 0.04595947265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 6.0, 9.0, 13.0, 11.0, 29.0, 31.0, 43.0, 62.0, 80.0, 125.0, 123.0, 121.0, 97.0, 68.0, 56.0, 34.0, 34.0, 18.0, 16.0, 4.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.762411117553711e-05, -4.601571708917618e-05, -4.4407323002815247e-05, -4.2798928916454315e-05, -4.1190534830093384e-05, -3.958214074373245e-05, -3.797374665737152e-05, -3.636535257101059e-05, -3.475695848464966e-05, -3.314856439828873e-05, -3.1540170311927795e-05, -2.9931776225566864e-05, -2.8323382139205933e-05, -2.6714988052845e-05, -2.510659396648407e-05, -2.349819988012314e-05, -2.1889805793762207e-05, -2.0281411707401276e-05, -1.8673017621040344e-05, -1.7064623534679413e-05, -1.545622944831848e-05, -1.384783536195755e-05, -1.2239441275596619e-05, -1.0631047189235687e-05, -9.022653102874756e-06, -7.4142590165138245e-06, -5.805864930152893e-06, -4.197470843791962e-06, -2.5890767574310303e-06, -9.806826710700989e-07, 6.277114152908325e-07, 2.236105501651764e-06, 3.844499588012695e-06, 5.452893674373627e-06, 7.061287760734558e-06, 8.66968184709549e-06, 1.0278075933456421e-05, 1.1886470019817352e-05, 1.3494864106178284e-05, 1.5103258192539215e-05, 1.6711652278900146e-05, 1.8320046365261078e-05, 1.992844045162201e-05, 2.153683453798294e-05, 2.3145228624343872e-05, 2.4753622710704803e-05, 2.6362016797065735e-05, 2.7970410883426666e-05, 2.9578804969787598e-05, 3.118719905614853e-05, 3.279559314250946e-05, 3.440398722887039e-05, 3.601238131523132e-05, 3.7620775401592255e-05, 3.9229169487953186e-05, 4.083756357431412e-05, 4.244595766067505e-05, 4.405435174703598e-05, 4.566274583339691e-05, 4.727113991975784e-05, 4.8879534006118774e-05, 5.0487928092479706e-05, 5.209632217884064e-05, 5.370471626520157e-05, 5.53131103515625e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 2.0, 11.0, 11.0, 21.0, 33.0, 48.0, 64.0, 85.0, 153.0, 206.0, 394.0, 656.0, 1343.0, 2527.0, 6532.0, 23394.0, 167618.0, 740913.0, 79931.0, 14948.0, 4943.0, 2117.0, 1035.0, 654.0, 338.0, 227.0, 127.0, 60.0, 43.0, 28.0, 24.0, 16.0, 6.0, 4.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.051605224609375, -0.050223350524902344, -0.04884147644042969, -0.04745960235595703, -0.046077728271484375, -0.04469585418701172, -0.04331398010253906, -0.041932106018066406, -0.04055023193359375, -0.039168357849121094, -0.03778648376464844, -0.03640460968017578, -0.035022735595703125, -0.03364086151123047, -0.03225898742675781, -0.030877113342285156, -0.0294952392578125, -0.028113365173339844, -0.026731491088867188, -0.02534961700439453, -0.023967742919921875, -0.02258586883544922, -0.021203994750976562, -0.019822120666503906, -0.01844024658203125, -0.017058372497558594, -0.015676498413085938, -0.014294624328613281, -0.012912750244140625, -0.011530876159667969, -0.010149002075195312, -0.008767127990722656, -0.00738525390625, -0.006003379821777344, -0.0046215057373046875, -0.0032396316528320312, -0.001857757568359375, -0.00047588348388671875, 0.0009059906005859375, 0.0022878646850585938, 0.00366973876953125, 0.005051612854003906, 0.0064334869384765625, 0.007815361022949219, 0.009197235107421875, 0.010579109191894531, 0.011960983276367188, 0.013342857360839844, 0.0147247314453125, 0.016106605529785156, 0.017488479614257812, 0.01887035369873047, 0.020252227783203125, 0.02163410186767578, 0.023015975952148438, 0.024397850036621094, 0.02577972412109375, 0.027161598205566406, 0.028543472290039062, 0.02992534637451172, 0.031307220458984375, 0.03268909454345703, 0.03407096862792969, 0.035452842712402344, 0.036834716796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 4.0, 9.0, 4.0, 15.0, 24.0, 16.0, 26.0, 53.0, 89.0, 137.0, 199.0, 165.0, 80.0, 44.0, 38.0, 19.0, 19.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0097198486328125, -0.009341239929199219, -0.008962631225585938, -0.008584022521972656, -0.008205413818359375, -0.007826805114746094, -0.0074481964111328125, -0.007069587707519531, -0.00669097900390625, -0.006312370300292969, -0.0059337615966796875, -0.005555152893066406, -0.005176544189453125, -0.004797935485839844, -0.0044193267822265625, -0.004040718078613281, -0.003662109375, -0.0032835006713867188, -0.0029048919677734375, -0.0025262832641601562, -0.002147674560546875, -0.0017690658569335938, -0.0013904571533203125, -0.0010118484497070312, -0.00063323974609375, -0.00025463104248046875, 0.0001239776611328125, 0.0005025863647460938, 0.000881195068359375, 0.0012598037719726562, 0.0016384124755859375, 0.0020170211791992188, 0.0023956298828125, 0.0027742385864257812, 0.0031528472900390625, 0.0035314559936523438, 0.003910064697265625, 0.004288673400878906, 0.0046672821044921875, 0.005045890808105469, 0.00542449951171875, 0.005803108215332031, 0.0061817169189453125, 0.006560325622558594, 0.006938934326171875, 0.007317543029785156, 0.0076961517333984375, 0.008074760437011719, 0.008453369140625, 0.008831977844238281, 0.009210586547851562, 0.009589195251464844, 0.009967803955078125, 0.010346412658691406, 0.010725021362304688, 0.011103630065917969, 0.01148223876953125, 0.011860847473144531, 0.012239456176757812, 0.012618064880371094, 0.012996673583984375, 0.013375282287597656, 0.013753890991210938, 0.014132499694824219, 0.0145111083984375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 14.0, 16.0, 31.0, 54.0, 77.0, 117.0, 159.0, 132.0, 138.0, 97.0, 64.0, 34.0, 29.0, 8.0, 11.0, 9.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2069525718688965, -2.122865676879883, -2.038778781890869, -1.954691767692566, -1.8706048727035522, -1.7865179777145386, -1.7024309635162354, -1.6183440685272217, -1.534257173538208, -1.4501702785491943, -1.3660833835601807, -1.2819963693618774, -1.1979094743728638, -1.11382257938385, -1.0297355651855469, -0.9456486701965332, -0.8615617752075195, -0.7774748802185059, -0.6933879256248474, -0.609300971031189, -0.5252140760421753, -0.44112715125083923, -0.3570402264595032, -0.2729532718658447, -0.18886637687683105, -0.104779452085495, -0.020692527294158936, 0.06339439749717712, 0.14748132228851318, 0.23156824707984924, 0.3156551718711853, 0.39974212646484375, 0.4838292598724365, 0.5679161548614502, 0.6520031094551086, 0.7360900640487671, 0.8201769590377808, 0.9042638540267944, 0.9883508086204529, 1.0724377632141113, 1.156524658203125, 1.2406115531921387, 1.3246984481811523, 1.4087854623794556, 1.4928723573684692, 1.576959252357483, 1.6610462665557861, 1.7451331615447998, 1.8292200565338135, 1.9133069515228271, 1.9973938465118408, 2.0814807415008545, 2.1655678749084473, 2.249654769897461, 2.3337416648864746, 2.4178285598754883, 2.501915454864502, 2.5860023498535156, 2.6700892448425293, 2.754176139831543, 2.8382630348205566, 2.9223501682281494, 3.006437063217163, 3.0905239582061768, 3.1746108531951904]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 19.0, 13.0, 21.0, 35.0, 39.0, 43.0, 41.0, 52.0, 45.0, 57.0, 67.0, 63.0, 65.0, 66.0, 77.0, 44.0, 54.0, 36.0, 36.0, 28.0, 14.0, 21.0, 13.0, 15.0, 10.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4761707782745361, -1.4279824495315552, -1.3797941207885742, -1.3316057920455933, -1.2834174633026123, -1.235229253768921, -1.1870408058166504, -1.138852596282959, -1.090664267539978, -1.042475938796997, -0.9942876100540161, -0.9460992813110352, -0.897911012172699, -0.849722683429718, -0.8015343546867371, -0.7533460855484009, -0.7051576972007751, -0.6569693684577942, -0.6087810397148132, -0.560592770576477, -0.5124044418334961, -0.46421611309051514, -0.4160277843475342, -0.3678394854068756, -0.31965115666389465, -0.2714628279209137, -0.22327452898025513, -0.17508620023727417, -0.1268978863954544, -0.07870957255363464, -0.030521243810653687, 0.017667055130004883, 0.06585538387298584, 0.1140436977148056, 0.16223201155662537, 0.21042034029960632, 0.2586086392402649, 0.30679696798324585, 0.3549852967262268, 0.4031735956668854, 0.45136192440986633, 0.4995502531528473, 0.5477385520935059, 0.5959268808364868, 0.6441152095794678, 0.6923035383224487, 0.7404918670654297, 0.7886801362037659, 0.8368684649467468, 0.8850567936897278, 0.9332451224327087, 0.9814333915710449, 1.0296217203140259, 1.0778100490570068, 1.1259983777999878, 1.1741867065429688, 1.2223750352859497, 1.2705633640289307, 1.3187516927719116, 1.3669400215148926, 1.4151283502578735, 1.4633166790008545, 1.511504888534546, 1.5596932172775269, 1.6078815460205078]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 8.0, 8.0, 15.0, 26.0, 41.0, 63.0, 109.0, 236.0, 424.0, 896.0, 1993.0, 5069.0, 16577.0, 81093.0, 640000.0, 250879.0, 36223.0, 9043.0, 3166.0, 1305.0, 608.0, 315.0, 191.0, 89.0, 51.0, 39.0, 29.0, 17.0, 6.0, 8.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0], "bins": [-2.201171875, -2.148468017578125, -2.09576416015625, -2.043060302734375, -1.9903564453125, -1.937652587890625, -1.88494873046875, -1.832244873046875, -1.779541015625, -1.726837158203125, -1.67413330078125, -1.621429443359375, -1.5687255859375, -1.516021728515625, -1.46331787109375, -1.410614013671875, -1.35791015625, -1.305206298828125, -1.25250244140625, -1.199798583984375, -1.1470947265625, -1.094390869140625, -1.04168701171875, -0.988983154296875, -0.936279296875, -0.883575439453125, -0.83087158203125, -0.778167724609375, -0.7254638671875, -0.672760009765625, -0.62005615234375, -0.567352294921875, -0.5146484375, -0.461944580078125, -0.40924072265625, -0.356536865234375, -0.3038330078125, -0.251129150390625, -0.19842529296875, -0.145721435546875, -0.093017578125, -0.040313720703125, 0.01239013671875, 0.065093994140625, 0.1177978515625, 0.170501708984375, 0.22320556640625, 0.275909423828125, 0.32861328125, 0.381317138671875, 0.43402099609375, 0.486724853515625, 0.5394287109375, 0.592132568359375, 0.64483642578125, 0.697540283203125, 0.750244140625, 0.802947998046875, 0.85565185546875, 0.908355712890625, 0.9610595703125, 1.013763427734375, 1.06646728515625, 1.119171142578125, 1.171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 6.0, 3.0, 7.0, 18.0, 19.0, 27.0, 46.0, 43.0, 55.0, 54.0, 82.0, 82.0, 77.0, 91.0, 81.0, 77.0, 59.0, 50.0, 34.0, 32.0, 20.0, 17.0, 12.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.48828125, -4.3748779296875, -4.261474609375, -4.1480712890625, -4.03466796875, -3.9212646484375, -3.807861328125, -3.6944580078125, -3.5810546875, -3.4676513671875, -3.354248046875, -3.2408447265625, -3.12744140625, -3.0140380859375, -2.900634765625, -2.7872314453125, -2.673828125, -2.5604248046875, -2.447021484375, -2.3336181640625, -2.22021484375, -2.1068115234375, -1.993408203125, -1.8800048828125, -1.7666015625, -1.6531982421875, -1.539794921875, -1.4263916015625, -1.31298828125, -1.1995849609375, -1.086181640625, -0.9727783203125, -0.859375, -0.7459716796875, -0.632568359375, -0.5191650390625, -0.40576171875, -0.2923583984375, -0.178955078125, -0.0655517578125, 0.0478515625, 0.1612548828125, 0.274658203125, 0.3880615234375, 0.50146484375, 0.6148681640625, 0.728271484375, 0.8416748046875, 0.955078125, 1.0684814453125, 1.181884765625, 1.2952880859375, 1.40869140625, 1.5220947265625, 1.635498046875, 1.7489013671875, 1.8623046875, 1.9757080078125, 2.089111328125, 2.2025146484375, 2.31591796875, 2.4293212890625, 2.542724609375, 2.6561279296875, 2.76953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 1.0, 6.0, 8.0, 12.0, 1.0, 8.0, 13.0, 11.0, 15.0, 27.0, 15.0, 26.0, 28.0, 30.0, 31.0, 54.0, 106.0, 246.0, 820.0, 3942.0, 59598.0, 963599.0, 16775.0, 2136.0, 480.0, 172.0, 88.0, 47.0, 49.0, 36.0, 21.0, 19.0, 22.0, 18.0, 14.0, 4.0, 13.0, 12.0, 8.0, 5.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.62890625, -4.4857177734375, -4.342529296875, -4.1993408203125, -4.05615234375, -3.9129638671875, -3.769775390625, -3.6265869140625, -3.4833984375, -3.3402099609375, -3.197021484375, -3.0538330078125, -2.91064453125, -2.7674560546875, -2.624267578125, -2.4810791015625, -2.337890625, -2.1947021484375, -2.051513671875, -1.9083251953125, -1.76513671875, -1.6219482421875, -1.478759765625, -1.3355712890625, -1.1923828125, -1.0491943359375, -0.906005859375, -0.7628173828125, -0.61962890625, -0.4764404296875, -0.333251953125, -0.1900634765625, -0.046875, 0.0963134765625, 0.239501953125, 0.3826904296875, 0.52587890625, 0.6690673828125, 0.812255859375, 0.9554443359375, 1.0986328125, 1.2418212890625, 1.385009765625, 1.5281982421875, 1.67138671875, 1.8145751953125, 1.957763671875, 2.1009521484375, 2.244140625, 2.3873291015625, 2.530517578125, 2.6737060546875, 2.81689453125, 2.9600830078125, 3.103271484375, 3.2464599609375, 3.3896484375, 3.5328369140625, 3.676025390625, 3.8192138671875, 3.96240234375, 4.1055908203125, 4.248779296875, 4.3919677734375, 4.53515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 5.0, 6.0, 5.0, 5.0, 12.0, 7.0, 7.0, 8.0, 23.0, 16.0, 22.0, 21.0, 22.0, 37.0, 33.0, 38.0, 37.0, 35.0, 40.0, 34.0, 42.0, 41.0, 42.0, 47.0, 43.0, 27.0, 37.0, 32.0, 39.0, 33.0, 25.0, 30.0, 21.0, 22.0, 13.0, 9.0, 12.0, 16.0, 11.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.14556884765625, -2.0743408203125, -2.00311279296875, -1.931884765625, -1.86065673828125, -1.7894287109375, -1.71820068359375, -1.64697265625, -1.57574462890625, -1.5045166015625, -1.43328857421875, -1.362060546875, -1.29083251953125, -1.2196044921875, -1.14837646484375, -1.0771484375, -1.00592041015625, -0.9346923828125, -0.86346435546875, -0.792236328125, -0.72100830078125, -0.6497802734375, -0.57855224609375, -0.50732421875, -0.43609619140625, -0.3648681640625, -0.29364013671875, -0.222412109375, -0.15118408203125, -0.0799560546875, -0.00872802734375, 0.0625, 0.13372802734375, 0.2049560546875, 0.27618408203125, 0.347412109375, 0.41864013671875, 0.4898681640625, 0.56109619140625, 0.63232421875, 0.70355224609375, 0.7747802734375, 0.84600830078125, 0.917236328125, 0.98846435546875, 1.0596923828125, 1.13092041015625, 1.2021484375, 1.27337646484375, 1.3446044921875, 1.41583251953125, 1.487060546875, 1.55828857421875, 1.6295166015625, 1.70074462890625, 1.77197265625, 1.84320068359375, 1.9144287109375, 1.98565673828125, 2.056884765625, 2.12811279296875, 2.1993408203125, 2.27056884765625, 2.341796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 7.0, 15.0, 21.0, 31.0, 78.0, 107.0, 231.0, 609.0, 1939.0, 8819.0, 69854.0, 887122.0, 68157.0, 8607.0, 1898.0, 554.0, 198.0, 121.0, 64.0, 35.0, 32.0, 15.0, 14.0, 8.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68701171875, -0.6676559448242188, -0.6483001708984375, -0.6289443969726562, -0.609588623046875, -0.5902328491210938, -0.5708770751953125, -0.5515213012695312, -0.53216552734375, -0.5128097534179688, -0.4934539794921875, -0.47409820556640625, -0.454742431640625, -0.43538665771484375, -0.4160308837890625, -0.39667510986328125, -0.3773193359375, -0.35796356201171875, -0.3386077880859375, -0.31925201416015625, -0.299896240234375, -0.28054046630859375, -0.2611846923828125, -0.24182891845703125, -0.22247314453125, -0.20311737060546875, -0.1837615966796875, -0.16440582275390625, -0.145050048828125, -0.12569427490234375, -0.1063385009765625, -0.08698272705078125, -0.067626953125, -0.04827117919921875, -0.0289154052734375, -0.00955963134765625, 0.009796142578125, 0.02915191650390625, 0.0485076904296875, 0.06786346435546875, 0.08721923828125, 0.10657501220703125, 0.1259307861328125, 0.14528656005859375, 0.164642333984375, 0.18399810791015625, 0.2033538818359375, 0.22270965576171875, 0.2420654296875, 0.26142120361328125, 0.2807769775390625, 0.30013275146484375, 0.319488525390625, 0.33884429931640625, 0.3582000732421875, 0.37755584716796875, 0.39691162109375, 0.41626739501953125, 0.4356231689453125, 0.45497894287109375, 0.474334716796875, 0.49369049072265625, 0.5130462646484375, 0.5324020385742188, 0.5517578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 4.0, 10.0, 8.0, 14.0, 18.0, 26.0, 48.0, 78.0, 141.0, 212.0, 185.0, 100.0, 51.0, 28.0, 29.0, 15.0, 9.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.958578109741211e-05, -8.684210479259491e-05, -8.409842848777771e-05, -8.135475218296051e-05, -7.861107587814331e-05, -7.586739957332611e-05, -7.312372326850891e-05, -7.038004696369171e-05, -6.763637065887451e-05, -6.489269435405731e-05, -6.214901804924011e-05, -5.940534174442291e-05, -5.666166543960571e-05, -5.391798913478851e-05, -5.1174312829971313e-05, -4.8430636525154114e-05, -4.5686960220336914e-05, -4.2943283915519714e-05, -4.0199607610702515e-05, -3.7455931305885315e-05, -3.4712255001068115e-05, -3.1968578696250916e-05, -2.9224902391433716e-05, -2.6481226086616516e-05, -2.3737549781799316e-05, -2.0993873476982117e-05, -1.8250197172164917e-05, -1.5506520867347717e-05, -1.2762844562530518e-05, -1.0019168257713318e-05, -7.275491952896118e-06, -4.5318156480789185e-06, -1.7881393432617188e-06, 9.55536961555481e-07, 3.6992132663726807e-06, 6.44288957118988e-06, 9.18656587600708e-06, 1.193024218082428e-05, 1.467391848564148e-05, 1.741759479045868e-05, 2.016127109527588e-05, 2.290494740009308e-05, 2.564862370491028e-05, 2.8392300009727478e-05, 3.113597631454468e-05, 3.387965261936188e-05, 3.662332892417908e-05, 3.936700522899628e-05, 4.2110681533813477e-05, 4.4854357838630676e-05, 4.7598034143447876e-05, 5.0341710448265076e-05, 5.3085386753082275e-05, 5.5829063057899475e-05, 5.8572739362716675e-05, 6.131641566753387e-05, 6.406009197235107e-05, 6.680376827716827e-05, 6.954744458198547e-05, 7.229112088680267e-05, 7.503479719161987e-05, 7.777847349643707e-05, 8.052214980125427e-05, 8.326582610607147e-05, 8.600950241088867e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 5.0, 13.0, 11.0, 16.0, 21.0, 28.0, 37.0, 62.0, 90.0, 168.0, 373.0, 813.0, 1983.0, 6509.0, 29511.0, 502911.0, 467025.0, 28923.0, 6321.0, 2055.0, 792.0, 381.0, 183.0, 95.0, 63.0, 41.0, 21.0, 18.0, 15.0, 24.0, 7.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4528312683105469, -0.43471527099609375, -0.4165992736816406, -0.3984832763671875, -0.3803672790527344, -0.36225128173828125, -0.3441352844238281, -0.326019287109375, -0.3079032897949219, -0.28978729248046875, -0.2716712951660156, -0.2535552978515625, -0.23543930053710938, -0.21732330322265625, -0.19920730590820312, -0.18109130859375, -0.16297531127929688, -0.14485931396484375, -0.12674331665039062, -0.1086273193359375, -0.09051132202148438, -0.07239532470703125, -0.054279327392578125, -0.036163330078125, -0.018047332763671875, 6.866455078125e-05, 0.018184661865234375, 0.0363006591796875, 0.054416656494140625, 0.07253265380859375, 0.09064865112304688, 0.1087646484375, 0.12688064575195312, 0.14499664306640625, 0.16311264038085938, 0.1812286376953125, 0.19934463500976562, 0.21746063232421875, 0.23557662963867188, 0.253692626953125, 0.2718086242675781, 0.28992462158203125, 0.3080406188964844, 0.3261566162109375, 0.3442726135253906, 0.36238861083984375, 0.3805046081542969, 0.39862060546875, 0.4167366027832031, 0.43485260009765625, 0.4529685974121094, 0.4710845947265625, 0.4892005920410156, 0.5073165893554688, 0.5254325866699219, 0.543548583984375, 0.5616645812988281, 0.5797805786132812, 0.5978965759277344, 0.6160125732421875, 0.6341285705566406, 0.6522445678710938, 0.6703605651855469, 0.6884765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 14.0, 12.0, 17.0, 36.0, 48.0, 72.0, 101.0, 316.0, 143.0, 79.0, 52.0, 29.0, 24.0, 18.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3648242950439453, -0.3556251525878906, -0.34642601013183594, -0.33722686767578125, -0.32802772521972656, -0.3188285827636719, -0.3096294403076172, -0.3004302978515625, -0.2912311553955078, -0.2820320129394531, -0.27283287048339844, -0.26363372802734375, -0.25443458557128906, -0.24523544311523438, -0.2360363006591797, -0.226837158203125, -0.2176380157470703, -0.20843887329101562, -0.19923973083496094, -0.19004058837890625, -0.18084144592285156, -0.17164230346679688, -0.1624431610107422, -0.1532440185546875, -0.1440448760986328, -0.13484573364257812, -0.12564659118652344, -0.11644744873046875, -0.10724830627441406, -0.09804916381835938, -0.08885002136230469, -0.07965087890625, -0.07045173645019531, -0.061252593994140625, -0.05205345153808594, -0.04285430908203125, -0.03365516662597656, -0.024456024169921875, -0.015256881713867188, -0.0060577392578125, 0.0031414031982421875, 0.012340545654296875, 0.021539688110351562, 0.03073883056640625, 0.03993797302246094, 0.049137115478515625, 0.05833625793457031, 0.067535400390625, 0.07673454284667969, 0.08593368530273438, 0.09513282775878906, 0.10433197021484375, 0.11353111267089844, 0.12273025512695312, 0.1319293975830078, 0.1411285400390625, 0.1503276824951172, 0.15952682495117188, 0.16872596740722656, 0.17792510986328125, 0.18712425231933594, 0.19632339477539062, 0.2055225372314453, 0.2147216796875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 13.0, 16.0, 19.0, 29.0, 55.0, 65.0, 64.0, 103.0, 101.0, 111.0, 94.0, 106.0, 62.0, 50.0, 25.0, 29.0, 19.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07796573638916, -1.9573192596435547, -1.8366727828979492, -1.7160263061523438, -1.5953797101974487, -1.4747332334518433, -1.3540867567062378, -1.2334401607513428, -1.1127936840057373, -0.9921472072601318, -0.8715006709098816, -0.7508541941642761, -0.6302076578140259, -0.5095611810684204, -0.38891470432281494, -0.2682681679725647, -0.147621750831604, -0.026975251734256744, 0.09367124736309052, 0.21431773900985718, 0.33496424555778503, 0.4556107521057129, 0.5762572288513184, 0.6969037652015686, 0.8175502419471741, 0.9381967186927795, 1.0588432550430298, 1.1794897317886353, 1.3001362085342407, 1.4207828044891357, 1.5414292812347412, 1.6620757579803467, 1.7827222347259521, 1.9033687114715576, 2.024015188217163, 2.1446616649627686, 2.265308141708374, 2.3859548568725586, 2.506601333618164, 2.6272478103637695, 2.747894287109375, 2.8685407638549805, 2.989187240600586, 3.1098337173461914, 3.230480194091797, 3.3511266708374023, 3.471773147583008, 3.5924198627471924, 3.7130661010742188, 3.833712577819824, 3.9543590545654297, 4.075005531311035, 4.195652008056641, 4.316298484802246, 4.436944961547852, 4.557591438293457, 4.678238391876221, 4.798884868621826, 4.919531345367432, 5.040177822113037, 5.160824298858643, 5.281470775604248, 5.4021172523498535, 5.522763729095459, 5.6434102058410645]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 13.0, 9.0, 9.0, 14.0, 18.0, 32.0, 24.0, 44.0, 45.0, 50.0, 51.0, 72.0, 72.0, 57.0, 66.0, 59.0, 48.0, 58.0, 55.0, 47.0, 35.0, 24.0, 24.0, 25.0, 18.0, 10.0, 10.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.204848766326904, -7.016234397888184, -6.827620506286621, -6.6390061378479, -6.45039176940918, -6.261777400970459, -6.0731635093688965, -5.884549140930176, -5.695934772491455, -5.507320404052734, -5.318706512451172, -5.130092144012451, -4.9414777755737305, -4.75286340713501, -4.564249515533447, -4.375635147094727, -4.187021255493164, -3.9984071254730225, -3.8097927570343018, -3.62117862701416, -3.4325642585754395, -3.243950128555298, -3.0553359985351562, -2.8667216300964355, -2.678107261657715, -2.4894931316375732, -2.3008787631988525, -2.112264633178711, -1.9236502647399902, -1.7350361347198486, -1.5464218854904175, -1.3578076362609863, -1.1691932678222656, -0.9805790185928345, -0.7919647693634033, -0.6033505797386169, -0.4147363305091858, -0.22612208127975464, -0.03750789165496826, 0.1511063575744629, 0.33972060680389404, 0.5283348560333252, 0.7169491052627563, 0.9055632948875427, 1.094177484512329, 1.2827918529510498, 1.4714059829711914, 1.6600202322006226, 1.8486344814300537, 2.0372486114501953, 2.225862979888916, 2.4144771099090576, 2.6030914783477783, 2.79170560836792, 2.9803199768066406, 3.1689341068267822, 3.357548236846924, 3.5461623668670654, 3.734776735305786, 3.9233908653259277, 4.112005233764648, 4.300619602203369, 4.489233493804932, 4.677847862243652, 4.866462230682373]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 9.0, 10.0, 15.0, 19.0, 30.0, 40.0, 50.0, 68.0, 125.0, 184.0, 308.0, 550.0, 901.0, 1684.0, 3296.0, 7315.0, 20646.0, 133235.0, 2866906.0, 1077526.0, 56769.0, 13453.0, 5330.0, 2567.0, 1361.0, 778.0, 416.0, 268.0, 151.0, 70.0, 46.0, 41.0, 31.0, 29.0, 8.0, 15.0, 8.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.587066650390625, -2.50030517578125, -2.413543701171875, -2.3267822265625, -2.240020751953125, -2.15325927734375, -2.066497802734375, -1.979736328125, -1.892974853515625, -1.80621337890625, -1.719451904296875, -1.6326904296875, -1.545928955078125, -1.45916748046875, -1.372406005859375, -1.28564453125, -1.198883056640625, -1.11212158203125, -1.025360107421875, -0.9385986328125, -0.851837158203125, -0.76507568359375, -0.678314208984375, -0.591552734375, -0.504791259765625, -0.41802978515625, -0.331268310546875, -0.2445068359375, -0.157745361328125, -0.07098388671875, 0.015777587890625, 0.1025390625, 0.189300537109375, 0.27606201171875, 0.362823486328125, 0.4495849609375, 0.536346435546875, 0.62310791015625, 0.709869384765625, 0.796630859375, 0.883392333984375, 0.97015380859375, 1.056915283203125, 1.1436767578125, 1.230438232421875, 1.31719970703125, 1.403961181640625, 1.49072265625, 1.577484130859375, 1.66424560546875, 1.751007080078125, 1.8377685546875, 1.924530029296875, 2.01129150390625, 2.098052978515625, 2.184814453125, 2.271575927734375, 2.35833740234375, 2.445098876953125, 2.5318603515625, 2.618621826171875, 2.70538330078125, 2.792144775390625, 2.87890625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 9.0, 11.0, 20.0, 20.0, 29.0, 36.0, 44.0, 42.0, 64.0, 64.0, 87.0, 76.0, 86.0, 62.0, 65.0, 63.0, 55.0, 41.0, 36.0, 22.0, 24.0, 12.0, 11.0, 10.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.58563232421875, -1.5306396484375, -1.47564697265625, -1.420654296875, -1.36566162109375, -1.3106689453125, -1.25567626953125, -1.20068359375, -1.14569091796875, -1.0906982421875, -1.03570556640625, -0.980712890625, -0.92572021484375, -0.8707275390625, -0.81573486328125, -0.7607421875, -0.70574951171875, -0.6507568359375, -0.59576416015625, -0.540771484375, -0.48577880859375, -0.4307861328125, -0.37579345703125, -0.32080078125, -0.26580810546875, -0.2108154296875, -0.15582275390625, -0.100830078125, -0.04583740234375, 0.0091552734375, 0.06414794921875, 0.119140625, 0.17413330078125, 0.2291259765625, 0.28411865234375, 0.339111328125, 0.39410400390625, 0.4490966796875, 0.50408935546875, 0.55908203125, 0.61407470703125, 0.6690673828125, 0.72406005859375, 0.779052734375, 0.83404541015625, 0.8890380859375, 0.94403076171875, 0.9990234375, 1.05401611328125, 1.1090087890625, 1.16400146484375, 1.218994140625, 1.27398681640625, 1.3289794921875, 1.38397216796875, 1.43896484375, 1.49395751953125, 1.5489501953125, 1.60394287109375, 1.658935546875, 1.71392822265625, 1.7689208984375, 1.82391357421875, 1.87890625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 4.0, 11.0, 13.0, 17.0, 41.0, 101.0, 284.0, 1114.0, 8566.0, 544847.0, 3622862.0, 14233.0, 1583.0, 375.0, 132.0, 45.0, 20.0, 15.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.77972412109375, -5.5399169921875, -5.30010986328125, -5.060302734375, -4.82049560546875, -4.5806884765625, -4.34088134765625, -4.10107421875, -3.86126708984375, -3.6214599609375, -3.38165283203125, -3.141845703125, -2.90203857421875, -2.6622314453125, -2.42242431640625, -2.1826171875, -1.94281005859375, -1.7030029296875, -1.46319580078125, -1.223388671875, -0.98358154296875, -0.7437744140625, -0.50396728515625, -0.26416015625, -0.02435302734375, 0.2154541015625, 0.45526123046875, 0.695068359375, 0.93487548828125, 1.1746826171875, 1.41448974609375, 1.654296875, 1.89410400390625, 2.1339111328125, 2.37371826171875, 2.613525390625, 2.85333251953125, 3.0931396484375, 3.33294677734375, 3.57275390625, 3.81256103515625, 4.0523681640625, 4.29217529296875, 4.531982421875, 4.77178955078125, 5.0115966796875, 5.25140380859375, 5.4912109375, 5.73101806640625, 5.9708251953125, 6.21063232421875, 6.450439453125, 6.69024658203125, 6.9300537109375, 7.16986083984375, 7.40966796875, 7.64947509765625, 7.8892822265625, 8.12908935546875, 8.368896484375, 8.60870361328125, 8.8485107421875, 9.08831787109375, 9.328125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 7.0, 13.0, 28.0, 33.0, 46.0, 70.0, 105.0, 274.0, 644.0, 1276.0, 879.0, 313.0, 139.0, 85.0, 42.0, 27.0, 31.0, 19.0, 12.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.28125, -1.2442779541015625, -1.207305908203125, -1.1703338623046875, -1.13336181640625, -1.0963897705078125, -1.059417724609375, -1.0224456787109375, -0.9854736328125, -0.9485015869140625, -0.911529541015625, -0.8745574951171875, -0.83758544921875, -0.8006134033203125, -0.763641357421875, -0.7266693115234375, -0.689697265625, -0.6527252197265625, -0.615753173828125, -0.5787811279296875, -0.54180908203125, -0.5048370361328125, -0.467864990234375, -0.4308929443359375, -0.3939208984375, -0.3569488525390625, -0.319976806640625, -0.2830047607421875, -0.24603271484375, -0.2090606689453125, -0.172088623046875, -0.1351165771484375, -0.09814453125, -0.0611724853515625, -0.024200439453125, 0.0127716064453125, 0.04974365234375, 0.0867156982421875, 0.123687744140625, 0.1606597900390625, 0.1976318359375, 0.2346038818359375, 0.271575927734375, 0.3085479736328125, 0.34552001953125, 0.3824920654296875, 0.419464111328125, 0.4564361572265625, 0.493408203125, 0.5303802490234375, 0.567352294921875, 0.6043243408203125, 0.64129638671875, 0.6782684326171875, 0.715240478515625, 0.7522125244140625, 0.7891845703125, 0.8261566162109375, 0.863128662109375, 0.9001007080078125, 0.93707275390625, 0.9740447998046875, 1.011016845703125, 1.0479888916015625, 1.0849609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 14.0, 15.0, 26.0, 43.0, 48.0, 69.0, 81.0, 90.0, 85.0, 93.0, 90.0, 57.0, 65.0, 51.0, 45.0, 32.0, 20.0, 13.0, 16.0, 10.0, 4.0, 2.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9601361751556396, -2.886221170425415, -2.8123061656951904, -2.738391160964966, -2.664476156234741, -2.5905611515045166, -2.516646146774292, -2.4427311420440674, -2.3688161373138428, -2.294901132583618, -2.2209861278533936, -2.147071123123169, -2.0731561183929443, -1.9992411136627197, -1.9253261089324951, -1.8514111042022705, -1.777496099472046, -1.7035810947418213, -1.6296660900115967, -1.555751085281372, -1.4818360805511475, -1.4079210758209229, -1.3340060710906982, -1.2600910663604736, -1.186176061630249, -1.1122610569000244, -1.0383460521697998, -0.9644310474395752, -0.8905160427093506, -0.816601037979126, -0.7426860332489014, -0.6687710285186768, -0.594855785369873, -0.5209407806396484, -0.44702577590942383, -0.3731107711791992, -0.2991957664489746, -0.22528076171875, -0.1513657569885254, -0.07745075225830078, -0.003535747528076172, 0.07037925720214844, 0.14429426193237305, 0.21820926666259766, 0.29212427139282227, 0.3660392761230469, 0.4399542808532715, 0.5138692855834961, 0.5877842903137207, 0.6616992950439453, 0.7356142997741699, 0.8095293045043945, 0.8834443092346191, 0.9573593139648438, 1.0312743186950684, 1.105189323425293, 1.1791043281555176, 1.2530193328857422, 1.3269343376159668, 1.4008493423461914, 1.474764347076416, 1.5486793518066406, 1.6225943565368652, 1.6965093612670898, 1.7704243659973145]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 10.0, 11.0, 22.0, 18.0, 23.0, 26.0, 24.0, 44.0, 43.0, 49.0, 37.0, 48.0, 64.0, 46.0, 54.0, 54.0, 64.0, 49.0, 43.0, 34.0, 40.0, 34.0, 31.0, 36.0, 26.0, 11.0, 22.0, 13.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814132571220398, -1.7562949657440186, -1.6984574794769287, -1.6406199932098389, -1.5827823877334595, -1.52494478225708, -1.4671072959899902, -1.4092698097229004, -1.351432204246521, -1.2935945987701416, -1.2357571125030518, -1.177919626235962, -1.1200820207595825, -1.0622444152832031, -1.0044069290161133, -0.9465693831443787, -0.888731837272644, -0.8308942914009094, -0.7730567455291748, -0.7152191996574402, -0.6573816537857056, -0.599544107913971, -0.5417065620422363, -0.4838690161705017, -0.4260314702987671, -0.36819392442703247, -0.31035637855529785, -0.25251883268356323, -0.1946812868118286, -0.136843740940094, -0.07900619506835938, -0.021168649196624756, 0.03666889667510986, 0.09450644254684448, 0.1523439884185791, 0.21018153429031372, 0.26801908016204834, 0.32585662603378296, 0.3836941719055176, 0.4415317177772522, 0.4993692636489868, 0.5572068095207214, 0.615044355392456, 0.6728819012641907, 0.7307194471359253, 0.7885569930076599, 0.8463945388793945, 0.9042320847511292, 0.9620696306228638, 1.0199072360992432, 1.077744722366333, 1.1355822086334229, 1.1934198141098022, 1.2512574195861816, 1.3090949058532715, 1.3669323921203613, 1.4247699975967407, 1.4826076030731201, 1.54044508934021, 1.5982825756072998, 1.6561201810836792, 1.7139577865600586, 1.7717952728271484, 1.8296327590942383, 1.8874703645706177]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 8.0, 5.0, 6.0, 12.0, 25.0, 27.0, 48.0, 57.0, 72.0, 147.0, 252.0, 430.0, 1024.0, 2802.0, 10152.0, 56010.0, 613272.0, 319723.0, 33750.0, 6965.0, 2083.0, 750.0, 364.0, 189.0, 134.0, 80.0, 58.0, 32.0, 31.0, 16.0, 7.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4542350769042969, -0.43849945068359375, -0.4227638244628906, -0.4070281982421875, -0.3912925720214844, -0.37555694580078125, -0.3598213195800781, -0.344085693359375, -0.3283500671386719, -0.31261444091796875, -0.2968788146972656, -0.2811431884765625, -0.2654075622558594, -0.24967193603515625, -0.23393630981445312, -0.21820068359375, -0.20246505737304688, -0.18672943115234375, -0.17099380493164062, -0.1552581787109375, -0.13952255249023438, -0.12378692626953125, -0.10805130004882812, -0.092315673828125, -0.07658004760742188, -0.06084442138671875, -0.045108795166015625, -0.0293731689453125, -0.013637542724609375, 0.00209808349609375, 0.017833709716796875, 0.0335693359375, 0.049304962158203125, 0.06504058837890625, 0.08077621459960938, 0.0965118408203125, 0.11224746704101562, 0.12798309326171875, 0.14371871948242188, 0.159454345703125, 0.17518997192382812, 0.19092559814453125, 0.20666122436523438, 0.2223968505859375, 0.23813247680664062, 0.25386810302734375, 0.2696037292480469, 0.28533935546875, 0.3010749816894531, 0.31681060791015625, 0.3325462341308594, 0.3482818603515625, 0.3640174865722656, 0.37975311279296875, 0.3954887390136719, 0.411224365234375, 0.4269599914550781, 0.44269561767578125, 0.4584312438964844, 0.4741668701171875, 0.4899024963378906, 0.5056381225585938, 0.5213737487792969, 0.537109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 9.0, 14.0, 21.0, 26.0, 15.0, 36.0, 40.0, 44.0, 53.0, 52.0, 53.0, 64.0, 44.0, 59.0, 73.0, 67.0, 59.0, 32.0, 46.0, 38.0, 34.0, 32.0, 24.0, 22.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.046295166015625, -1.00860595703125, -0.970916748046875, -0.9332275390625, -0.895538330078125, -0.85784912109375, -0.820159912109375, -0.782470703125, -0.744781494140625, -0.70709228515625, -0.669403076171875, -0.6317138671875, -0.594024658203125, -0.55633544921875, -0.518646240234375, -0.48095703125, -0.443267822265625, -0.40557861328125, -0.367889404296875, -0.3302001953125, -0.292510986328125, -0.25482177734375, -0.217132568359375, -0.179443359375, -0.141754150390625, -0.10406494140625, -0.066375732421875, -0.0286865234375, 0.009002685546875, 0.04669189453125, 0.084381103515625, 0.1220703125, 0.159759521484375, 0.19744873046875, 0.235137939453125, 0.2728271484375, 0.310516357421875, 0.34820556640625, 0.385894775390625, 0.423583984375, 0.461273193359375, 0.49896240234375, 0.536651611328125, 0.5743408203125, 0.612030029296875, 0.64971923828125, 0.687408447265625, 0.72509765625, 0.762786865234375, 0.80047607421875, 0.838165283203125, 0.8758544921875, 0.913543701171875, 0.95123291015625, 0.988922119140625, 1.026611328125, 1.064300537109375, 1.10198974609375, 1.139678955078125, 1.1773681640625, 1.215057373046875, 1.25274658203125, 1.290435791015625, 1.328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 1.0, 8.0, 15.0, 15.0, 41.0, 46.0, 58.0, 78.0, 113.0, 213.0, 317.0, 435.0, 689.0, 1059.0, 1704.0, 2791.0, 4804.0, 8403.0, 15059.0, 28024.0, 56100.0, 118148.0, 241026.0, 276096.0, 147405.0, 69456.0, 34340.0, 17942.0, 9801.0, 5647.0, 3295.0, 2025.0, 1222.0, 752.0, 472.0, 297.0, 204.0, 135.0, 108.0, 70.0, 52.0, 24.0, 19.0, 17.0, 11.0, 4.0, 10.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08270549774169922, -0.07996177673339844, -0.07721805572509766, -0.07447433471679688, -0.0717306137084961, -0.06898689270019531, -0.06624317169189453, -0.06349945068359375, -0.06075572967529297, -0.05801200866699219, -0.055268287658691406, -0.052524566650390625, -0.049780845642089844, -0.04703712463378906, -0.04429340362548828, -0.0415496826171875, -0.03880596160888672, -0.03606224060058594, -0.033318519592285156, -0.030574798583984375, -0.027831077575683594, -0.025087356567382812, -0.02234363555908203, -0.01959991455078125, -0.01685619354248047, -0.014112472534179688, -0.011368751525878906, -0.008625030517578125, -0.005881309509277344, -0.0031375885009765625, -0.00039386749267578125, 0.002349853515625, 0.005093574523925781, 0.007837295532226562, 0.010581016540527344, 0.013324737548828125, 0.016068458557128906, 0.018812179565429688, 0.02155590057373047, 0.02429962158203125, 0.02704334259033203, 0.029787063598632812, 0.032530784606933594, 0.035274505615234375, 0.038018226623535156, 0.04076194763183594, 0.04350566864013672, 0.0462493896484375, 0.04899311065673828, 0.05173683166503906, 0.054480552673339844, 0.057224273681640625, 0.059967994689941406, 0.06271171569824219, 0.06545543670654297, 0.06819915771484375, 0.07094287872314453, 0.07368659973144531, 0.0764303207397461, 0.07917404174804688, 0.08191776275634766, 0.08466148376464844, 0.08740520477294922, 0.09014892578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 7.0, 7.0, 8.0, 11.0, 11.0, 15.0, 18.0, 25.0, 25.0, 30.0, 29.0, 35.0, 42.0, 44.0, 45.0, 54.0, 50.0, 52.0, 49.0, 61.0, 44.0, 42.0, 51.0, 39.0, 36.0, 31.0, 27.0, 20.0, 18.0, 15.0, 9.0, 16.0, 6.0, 10.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.029296875, -1.966766357421875, -1.90423583984375, -1.841705322265625, -1.7791748046875, -1.716644287109375, -1.65411376953125, -1.591583251953125, -1.529052734375, -1.466522216796875, -1.40399169921875, -1.341461181640625, -1.2789306640625, -1.216400146484375, -1.15386962890625, -1.091339111328125, -1.02880859375, -0.966278076171875, -0.90374755859375, -0.841217041015625, -0.7786865234375, -0.716156005859375, -0.65362548828125, -0.591094970703125, -0.528564453125, -0.466033935546875, -0.40350341796875, -0.340972900390625, -0.2784423828125, -0.215911865234375, -0.15338134765625, -0.090850830078125, -0.0283203125, 0.034210205078125, 0.09674072265625, 0.159271240234375, 0.2218017578125, 0.284332275390625, 0.34686279296875, 0.409393310546875, 0.471923828125, 0.534454345703125, 0.59698486328125, 0.659515380859375, 0.7220458984375, 0.784576416015625, 0.84710693359375, 0.909637451171875, 0.97216796875, 1.034698486328125, 1.09722900390625, 1.159759521484375, 1.2222900390625, 1.284820556640625, 1.34735107421875, 1.409881591796875, 1.472412109375, 1.534942626953125, 1.59747314453125, 1.660003662109375, 1.7225341796875, 1.785064697265625, 1.84759521484375, 1.910125732421875, 1.97265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 10.0, 10.0, 29.0, 47.0, 92.0, 120.0, 233.0, 404.0, 905.0, 2011.0, 5617.0, 21644.0, 133240.0, 716659.0, 135433.0, 22225.0, 6047.0, 2017.0, 826.0, 420.0, 215.0, 102.0, 100.0, 51.0, 27.0, 23.0, 11.0, 8.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03802490234375, -0.03689002990722656, -0.035755157470703125, -0.03462028503417969, -0.03348541259765625, -0.03235054016113281, -0.031215667724609375, -0.030080795288085938, -0.0289459228515625, -0.027811050415039062, -0.026676177978515625, -0.025541305541992188, -0.02440643310546875, -0.023271560668945312, -0.022136688232421875, -0.021001815795898438, -0.019866943359375, -0.018732070922851562, -0.017597198486328125, -0.016462326049804688, -0.01532745361328125, -0.014192581176757812, -0.013057708740234375, -0.011922836303710938, -0.0107879638671875, -0.009653091430664062, -0.008518218994140625, -0.0073833465576171875, -0.00624847412109375, -0.0051136016845703125, -0.003978729248046875, -0.0028438568115234375, -0.001708984375, -0.0005741119384765625, 0.000560760498046875, 0.0016956329345703125, 0.00283050537109375, 0.0039653778076171875, 0.005100250244140625, 0.0062351226806640625, 0.0073699951171875, 0.008504867553710938, 0.009639739990234375, 0.010774612426757812, 0.01190948486328125, 0.013044357299804688, 0.014179229736328125, 0.015314102172851562, 0.016448974609375, 0.017583847045898438, 0.018718719482421875, 0.019853591918945312, 0.02098846435546875, 0.022123336791992188, 0.023258209228515625, 0.024393081665039062, 0.0255279541015625, 0.026662826538085938, 0.027797698974609375, 0.028932571411132812, 0.03006744384765625, 0.031202316284179688, 0.032337188720703125, 0.03347206115722656, 0.03460693359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 9.0, 10.0, 5.0, 14.0, 28.0, 26.0, 51.0, 61.0, 83.0, 90.0, 115.0, 109.0, 106.0, 68.0, 53.0, 55.0, 29.0, 21.0, 12.0, 10.0, 9.0, 8.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.45246696472168e-05, -4.317052662372589e-05, -4.1816383600234985e-05, -4.046224057674408e-05, -3.9108097553253174e-05, -3.775395452976227e-05, -3.639981150627136e-05, -3.5045668482780457e-05, -3.369152545928955e-05, -3.2337382435798645e-05, -3.098323941230774e-05, -2.9629096388816833e-05, -2.8274953365325928e-05, -2.6920810341835022e-05, -2.5566667318344116e-05, -2.421252429485321e-05, -2.2858381271362305e-05, -2.15042382478714e-05, -2.0150095224380493e-05, -1.8795952200889587e-05, -1.744180917739868e-05, -1.6087666153907776e-05, -1.473352313041687e-05, -1.3379380106925964e-05, -1.2025237083435059e-05, -1.0671094059944153e-05, -9.316951036453247e-06, -7.962808012962341e-06, -6.6086649894714355e-06, -5.25452196598053e-06, -3.900378942489624e-06, -2.5462359189987183e-06, -1.1920928955078125e-06, 1.6205012798309326e-07, 1.516193151473999e-06, 2.8703361749649048e-06, 4.2244791984558105e-06, 5.578622221946716e-06, 6.932765245437622e-06, 8.286908268928528e-06, 9.641051292419434e-06, 1.099519431591034e-05, 1.2349337339401245e-05, 1.3703480362892151e-05, 1.5057623386383057e-05, 1.6411766409873962e-05, 1.7765909433364868e-05, 1.9120052456855774e-05, 2.047419548034668e-05, 2.1828338503837585e-05, 2.318248152732849e-05, 2.4536624550819397e-05, 2.5890767574310303e-05, 2.724491059780121e-05, 2.8599053621292114e-05, 2.995319664478302e-05, 3.1307339668273926e-05, 3.266148269176483e-05, 3.401562571525574e-05, 3.536976873874664e-05, 3.672391176223755e-05, 3.8078054785728455e-05, 3.943219780921936e-05, 4.0786340832710266e-05, 4.214048385620117e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 7.0, 11.0, 11.0, 17.0, 31.0, 73.0, 157.0, 317.0, 813.0, 2313.0, 8127.0, 41483.0, 600122.0, 356005.0, 29430.0, 6442.0, 1949.0, 703.0, 290.0, 100.0, 48.0, 34.0, 22.0, 17.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056884765625, -0.05530071258544922, -0.05371665954589844, -0.052132606506347656, -0.050548553466796875, -0.048964500427246094, -0.04738044738769531, -0.04579639434814453, -0.04421234130859375, -0.04262828826904297, -0.04104423522949219, -0.039460182189941406, -0.037876129150390625, -0.036292076110839844, -0.03470802307128906, -0.03312397003173828, -0.0315399169921875, -0.02995586395263672, -0.028371810913085938, -0.026787757873535156, -0.025203704833984375, -0.023619651794433594, -0.022035598754882812, -0.02045154571533203, -0.01886749267578125, -0.01728343963623047, -0.015699386596679688, -0.014115333557128906, -0.012531280517578125, -0.010947227478027344, -0.009363174438476562, -0.007779121398925781, -0.006195068359375, -0.004611015319824219, -0.0030269622802734375, -0.0014429092407226562, 0.000141143798828125, 0.0017251968383789062, 0.0033092498779296875, 0.004893302917480469, 0.00647735595703125, 0.008061408996582031, 0.009645462036132812, 0.011229515075683594, 0.012813568115234375, 0.014397621154785156, 0.015981674194335938, 0.01756572723388672, 0.0191497802734375, 0.02073383331298828, 0.022317886352539062, 0.023901939392089844, 0.025485992431640625, 0.027070045471191406, 0.028654098510742188, 0.03023815155029297, 0.03182220458984375, 0.03340625762939453, 0.03499031066894531, 0.036574363708496094, 0.038158416748046875, 0.039742469787597656, 0.04132652282714844, 0.04291057586669922, 0.04449462890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 22.0, 18.0, 32.0, 36.0, 42.0, 60.0, 65.0, 104.0, 127.0, 116.0, 91.0, 56.0, 53.0, 31.0, 26.0, 25.0, 14.0, 11.0, 9.0, 3.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.010101318359375, -0.009809017181396484, -0.009516716003417969, -0.009224414825439453, -0.008932113647460938, -0.008639812469482422, -0.008347511291503906, -0.00805521011352539, -0.007762908935546875, -0.007470607757568359, -0.007178306579589844, -0.006886005401611328, -0.0065937042236328125, -0.006301403045654297, -0.006009101867675781, -0.005716800689697266, -0.00542449951171875, -0.005132198333740234, -0.004839897155761719, -0.004547595977783203, -0.0042552947998046875, -0.003962993621826172, -0.0036706924438476562, -0.0033783912658691406, -0.003086090087890625, -0.0027937889099121094, -0.0025014877319335938, -0.002209186553955078, -0.0019168853759765625, -0.0016245841979980469, -0.0013322830200195312, -0.0010399818420410156, -0.0007476806640625, -0.0004553794860839844, -0.00016307830810546875, 0.00012922286987304688, 0.0004215240478515625, 0.0007138252258300781, 0.0010061264038085938, 0.0012984275817871094, 0.001590728759765625, 0.0018830299377441406, 0.0021753311157226562, 0.002467632293701172, 0.0027599334716796875, 0.003052234649658203, 0.0033445358276367188, 0.0036368370056152344, 0.00392913818359375, 0.004221439361572266, 0.004513740539550781, 0.004806041717529297, 0.0050983428955078125, 0.005390644073486328, 0.005682945251464844, 0.005975246429443359, 0.006267547607421875, 0.006559848785400391, 0.006852149963378906, 0.007144451141357422, 0.0074367523193359375, 0.007729053497314453, 0.008021354675292969, 0.008313655853271484, 0.00860595703125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 10.0, 12.0, 10.0, 34.0, 47.0, 74.0, 126.0, 154.0, 140.0, 146.0, 85.0, 69.0, 42.0, 19.0, 17.0, 12.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02264142036438, -1.955837368965149, -1.889033317565918, -1.8222293853759766, -1.7554253339767456, -1.6886212825775146, -1.6218173503875732, -1.5550132989883423, -1.4882092475891113, -1.4214051961898804, -1.3546011447906494, -1.287797212600708, -1.220993161201477, -1.154189109802246, -1.0873851776123047, -1.0205811262130737, -0.9537770748138428, -0.8869730234146118, -0.8201690316200256, -0.7533650398254395, -0.6865609884262085, -0.6197569370269775, -0.5529529452323914, -0.4861489236354828, -0.4193449020385742, -0.35254088044166565, -0.2857368588447571, -0.2189328372478485, -0.15212881565093994, -0.08532479405403137, -0.018520772457122803, 0.04828324913978577, 0.11508750915527344, 0.181891530752182, 0.24869555234909058, 0.31549957394599915, 0.3823035955429077, 0.4491076171398163, 0.5159116387367249, 0.582715630531311, 0.649519681930542, 0.716323733329773, 0.7831277251243591, 0.8499317169189453, 0.9167357683181763, 0.9835398197174072, 1.0503437519073486, 1.1171478033065796, 1.1839518547058105, 1.2507559061050415, 1.3175599575042725, 1.3843638896942139, 1.4511679410934448, 1.5179719924926758, 1.5847759246826172, 1.6515799760818481, 1.718384027481079, 1.78518807888031, 1.851992130279541, 1.9187960624694824, 1.9856001138687134, 2.0524041652679443, 2.1192080974578857, 2.1860122680664062, 2.2528162002563477]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 8.0, 21.0, 14.0, 35.0, 22.0, 44.0, 48.0, 48.0, 53.0, 65.0, 68.0, 59.0, 62.0, 79.0, 53.0, 52.0, 43.0, 44.0, 37.0, 41.0, 26.0, 19.0, 18.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412394285202026, -1.2020649909973145, -1.1628905534744263, -1.123716115951538, -1.08454167842865, -1.0453672409057617, -1.0061928033828735, -0.9670184254646301, -0.9278439879417419, -0.8886695504188538, -0.8494951128959656, -0.8103206753730774, -0.771146297454834, -0.7319718599319458, -0.6927974224090576, -0.6536229848861694, -0.6144485473632812, -0.5752741098403931, -0.5360996723175049, -0.4969252645969391, -0.4577508270740509, -0.4185763895511627, -0.3794019818305969, -0.34022754430770874, -0.30105310678482056, -0.2618786692619324, -0.22270424664020538, -0.1835298240184784, -0.1443553864955902, -0.10518094897270203, -0.06600652635097504, -0.026832103729248047, 0.012342333793640137, 0.05151676386594772, 0.09069119393825531, 0.1298656165599823, 0.16904005408287048, 0.20821449160575867, 0.24738891422748566, 0.28656333684921265, 0.32573777437210083, 0.364912211894989, 0.4040866494178772, 0.443261057138443, 0.4824354946613312, 0.521609902381897, 0.5607843399047852, 0.5999587774276733, 0.6391332149505615, 0.6783076524734497, 0.7174820899963379, 0.7566565275192261, 0.7958309650421143, 0.8350054025650024, 0.8741797804832458, 0.913354218006134, 0.9525286555290222, 0.9917030930519104, 1.0308774709701538, 1.070051908493042, 1.1092263460159302, 1.1484007835388184, 1.1875752210617065, 1.2267496585845947, 1.265924096107483]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 6.0, 12.0, 25.0, 32.0, 49.0, 72.0, 95.0, 152.0, 220.0, 336.0, 584.0, 806.0, 1357.0, 2194.0, 3637.0, 6346.0, 11963.0, 25798.0, 90622.0, 660515.0, 174572.0, 35405.0, 14788.0, 7800.0, 4314.0, 2526.0, 1570.0, 939.0, 600.0, 393.0, 263.0, 197.0, 109.0, 76.0, 63.0, 38.0, 18.0, 17.0, 14.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4267578125, -1.385589599609375, -1.34442138671875, -1.303253173828125, -1.2620849609375, -1.220916748046875, -1.17974853515625, -1.138580322265625, -1.097412109375, -1.056243896484375, -1.01507568359375, -0.973907470703125, -0.9327392578125, -0.891571044921875, -0.85040283203125, -0.809234619140625, -0.76806640625, -0.726898193359375, -0.68572998046875, -0.644561767578125, -0.6033935546875, -0.562225341796875, -0.52105712890625, -0.479888916015625, -0.438720703125, -0.397552490234375, -0.35638427734375, -0.315216064453125, -0.2740478515625, -0.232879638671875, -0.19171142578125, -0.150543212890625, -0.109375, -0.068206787109375, -0.02703857421875, 0.014129638671875, 0.0552978515625, 0.096466064453125, 0.13763427734375, 0.178802490234375, 0.219970703125, 0.261138916015625, 0.30230712890625, 0.343475341796875, 0.3846435546875, 0.425811767578125, 0.46697998046875, 0.508148193359375, 0.54931640625, 0.590484619140625, 0.63165283203125, 0.672821044921875, 0.7139892578125, 0.755157470703125, 0.79632568359375, 0.837493896484375, 0.878662109375, 0.919830322265625, 0.96099853515625, 1.002166748046875, 1.0433349609375, 1.084503173828125, 1.12567138671875, 1.166839599609375, 1.2080078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 4.0, 8.0, 13.0, 21.0, 25.0, 33.0, 30.0, 36.0, 52.0, 43.0, 62.0, 64.0, 73.0, 59.0, 63.0, 54.0, 66.0, 57.0, 45.0, 35.0, 34.0, 28.0, 26.0, 21.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.91796875, -2.83770751953125, -2.7574462890625, -2.67718505859375, -2.596923828125, -2.51666259765625, -2.4364013671875, -2.35614013671875, -2.27587890625, -2.19561767578125, -2.1153564453125, -2.03509521484375, -1.954833984375, -1.87457275390625, -1.7943115234375, -1.71405029296875, -1.6337890625, -1.55352783203125, -1.4732666015625, -1.39300537109375, -1.312744140625, -1.23248291015625, -1.1522216796875, -1.07196044921875, -0.99169921875, -0.91143798828125, -0.8311767578125, -0.75091552734375, -0.670654296875, -0.59039306640625, -0.5101318359375, -0.42987060546875, -0.349609375, -0.26934814453125, -0.1890869140625, -0.10882568359375, -0.028564453125, 0.05169677734375, 0.1319580078125, 0.21221923828125, 0.29248046875, 0.37274169921875, 0.4530029296875, 0.53326416015625, 0.613525390625, 0.69378662109375, 0.7740478515625, 0.85430908203125, 0.9345703125, 1.01483154296875, 1.0950927734375, 1.17535400390625, 1.255615234375, 1.33587646484375, 1.4161376953125, 1.49639892578125, 1.57666015625, 1.65692138671875, 1.7371826171875, 1.81744384765625, 1.897705078125, 1.97796630859375, 2.0582275390625, 2.13848876953125, 2.21875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 5.0, 6.0, 15.0, 22.0, 14.0, 32.0, 56.0, 50.0, 104.0, 136.0, 219.0, 314.0, 540.0, 965.0, 1952.0, 3902.0, 7892.0, 18858.0, 77701.0, 806381.0, 92159.0, 20079.0, 8518.0, 3994.0, 2017.0, 1055.0, 562.0, 323.0, 216.0, 125.0, 96.0, 63.0, 36.0, 28.0, 20.0, 28.0, 13.0, 13.0, 5.0, 0.0, 8.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.870269775390625, -1.80694580078125, -1.743621826171875, -1.6802978515625, -1.616973876953125, -1.55364990234375, -1.490325927734375, -1.427001953125, -1.363677978515625, -1.30035400390625, -1.237030029296875, -1.1737060546875, -1.110382080078125, -1.04705810546875, -0.983734130859375, -0.92041015625, -0.857086181640625, -0.79376220703125, -0.730438232421875, -0.6671142578125, -0.603790283203125, -0.54046630859375, -0.477142333984375, -0.413818359375, -0.350494384765625, -0.28717041015625, -0.223846435546875, -0.1605224609375, -0.097198486328125, -0.03387451171875, 0.029449462890625, 0.0927734375, 0.156097412109375, 0.21942138671875, 0.282745361328125, 0.3460693359375, 0.409393310546875, 0.47271728515625, 0.536041259765625, 0.599365234375, 0.662689208984375, 0.72601318359375, 0.789337158203125, 0.8526611328125, 0.915985107421875, 0.97930908203125, 1.042633056640625, 1.10595703125, 1.169281005859375, 1.23260498046875, 1.295928955078125, 1.3592529296875, 1.422576904296875, 1.48590087890625, 1.549224853515625, 1.612548828125, 1.675872802734375, 1.73919677734375, 1.802520751953125, 1.8658447265625, 1.929168701171875, 1.99249267578125, 2.055816650390625, 2.119140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 8.0, 6.0, 10.0, 11.0, 11.0, 13.0, 19.0, 26.0, 36.0, 27.0, 36.0, 38.0, 38.0, 54.0, 53.0, 60.0, 63.0, 67.0, 60.0, 48.0, 43.0, 44.0, 42.0, 25.0, 29.0, 22.0, 23.0, 17.0, 20.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.17578125, -3.08502197265625, -2.9942626953125, -2.90350341796875, -2.812744140625, -2.72198486328125, -2.6312255859375, -2.54046630859375, -2.44970703125, -2.35894775390625, -2.2681884765625, -2.17742919921875, -2.086669921875, -1.99591064453125, -1.9051513671875, -1.81439208984375, -1.7236328125, -1.63287353515625, -1.5421142578125, -1.45135498046875, -1.360595703125, -1.26983642578125, -1.1790771484375, -1.08831787109375, -0.99755859375, -0.90679931640625, -0.8160400390625, -0.72528076171875, -0.634521484375, -0.54376220703125, -0.4530029296875, -0.36224365234375, -0.271484375, -0.18072509765625, -0.0899658203125, 0.00079345703125, 0.091552734375, 0.18231201171875, 0.2730712890625, 0.36383056640625, 0.45458984375, 0.54534912109375, 0.6361083984375, 0.72686767578125, 0.817626953125, 0.90838623046875, 0.9991455078125, 1.08990478515625, 1.1806640625, 1.27142333984375, 1.3621826171875, 1.45294189453125, 1.543701171875, 1.63446044921875, 1.7252197265625, 1.81597900390625, 1.90673828125, 1.99749755859375, 2.0882568359375, 2.17901611328125, 2.269775390625, 2.36053466796875, 2.4512939453125, 2.54205322265625, 2.6328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 9.0, 13.0, 17.0, 48.0, 73.0, 164.0, 530.0, 1897.0, 9016.0, 110470.0, 886027.0, 33799.0, 4728.0, 1166.0, 364.0, 107.0, 62.0, 29.0, 10.0, 6.0, 11.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7724609375, -0.7477874755859375, -0.723114013671875, -0.6984405517578125, -0.67376708984375, -0.6490936279296875, -0.624420166015625, -0.5997467041015625, -0.5750732421875, -0.5503997802734375, -0.525726318359375, -0.5010528564453125, -0.47637939453125, -0.4517059326171875, -0.427032470703125, -0.4023590087890625, -0.377685546875, -0.3530120849609375, -0.328338623046875, -0.3036651611328125, -0.27899169921875, -0.2543182373046875, -0.229644775390625, -0.2049713134765625, -0.1802978515625, -0.1556243896484375, -0.130950927734375, -0.1062774658203125, -0.08160400390625, -0.0569305419921875, -0.032257080078125, -0.0075836181640625, 0.01708984375, 0.0417633056640625, 0.066436767578125, 0.0911102294921875, 0.11578369140625, 0.1404571533203125, 0.165130615234375, 0.1898040771484375, 0.2144775390625, 0.2391510009765625, 0.263824462890625, 0.2884979248046875, 0.31317138671875, 0.3378448486328125, 0.362518310546875, 0.3871917724609375, 0.411865234375, 0.4365386962890625, 0.461212158203125, 0.4858856201171875, 0.51055908203125, 0.5352325439453125, 0.559906005859375, 0.5845794677734375, 0.6092529296875, 0.6339263916015625, 0.658599853515625, 0.6832733154296875, 0.70794677734375, 0.7326202392578125, 0.757293701171875, 0.7819671630859375, 0.806640625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 7.0, 14.0, 14.0, 19.0, 29.0, 37.0, 53.0, 99.0, 135.0, 172.0, 139.0, 76.0, 60.0, 44.0, 17.0, 15.0, 15.0, 16.0, 5.0, 6.0, 8.0, 6.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.684925079345703e-05, -4.5008957386016846e-05, -4.316866397857666e-05, -4.1328370571136475e-05, -3.948807716369629e-05, -3.7647783756256104e-05, -3.580749034881592e-05, -3.396719694137573e-05, -3.212690353393555e-05, -3.028661012649536e-05, -2.8446316719055176e-05, -2.660602331161499e-05, -2.4765729904174805e-05, -2.292543649673462e-05, -2.1085143089294434e-05, -1.9244849681854248e-05, -1.7404556274414062e-05, -1.5564262866973877e-05, -1.3723969459533691e-05, -1.1883676052093506e-05, -1.004338264465332e-05, -8.203089237213135e-06, -6.362795829772949e-06, -4.522502422332764e-06, -2.682209014892578e-06, -8.419156074523926e-07, 9.98377799987793e-07, 2.8386712074279785e-06, 4.678964614868164e-06, 6.51925802230835e-06, 8.359551429748535e-06, 1.019984483718872e-05, 1.2040138244628906e-05, 1.3880431652069092e-05, 1.5720725059509277e-05, 1.7561018466949463e-05, 1.940131187438965e-05, 2.1241605281829834e-05, 2.308189868927002e-05, 2.4922192096710205e-05, 2.676248550415039e-05, 2.8602778911590576e-05, 3.0443072319030762e-05, 3.228336572647095e-05, 3.412365913391113e-05, 3.596395254135132e-05, 3.7804245948791504e-05, 3.964453935623169e-05, 4.1484832763671875e-05, 4.332512617111206e-05, 4.5165419578552246e-05, 4.700571298599243e-05, 4.884600639343262e-05, 5.06862998008728e-05, 5.252659320831299e-05, 5.4366886615753174e-05, 5.620718002319336e-05, 5.8047473430633545e-05, 5.988776683807373e-05, 6.172806024551392e-05, 6.35683536529541e-05, 6.540864706039429e-05, 6.724894046783447e-05, 6.908923387527466e-05, 7.092952728271484e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 15.0, 24.0, 31.0, 38.0, 76.0, 166.0, 285.0, 529.0, 1129.0, 2437.0, 5957.0, 18700.0, 103105.0, 777916.0, 107765.0, 19404.0, 6120.0, 2551.0, 1098.0, 548.0, 247.0, 150.0, 98.0, 39.0, 26.0, 32.0, 13.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.40936279296875, -0.3939208984375, -0.37847900390625, -0.363037109375, -0.34759521484375, -0.3321533203125, -0.31671142578125, -0.30126953125, -0.28582763671875, -0.2703857421875, -0.25494384765625, -0.239501953125, -0.22406005859375, -0.2086181640625, -0.19317626953125, -0.177734375, -0.16229248046875, -0.1468505859375, -0.13140869140625, -0.115966796875, -0.10052490234375, -0.0850830078125, -0.06964111328125, -0.05419921875, -0.03875732421875, -0.0233154296875, -0.00787353515625, 0.007568359375, 0.02301025390625, 0.0384521484375, 0.05389404296875, 0.0693359375, 0.08477783203125, 0.1002197265625, 0.11566162109375, 0.131103515625, 0.14654541015625, 0.1619873046875, 0.17742919921875, 0.19287109375, 0.20831298828125, 0.2237548828125, 0.23919677734375, 0.254638671875, 0.27008056640625, 0.2855224609375, 0.30096435546875, 0.31640625, 0.33184814453125, 0.3472900390625, 0.36273193359375, 0.378173828125, 0.39361572265625, 0.4090576171875, 0.42449951171875, 0.43994140625, 0.45538330078125, 0.4708251953125, 0.48626708984375, 0.501708984375, 0.51715087890625, 0.5325927734375, 0.54803466796875, 0.5634765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 0.0, 6.0, 2.0, 10.0, 9.0, 9.0, 15.0, 20.0, 28.0, 34.0, 47.0, 68.0, 109.0, 145.0, 174.0, 99.0, 67.0, 38.0, 32.0, 16.0, 21.0, 17.0, 14.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23828125, -0.23143959045410156, -0.22459793090820312, -0.2177562713623047, -0.21091461181640625, -0.2040729522705078, -0.19723129272460938, -0.19038963317871094, -0.1835479736328125, -0.17670631408691406, -0.16986465454101562, -0.1630229949951172, -0.15618133544921875, -0.1493396759033203, -0.14249801635742188, -0.13565635681152344, -0.128814697265625, -0.12197303771972656, -0.11513137817382812, -0.10828971862792969, -0.10144805908203125, -0.09460639953613281, -0.08776473999023438, -0.08092308044433594, -0.0740814208984375, -0.06723976135253906, -0.060398101806640625, -0.05355644226074219, -0.04671478271484375, -0.03987312316894531, -0.033031463623046875, -0.026189804077148438, -0.01934814453125, -0.012506484985351562, -0.005664825439453125, 0.0011768341064453125, 0.00801849365234375, 0.014860153198242188, 0.021701812744140625, 0.028543472290039062, 0.0353851318359375, 0.04222679138183594, 0.049068450927734375, 0.05591011047363281, 0.06275177001953125, 0.06959342956542969, 0.07643508911132812, 0.08327674865722656, 0.090118408203125, 0.09696006774902344, 0.10380172729492188, 0.11064338684082031, 0.11748504638671875, 0.12432670593261719, 0.13116836547851562, 0.13801002502441406, 0.1448516845703125, 0.15169334411621094, 0.15853500366210938, 0.1653766632080078, 0.17221832275390625, 0.1790599822998047, 0.18590164184570312, 0.19274330139160156, 0.1995849609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 12.0, 19.0, 51.0, 67.0, 125.0, 141.0, 173.0, 158.0, 91.0, 62.0, 44.0, 23.0, 13.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7016072273254395, -3.549748420715332, -3.3978896141052246, -3.2460310459136963, -3.094172239303589, -2.9423134326934814, -2.790454864501953, -2.6385960578918457, -2.4867372512817383, -2.334878444671631, -2.1830196380615234, -2.031161069869995, -1.8793022632598877, -1.7274434566497803, -1.5755847692489624, -1.4237260818481445, -1.271867275238037, -1.1200084686279297, -0.9681497812271118, -0.8162910342216492, -0.6644322872161865, -0.5125735402107239, -0.36071479320526123, -0.20885610580444336, -0.05699729919433594, 0.09486144781112671, 0.24672019481658936, 0.398578941822052, 0.5504376888275146, 0.7022964358329773, 0.8541551828384399, 1.0060138702392578, 1.1578731536865234, 1.3097319602966309, 1.4615906476974487, 1.6134493350982666, 1.765308141708374, 1.9171669483184814, 2.0690255165100098, 2.220884323120117, 2.3727431297302246, 2.524601936340332, 2.6764607429504395, 2.8283193111419678, 2.980178117752075, 3.1320369243621826, 3.283895492553711, 3.4357542991638184, 3.587613105773926, 3.739471912384033, 3.8913307189941406, 4.043189525604248, 4.1950483322143555, 4.346906661987305, 4.498765468597412, 4.6506242752075195, 4.802483081817627, 4.954341888427734, 5.106200695037842, 5.258059501647949, 5.409917831420898, 5.561776638031006, 5.713635444641113, 5.865494251251221, 6.017353057861328]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 6.0, 6.0, 12.0, 15.0, 17.0, 21.0, 26.0, 28.0, 21.0, 45.0, 37.0, 43.0, 46.0, 44.0, 44.0, 53.0, 57.0, 59.0, 43.0, 31.0, 41.0, 32.0, 26.0, 32.0, 25.0, 16.0, 21.0, 20.0, 26.0, 15.0, 17.0, 14.0, 10.0, 11.0, 6.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.724957466125488, -4.592073440551758, -4.459189414978027, -4.326305389404297, -4.193421363830566, -4.060537338256836, -3.9276533126831055, -3.794769287109375, -3.6618852615356445, -3.529001235961914, -3.3961172103881836, -3.263233184814453, -3.1303491592407227, -2.997465133666992, -2.8645811080932617, -2.7316970825195312, -2.598813056945801, -2.4659290313720703, -2.33304500579834, -2.2001609802246094, -2.067276954650879, -1.9343929290771484, -1.801508903503418, -1.6686248779296875, -1.535740852355957, -1.4028568267822266, -1.269972801208496, -1.1370887756347656, -1.0042047500610352, -0.8713207244873047, -0.7384366989135742, -0.6055526733398438, -0.4726686477661133, -0.3397846221923828, -0.20690059661865234, -0.07401657104492188, 0.058867454528808594, 0.19175148010253906, 0.32463550567626953, 0.45751953125, 0.5904035568237305, 0.7232875823974609, 0.8561716079711914, 0.9890556335449219, 1.1219396591186523, 1.2548236846923828, 1.3877077102661133, 1.5205917358398438, 1.6534757614135742, 1.7863597869873047, 1.9192438125610352, 2.0521278381347656, 2.185011863708496, 2.3178958892822266, 2.450779914855957, 2.5836639404296875, 2.716547966003418, 2.8494319915771484, 2.982316017150879, 3.1152000427246094, 3.24808406829834, 3.3809680938720703, 3.513852119445801, 3.6467361450195312, 3.7796201705932617]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 3.0, 12.0, 10.0, 15.0, 10.0, 17.0, 28.0, 30.0, 54.0, 68.0, 128.0, 184.0, 272.0, 422.0, 728.0, 1599.0, 3455.0, 10471.0, 153885.0, 3889027.0, 116709.0, 10513.0, 3272.0, 1427.0, 747.0, 394.0, 264.0, 146.0, 106.0, 79.0, 60.0, 42.0, 44.0, 22.0, 13.0, 8.0, 12.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.07147216796875, -2.9554443359375, -2.83941650390625, -2.723388671875, -2.60736083984375, -2.4913330078125, -2.37530517578125, -2.25927734375, -2.14324951171875, -2.0272216796875, -1.91119384765625, -1.795166015625, -1.67913818359375, -1.5631103515625, -1.44708251953125, -1.3310546875, -1.21502685546875, -1.0989990234375, -0.98297119140625, -0.866943359375, -0.75091552734375, -0.6348876953125, -0.51885986328125, -0.40283203125, -0.28680419921875, -0.1707763671875, -0.05474853515625, 0.061279296875, 0.17730712890625, 0.2933349609375, 0.40936279296875, 0.525390625, 0.64141845703125, 0.7574462890625, 0.87347412109375, 0.989501953125, 1.10552978515625, 1.2215576171875, 1.33758544921875, 1.45361328125, 1.56964111328125, 1.6856689453125, 1.80169677734375, 1.917724609375, 2.03375244140625, 2.1497802734375, 2.26580810546875, 2.3818359375, 2.49786376953125, 2.6138916015625, 2.72991943359375, 2.845947265625, 2.96197509765625, 3.0780029296875, 3.19403076171875, 3.31005859375, 3.42608642578125, 3.5421142578125, 3.65814208984375, 3.774169921875, 3.89019775390625, 4.0062255859375, 4.12225341796875, 4.23828125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 12.0, 14.0, 26.0, 41.0, 31.0, 39.0, 50.0, 41.0, 77.0, 69.0, 64.0, 78.0, 66.0, 64.0, 46.0, 50.0, 56.0, 35.0, 30.0, 36.0, 16.0, 17.0, 10.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6455078125, -1.603607177734375, -1.56170654296875, -1.519805908203125, -1.4779052734375, -1.436004638671875, -1.39410400390625, -1.352203369140625, -1.310302734375, -1.268402099609375, -1.22650146484375, -1.184600830078125, -1.1427001953125, -1.100799560546875, -1.05889892578125, -1.016998291015625, -0.97509765625, -0.933197021484375, -0.89129638671875, -0.849395751953125, -0.8074951171875, -0.765594482421875, -0.72369384765625, -0.681793212890625, -0.639892578125, -0.597991943359375, -0.55609130859375, -0.514190673828125, -0.4722900390625, -0.430389404296875, -0.38848876953125, -0.346588134765625, -0.3046875, -0.262786865234375, -0.22088623046875, -0.178985595703125, -0.1370849609375, -0.095184326171875, -0.05328369140625, -0.011383056640625, 0.030517578125, 0.072418212890625, 0.11431884765625, 0.156219482421875, 0.1981201171875, 0.240020751953125, 0.28192138671875, 0.323822021484375, 0.36572265625, 0.407623291015625, 0.44952392578125, 0.491424560546875, 0.5333251953125, 0.575225830078125, 0.61712646484375, 0.659027099609375, 0.700927734375, 0.742828369140625, 0.78472900390625, 0.826629638671875, 0.8685302734375, 0.910430908203125, 0.95233154296875, 0.994232177734375, 1.0361328125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 15.0, 17.0, 11.0, 18.0, 35.0, 65.0, 131.0, 390.0, 1726.0, 11728.0, 572349.0, 3583217.0, 21307.0, 2349.0, 530.0, 173.0, 82.0, 48.0, 24.0, 17.0, 13.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.546875, -6.395050048828125, -6.24322509765625, -6.091400146484375, -5.9395751953125, -5.787750244140625, -5.63592529296875, -5.484100341796875, -5.332275390625, -5.180450439453125, -5.02862548828125, -4.876800537109375, -4.7249755859375, -4.573150634765625, -4.42132568359375, -4.269500732421875, -4.11767578125, -3.965850830078125, -3.81402587890625, -3.662200927734375, -3.5103759765625, -3.358551025390625, -3.20672607421875, -3.054901123046875, -2.903076171875, -2.751251220703125, -2.59942626953125, -2.447601318359375, -2.2957763671875, -2.143951416015625, -1.99212646484375, -1.840301513671875, -1.6884765625, -1.536651611328125, -1.38482666015625, -1.233001708984375, -1.0811767578125, -0.929351806640625, -0.77752685546875, -0.625701904296875, -0.473876953125, -0.322052001953125, -0.17022705078125, -0.018402099609375, 0.1334228515625, 0.285247802734375, 0.43707275390625, 0.588897705078125, 0.74072265625, 0.892547607421875, 1.04437255859375, 1.196197509765625, 1.3480224609375, 1.499847412109375, 1.65167236328125, 1.803497314453125, 1.955322265625, 2.107147216796875, 2.25897216796875, 2.410797119140625, 2.5626220703125, 2.714447021484375, 2.86627197265625, 3.018096923828125, 3.169921875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 13.0, 13.0, 12.0, 25.0, 22.0, 41.0, 87.0, 171.0, 347.0, 739.0, 1026.0, 725.0, 367.0, 191.0, 96.0, 52.0, 36.0, 22.0, 15.0, 12.0, 10.0, 10.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.591796875, -0.5676803588867188, -0.5435638427734375, -0.5194473266601562, -0.495330810546875, -0.47121429443359375, -0.4470977783203125, -0.42298126220703125, -0.39886474609375, -0.37474822998046875, -0.3506317138671875, -0.32651519775390625, -0.302398681640625, -0.27828216552734375, -0.2541656494140625, -0.23004913330078125, -0.2059326171875, -0.18181610107421875, -0.1576995849609375, -0.13358306884765625, -0.109466552734375, -0.08535003662109375, -0.0612335205078125, -0.03711700439453125, -0.01300048828125, 0.01111602783203125, 0.0352325439453125, 0.05934906005859375, 0.083465576171875, 0.10758209228515625, 0.1316986083984375, 0.15581512451171875, 0.179931640625, 0.20404815673828125, 0.2281646728515625, 0.25228118896484375, 0.276397705078125, 0.30051422119140625, 0.3246307373046875, 0.34874725341796875, 0.37286376953125, 0.39698028564453125, 0.4210968017578125, 0.44521331787109375, 0.469329833984375, 0.49344635009765625, 0.5175628662109375, 0.5416793823242188, 0.5657958984375, 0.5899124145507812, 0.6140289306640625, 0.6381454467773438, 0.662261962890625, 0.6863784790039062, 0.7104949951171875, 0.7346115112304688, 0.75872802734375, 0.7828445434570312, 0.8069610595703125, 0.8310775756835938, 0.855194091796875, 0.8793106079101562, 0.9034271240234375, 0.9275436401367188, 0.95166015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 6.0, 8.0, 4.0, 15.0, 8.0, 16.0, 16.0, 29.0, 25.0, 26.0, 44.0, 40.0, 53.0, 54.0, 56.0, 53.0, 64.0, 63.0, 67.0, 65.0, 51.0, 43.0, 33.0, 31.0, 15.0, 16.0, 18.0, 18.0, 13.0, 12.0, 10.0, 4.0, 7.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2557870149612427, -1.2156645059585571, -1.1755421161651611, -1.1354196071624756, -1.0952972173690796, -1.055174708366394, -1.015052318572998, -0.9749298095703125, -0.9348074197769165, -0.8946849703788757, -0.854562520980835, -0.8144400715827942, -0.7743176221847534, -0.7341951727867126, -0.6940727233886719, -0.6539502143859863, -0.6138277649879456, -0.5737053155899048, -0.533582866191864, -0.49346041679382324, -0.45333796739578247, -0.4132155179977417, -0.37309303879737854, -0.33297058939933777, -0.292848140001297, -0.2527256906032562, -0.21260324120521545, -0.1724807769060135, -0.13235832750797272, -0.09223587810993195, -0.05211341381072998, -0.011990964412689209, 0.028131484985351562, 0.06825393438339233, 0.1083763912320137, 0.14849884808063507, 0.18862129747867584, 0.2287437468767166, 0.2688662111759186, 0.30898866057395935, 0.3491111099720001, 0.3892335593700409, 0.42935600876808167, 0.4694784879684448, 0.5096009373664856, 0.5497233867645264, 0.5898458361625671, 0.6299682855606079, 0.6700907349586487, 0.7102131843566895, 0.7503356337547302, 0.790458083152771, 0.8305805325508118, 0.8707029819488525, 0.9108254909515381, 0.9509478807449341, 0.9910703897476196, 1.0311928987503052, 1.0713152885437012, 1.1114377975463867, 1.1515601873397827, 1.1916826963424683, 1.2318050861358643, 1.2719275951385498, 1.3120499849319458]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 7.0, 13.0, 9.0, 17.0, 17.0, 20.0, 22.0, 16.0, 29.0, 32.0, 36.0, 33.0, 45.0, 44.0, 45.0, 48.0, 44.0, 38.0, 43.0, 48.0, 50.0, 56.0, 29.0, 42.0, 36.0, 29.0, 32.0, 25.0, 15.0, 16.0, 8.0, 18.0, 6.0, 7.0, 6.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1805386543273926, -1.1423274278640747, -1.1041163206100464, -1.0659050941467285, -1.0276939868927002, -0.9894827604293823, -0.9512715339660645, -0.9130603671073914, -0.8748492002487183, -0.8366380333900452, -0.7984268665313721, -0.7602156400680542, -0.7220044732093811, -0.683793306350708, -0.6455820798873901, -0.607370913028717, -0.569159746170044, -0.5309485793113708, -0.49273738265037537, -0.4545261859893799, -0.4163150191307068, -0.3781038522720337, -0.3398926556110382, -0.3016814589500427, -0.26347029209136963, -0.22525911033153534, -0.18704792857170105, -0.14883674681186676, -0.11062556505203247, -0.07241438329219818, -0.03420320153236389, 0.004007995128631592, 0.04221928119659424, 0.08043046295642853, 0.11864164471626282, 0.1568528264760971, 0.1950640082359314, 0.23327518999576569, 0.2714863717556, 0.30969756841659546, 0.34790873527526855, 0.38611990213394165, 0.42433109879493713, 0.4625422954559326, 0.5007534623146057, 0.5389646291732788, 0.5771758556365967, 0.6153870224952698, 0.6535981893539429, 0.691809356212616, 0.7300205230712891, 0.7682317495346069, 0.80644291639328, 0.8446540832519531, 0.882865309715271, 0.9210764765739441, 0.9592876434326172, 0.9974988102912903, 1.0357099771499634, 1.0739212036132812, 1.1121323108673096, 1.1503435373306274, 1.1885547637939453, 1.2267658710479736, 1.2649770975112915]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 13.0, 10.0, 17.0, 29.0, 42.0, 60.0, 93.0, 155.0, 245.0, 386.0, 709.0, 1476.0, 6627.0, 84166.0, 874226.0, 71291.0, 5884.0, 1440.0, 649.0, 355.0, 236.0, 156.0, 100.0, 66.0, 49.0, 23.0, 14.0, 12.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.48697662353515625, -0.4685821533203125, -0.45018768310546875, -0.431793212890625, -0.41339874267578125, -0.3950042724609375, -0.37660980224609375, -0.35821533203125, -0.33982086181640625, -0.3214263916015625, -0.30303192138671875, -0.284637451171875, -0.26624298095703125, -0.2478485107421875, -0.22945404052734375, -0.2110595703125, -0.19266510009765625, -0.1742706298828125, -0.15587615966796875, -0.137481689453125, -0.11908721923828125, -0.1006927490234375, -0.08229827880859375, -0.06390380859375, -0.04550933837890625, -0.0271148681640625, -0.00872039794921875, 0.009674072265625, 0.02806854248046875, 0.0464630126953125, 0.06485748291015625, 0.083251953125, 0.10164642333984375, 0.1200408935546875, 0.13843536376953125, 0.156829833984375, 0.17522430419921875, 0.1936187744140625, 0.21201324462890625, 0.23040771484375, 0.24880218505859375, 0.2671966552734375, 0.28559112548828125, 0.303985595703125, 0.32238006591796875, 0.3407745361328125, 0.35916900634765625, 0.3775634765625, 0.39595794677734375, 0.4143524169921875, 0.43274688720703125, 0.451141357421875, 0.46953582763671875, 0.4879302978515625, 0.5063247680664062, 0.52471923828125, 0.5431137084960938, 0.5615081787109375, 0.5799026489257812, 0.598297119140625, 0.6166915893554688, 0.6350860595703125, 0.6534805297851562, 0.671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 10.0, 9.0, 13.0, 17.0, 20.0, 23.0, 24.0, 27.0, 42.0, 47.0, 50.0, 46.0, 49.0, 61.0, 50.0, 55.0, 46.0, 62.0, 67.0, 44.0, 42.0, 42.0, 27.0, 37.0, 27.0, 17.0, 10.0, 11.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1351470947265625, -1.105255126953125, -1.0753631591796875, -1.04547119140625, -1.0155792236328125, -0.985687255859375, -0.9557952880859375, -0.9259033203125, -0.8960113525390625, -0.866119384765625, -0.8362274169921875, -0.80633544921875, -0.7764434814453125, -0.746551513671875, -0.7166595458984375, -0.686767578125, -0.6568756103515625, -0.626983642578125, -0.5970916748046875, -0.56719970703125, -0.5373077392578125, -0.507415771484375, -0.4775238037109375, -0.4476318359375, -0.4177398681640625, -0.387847900390625, -0.3579559326171875, -0.32806396484375, -0.2981719970703125, -0.268280029296875, -0.2383880615234375, -0.20849609375, -0.1786041259765625, -0.148712158203125, -0.1188201904296875, -0.08892822265625, -0.0590362548828125, -0.029144287109375, 0.0007476806640625, 0.0306396484375, 0.0605316162109375, 0.090423583984375, 0.1203155517578125, 0.15020751953125, 0.1800994873046875, 0.209991455078125, 0.2398834228515625, 0.269775390625, 0.2996673583984375, 0.329559326171875, 0.3594512939453125, 0.38934326171875, 0.4192352294921875, 0.449127197265625, 0.4790191650390625, 0.5089111328125, 0.5388031005859375, 0.568695068359375, 0.5985870361328125, 0.62847900390625, 0.6583709716796875, 0.688262939453125, 0.7181549072265625, 0.748046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 10.0, 16.0, 24.0, 43.0, 65.0, 137.0, 239.0, 390.0, 811.0, 1511.0, 3021.0, 6077.0, 12813.0, 28712.0, 69274.0, 192597.0, 386736.0, 211159.0, 75781.0, 31095.0, 14129.0, 6716.0, 3367.0, 1690.0, 923.0, 510.0, 266.0, 156.0, 93.0, 66.0, 46.0, 22.0, 19.0, 13.0, 9.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092041015625, -0.08843803405761719, -0.08483505249023438, -0.08123207092285156, -0.07762908935546875, -0.07402610778808594, -0.07042312622070312, -0.06682014465332031, -0.0632171630859375, -0.05961418151855469, -0.056011199951171875, -0.05240821838378906, -0.04880523681640625, -0.04520225524902344, -0.041599273681640625, -0.03799629211425781, -0.034393310546875, -0.030790328979492188, -0.027187347412109375, -0.023584365844726562, -0.01998138427734375, -0.016378402709960938, -0.012775421142578125, -0.009172439575195312, -0.0055694580078125, -0.0019664764404296875, 0.001636505126953125, 0.0052394866943359375, 0.00884246826171875, 0.012445449829101562, 0.016048431396484375, 0.019651412963867188, 0.02325439453125, 0.026857376098632812, 0.030460357666015625, 0.03406333923339844, 0.03766632080078125, 0.04126930236816406, 0.044872283935546875, 0.04847526550292969, 0.0520782470703125, 0.05568122863769531, 0.059284210205078125, 0.06288719177246094, 0.06649017333984375, 0.07009315490722656, 0.07369613647460938, 0.07729911804199219, 0.080902099609375, 0.08450508117675781, 0.08810806274414062, 0.09171104431152344, 0.09531402587890625, 0.09891700744628906, 0.10251998901367188, 0.10612297058105469, 0.1097259521484375, 0.11332893371582031, 0.11693191528320312, 0.12053489685058594, 0.12413787841796875, 0.12774085998535156, 0.13134384155273438, 0.1349468231201172, 0.1385498046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 10.0, 12.0, 17.0, 21.0, 16.0, 23.0, 16.0, 19.0, 34.0, 48.0, 43.0, 43.0, 40.0, 56.0, 42.0, 58.0, 56.0, 50.0, 52.0, 42.0, 40.0, 33.0, 40.0, 25.0, 19.0, 20.0, 22.0, 13.0, 14.0, 11.0, 17.0, 5.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.457763671875, -1.39794921875, -1.338134765625, -1.2783203125, -1.218505859375, -1.15869140625, -1.098876953125, -1.0390625, -0.979248046875, -0.91943359375, -0.859619140625, -0.7998046875, -0.739990234375, -0.68017578125, -0.620361328125, -0.560546875, -0.500732421875, -0.44091796875, -0.381103515625, -0.3212890625, -0.261474609375, -0.20166015625, -0.141845703125, -0.08203125, -0.022216796875, 0.03759765625, 0.097412109375, 0.1572265625, 0.217041015625, 0.27685546875, 0.336669921875, 0.396484375, 0.456298828125, 0.51611328125, 0.575927734375, 0.6357421875, 0.695556640625, 0.75537109375, 0.815185546875, 0.875, 0.934814453125, 0.99462890625, 1.054443359375, 1.1142578125, 1.174072265625, 1.23388671875, 1.293701171875, 1.353515625, 1.413330078125, 1.47314453125, 1.532958984375, 1.5927734375, 1.652587890625, 1.71240234375, 1.772216796875, 1.83203125, 1.891845703125, 1.95166015625, 2.011474609375, 2.0712890625, 2.131103515625, 2.19091796875, 2.250732421875, 2.310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 9.0, 12.0, 13.0, 18.0, 33.0, 48.0, 76.0, 119.0, 208.0, 332.0, 654.0, 1190.0, 2518.0, 5671.0, 16760.0, 91637.0, 729429.0, 162760.0, 23495.0, 7244.0, 3036.0, 1459.0, 789.0, 451.0, 232.0, 116.0, 73.0, 62.0, 43.0, 22.0, 14.0, 9.0, 5.0, 2.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0467529296875, -0.04540252685546875, -0.0440521240234375, -0.04270172119140625, -0.041351318359375, -0.04000091552734375, -0.0386505126953125, -0.03730010986328125, -0.03594970703125, -0.03459930419921875, -0.0332489013671875, -0.03189849853515625, -0.030548095703125, -0.02919769287109375, -0.0278472900390625, -0.02649688720703125, -0.025146484375, -0.02379608154296875, -0.0224456787109375, -0.02109527587890625, -0.019744873046875, -0.01839447021484375, -0.0170440673828125, -0.01569366455078125, -0.01434326171875, -0.01299285888671875, -0.0116424560546875, -0.01029205322265625, -0.008941650390625, -0.00759124755859375, -0.0062408447265625, -0.00489044189453125, -0.0035400390625, -0.00218963623046875, -0.0008392333984375, 0.00051116943359375, 0.001861572265625, 0.00321197509765625, 0.0045623779296875, 0.00591278076171875, 0.00726318359375, 0.00861358642578125, 0.0099639892578125, 0.01131439208984375, 0.012664794921875, 0.01401519775390625, 0.0153656005859375, 0.01671600341796875, 0.01806640625, 0.01941680908203125, 0.0207672119140625, 0.02211761474609375, 0.023468017578125, 0.02481842041015625, 0.0261688232421875, 0.02751922607421875, 0.02886962890625, 0.03022003173828125, 0.0315704345703125, 0.03292083740234375, 0.034271240234375, 0.03562164306640625, 0.0369720458984375, 0.03832244873046875, 0.0396728515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 13.0, 13.0, 28.0, 43.0, 64.0, 90.0, 155.0, 162.0, 140.0, 93.0, 66.0, 42.0, 21.0, 13.0, 11.0, 11.0, 2.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.224082946777344e-05, -7.024593651294708e-05, -6.825104355812073e-05, -6.625615060329437e-05, -6.426125764846802e-05, -6.226636469364166e-05, -6.027147173881531e-05, -5.827657878398895e-05, -5.62816858291626e-05, -5.428679287433624e-05, -5.229189991950989e-05, -5.029700696468353e-05, -4.830211400985718e-05, -4.630722105503082e-05, -4.431232810020447e-05, -4.231743514537811e-05, -4.032254219055176e-05, -3.83276492357254e-05, -3.633275628089905e-05, -3.433786332607269e-05, -3.234297037124634e-05, -3.0348077416419983e-05, -2.8353184461593628e-05, -2.6358291506767273e-05, -2.4363398551940918e-05, -2.2368505597114563e-05, -2.0373612642288208e-05, -1.8378719687461853e-05, -1.6383826732635498e-05, -1.4388933777809143e-05, -1.2394040822982788e-05, -1.0399147868156433e-05, -8.404254913330078e-06, -6.409361958503723e-06, -4.414469003677368e-06, -2.419576048851013e-06, -4.246830940246582e-07, 1.5702098608016968e-06, 3.5651028156280518e-06, 5.559995770454407e-06, 7.554888725280762e-06, 9.549781680107117e-06, 1.1544674634933472e-05, 1.3539567589759827e-05, 1.553446054458618e-05, 1.7529353499412537e-05, 1.952424645423889e-05, 2.1519139409065247e-05, 2.35140323638916e-05, 2.5508925318717957e-05, 2.750381827354431e-05, 2.9498711228370667e-05, 3.149360418319702e-05, 3.3488497138023376e-05, 3.548339009284973e-05, 3.7478283047676086e-05, 3.947317600250244e-05, 4.1468068957328796e-05, 4.346296191215515e-05, 4.5457854866981506e-05, 4.745274782180786e-05, 4.9447640776634216e-05, 5.144253373146057e-05, 5.3437426686286926e-05, 5.543231964111328e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 14.0, 27.0, 37.0, 53.0, 61.0, 100.0, 123.0, 232.0, 362.0, 546.0, 835.0, 1162.0, 1919.0, 3200.0, 5601.0, 11021.0, 22174.0, 51623.0, 159753.0, 478692.0, 197756.0, 60038.0, 25161.0, 12226.0, 6247.0, 3498.0, 2097.0, 1333.0, 818.0, 591.0, 373.0, 264.0, 175.0, 137.0, 97.0, 55.0, 43.0, 24.0, 17.0, 18.0, 11.0, 8.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.022186279296875, -0.021505355834960938, -0.020824432373046875, -0.020143508911132812, -0.01946258544921875, -0.018781661987304688, -0.018100738525390625, -0.017419815063476562, -0.0167388916015625, -0.016057968139648438, -0.015377044677734375, -0.014696121215820312, -0.01401519775390625, -0.013334274291992188, -0.012653350830078125, -0.011972427368164062, -0.01129150390625, -0.010610580444335938, -0.009929656982421875, -0.009248733520507812, -0.00856781005859375, -0.007886886596679688, -0.007205963134765625, -0.0065250396728515625, -0.0058441162109375, -0.0051631927490234375, -0.004482269287109375, -0.0038013458251953125, -0.00312042236328125, -0.0024394989013671875, -0.001758575439453125, -0.0010776519775390625, -0.000396728515625, 0.0002841949462890625, 0.000965118408203125, 0.0016460418701171875, 0.00232696533203125, 0.0030078887939453125, 0.003688812255859375, 0.0043697357177734375, 0.0050506591796875, 0.0057315826416015625, 0.006412506103515625, 0.0070934295654296875, 0.00777435302734375, 0.008455276489257812, 0.009136199951171875, 0.009817123413085938, 0.010498046875, 0.011178970336914062, 0.011859893798828125, 0.012540817260742188, 0.01322174072265625, 0.013902664184570312, 0.014583587646484375, 0.015264511108398438, 0.0159454345703125, 0.016626358032226562, 0.017307281494140625, 0.017988204956054688, 0.01866912841796875, 0.019350051879882812, 0.020030975341796875, 0.020711898803710938, 0.021392822265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 9.0, 8.0, 12.0, 6.0, 21.0, 31.0, 28.0, 33.0, 58.0, 60.0, 81.0, 89.0, 123.0, 100.0, 71.0, 68.0, 34.0, 36.0, 24.0, 23.0, 12.0, 20.0, 11.0, 10.0, 8.0, 6.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01230621337890625, -0.011949419975280762, -0.011592626571655273, -0.011235833168029785, -0.010879039764404297, -0.010522246360778809, -0.01016545295715332, -0.009808659553527832, -0.009451866149902344, -0.009095072746276855, -0.008738279342651367, -0.008381485939025879, -0.00802469253540039, -0.007667899131774902, -0.007311105728149414, -0.006954312324523926, -0.0065975189208984375, -0.006240725517272949, -0.005883932113647461, -0.005527138710021973, -0.005170345306396484, -0.004813551902770996, -0.004456758499145508, -0.0040999650955200195, -0.0037431716918945312, -0.003386378288269043, -0.0030295848846435547, -0.0026727914810180664, -0.002315998077392578, -0.00195920467376709, -0.0016024112701416016, -0.0012456178665161133, -0.000888824462890625, -0.0005320310592651367, -0.00017523765563964844, 0.00018155574798583984, 0.0005383491516113281, 0.0008951425552368164, 0.0012519359588623047, 0.001608729362487793, 0.0019655227661132812, 0.0023223161697387695, 0.002679109573364258, 0.003035902976989746, 0.0033926963806152344, 0.0037494897842407227, 0.004106283187866211, 0.004463076591491699, 0.0048198699951171875, 0.005176663398742676, 0.005533456802368164, 0.005890250205993652, 0.006247043609619141, 0.006603837013244629, 0.006960630416870117, 0.0073174238204956055, 0.007674217224121094, 0.008031010627746582, 0.00838780403137207, 0.008744597434997559, 0.009101390838623047, 0.009458184242248535, 0.009814977645874023, 0.010171771049499512, 0.010528564453125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 8.0, 14.0, 15.0, 17.0, 30.0, 41.0, 55.0, 68.0, 92.0, 83.0, 88.0, 96.0, 99.0, 81.0, 59.0, 35.0, 28.0, 25.0, 23.0, 13.0, 13.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9561367630958557, -0.9189280867576599, -0.8817194700241089, -0.8445107936859131, -0.8073021769523621, -0.7700935006141663, -0.7328848838806152, -0.6956762075424194, -0.6584675312042236, -0.6212588548660278, -0.5840502381324768, -0.546841561794281, -0.50963294506073, -0.4724242687225342, -0.43521562218666077, -0.39800697565078735, -0.36079835891723633, -0.3235897123813629, -0.2863810658454895, -0.2491724044084549, -0.21196375787258148, -0.17475511133670807, -0.13754644989967346, -0.10033780336380005, -0.06312915682792664, -0.025920506566762924, 0.011288143694400787, 0.0484967976808548, 0.08570544421672821, 0.12291409075260162, 0.16012275218963623, 0.19733139872550964, 0.23453998565673828, 0.2717486321926117, 0.3089572787284851, 0.3461659550666809, 0.38337457180023193, 0.42058324813842773, 0.45779189467430115, 0.49500054121017456, 0.5322091579437256, 0.5694178342819214, 0.6066264510154724, 0.6438351273536682, 0.6810437440872192, 0.718252420425415, 0.7554610967636108, 0.7926697134971619, 0.8298783898353577, 0.8670870661735535, 0.9042956829071045, 0.9415043592453003, 0.9787129759788513, 1.0159215927124023, 1.0531302690505981, 1.090338945388794, 1.1275476217269897, 1.1647562980651855, 1.2019649744033813, 1.2391735315322876, 1.2763822078704834, 1.3135908842086792, 1.350799560546875, 1.3880081176757812, 1.425216794013977]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 5.0, 10.0, 18.0, 21.0, 20.0, 25.0, 31.0, 40.0, 39.0, 53.0, 52.0, 61.0, 55.0, 59.0, 52.0, 55.0, 74.0, 50.0, 49.0, 43.0, 42.0, 35.0, 25.0, 12.0, 22.0, 13.0, 11.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.142427682876587, -1.1125179529190063, -1.0826082229614258, -1.0526986122131348, -1.0227888822555542, -0.9928791522979736, -0.9629694223403931, -0.9330596923828125, -0.9031500220298767, -0.8732402920722961, -0.8433306217193604, -0.8134208917617798, -0.7835111618041992, -0.7536014914512634, -0.7236917614936829, -0.6937820911407471, -0.6638723611831665, -0.6339626312255859, -0.6040529608726501, -0.5741432309150696, -0.5442335605621338, -0.5143238306045532, -0.48441410064697266, -0.4545044004917145, -0.4245947003364563, -0.3946850001811981, -0.36477530002593994, -0.3348655700683594, -0.3049558699131012, -0.275046169757843, -0.24513645470142365, -0.21522673964500427, -0.18531709909439087, -0.1554073989391327, -0.12549768388271332, -0.09558797627687454, -0.06567826867103577, -0.03576856851577759, -0.005858853459358215, 0.024050861597061157, 0.053960561752319336, 0.08387026935815811, 0.11377997696399689, 0.14368969202041626, 0.17359939217567444, 0.20350909233093262, 0.233418807387352, 0.26332852244377136, 0.29323822259902954, 0.3231479227542877, 0.3530576229095459, 0.38296735286712646, 0.41287705302238464, 0.4427867531776428, 0.4726964831352234, 0.5026061534881592, 0.5325158834457397, 0.5624256134033203, 0.5923352837562561, 0.6222450137138367, 0.6521546840667725, 0.682064414024353, 0.7119741439819336, 0.7418838739395142, 0.77179354429245]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 0.0, 10.0, 8.0, 10.0, 11.0, 24.0, 35.0, 37.0, 67.0, 107.0, 208.0, 318.0, 520.0, 863.0, 1568.0, 2782.0, 5439.0, 11041.0, 23903.0, 58227.0, 194825.0, 502601.0, 154633.0, 49755.0, 20848.0, 9704.0, 4934.0, 2561.0, 1509.0, 754.0, 511.0, 274.0, 171.0, 104.0, 61.0, 29.0, 35.0, 23.0, 9.0, 13.0, 6.0, 2.0, 5.0, 5.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.215057373046875, -1.17230224609375, -1.129547119140625, -1.0867919921875, -1.044036865234375, -1.00128173828125, -0.958526611328125, -0.915771484375, -0.873016357421875, -0.83026123046875, -0.787506103515625, -0.7447509765625, -0.701995849609375, -0.65924072265625, -0.616485595703125, -0.57373046875, -0.530975341796875, -0.48822021484375, -0.445465087890625, -0.4027099609375, -0.359954833984375, -0.31719970703125, -0.274444580078125, -0.231689453125, -0.188934326171875, -0.14617919921875, -0.103424072265625, -0.0606689453125, -0.017913818359375, 0.02484130859375, 0.067596435546875, 0.1103515625, 0.153106689453125, 0.19586181640625, 0.238616943359375, 0.2813720703125, 0.324127197265625, 0.36688232421875, 0.409637451171875, 0.452392578125, 0.495147705078125, 0.53790283203125, 0.580657958984375, 0.6234130859375, 0.666168212890625, 0.70892333984375, 0.751678466796875, 0.79443359375, 0.837188720703125, 0.87994384765625, 0.922698974609375, 0.9654541015625, 1.008209228515625, 1.05096435546875, 1.093719482421875, 1.136474609375, 1.179229736328125, 1.22198486328125, 1.264739990234375, 1.3074951171875, 1.350250244140625, 1.39300537109375, 1.435760498046875, 1.478515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 5.0, 2.0, 8.0, 8.0, 8.0, 9.0, 17.0, 27.0, 21.0, 27.0, 28.0, 31.0, 31.0, 31.0, 46.0, 45.0, 66.0, 50.0, 44.0, 53.0, 53.0, 48.0, 51.0, 39.0, 36.0, 32.0, 39.0, 24.0, 21.0, 21.0, 18.0, 9.0, 11.0, 15.0, 4.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4013671875, -1.359893798828125, -1.31842041015625, -1.276947021484375, -1.2354736328125, -1.194000244140625, -1.15252685546875, -1.111053466796875, -1.069580078125, -1.028106689453125, -0.98663330078125, -0.945159912109375, -0.9036865234375, -0.862213134765625, -0.82073974609375, -0.779266357421875, -0.73779296875, -0.696319580078125, -0.65484619140625, -0.613372802734375, -0.5718994140625, -0.530426025390625, -0.48895263671875, -0.447479248046875, -0.406005859375, -0.364532470703125, -0.32305908203125, -0.281585693359375, -0.2401123046875, -0.198638916015625, -0.15716552734375, -0.115692138671875, -0.07421875, -0.032745361328125, 0.00872802734375, 0.050201416015625, 0.0916748046875, 0.133148193359375, 0.17462158203125, 0.216094970703125, 0.257568359375, 0.299041748046875, 0.34051513671875, 0.381988525390625, 0.4234619140625, 0.464935302734375, 0.50640869140625, 0.547882080078125, 0.58935546875, 0.630828857421875, 0.67230224609375, 0.713775634765625, 0.7552490234375, 0.796722412109375, 0.83819580078125, 0.879669189453125, 0.921142578125, 0.962615966796875, 1.00408935546875, 1.045562744140625, 1.0870361328125, 1.128509521484375, 1.16998291015625, 1.211456298828125, 1.2529296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 13.0, 13.0, 28.0, 40.0, 58.0, 112.0, 194.0, 367.0, 686.0, 1350.0, 2964.0, 6942.0, 17386.0, 51352.0, 259584.0, 570032.0, 92170.0, 26970.0, 10211.0, 4156.0, 1913.0, 907.0, 498.0, 251.0, 139.0, 85.0, 35.0, 32.0, 25.0, 13.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.028564453125, -1.96142578125, -1.894287109375, -1.8271484375, -1.760009765625, -1.69287109375, -1.625732421875, -1.55859375, -1.491455078125, -1.42431640625, -1.357177734375, -1.2900390625, -1.222900390625, -1.15576171875, -1.088623046875, -1.021484375, -0.954345703125, -0.88720703125, -0.820068359375, -0.7529296875, -0.685791015625, -0.61865234375, -0.551513671875, -0.484375, -0.417236328125, -0.35009765625, -0.282958984375, -0.2158203125, -0.148681640625, -0.08154296875, -0.014404296875, 0.052734375, 0.119873046875, 0.18701171875, 0.254150390625, 0.3212890625, 0.388427734375, 0.45556640625, 0.522705078125, 0.58984375, 0.656982421875, 0.72412109375, 0.791259765625, 0.8583984375, 0.925537109375, 0.99267578125, 1.059814453125, 1.126953125, 1.194091796875, 1.26123046875, 1.328369140625, 1.3955078125, 1.462646484375, 1.52978515625, 1.596923828125, 1.6640625, 1.731201171875, 1.79833984375, 1.865478515625, 1.9326171875, 1.999755859375, 2.06689453125, 2.134033203125, 2.201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 14.0, 5.0, 10.0, 9.0, 20.0, 25.0, 42.0, 38.0, 46.0, 49.0, 47.0, 63.0, 79.0, 66.0, 63.0, 69.0, 58.0, 52.0, 55.0, 37.0, 39.0, 32.0, 21.0, 13.0, 16.0, 12.0, 8.0, 4.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.421234130859375, -2.35223388671875, -2.283233642578125, -2.2142333984375, -2.145233154296875, -2.07623291015625, -2.007232666015625, -1.938232421875, -1.869232177734375, -1.80023193359375, -1.731231689453125, -1.6622314453125, -1.593231201171875, -1.52423095703125, -1.455230712890625, -1.38623046875, -1.317230224609375, -1.24822998046875, -1.179229736328125, -1.1102294921875, -1.041229248046875, -0.97222900390625, -0.903228759765625, -0.834228515625, -0.765228271484375, -0.69622802734375, -0.627227783203125, -0.5582275390625, -0.489227294921875, -0.42022705078125, -0.351226806640625, -0.2822265625, -0.213226318359375, -0.14422607421875, -0.075225830078125, -0.0062255859375, 0.062774658203125, 0.13177490234375, 0.200775146484375, 0.269775390625, 0.338775634765625, 0.40777587890625, 0.476776123046875, 0.5457763671875, 0.614776611328125, 0.68377685546875, 0.752777099609375, 0.82177734375, 0.890777587890625, 0.95977783203125, 1.028778076171875, 1.0977783203125, 1.166778564453125, 1.23577880859375, 1.304779052734375, 1.373779296875, 1.442779541015625, 1.51177978515625, 1.580780029296875, 1.6497802734375, 1.718780517578125, 1.78778076171875, 1.856781005859375, 1.92578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 8.0, 11.0, 15.0, 14.0, 27.0, 33.0, 49.0, 66.0, 81.0, 123.0, 172.0, 208.0, 331.0, 411.0, 611.0, 914.0, 1383.0, 2089.0, 3216.0, 4991.0, 8647.0, 15972.0, 33314.0, 77344.0, 199569.0, 412990.0, 159994.0, 63464.0, 27675.0, 13864.0, 7573.0, 4551.0, 2898.0, 1829.0, 1206.0, 854.0, 593.0, 398.0, 276.0, 204.0, 171.0, 101.0, 78.0, 51.0, 48.0, 39.0, 22.0, 21.0, 17.0, 12.0, 12.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0], "bins": [-0.1500244140625, -0.14524459838867188, -0.14046478271484375, -0.13568496704101562, -0.1309051513671875, -0.12612533569335938, -0.12134552001953125, -0.11656570434570312, -0.111785888671875, -0.10700607299804688, -0.10222625732421875, -0.09744644165039062, -0.0926666259765625, -0.08788681030273438, -0.08310699462890625, -0.07832717895507812, -0.07354736328125, -0.06876754760742188, -0.06398773193359375, -0.059207916259765625, -0.0544281005859375, -0.049648284912109375, -0.04486846923828125, -0.040088653564453125, -0.035308837890625, -0.030529022216796875, -0.02574920654296875, -0.020969390869140625, -0.0161895751953125, -0.011409759521484375, -0.00662994384765625, -0.001850128173828125, 0.0029296875, 0.007709503173828125, 0.01248931884765625, 0.017269134521484375, 0.0220489501953125, 0.026828765869140625, 0.03160858154296875, 0.036388397216796875, 0.041168212890625, 0.045948028564453125, 0.05072784423828125, 0.055507659912109375, 0.0602874755859375, 0.06506729125976562, 0.06984710693359375, 0.07462692260742188, 0.07940673828125, 0.08418655395507812, 0.08896636962890625, 0.09374618530273438, 0.0985260009765625, 0.10330581665039062, 0.10808563232421875, 0.11286544799804688, 0.117645263671875, 0.12242507934570312, 0.12720489501953125, 0.13198471069335938, 0.1367645263671875, 0.14154434204101562, 0.14632415771484375, 0.15110397338867188, 0.1558837890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 1.0, 4.0, 7.0, 8.0, 6.0, 14.0, 15.0, 20.0, 32.0, 36.0, 53.0, 53.0, 83.0, 134.0, 128.0, 98.0, 71.0, 61.0, 41.0, 36.0, 22.0, 24.0, 12.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 9.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4405460357666016e-05, -4.2885541915893555e-05, -4.1365623474121094e-05, -3.984570503234863e-05, -3.832578659057617e-05, -3.680586814880371e-05, -3.528594970703125e-05, -3.376603126525879e-05, -3.224611282348633e-05, -3.072619438171387e-05, -2.9206275939941406e-05, -2.7686357498168945e-05, -2.6166439056396484e-05, -2.4646520614624023e-05, -2.3126602172851562e-05, -2.16066837310791e-05, -2.008676528930664e-05, -1.856684684753418e-05, -1.704692840576172e-05, -1.5527009963989258e-05, -1.4007091522216797e-05, -1.2487173080444336e-05, -1.0967254638671875e-05, -9.447336196899414e-06, -7.927417755126953e-06, -6.407499313354492e-06, -4.887580871582031e-06, -3.3676624298095703e-06, -1.8477439880371094e-06, -3.2782554626464844e-07, 1.1920928955078125e-06, 2.7120113372802734e-06, 4.231929779052734e-06, 5.751848220825195e-06, 7.271766662597656e-06, 8.791685104370117e-06, 1.0311603546142578e-05, 1.1831521987915039e-05, 1.33514404296875e-05, 1.4871358871459961e-05, 1.6391277313232422e-05, 1.7911195755004883e-05, 1.9431114196777344e-05, 2.0951032638549805e-05, 2.2470951080322266e-05, 2.3990869522094727e-05, 2.5510787963867188e-05, 2.703070640563965e-05, 2.855062484741211e-05, 3.007054328918457e-05, 3.159046173095703e-05, 3.311038017272949e-05, 3.463029861450195e-05, 3.6150217056274414e-05, 3.7670135498046875e-05, 3.9190053939819336e-05, 4.07099723815918e-05, 4.222989082336426e-05, 4.374980926513672e-05, 4.526972770690918e-05, 4.678964614868164e-05, 4.83095645904541e-05, 4.982948303222656e-05, 5.1349401473999023e-05, 5.2869319915771484e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 9.0, 10.0, 18.0, 21.0, 21.0, 38.0, 58.0, 74.0, 86.0, 162.0, 175.0, 250.0, 348.0, 521.0, 767.0, 1216.0, 1786.0, 2847.0, 4664.0, 7809.0, 13500.0, 26777.0, 60243.0, 163402.0, 432278.0, 194065.0, 69582.0, 30020.0, 15248.0, 8433.0, 4993.0, 3082.0, 1972.0, 1257.0, 858.0, 561.0, 396.0, 251.0, 216.0, 136.0, 113.0, 74.0, 51.0, 35.0, 40.0, 24.0, 22.0, 16.0, 11.0, 6.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2008056640625, -0.19444656372070312, -0.18808746337890625, -0.18172836303710938, -0.1753692626953125, -0.16901016235351562, -0.16265106201171875, -0.15629196166992188, -0.149932861328125, -0.14357376098632812, -0.13721466064453125, -0.13085556030273438, -0.1244964599609375, -0.11813735961914062, -0.11177825927734375, -0.10541915893554688, -0.09906005859375, -0.09270095825195312, -0.08634185791015625, -0.07998275756835938, -0.0736236572265625, -0.06726455688476562, -0.06090545654296875, -0.054546356201171875, -0.048187255859375, -0.041828155517578125, -0.03546905517578125, -0.029109954833984375, -0.0227508544921875, -0.016391754150390625, -0.01003265380859375, -0.003673553466796875, 0.002685546875, 0.009044647216796875, 0.01540374755859375, 0.021762847900390625, 0.0281219482421875, 0.034481048583984375, 0.04084014892578125, 0.047199249267578125, 0.053558349609375, 0.059917449951171875, 0.06627655029296875, 0.07263565063476562, 0.0789947509765625, 0.08535385131835938, 0.09171295166015625, 0.09807205200195312, 0.10443115234375, 0.11079025268554688, 0.11714935302734375, 0.12350845336914062, 0.1298675537109375, 0.13622665405273438, 0.14258575439453125, 0.14894485473632812, 0.155303955078125, 0.16166305541992188, 0.16802215576171875, 0.17438125610351562, 0.1807403564453125, 0.18709945678710938, 0.19345855712890625, 0.19981765747070312, 0.2061767578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 4.0, 8.0, 7.0, 5.0, 12.0, 14.0, 16.0, 25.0, 37.0, 42.0, 47.0, 68.0, 100.0, 100.0, 100.0, 82.0, 72.0, 49.0, 39.0, 38.0, 27.0, 16.0, 16.0, 13.0, 11.0, 6.0, 5.0, 2.0, 4.0, 5.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.19580078125, -0.19035911560058594, -0.18491744995117188, -0.1794757843017578, -0.17403411865234375, -0.1685924530029297, -0.16315078735351562, -0.15770912170410156, -0.1522674560546875, -0.14682579040527344, -0.14138412475585938, -0.1359424591064453, -0.13050079345703125, -0.1250591278076172, -0.11961746215820312, -0.11417579650878906, -0.108734130859375, -0.10329246520996094, -0.09785079956054688, -0.09240913391113281, -0.08696746826171875, -0.08152580261230469, -0.07608413696289062, -0.07064247131347656, -0.0652008056640625, -0.05975914001464844, -0.054317474365234375, -0.04887580871582031, -0.04343414306640625, -0.03799247741699219, -0.032550811767578125, -0.027109146118164062, -0.02166748046875, -0.016225814819335938, -0.010784149169921875, -0.0053424835205078125, 9.918212890625e-05, 0.0055408477783203125, 0.010982513427734375, 0.016424179077148438, 0.0218658447265625, 0.027307510375976562, 0.032749176025390625, 0.03819084167480469, 0.04363250732421875, 0.04907417297363281, 0.054515838623046875, 0.05995750427246094, 0.065399169921875, 0.07084083557128906, 0.07628250122070312, 0.08172416687011719, 0.08716583251953125, 0.09260749816894531, 0.09804916381835938, 0.10349082946777344, 0.1089324951171875, 0.11437416076660156, 0.11981582641601562, 0.1252574920654297, 0.13069915771484375, 0.1361408233642578, 0.14158248901367188, 0.14702415466308594, 0.1524658203125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 6.0, 19.0, 17.0, 21.0, 21.0, 46.0, 79.0, 92.0, 123.0, 122.0, 104.0, 100.0, 80.0, 59.0, 35.0, 21.0, 13.0, 11.0, 6.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1356298923492432, -1.045167088508606, -0.9547043442726135, -0.8642416000366211, -0.7737787961959839, -0.6833159923553467, -0.5928532481193542, -0.5023905038833618, -0.4119277000427246, -0.3214649260044098, -0.23100215196609497, -0.14053937792778015, -0.05007660388946533, 0.04038617014884949, 0.1308489441871643, 0.22131168842315674, 0.31177449226379395, 0.40223726630210876, 0.4927000403404236, 0.583162784576416, 0.6736255884170532, 0.7640883922576904, 0.8545511364936829, 0.9450138807296753, 1.0354766845703125, 1.1259394884109497, 1.216402292251587, 1.3068649768829346, 1.3973277807235718, 1.487790584564209, 1.5782532691955566, 1.6687160730361938, 1.7591791152954102, 1.8496419191360474, 1.9401047229766846, 2.0305674076080322, 2.121030330657959, 2.2114930152893066, 2.3019556999206543, 2.392418384552002, 2.4828813076019287, 2.5733439922332764, 2.663806915283203, 2.754269599914551, 2.8447322845458984, 2.935195207595825, 3.025657892227173, 3.1161208152770996, 3.2065834999084473, 3.297046184539795, 3.3875091075897217, 3.4779717922210693, 3.568434715270996, 3.6588973999023438, 3.7493600845336914, 3.839822769165039, 3.930285692214966, 4.020748615264893, 4.11121129989624, 4.201673984527588, 4.2921366691589355, 4.382599353790283, 4.473062515258789, 4.563525199890137, 4.653987884521484]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 10.0, 8.0, 17.0, 19.0, 21.0, 24.0, 21.0, 19.0, 28.0, 25.0, 40.0, 31.0, 34.0, 41.0, 45.0, 30.0, 41.0, 36.0, 56.0, 34.0, 41.0, 37.0, 46.0, 32.0, 35.0, 28.0, 29.0, 22.0, 16.0, 18.0, 22.0, 11.0, 13.0, 13.0, 13.0, 7.0, 14.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.1453680992126465, -2.0737626552581787, -2.002157211303711, -1.9305517673492432, -1.8589463233947754, -1.7873408794403076, -1.7157355546951294, -1.6441301107406616, -1.5725246667861938, -1.500919222831726, -1.4293137788772583, -1.3577083349227905, -1.2861030101776123, -1.2144975662231445, -1.1428921222686768, -1.071286678314209, -0.9996812343597412, -0.9280757904052734, -0.8564703464508057, -0.7848649621009827, -0.7132595181465149, -0.6416540741920471, -0.5700486898422241, -0.49844324588775635, -0.4268378019332886, -0.3552323579788208, -0.2836269438266754, -0.21202151477336884, -0.14041608572006226, -0.06881064176559448, 0.0027947723865509033, 0.07440018653869629, 0.14600563049316406, 0.21761105954647064, 0.2892164885997772, 0.3608219027519226, 0.4324273467063904, 0.5040327906608582, 0.5756381750106812, 0.6472436189651489, 0.7188490629196167, 0.7904545068740845, 0.8620599508285522, 0.9336653351783752, 1.0052707195281982, 1.076876163482666, 1.1484816074371338, 1.2200870513916016, 1.2916924953460693, 1.363297939300537, 1.4349033832550049, 1.5065088272094727, 1.5781142711639404, 1.6497197151184082, 1.7213250398635864, 1.7929304838180542, 1.864535927772522, 1.9361413717269897, 2.007746696472168, 2.0793521404266357, 2.1509575843811035, 2.2225630283355713, 2.294168472290039, 2.365773916244507, 2.4373793601989746]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 9.0, 9.0, 7.0, 15.0, 12.0, 22.0, 31.0, 41.0, 49.0, 74.0, 74.0, 105.0, 127.0, 147.0, 184.0, 193.0, 198.0, 282.0, 297.0, 380.0, 448.0, 575.0, 1043302.0, 863.0, 562.0, 421.0, 331.0, 287.0, 283.0, 208.0, 197.0, 177.0, 126.0, 127.0, 103.0, 67.0, 59.0, 52.0, 32.0, 24.0, 21.0, 23.0, 17.0, 5.0, 11.0, 7.0, 0.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.9430489540100098, -2.8507559299468994, -2.75846266746521, -2.6661696434020996, -2.5738766193389893, -2.481583595275879, -2.3892903327941895, -2.296997308731079, -2.2047042846679688, -2.1124112606048584, -2.020117998123169, -1.9278249740600586, -1.8355319499969482, -1.7432388067245483, -1.6509456634521484, -1.558652639389038, -1.4663593769073486, -1.3740662336349487, -1.2817732095718384, -1.1894800662994385, -1.0971870422363281, -1.0048938989639282, -0.9126007556915283, -0.8203076720237732, -0.7280145883560181, -0.6357215046882629, -0.5434284210205078, -0.4511352777481079, -0.3588421940803528, -0.26654911041259766, -0.17425596714019775, -0.08196288347244263, 0.010330438613891602, 0.10262353718280792, 0.19491663575172424, 0.28720974922180176, 0.3795028328895569, 0.471795916557312, 0.5640890598297119, 0.656382143497467, 0.7486752271652222, 0.8409683108329773, 0.9332613945007324, 1.0255545377731323, 1.1178476810455322, 1.2101407051086426, 1.3024338483810425, 1.3947269916534424, 1.4870200157165527, 1.5793131589889526, 1.671606183052063, 1.763899326324463, 1.8561923503875732, 1.9484854936599731, 2.040778636932373, 2.1330716609954834, 2.2253646850585938, 2.317657709121704, 2.4099509716033936, 2.502243995666504, 2.5945370197296143, 2.6868300437927246, 2.779123306274414, 2.8714163303375244, 2.963709592819214]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 8.0, 10.0, 8.0, 8.0, 12.0, 42.0, 106.0, 409.0, 2767.0, 51459292.0, 7420.0, 950.0, 208.0, 59.0, 19.0, 18.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.58203125, -60.5390625, -58.49609375, -56.453125, -54.41015625, -52.3671875, -50.32421875, -48.28125, -46.23828125, -44.1953125, -42.15234375, -40.109375, -38.06640625, -36.0234375, -33.98046875, -31.9375, -29.89453125, -27.8515625, -25.80859375, -23.765625, -21.72265625, -19.6796875, -17.63671875, -15.59375, -13.55078125, -11.5078125, -9.46484375, -7.421875, -5.37890625, -3.3359375, -1.29296875, 0.75, 2.79296875, 4.8359375, 6.87890625, 8.921875, 10.96484375, 13.0078125, 15.05078125, 17.09375, 19.13671875, 21.1796875, 23.22265625, 25.265625, 27.30859375, 29.3515625, 31.39453125, 33.4375, 35.48046875, 37.5234375, 39.56640625, 41.609375, 43.65234375, 45.6953125, 47.73828125, 49.78125, 51.82421875, 53.8671875, 55.91015625, 57.953125, 59.99609375, 62.0390625, 64.08203125, 66.125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 11.0, 10.0, 17.0, 22.0, 33.0, 52.0, 70.0, 94.0, 160.0, 226.0, 341.0, 518.0, 666.0, 1129.0, 1582.0, 2253.0, 3413.0, 5039.0, 7626.0, 11476.0, 17237.0, 26520.0, 41397.0, 65130.0, 101136.0, 159101.0, 247808.0, 370819.0, 1316428.0, 2809498.0, 382911.0, 257422.0, 166384.0, 105259.0, 67229.0, 42587.0, 27429.0, 17640.0, 11458.0, 7859.0, 5062.0, 3378.0, 2222.0, 1493.0, 1036.0, 760.0, 479.0, 322.0, 245.0, 148.0, 108.0, 74.0, 52.0, 25.0, 29.0, 15.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.60009765625, -0.5819320678710938, -0.5637664794921875, -0.5456008911132812, -0.527435302734375, -0.5092697143554688, -0.4911041259765625, -0.47293853759765625, -0.45477294921875, -0.43660736083984375, -0.4184417724609375, -0.40027618408203125, -0.382110595703125, -0.36394500732421875, -0.3457794189453125, -0.32761383056640625, -0.3094482421875, -0.29128265380859375, -0.2731170654296875, -0.25495147705078125, -0.236785888671875, -0.21862030029296875, -0.2004547119140625, -0.18228912353515625, -0.16412353515625, -0.14595794677734375, -0.1277923583984375, -0.10962677001953125, -0.091461181640625, -0.07329559326171875, -0.0551300048828125, -0.03696441650390625, -0.018798828125, -0.00063323974609375, 0.0175323486328125, 0.03569793701171875, 0.053863525390625, 0.07202911376953125, 0.0901947021484375, 0.10836029052734375, 0.12652587890625, 0.14469146728515625, 0.1628570556640625, 0.18102264404296875, 0.199188232421875, 0.21735382080078125, 0.2355194091796875, 0.25368499755859375, 0.2718505859375, 0.29001617431640625, 0.3081817626953125, 0.32634735107421875, 0.344512939453125, 0.36267852783203125, 0.3808441162109375, 0.39900970458984375, 0.41717529296875, 0.43534088134765625, 0.4535064697265625, 0.47167205810546875, 0.489837646484375, 0.5080032348632812, 0.5261688232421875, 0.5443344116210938, 0.5625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 9.0, 10.0, 8.0, 13.0, 20.0, 14.0, 19.0, 30.0, 25.0, 28.0, 31.0, 36.0, 36.0, 37.0, 29.0, 54.0, 70.0, 1056.0, 46.0, 45.0, 46.0, 41.0, 46.0, 39.0, 29.0, 26.0, 23.0, 24.0, 20.0, 13.0, 16.0, 18.0, 11.0, 10.0, 10.0, 9.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-16.4375, -15.9444580078125, -15.451416015625, -14.9583740234375, -14.46533203125, -13.9722900390625, -13.479248046875, -12.9862060546875, -12.4931640625, -12.0001220703125, -11.507080078125, -11.0140380859375, -10.52099609375, -10.0279541015625, -9.534912109375, -9.0418701171875, -8.548828125, -8.0557861328125, -7.562744140625, -7.0697021484375, -6.57666015625, -6.0836181640625, -5.590576171875, -5.0975341796875, -4.6044921875, -4.1114501953125, -3.618408203125, -3.1253662109375, -2.63232421875, -2.1392822265625, -1.646240234375, -1.1531982421875, -0.66015625, -0.1671142578125, 0.325927734375, 0.8189697265625, 1.31201171875, 1.8050537109375, 2.298095703125, 2.7911376953125, 3.2841796875, 3.7772216796875, 4.270263671875, 4.7633056640625, 5.25634765625, 5.7493896484375, 6.242431640625, 6.7354736328125, 7.228515625, 7.7215576171875, 8.214599609375, 8.7076416015625, 9.20068359375, 9.6937255859375, 10.186767578125, 10.6798095703125, 11.1728515625, 11.6658935546875, 12.158935546875, 12.6519775390625, 13.14501953125, 13.6380615234375, 14.131103515625, 14.6241455078125, 15.1171875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 9.0, 14.0, 23.0, 28.0, 45.0, 61.0, 112.0, 179.0, 264.0, 376.0, 572.0, 829.0, 1314.0, 1955.0, 3005.0, 4377.0, 6684.0, 10571.0, 15930.0, 24642.0, 38586.0, 61789.0, 97963.0, 155001.0, 244765.0, 359059.0, 598265.0, 3489240.0, 398386.0, 281013.0, 182783.0, 114312.0, 71853.0, 45301.0, 28983.0, 18528.0, 11903.0, 7699.0, 5066.0, 3376.0, 2203.0, 1451.0, 991.0, 651.0, 433.0, 292.0, 205.0, 136.0, 93.0, 49.0, 24.0, 22.0, 11.0, 12.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.486328125, -0.47020721435546875, -0.4540863037109375, -0.43796539306640625, -0.421844482421875, -0.40572357177734375, -0.3896026611328125, -0.37348175048828125, -0.35736083984375, -0.34123992919921875, -0.3251190185546875, -0.30899810791015625, -0.292877197265625, -0.27675628662109375, -0.2606353759765625, -0.24451446533203125, -0.2283935546875, -0.21227264404296875, -0.1961517333984375, -0.18003082275390625, -0.163909912109375, -0.14778900146484375, -0.1316680908203125, -0.11554718017578125, -0.09942626953125, -0.08330535888671875, -0.0671844482421875, -0.05106353759765625, -0.034942626953125, -0.01882171630859375, -0.0027008056640625, 0.01342010498046875, 0.029541015625, 0.04566192626953125, 0.0617828369140625, 0.07790374755859375, 0.094024658203125, 0.11014556884765625, 0.1262664794921875, 0.14238739013671875, 0.15850830078125, 0.17462921142578125, 0.1907501220703125, 0.20687103271484375, 0.222991943359375, 0.23911285400390625, 0.2552337646484375, 0.27135467529296875, 0.2874755859375, 0.30359649658203125, 0.3197174072265625, 0.33583831787109375, 0.351959228515625, 0.36808013916015625, 0.3842010498046875, 0.40032196044921875, 0.41644287109375, 0.43256378173828125, 0.4486846923828125, 0.46480560302734375, 0.480926513671875, 0.49704742431640625, 0.5131683349609375, 0.5292892456054688, 0.54541015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 3.0, 10.0, 8.0, 5.0, 13.0, 12.0, 13.0, 26.0, 22.0, 17.0, 23.0, 25.0, 37.0, 35.0, 30.0, 34.0, 36.0, 39.0, 40.0, 41.0, 1069.0, 39.0, 32.0, 42.0, 34.0, 30.0, 40.0, 28.0, 29.0, 27.0, 26.0, 23.0, 12.0, 21.0, 19.0, 15.0, 11.0, 8.0, 10.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-11.6015625, -11.2650146484375, -10.928466796875, -10.5919189453125, -10.25537109375, -9.9188232421875, -9.582275390625, -9.2457275390625, -8.9091796875, -8.5726318359375, -8.236083984375, -7.8995361328125, -7.56298828125, -7.2264404296875, -6.889892578125, -6.5533447265625, -6.216796875, -5.8802490234375, -5.543701171875, -5.2071533203125, -4.87060546875, -4.5340576171875, -4.197509765625, -3.8609619140625, -3.5244140625, -3.1878662109375, -2.851318359375, -2.5147705078125, -2.17822265625, -1.8416748046875, -1.505126953125, -1.1685791015625, -0.83203125, -0.4954833984375, -0.158935546875, 0.1776123046875, 0.51416015625, 0.8507080078125, 1.187255859375, 1.5238037109375, 1.8603515625, 2.1968994140625, 2.533447265625, 2.8699951171875, 3.20654296875, 3.5430908203125, 3.879638671875, 4.2161865234375, 4.552734375, 4.8892822265625, 5.225830078125, 5.5623779296875, 5.89892578125, 6.2354736328125, 6.572021484375, 6.9085693359375, 7.2451171875, 7.5816650390625, 7.918212890625, 8.2547607421875, 8.59130859375, 8.9278564453125, 9.264404296875, 9.6009521484375, 9.9375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 4.0, 9.0, 8.0, 14.0, 18.0, 34.0, 35.0, 62.0, 100.0, 123.0, 244.0, 380.0, 673.0, 1171.0, 2084.0, 3942.0, 7406.0, 13941.0, 26245.0, 53391.0, 113481.0, 261633.0, 634567.0, 4146668.0, 577949.0, 239758.0, 104692.0, 49762.0, 24612.0, 12952.0, 6926.0, 3630.0, 2112.0, 1155.0, 645.0, 362.0, 236.0, 142.0, 77.0, 35.0, 35.0, 26.0, 20.0, 28.0, 12.0, 12.0, 11.0, 2.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.90576171875, -0.8760147094726562, -0.8462677001953125, -0.8165206909179688, -0.786773681640625, -0.7570266723632812, -0.7272796630859375, -0.6975326538085938, -0.66778564453125, -0.6380386352539062, -0.6082916259765625, -0.5785446166992188, -0.548797607421875, -0.5190505981445312, -0.4893035888671875, -0.45955657958984375, -0.4298095703125, -0.40006256103515625, -0.3703155517578125, -0.34056854248046875, -0.310821533203125, -0.28107452392578125, -0.2513275146484375, -0.22158050537109375, -0.19183349609375, -0.16208648681640625, -0.1323394775390625, -0.10259246826171875, -0.072845458984375, -0.04309844970703125, -0.0133514404296875, 0.01639556884765625, 0.046142578125, 0.07588958740234375, 0.1056365966796875, 0.13538360595703125, 0.165130615234375, 0.19487762451171875, 0.2246246337890625, 0.25437164306640625, 0.28411865234375, 0.31386566162109375, 0.3436126708984375, 0.37335968017578125, 0.403106689453125, 0.43285369873046875, 0.4626007080078125, 0.49234771728515625, 0.5220947265625, 0.5518417358398438, 0.5815887451171875, 0.6113357543945312, 0.641082763671875, 0.6708297729492188, 0.7005767822265625, 0.7303237915039062, 0.76007080078125, 0.7898178100585938, 0.8195648193359375, 0.8493118286132812, 0.879058837890625, 0.9088058471679688, 0.9385528564453125, 0.9682998657226562, 0.998046875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 8.0, 9.0, 10.0, 8.0, 15.0, 13.0, 8.0, 15.0, 18.0, 22.0, 28.0, 22.0, 24.0, 33.0, 32.0, 30.0, 46.0, 42.0, 44.0, 45.0, 1055.0, 45.0, 47.0, 38.0, 37.0, 28.0, 41.0, 30.0, 28.0, 23.0, 34.0, 18.0, 22.0, 14.0, 15.0, 20.0, 4.0, 10.0, 8.0, 11.0, 2.0, 4.0, 5.0, 1.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1015625, -8.8297119140625, -8.557861328125, -8.2860107421875, -8.01416015625, -7.7423095703125, -7.470458984375, -7.1986083984375, -6.9267578125, -6.6549072265625, -6.383056640625, -6.1112060546875, -5.83935546875, -5.5675048828125, -5.295654296875, -5.0238037109375, -4.751953125, -4.4801025390625, -4.208251953125, -3.9364013671875, -3.66455078125, -3.3927001953125, -3.120849609375, -2.8489990234375, -2.5771484375, -2.3052978515625, -2.033447265625, -1.7615966796875, -1.48974609375, -1.2178955078125, -0.946044921875, -0.6741943359375, -0.40234375, -0.1304931640625, 0.141357421875, 0.4132080078125, 0.68505859375, 0.9569091796875, 1.228759765625, 1.5006103515625, 1.7724609375, 2.0443115234375, 2.316162109375, 2.5880126953125, 2.85986328125, 3.1317138671875, 3.403564453125, 3.6754150390625, 3.947265625, 4.2191162109375, 4.490966796875, 4.7628173828125, 5.03466796875, 5.3065185546875, 5.578369140625, 5.8502197265625, 6.1220703125, 6.3939208984375, 6.665771484375, 6.9376220703125, 7.20947265625, 7.4813232421875, 7.753173828125, 8.0250244140625, 8.296875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 17.0, 44.0, 187.0, 397.0, 261.0, 64.0, 19.0, 5.0, 7.0, 1.0, 1.0, 1.0], "bins": [-29.987051010131836, -29.449649810791016, -28.912250518798828, -28.374849319458008, -27.837448120117188, -27.300048828125, -26.76264762878418, -26.22524642944336, -25.687847137451172, -25.15044593811035, -24.613046646118164, -24.075645446777344, -23.538244247436523, -23.000843048095703, -22.463443756103516, -21.926042556762695, -21.388641357421875, -20.851240158081055, -20.313840866088867, -19.776439666748047, -19.239038467407227, -18.701637268066406, -18.16423797607422, -17.6268367767334, -17.089435577392578, -16.552034378051758, -16.01463508605957, -15.47723388671875, -14.93983268737793, -14.402432441711426, -13.865032196044922, -13.327630996704102, -12.790231704711914, -12.25283145904541, -11.71543025970459, -11.178030014038086, -10.640628814697266, -10.103228569030762, -9.565828323364258, -9.028427124023438, -8.491026878356934, -7.9536261558532715, -7.416225433349609, -6.8788251876831055, -6.341424465179443, -5.804023742675781, -5.266623497009277, -4.729222774505615, -4.191822052001953, -3.654421329498291, -3.117020845413208, -2.579620361328125, -2.042219638824463, -1.5048189163208008, -0.9674184322357178, -0.43001794815063477, 0.10738277435302734, 0.6447833776473999, 1.1821839809417725, 1.719584584236145, 2.2569851875305176, 2.7943859100341797, 3.3317863941192627, 3.8691868782043457, 4.406587600708008]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 1.0, 8.0, 4.0, 20.0, 16.0, 18.0, 20.0, 16.0, 25.0, 22.0, 34.0, 30.0, 41.0, 33.0, 52.0, 39.0, 37.0, 43.0, 31.0, 49.0, 47.0, 45.0, 43.0, 37.0, 41.0, 31.0, 30.0, 22.0, 19.0, 27.0, 13.0, 18.0, 12.0, 10.0, 14.0, 13.0, 7.0, 10.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.266138076782227, -15.759446144104004, -15.252753257751465, -14.746061325073242, -14.239368438720703, -13.73267650604248, -13.225984573364258, -12.719291687011719, -12.212599754333496, -11.705907821655273, -11.199214935302734, -10.692523002624512, -10.185831069946289, -9.67913818359375, -9.172446250915527, -8.665754318237305, -8.159061431884766, -7.652369022369385, -7.145676612854004, -6.638984680175781, -6.1322922706604, -5.6255998611450195, -5.118907928466797, -4.612215518951416, -4.105523109436035, -3.5988306999206543, -3.0921385288238525, -2.585446357727051, -2.07875394821167, -1.572061538696289, -1.0653693675994873, -0.5586771965026855, -0.0519866943359375, 0.4547055959701538, 0.9613978862762451, 1.4680901765823364, 1.9747824668884277, 2.4814748764038086, 2.9881670475006104, 3.494859218597412, 4.001551628112793, 4.508244037628174, 5.014936447143555, 5.521628379821777, 6.028320789337158, 6.535013198852539, 7.041705131530762, 7.548397541046143, 8.055089950561523, 8.561781883239746, 9.068474769592285, 9.575166702270508, 10.081859588623047, 10.58855152130127, 11.095243453979492, 11.601936340332031, 12.108628273010254, 12.615320205688477, 13.122013092041016, 13.628705024719238, 14.135396957397461, 14.64208984375, 15.148781776428223, 15.655473709106445, 16.162166595458984]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 4.0, 10.0, 14.0, 15.0, 34.0, 41.0, 86.0, 182.0, 356.0, 449.0, 697.0, 1571.0, 3278.0, 7640.0, 20834.0, 65492.0, 2559631.0, 1440040.0, 64110.0, 19390.0, 5932.0, 2255.0, 960.0, 555.0, 286.0, 175.0, 88.0, 52.0, 28.0, 14.0, 12.0, 8.0, 13.0, 2.0, 5.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.261474609375, -0.2527427673339844, -0.24401092529296875, -0.23527908325195312, -0.2265472412109375, -0.21781539916992188, -0.20908355712890625, -0.20035171508789062, -0.191619873046875, -0.18288803100585938, -0.17415618896484375, -0.16542434692382812, -0.1566925048828125, -0.14796066284179688, -0.13922882080078125, -0.13049697875976562, -0.12176513671875, -0.11303329467773438, -0.10430145263671875, -0.09556961059570312, -0.0868377685546875, -0.07810592651367188, -0.06937408447265625, -0.060642242431640625, -0.051910400390625, -0.043178558349609375, -0.03444671630859375, -0.025714874267578125, -0.0169830322265625, -0.008251190185546875, 0.00048065185546875, 0.009212493896484375, 0.0179443359375, 0.026676177978515625, 0.03540802001953125, 0.044139862060546875, 0.0528717041015625, 0.061603546142578125, 0.07033538818359375, 0.07906723022460938, 0.087799072265625, 0.09653091430664062, 0.10526275634765625, 0.11399459838867188, 0.1227264404296875, 0.13145828247070312, 0.14019012451171875, 0.14892196655273438, 0.15765380859375, 0.16638565063476562, 0.17511749267578125, 0.18384933471679688, 0.1925811767578125, 0.20131301879882812, 0.21004486083984375, 0.21877670288085938, 0.227508544921875, 0.23624038696289062, 0.24497222900390625, 0.2537040710449219, 0.2624359130859375, 0.2711677551269531, 0.27989959716796875, 0.2886314392089844, 0.29736328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 12.0, 19.0, 18.0, 19.0, 23.0, 23.0, 37.0, 36.0, 62.0, 57.0, 64.0, 86.0, 74.0, 69.0, 67.0, 55.0, 56.0, 38.0, 23.0, 27.0, 31.0, 18.0, 13.0, 15.0, 10.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0721435546875, -0.06974124908447266, -0.06733894348144531, -0.06493663787841797, -0.06253433227539062, -0.06013202667236328, -0.05772972106933594, -0.055327415466308594, -0.05292510986328125, -0.050522804260253906, -0.04812049865722656, -0.04571819305419922, -0.043315887451171875, -0.04091358184814453, -0.03851127624511719, -0.036108970642089844, -0.0337066650390625, -0.031304359436035156, -0.028902053833007812, -0.02649974822998047, -0.024097442626953125, -0.02169513702392578, -0.019292831420898438, -0.016890525817871094, -0.01448822021484375, -0.012085914611816406, -0.009683609008789062, -0.007281303405761719, -0.004878997802734375, -0.0024766921997070312, -7.43865966796875e-05, 0.0023279190063476562, 0.004730224609375, 0.007132530212402344, 0.009534835815429688, 0.011937141418457031, 0.014339447021484375, 0.01674175262451172, 0.019144058227539062, 0.021546363830566406, 0.02394866943359375, 0.026350975036621094, 0.028753280639648438, 0.03115558624267578, 0.033557891845703125, 0.03596019744873047, 0.03836250305175781, 0.040764808654785156, 0.0431671142578125, 0.045569419860839844, 0.04797172546386719, 0.05037403106689453, 0.052776336669921875, 0.05517864227294922, 0.05758094787597656, 0.059983253479003906, 0.06238555908203125, 0.0647878646850586, 0.06719017028808594, 0.06959247589111328, 0.07199478149414062, 0.07439708709716797, 0.07679939270019531, 0.07920169830322266, 0.08160400390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 8.0, 10.0, 12.0, 11.0, 15.0, 23.0, 23.0, 24.0, 33.0, 47.0, 65.0, 72.0, 168.0, 594.0, 7950.0, 4064934.0, 117402.0, 2388.0, 226.0, 90.0, 46.0, 36.0, 20.0, 12.0, 13.0, 10.0, 10.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3828125, -0.3721199035644531, -0.36142730712890625, -0.3507347106933594, -0.3400421142578125, -0.3293495178222656, -0.31865692138671875, -0.3079643249511719, -0.297271728515625, -0.2865791320800781, -0.27588653564453125, -0.2651939392089844, -0.2545013427734375, -0.24380874633789062, -0.23311614990234375, -0.22242355346679688, -0.21173095703125, -0.20103836059570312, -0.19034576416015625, -0.17965316772460938, -0.1689605712890625, -0.15826797485351562, -0.14757537841796875, -0.13688278198242188, -0.126190185546875, -0.11549758911132812, -0.10480499267578125, -0.09411239624023438, -0.0834197998046875, -0.07272720336914062, -0.06203460693359375, -0.051342010498046875, -0.0406494140625, -0.029956817626953125, -0.01926422119140625, -0.008571624755859375, 0.0021209716796875, 0.012813568115234375, 0.02350616455078125, 0.034198760986328125, 0.044891357421875, 0.055583953857421875, 0.06627655029296875, 0.07696914672851562, 0.0876617431640625, 0.09835433959960938, 0.10904693603515625, 0.11973953247070312, 0.13043212890625, 0.14112472534179688, 0.15181732177734375, 0.16250991821289062, 0.1732025146484375, 0.18389511108398438, 0.19458770751953125, 0.20528030395507812, 0.215972900390625, 0.22666549682617188, 0.23735809326171875, 0.24805068969726562, 0.2587432861328125, 0.2694358825683594, 0.28012847900390625, 0.2908210754394531, 0.301513671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 10.0, 4.0, 7.0, 9.0, 14.0, 22.0, 30.0, 46.0, 69.0, 161.0, 536.0, 1922.0, 737.0, 186.0, 92.0, 53.0, 37.0, 34.0, 22.0, 10.0, 17.0, 8.0, 9.0, 6.0, 12.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12225532531738281, -0.11706924438476562, -0.11188316345214844, -0.10669708251953125, -0.10151100158691406, -0.09632492065429688, -0.09113883972167969, -0.0859527587890625, -0.08076667785644531, -0.07558059692382812, -0.07039451599121094, -0.06520843505859375, -0.06002235412597656, -0.054836273193359375, -0.04965019226074219, -0.044464111328125, -0.03927803039550781, -0.034091949462890625, -0.028905868530273438, -0.02371978759765625, -0.018533706665039062, -0.013347625732421875, -0.008161544799804688, -0.0029754638671875, 0.0022106170654296875, 0.007396697998046875, 0.012582778930664062, 0.01776885986328125, 0.022954940795898438, 0.028141021728515625, 0.03332710266113281, 0.03851318359375, 0.04369926452636719, 0.048885345458984375, 0.05407142639160156, 0.05925750732421875, 0.06444358825683594, 0.06962966918945312, 0.07481575012207031, 0.0800018310546875, 0.08518791198730469, 0.09037399291992188, 0.09556007385253906, 0.10074615478515625, 0.10593223571777344, 0.11111831665039062, 0.11630439758300781, 0.121490478515625, 0.1266765594482422, 0.13186264038085938, 0.13704872131347656, 0.14223480224609375, 0.14742088317871094, 0.15260696411132812, 0.1577930450439453, 0.1629791259765625, 0.1681652069091797, 0.17335128784179688, 0.17853736877441406, 0.18372344970703125, 0.18890953063964844, 0.19409561157226562, 0.1992816925048828, 0.2044677734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1019.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13934482634067535, 0.09552453458309174, 0.33039391040802, 0.5652632713317871, 0.8001326322555542, 1.0350019931793213, 1.2698713541030884, 1.5047407150268555, 1.7396100759506226, 1.9744794368743896, 2.209348678588867, 2.444218158721924, 2.6790876388549805, 2.913956880569458, 3.1488261222839355, 3.383695602416992, 3.6185648441314697, 3.8534340858459473, 4.088303565979004, 4.3231730461120605, 4.558042526245117, 4.792911529541016, 5.027781009674072, 5.262650489807129, 5.4975199699401855, 5.732389450073242, 5.967258453369141, 6.202127933502197, 6.436997413635254, 6.6718668937683105, 6.906736373901367, 7.141605377197266, 7.376474380493164, 7.611343860626221, 7.846213340759277, 8.081082344055176, 8.31595230102539, 8.550821304321289, 8.785690307617188, 9.020560264587402, 9.2554292678833, 9.4902982711792, 9.725168228149414, 9.960037231445312, 10.194906234741211, 10.429776191711426, 10.664645195007324, 10.899515151977539, 11.134384155273438, 11.369253158569336, 11.60412311553955, 11.83899211883545, 12.073862075805664, 12.308731079101562, 12.543600082397461, 12.778470039367676, 13.013339042663574, 13.248208045959473, 13.483078002929688, 13.717947006225586, 13.952816009521484, 14.1876859664917, 14.422554969787598, 14.657424926757812, 14.892293930053711]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 2.0, 6.0, 11.0, 19.0, 21.0, 23.0, 18.0, 35.0, 38.0, 55.0, 54.0, 51.0, 71.0, 60.0, 60.0, 60.0, 56.0, 52.0, 57.0, 39.0, 36.0, 37.0, 23.0, 27.0, 23.0, 14.0, 15.0, 4.0, 4.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3183482885360718, -0.30499112606048584, -0.2916339337825775, -0.2782767713069916, -0.26491957902908325, -0.2515624165534973, -0.23820523917675018, -0.22484806180000305, -0.21149089932441711, -0.19813372194766998, -0.18477654457092285, -0.17141938209533691, -0.15806220471858978, -0.14470502734184265, -0.13134784996509552, -0.11799068003892899, -0.10463349521160126, -0.09127631783485413, -0.07791914790868759, -0.06456197053194046, -0.05120479688048363, -0.037847623229026794, -0.024490445852279663, -0.011133275926113129, 0.0022239014506340027, 0.01558107603341341, 0.028938250616192818, 0.0422954261302948, 0.05565259978175163, 0.06900977343320847, 0.0823669508099556, 0.09572412073612213, 0.10908129811286926, 0.1224384754896164, 0.13579565286636353, 0.14915281534194946, 0.1625099927186966, 0.17586717009544373, 0.18922434747219086, 0.202581524848938, 0.21593868732452393, 0.22929586470127106, 0.2426530420780182, 0.2560102045536041, 0.26936739683151245, 0.2827245593070984, 0.2960817217826843, 0.30943891406059265, 0.322796106338501, 0.3361532688140869, 0.34951046109199524, 0.3628676235675812, 0.3762248158454895, 0.38958197832107544, 0.4029391407966614, 0.4162963330745697, 0.42965349555015564, 0.4430106580257416, 0.4563678503036499, 0.46972501277923584, 0.48308220505714417, 0.4964393675327301, 0.5097965598106384, 0.5231537222862244, 0.5365108847618103]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 4.0, 8.0, 9.0, 16.0, 23.0, 21.0, 37.0, 50.0, 69.0, 80.0, 130.0, 183.0, 259.0, 425.0, 657.0, 1005.0, 1744.0, 3091.0, 6618.0, 17153.0, 68495.0, 689836.0, 205841.0, 31964.0, 10466.0, 4501.0, 2242.0, 1309.0, 773.0, 470.0, 341.0, 176.0, 134.0, 108.0, 69.0, 51.0, 38.0, 37.0, 25.0, 23.0, 15.0, 12.0, 7.0, 8.0, 4.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 3.0, 1.0, 3.0], "bins": [-0.49658203125, -0.4809417724609375, -0.465301513671875, -0.4496612548828125, -0.43402099609375, -0.4183807373046875, -0.402740478515625, -0.3871002197265625, -0.3714599609375, -0.3558197021484375, -0.340179443359375, -0.3245391845703125, -0.30889892578125, -0.2932586669921875, -0.277618408203125, -0.2619781494140625, -0.246337890625, -0.2306976318359375, -0.215057373046875, -0.1994171142578125, -0.18377685546875, -0.1681365966796875, -0.152496337890625, -0.1368560791015625, -0.1212158203125, -0.1055755615234375, -0.089935302734375, -0.0742950439453125, -0.05865478515625, -0.0430145263671875, -0.027374267578125, -0.0117340087890625, 0.00390625, 0.0195465087890625, 0.035186767578125, 0.0508270263671875, 0.06646728515625, 0.0821075439453125, 0.097747802734375, 0.1133880615234375, 0.1290283203125, 0.1446685791015625, 0.160308837890625, 0.1759490966796875, 0.19158935546875, 0.2072296142578125, 0.222869873046875, 0.2385101318359375, 0.254150390625, 0.2697906494140625, 0.285430908203125, 0.3010711669921875, 0.31671142578125, 0.3323516845703125, 0.347991943359375, 0.3636322021484375, 0.3792724609375, 0.3949127197265625, 0.410552978515625, 0.4261932373046875, 0.44183349609375, 0.4574737548828125, 0.473114013671875, 0.4887542724609375, 0.50439453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 8.0, 7.0, 13.0, 18.0, 13.0, 22.0, 21.0, 23.0, 40.0, 34.0, 54.0, 55.0, 71.0, 64.0, 82.0, 77.0, 50.0, 61.0, 57.0, 43.0, 25.0, 26.0, 28.0, 24.0, 22.0, 13.0, 8.0, 9.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07073974609375, -0.0684061050415039, -0.06607246398925781, -0.06373882293701172, -0.061405181884765625, -0.05907154083251953, -0.05673789978027344, -0.054404258728027344, -0.05207061767578125, -0.049736976623535156, -0.04740333557128906, -0.04506969451904297, -0.042736053466796875, -0.04040241241455078, -0.03806877136230469, -0.035735130310058594, -0.0334014892578125, -0.031067848205566406, -0.028734207153320312, -0.02640056610107422, -0.024066925048828125, -0.02173328399658203, -0.019399642944335938, -0.017066001892089844, -0.01473236083984375, -0.012398719787597656, -0.010065078735351562, -0.007731437683105469, -0.005397796630859375, -0.0030641555786132812, -0.0007305145263671875, 0.0016031265258789062, 0.003936767578125, 0.006270408630371094, 0.008604049682617188, 0.010937690734863281, 0.013271331787109375, 0.015604972839355469, 0.017938613891601562, 0.020272254943847656, 0.02260589599609375, 0.024939537048339844, 0.027273178100585938, 0.02960681915283203, 0.031940460205078125, 0.03427410125732422, 0.03660774230957031, 0.038941383361816406, 0.0412750244140625, 0.043608665466308594, 0.04594230651855469, 0.04827594757080078, 0.050609588623046875, 0.05294322967529297, 0.05527687072753906, 0.057610511779785156, 0.05994415283203125, 0.062277793884277344, 0.06461143493652344, 0.06694507598876953, 0.06927871704101562, 0.07161235809326172, 0.07394599914550781, 0.0762796401977539, 0.07861328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 8.0, 11.0, 11.0, 13.0, 23.0, 29.0, 32.0, 56.0, 70.0, 137.0, 198.0, 327.0, 526.0, 990.0, 2055.0, 4614.0, 13296.0, 50917.0, 288772.0, 558567.0, 93751.0, 21667.0, 6774.0, 2635.0, 1315.0, 636.0, 408.0, 248.0, 139.0, 97.0, 64.0, 42.0, 31.0, 22.0, 12.0, 18.0, 9.0, 12.0, 7.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19873046875, -0.1919231414794922, -0.18511581420898438, -0.17830848693847656, -0.17150115966796875, -0.16469383239746094, -0.15788650512695312, -0.1510791778564453, -0.1442718505859375, -0.1374645233154297, -0.13065719604492188, -0.12384986877441406, -0.11704254150390625, -0.11023521423339844, -0.10342788696289062, -0.09662055969238281, -0.089813232421875, -0.08300590515136719, -0.07619857788085938, -0.06939125061035156, -0.06258392333984375, -0.05577659606933594, -0.048969268798828125, -0.04216194152832031, -0.0353546142578125, -0.028547286987304688, -0.021739959716796875, -0.014932632446289062, -0.00812530517578125, -0.0013179779052734375, 0.005489349365234375, 0.012296676635742188, 0.01910400390625, 0.025911331176757812, 0.032718658447265625, 0.03952598571777344, 0.04633331298828125, 0.05314064025878906, 0.059947967529296875, 0.06675529479980469, 0.0735626220703125, 0.08036994934082031, 0.08717727661132812, 0.09398460388183594, 0.10079193115234375, 0.10759925842285156, 0.11440658569335938, 0.12121391296386719, 0.128021240234375, 0.1348285675048828, 0.14163589477539062, 0.14844322204589844, 0.15525054931640625, 0.16205787658691406, 0.16886520385742188, 0.1756725311279297, 0.1824798583984375, 0.1892871856689453, 0.19609451293945312, 0.20290184020996094, 0.20970916748046875, 0.21651649475097656, 0.22332382202148438, 0.2301311492919922, 0.2369384765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 12.0, 6.0, 9.0, 9.0, 9.0, 18.0, 13.0, 21.0, 24.0, 42.0, 25.0, 55.0, 46.0, 54.0, 51.0, 47.0, 45.0, 45.0, 45.0, 47.0, 45.0, 39.0, 36.0, 31.0, 26.0, 27.0, 27.0, 29.0, 17.0, 22.0, 12.0, 11.0, 13.0, 11.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139404296875, -0.13364791870117188, -0.12789154052734375, -0.12213516235351562, -0.1163787841796875, -0.11062240600585938, -0.10486602783203125, -0.09910964965820312, -0.093353271484375, -0.08759689331054688, -0.08184051513671875, -0.07608413696289062, -0.0703277587890625, -0.06457138061523438, -0.05881500244140625, -0.053058624267578125, -0.04730224609375, -0.041545867919921875, -0.03578948974609375, -0.030033111572265625, -0.0242767333984375, -0.018520355224609375, -0.01276397705078125, -0.007007598876953125, -0.001251220703125, 0.004505157470703125, 0.01026153564453125, 0.016017913818359375, 0.0217742919921875, 0.027530670166015625, 0.03328704833984375, 0.039043426513671875, 0.0447998046875, 0.050556182861328125, 0.05631256103515625, 0.062068939208984375, 0.0678253173828125, 0.07358169555664062, 0.07933807373046875, 0.08509445190429688, 0.090850830078125, 0.09660720825195312, 0.10236358642578125, 0.10811996459960938, 0.1138763427734375, 0.11963272094726562, 0.12538909912109375, 0.13114547729492188, 0.13690185546875, 0.14265823364257812, 0.14841461181640625, 0.15417098999023438, 0.1599273681640625, 0.16568374633789062, 0.17144012451171875, 0.17719650268554688, 0.182952880859375, 0.18870925903320312, 0.19446563720703125, 0.20022201538085938, 0.2059783935546875, 0.21173477172851562, 0.21749114990234375, 0.22324752807617188, 0.22900390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 11.0, 19.0, 20.0, 37.0, 46.0, 91.0, 127.0, 203.0, 355.0, 531.0, 967.0, 2115.0, 5101.0, 14245.0, 57609.0, 624553.0, 286891.0, 37372.0, 10534.0, 3963.0, 1692.0, 840.0, 457.0, 281.0, 146.0, 104.0, 61.0, 46.0, 31.0, 29.0, 16.0, 12.0, 4.0, 2.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.045250892639160156, -0.04362678527832031, -0.04200267791748047, -0.040378570556640625, -0.03875446319580078, -0.03713035583496094, -0.035506248474121094, -0.03388214111328125, -0.032258033752441406, -0.030633926391601562, -0.02900981903076172, -0.027385711669921875, -0.02576160430908203, -0.024137496948242188, -0.022513389587402344, -0.0208892822265625, -0.019265174865722656, -0.017641067504882812, -0.01601696014404297, -0.014392852783203125, -0.012768745422363281, -0.011144638061523438, -0.009520530700683594, -0.00789642333984375, -0.006272315979003906, -0.0046482086181640625, -0.0030241012573242188, -0.001399993896484375, 0.00022411346435546875, 0.0018482208251953125, 0.0034723281860351562, 0.005096435546875, 0.006720542907714844, 0.008344650268554688, 0.009968757629394531, 0.011592864990234375, 0.013216972351074219, 0.014841079711914062, 0.016465187072753906, 0.01808929443359375, 0.019713401794433594, 0.021337509155273438, 0.02296161651611328, 0.024585723876953125, 0.02620983123779297, 0.027833938598632812, 0.029458045959472656, 0.0310821533203125, 0.032706260681152344, 0.03433036804199219, 0.03595447540283203, 0.037578582763671875, 0.03920269012451172, 0.04082679748535156, 0.042450904846191406, 0.04407501220703125, 0.045699119567871094, 0.04732322692871094, 0.04894733428955078, 0.050571441650390625, 0.05219554901123047, 0.05381965637207031, 0.055443763732910156, 0.05706787109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 6.0, 15.0, 13.0, 36.0, 70.0, 171.0, 267.0, 199.0, 96.0, 41.0, 27.0, 7.0, 12.0, 7.0, 4.0, 1.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.919269561767578e-05, -1.8605031073093414e-05, -1.8017366528511047e-05, -1.742970198392868e-05, -1.6842037439346313e-05, -1.6254372894763947e-05, -1.566670835018158e-05, -1.5079043805599213e-05, -1.4491379261016846e-05, -1.3903714716434479e-05, -1.3316050171852112e-05, -1.2728385627269745e-05, -1.2140721082687378e-05, -1.1553056538105011e-05, -1.0965391993522644e-05, -1.0377727448940277e-05, -9.79006290435791e-06, -9.202398359775543e-06, -8.614733815193176e-06, -8.02706927061081e-06, -7.439404726028442e-06, -6.8517401814460754e-06, -6.2640756368637085e-06, -5.6764110922813416e-06, -5.088746547698975e-06, -4.501082003116608e-06, -3.913417458534241e-06, -3.3257529139518738e-06, -2.738088369369507e-06, -2.15042382478714e-06, -1.562759280204773e-06, -9.75094735622406e-07, -3.8743019104003906e-07, 2.0023435354232788e-07, 7.878988981246948e-07, 1.3755634427070618e-06, 1.9632279872894287e-06, 2.5508925318717957e-06, 3.1385570764541626e-06, 3.7262216210365295e-06, 4.3138861656188965e-06, 4.9015507102012634e-06, 5.48921525478363e-06, 6.076879799365997e-06, 6.664544343948364e-06, 7.252208888530731e-06, 7.839873433113098e-06, 8.427537977695465e-06, 9.015202522277832e-06, 9.602867066860199e-06, 1.0190531611442566e-05, 1.0778196156024933e-05, 1.13658607006073e-05, 1.1953525245189667e-05, 1.2541189789772034e-05, 1.31288543343544e-05, 1.3716518878936768e-05, 1.4304183423519135e-05, 1.4891847968101501e-05, 1.547951251268387e-05, 1.6067177057266235e-05, 1.6654841601848602e-05, 1.724250614643097e-05, 1.7830170691013336e-05, 1.8417835235595703e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 10.0, 14.0, 22.0, 42.0, 47.0, 58.0, 118.0, 174.0, 233.0, 559.0, 943.0, 1879.0, 4043.0, 10183.0, 31133.0, 255433.0, 675821.0, 44652.0, 13200.0, 5067.0, 2326.0, 1144.0, 574.0, 328.0, 184.0, 118.0, 80.0, 50.0, 30.0, 18.0, 18.0, 11.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.106689453125, -0.10356330871582031, -0.10043716430664062, -0.09731101989746094, -0.09418487548828125, -0.09105873107910156, -0.08793258666992188, -0.08480644226074219, -0.0816802978515625, -0.07855415344238281, -0.07542800903320312, -0.07230186462402344, -0.06917572021484375, -0.06604957580566406, -0.06292343139648438, -0.05979728698730469, -0.056671142578125, -0.05354499816894531, -0.050418853759765625, -0.04729270935058594, -0.04416656494140625, -0.04104042053222656, -0.037914276123046875, -0.03478813171386719, -0.0316619873046875, -0.028535842895507812, -0.025409698486328125, -0.022283554077148438, -0.01915740966796875, -0.016031265258789062, -0.012905120849609375, -0.009778976440429688, -0.00665283203125, -0.0035266876220703125, -0.000400543212890625, 0.0027256011962890625, 0.00585174560546875, 0.008977890014648438, 0.012104034423828125, 0.015230178833007812, 0.0183563232421875, 0.021482467651367188, 0.024608612060546875, 0.027734756469726562, 0.03086090087890625, 0.03398704528808594, 0.037113189697265625, 0.04023933410644531, 0.043365478515625, 0.04649162292480469, 0.049617767333984375, 0.05274391174316406, 0.05587005615234375, 0.05899620056152344, 0.062122344970703125, 0.06524848937988281, 0.0683746337890625, 0.07150077819824219, 0.07462692260742188, 0.07775306701660156, 0.08087921142578125, 0.08400535583496094, 0.08713150024414062, 0.09025764465332031, 0.0933837890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 0.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 23.0, 33.0, 38.0, 83.0, 176.0, 227.0, 148.0, 93.0, 41.0, 30.0, 16.0, 9.0, 11.0, 7.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06216239929199219, -0.059505462646484375, -0.05684852600097656, -0.05419158935546875, -0.05153465270996094, -0.048877716064453125, -0.04622077941894531, -0.0435638427734375, -0.04090690612792969, -0.038249969482421875, -0.03559303283691406, -0.03293609619140625, -0.030279159545898438, -0.027622222900390625, -0.024965286254882812, -0.022308349609375, -0.019651412963867188, -0.016994476318359375, -0.014337539672851562, -0.01168060302734375, -0.009023666381835938, -0.006366729736328125, -0.0037097930908203125, -0.0010528564453125, 0.0016040802001953125, 0.004261016845703125, 0.0069179534912109375, 0.00957489013671875, 0.012231826782226562, 0.014888763427734375, 0.017545700073242188, 0.02020263671875, 0.022859573364257812, 0.025516510009765625, 0.028173446655273438, 0.03083038330078125, 0.03348731994628906, 0.036144256591796875, 0.03880119323730469, 0.0414581298828125, 0.04411506652832031, 0.046772003173828125, 0.04942893981933594, 0.05208587646484375, 0.05474281311035156, 0.057399749755859375, 0.06005668640136719, 0.062713623046875, 0.06537055969238281, 0.06802749633789062, 0.07068443298339844, 0.07334136962890625, 0.07599830627441406, 0.07865524291992188, 0.08131217956542969, 0.0839691162109375, 0.08662605285644531, 0.08928298950195312, 0.09193992614746094, 0.09459686279296875, 0.09725379943847656, 0.09991073608398438, 0.10256767272949219, 0.105224609375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 15.0, 23.0, 63.0, 115.0, 239.0, 355.0, 136.0, 42.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3835206031799316, -2.3141560554504395, -2.2447917461395264, -2.175427198410034, -2.106062889099121, -2.036698341369629, -1.9673339128494263, -1.8979694843292236, -1.828605055809021, -1.7592406272888184, -1.6898761987686157, -1.620511770248413, -1.551147222518921, -1.4817829132080078, -1.4124183654785156, -1.343053936958313, -1.2736895084381104, -1.2043250799179077, -1.134960651397705, -1.0655962228775024, -0.996231734752655, -0.9268673062324524, -0.857502818107605, -0.7881383895874023, -0.7187739610671997, -0.6494095325469971, -0.5800451040267944, -0.510680615901947, -0.4413161873817444, -0.37195175886154175, -0.3025873005390167, -0.2332228422164917, -0.16385817527770996, -0.09449373185634613, -0.0251292884349823, 0.04423515498638153, 0.11359959840774536, 0.182964026927948, 0.252328485250473, 0.32169294357299805, 0.3910573720932007, 0.4604218006134033, 0.529786229133606, 0.5991507172584534, 0.668515145778656, 0.7378795742988586, 0.807244062423706, 0.8766084909439087, 0.9459729194641113, 1.015337347984314, 1.0847017765045166, 1.1540662050247192, 1.2234306335449219, 1.292795181274414, 1.3621596097946167, 1.4315240383148193, 1.500888466835022, 1.5702528953552246, 1.6396173238754272, 1.7089817523956299, 1.778346300125122, 1.8477106094360352, 1.9170751571655273, 1.98643958568573, 2.0558040142059326]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 11.0, 5.0, 13.0, 9.0, 14.0, 16.0, 18.0, 18.0, 22.0, 21.0, 22.0, 31.0, 22.0, 34.0, 36.0, 41.0, 25.0, 41.0, 35.0, 35.0, 32.0, 41.0, 37.0, 32.0, 32.0, 36.0, 35.0, 35.0, 35.0, 24.0, 20.0, 20.0, 24.0, 22.0, 16.0, 17.0, 11.0, 10.0, 9.0, 5.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.7971649169921875, -0.7715793251991272, -0.7459936738014221, -0.7204080820083618, -0.6948224306106567, -0.6692368388175964, -0.6436512470245361, -0.618065595626831, -0.592479944229126, -0.5668943524360657, -0.5413087010383606, -0.5157231092453003, -0.4901374578475952, -0.4645518660545349, -0.4389662444591522, -0.41338062286376953, -0.38779503107070923, -0.36220940947532654, -0.33662378787994385, -0.31103819608688354, -0.28545254468917847, -0.25986695289611816, -0.23428133130073547, -0.20869570970535278, -0.1831100881099701, -0.1575244665145874, -0.1319388449192047, -0.10635323822498322, -0.08076761662960052, -0.055181995034217834, -0.029596388339996338, -0.0040107667446136475, 0.02157491445541382, 0.04716053232550621, 0.0727461501955986, 0.0983317643404007, 0.12391738593578339, 0.14950300753116608, 0.17508861422538757, 0.20067423582077026, 0.22625985741615295, 0.25184547901153564, 0.27743110060691833, 0.303016722202301, 0.32860231399536133, 0.3541879653930664, 0.3797735571861267, 0.4053591787815094, 0.4309448003768921, 0.4565304219722748, 0.48211604356765747, 0.5077016353607178, 0.5332872867584229, 0.5588728785514832, 0.5844584703445435, 0.6100441217422485, 0.6356297731399536, 0.6612153649330139, 0.686801016330719, 0.7123866081237793, 0.7379722595214844, 0.7635578513145447, 0.789143443107605, 0.8147290945053101, 0.8403146862983704]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 7.0, 5.0, 9.0, 16.0, 26.0, 32.0, 36.0, 61.0, 87.0, 136.0, 225.0, 345.0, 654.0, 1388.0, 3542.0, 10050.0, 37449.0, 391089.0, 3645533.0, 78673.0, 16489.0, 4845.0, 1726.0, 729.0, 410.0, 226.0, 134.0, 106.0, 82.0, 54.0, 33.0, 19.0, 16.0, 9.0, 5.0, 7.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4170989990234375, -0.403289794921875, -0.3894805908203125, -0.37567138671875, -0.3618621826171875, -0.348052978515625, -0.3342437744140625, -0.3204345703125, -0.3066253662109375, -0.292816162109375, -0.2790069580078125, -0.26519775390625, -0.2513885498046875, -0.237579345703125, -0.2237701416015625, -0.2099609375, -0.1961517333984375, -0.182342529296875, -0.1685333251953125, -0.15472412109375, -0.1409149169921875, -0.127105712890625, -0.1132965087890625, -0.0994873046875, -0.0856781005859375, -0.071868896484375, -0.0580596923828125, -0.04425048828125, -0.0304412841796875, -0.016632080078125, -0.0028228759765625, 0.010986328125, 0.0247955322265625, 0.038604736328125, 0.0524139404296875, 0.06622314453125, 0.0800323486328125, 0.093841552734375, 0.1076507568359375, 0.1214599609375, 0.1352691650390625, 0.149078369140625, 0.1628875732421875, 0.17669677734375, 0.1905059814453125, 0.204315185546875, 0.2181243896484375, 0.23193359375, 0.2457427978515625, 0.259552001953125, 0.2733612060546875, 0.28717041015625, 0.3009796142578125, 0.314788818359375, 0.3285980224609375, 0.3424072265625, 0.3562164306640625, 0.370025634765625, 0.3838348388671875, 0.39764404296875, 0.4114532470703125, 0.425262451171875, 0.4390716552734375, 0.452880859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 10.0, 12.0, 7.0, 10.0, 20.0, 21.0, 18.0, 19.0, 26.0, 40.0, 59.0, 59.0, 75.0, 76.0, 69.0, 88.0, 76.0, 45.0, 55.0, 47.0, 36.0, 30.0, 20.0, 18.0, 25.0, 12.0, 9.0, 5.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07464599609375, -0.07220458984375, -0.06976318359375, -0.06732177734375, -0.06488037109375, -0.06243896484375, -0.05999755859375, -0.05755615234375, -0.05511474609375, -0.05267333984375, -0.05023193359375, -0.04779052734375, -0.04534912109375, -0.04290771484375, -0.04046630859375, -0.03802490234375, -0.03558349609375, -0.03314208984375, -0.03070068359375, -0.02825927734375, -0.02581787109375, -0.02337646484375, -0.02093505859375, -0.01849365234375, -0.01605224609375, -0.01361083984375, -0.01116943359375, -0.00872802734375, -0.00628662109375, -0.00384521484375, -0.00140380859375, 0.00103759765625, 0.00347900390625, 0.00592041015625, 0.00836181640625, 0.01080322265625, 0.01324462890625, 0.01568603515625, 0.01812744140625, 0.02056884765625, 0.02301025390625, 0.02545166015625, 0.02789306640625, 0.03033447265625, 0.03277587890625, 0.03521728515625, 0.03765869140625, 0.04010009765625, 0.04254150390625, 0.04498291015625, 0.04742431640625, 0.04986572265625, 0.05230712890625, 0.05474853515625, 0.05718994140625, 0.05963134765625, 0.06207275390625, 0.06451416015625, 0.06695556640625, 0.06939697265625, 0.07183837890625, 0.07427978515625, 0.07672119140625, 0.07916259765625, 0.08160400390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 5.0, 2.0, 4.0, 9.0, 12.0, 10.0, 16.0, 26.0, 42.0, 57.0, 102.0, 215.0, 463.0, 1418.0, 7006.0, 61583.0, 3518417.0, 573520.0, 26060.0, 3808.0, 877.0, 317.0, 139.0, 81.0, 38.0, 27.0, 15.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.60107421875, -0.5885066986083984, -0.5759391784667969, -0.5633716583251953, -0.5508041381835938, -0.5382366180419922, -0.5256690979003906, -0.5131015777587891, -0.5005340576171875, -0.48796653747558594, -0.4753990173339844, -0.4628314971923828, -0.45026397705078125, -0.4376964569091797, -0.4251289367675781, -0.41256141662597656, -0.399993896484375, -0.38742637634277344, -0.3748588562011719, -0.3622913360595703, -0.34972381591796875, -0.3371562957763672, -0.3245887756347656, -0.31202125549316406, -0.2994537353515625, -0.28688621520996094, -0.2743186950683594, -0.2617511749267578, -0.24918365478515625, -0.2366161346435547, -0.22404861450195312, -0.21148109436035156, -0.19891357421875, -0.18634605407714844, -0.17377853393554688, -0.1612110137939453, -0.14864349365234375, -0.1360759735107422, -0.12350845336914062, -0.11094093322753906, -0.0983734130859375, -0.08580589294433594, -0.07323837280273438, -0.06067085266113281, -0.04810333251953125, -0.03553581237792969, -0.022968292236328125, -0.010400772094726562, 0.002166748046875, 0.014734268188476562, 0.027301788330078125, 0.03986930847167969, 0.05243682861328125, 0.06500434875488281, 0.07757186889648438, 0.09013938903808594, 0.1027069091796875, 0.11527442932128906, 0.12784194946289062, 0.1404094696044922, 0.15297698974609375, 0.1655445098876953, 0.17811203002929688, 0.19067955017089844, 0.2032470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 11.0, 16.0, 23.0, 25.0, 37.0, 43.0, 75.0, 80.0, 147.0, 282.0, 643.0, 1085.0, 620.0, 315.0, 178.0, 144.0, 88.0, 62.0, 37.0, 38.0, 35.0, 19.0, 12.0, 10.0, 10.0, 7.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08905029296875, -0.08569622039794922, -0.08234214782714844, -0.07898807525634766, -0.07563400268554688, -0.0722799301147461, -0.06892585754394531, -0.06557178497314453, -0.06221771240234375, -0.05886363983154297, -0.05550956726074219, -0.052155494689941406, -0.048801422119140625, -0.045447349548339844, -0.04209327697753906, -0.03873920440673828, -0.0353851318359375, -0.03203105926513672, -0.028676986694335938, -0.025322914123535156, -0.021968841552734375, -0.018614768981933594, -0.015260696411132812, -0.011906623840332031, -0.00855255126953125, -0.005198478698730469, -0.0018444061279296875, 0.0015096664428710938, 0.004863739013671875, 0.008217811584472656, 0.011571884155273438, 0.014925956726074219, 0.018280029296875, 0.02163410186767578, 0.024988174438476562, 0.028342247009277344, 0.031696319580078125, 0.035050392150878906, 0.03840446472167969, 0.04175853729248047, 0.04511260986328125, 0.04846668243408203, 0.05182075500488281, 0.055174827575683594, 0.058528900146484375, 0.061882972717285156, 0.06523704528808594, 0.06859111785888672, 0.0719451904296875, 0.07529926300048828, 0.07865333557128906, 0.08200740814208984, 0.08536148071289062, 0.0887155532836914, 0.09206962585449219, 0.09542369842529297, 0.09877777099609375, 0.10213184356689453, 0.10548591613769531, 0.1088399887084961, 0.11219406127929688, 0.11554813385009766, 0.11890220642089844, 0.12225627899169922, 0.1256103515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [48.0, 627.0, 315.0, 22.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13389800488948822, -0.0545707568526268, 0.02475649118423462, 0.10408373177051544, 0.18341098725795746, 0.2627382278442383, 0.3420654535293579, 0.4213927388191223, 0.5007199645042419, 0.5800471901893616, 0.659374475479126, 0.7387017011642456, 0.8180289268493652, 0.8973562121391296, 0.9766834378242493, 1.0560107231140137, 1.1353379487991333, 1.214665174484253, 1.2939924001693726, 1.3733196258544922, 1.4526469707489014, 1.531974196434021, 1.6113014221191406, 1.6906287670135498, 1.7699559926986694, 1.849283218383789, 1.9286104440689087, 2.0079376697540283, 2.0872650146484375, 2.1665921211242676, 2.2459194660186768, 2.325246810913086, 2.404574155807495, 2.4839015007019043, 2.5632286071777344, 2.6425559520721436, 2.7218830585479736, 2.801210403442383, 2.880537509918213, 2.959864854812622, 3.0391921997070312, 3.1185195446014404, 3.1978466510772705, 3.2771739959716797, 3.3565011024475098, 3.435828447341919, 3.515155792236328, 3.594482898712158, 3.6738100051879883, 3.7531373500823975, 3.8324644565582275, 3.9117918014526367, 3.991118907928467, 4.070446014404297, 4.149773597717285, 4.229100704193115, 4.3084282875061035, 4.387755393981934, 4.467082977294922, 4.546410083770752, 4.625737190246582, 4.70506477355957, 4.7843918800354, 4.8637189865112305, 4.9430460929870605]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 6.0, 8.0, 11.0, 17.0, 12.0, 16.0, 19.0, 23.0, 22.0, 31.0, 35.0, 53.0, 37.0, 46.0, 37.0, 50.0, 59.0, 63.0, 50.0, 59.0, 48.0, 44.0, 47.0, 33.0, 32.0, 20.0, 21.0, 17.0, 14.0, 15.0, 9.0, 8.0, 7.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.3771207928657532, -0.36677661538124084, -0.3564324676990509, -0.3460882902145386, -0.33574414253234863, -0.3253999650478363, -0.31505581736564636, -0.30471163988113403, -0.2943674921989441, -0.28402331471443176, -0.2736791670322418, -0.2633349895477295, -0.25299084186553955, -0.24264666438102722, -0.2323025017976761, -0.22195833921432495, -0.21161416172981262, -0.2012699991464615, -0.19092583656311035, -0.18058167397975922, -0.17023751139640808, -0.15989333391189575, -0.14954917132854462, -0.13920500874519348, -0.12886084616184235, -0.11851668357849121, -0.10817252099514008, -0.09782835096120834, -0.08748418837785721, -0.07714002579450607, -0.06679585576057434, -0.056451693177223206, -0.04610753059387207, -0.035763368010520935, -0.0254192017018795, -0.015075037255883217, -0.004730872809886932, 0.005613289773464203, 0.015957456082105637, 0.02630162239074707, 0.036645784974098206, 0.04698994755744934, 0.057334113866090775, 0.06767828017473221, 0.07802244275808334, 0.08836660534143448, 0.09871077537536621, 0.10905493795871735, 0.11939910054206848, 0.12974326312541962, 0.14008742570877075, 0.1504315882921219, 0.16077575087547302, 0.17111992835998535, 0.1814640909433365, 0.19180825352668762, 0.20215241611003876, 0.2124965786933899, 0.22284074127674103, 0.23318490386009216, 0.2435290813446045, 0.25387322902679443, 0.26421740651130676, 0.2745615839958191, 0.28490573167800903]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 7.0, 15.0, 9.0, 19.0, 34.0, 58.0, 73.0, 117.0, 185.0, 441.0, 688.0, 1339.0, 2676.0, 5749.0, 13908.0, 36959.0, 118728.0, 440241.0, 301646.0, 79718.0, 26460.0, 10415.0, 4409.0, 2137.0, 1074.0, 607.0, 348.0, 189.0, 119.0, 64.0, 38.0, 29.0, 11.0, 14.0, 9.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2221240997314453, -0.21414566040039062, -0.20616722106933594, -0.19818878173828125, -0.19021034240722656, -0.18223190307617188, -0.1742534637451172, -0.1662750244140625, -0.1582965850830078, -0.15031814575195312, -0.14233970642089844, -0.13436126708984375, -0.12638282775878906, -0.11840438842773438, -0.11042594909667969, -0.102447509765625, -0.09446907043457031, -0.08649063110351562, -0.07851219177246094, -0.07053375244140625, -0.06255531311035156, -0.054576873779296875, -0.04659843444824219, -0.0386199951171875, -0.030641555786132812, -0.022663116455078125, -0.014684677124023438, -0.00670623779296875, 0.0012722015380859375, 0.009250640869140625, 0.017229080200195312, 0.02520751953125, 0.03318595886230469, 0.041164398193359375, 0.04914283752441406, 0.05712127685546875, 0.06509971618652344, 0.07307815551757812, 0.08105659484863281, 0.0890350341796875, 0.09701347351074219, 0.10499191284179688, 0.11297035217285156, 0.12094879150390625, 0.12892723083496094, 0.13690567016601562, 0.1448841094970703, 0.152862548828125, 0.1608409881591797, 0.16881942749023438, 0.17679786682128906, 0.18477630615234375, 0.19275474548339844, 0.20073318481445312, 0.2087116241455078, 0.2166900634765625, 0.2246685028076172, 0.23264694213867188, 0.24062538146972656, 0.24860382080078125, 0.25658226013183594, 0.2645606994628906, 0.2725391387939453, 0.280517578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 10.0, 9.0, 13.0, 26.0, 24.0, 29.0, 24.0, 41.0, 55.0, 61.0, 72.0, 80.0, 85.0, 100.0, 57.0, 60.0, 45.0, 48.0, 26.0, 29.0, 19.0, 22.0, 18.0, 11.0, 5.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.0662984848022461, -0.06387138366699219, -0.06144428253173828, -0.059017181396484375, -0.05659008026123047, -0.05416297912597656, -0.051735877990722656, -0.04930877685546875, -0.046881675720214844, -0.04445457458496094, -0.04202747344970703, -0.039600372314453125, -0.03717327117919922, -0.03474617004394531, -0.032319068908691406, -0.0298919677734375, -0.027464866638183594, -0.025037765502929688, -0.02261066436767578, -0.020183563232421875, -0.01775646209716797, -0.015329360961914062, -0.012902259826660156, -0.01047515869140625, -0.008048057556152344, -0.0056209564208984375, -0.0031938552856445312, -0.000766754150390625, 0.0016603469848632812, 0.0040874481201171875, 0.006514549255371094, 0.008941650390625, 0.011368751525878906, 0.013795852661132812, 0.01622295379638672, 0.018650054931640625, 0.02107715606689453, 0.023504257202148438, 0.025931358337402344, 0.02835845947265625, 0.030785560607910156, 0.03321266174316406, 0.03563976287841797, 0.038066864013671875, 0.04049396514892578, 0.04292106628417969, 0.045348167419433594, 0.0477752685546875, 0.050202369689941406, 0.05262947082519531, 0.05505657196044922, 0.057483673095703125, 0.05991077423095703, 0.06233787536621094, 0.06476497650146484, 0.06719207763671875, 0.06961917877197266, 0.07204627990722656, 0.07447338104248047, 0.07690048217773438, 0.07932758331298828, 0.08175468444824219, 0.0841817855834961, 0.08660888671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 6.0, 6.0, 10.0, 8.0, 20.0, 26.0, 23.0, 26.0, 43.0, 44.0, 43.0, 75.0, 123.0, 232.0, 581.0, 2476.0, 35663.0, 857170.0, 144339.0, 5886.0, 890.0, 287.0, 170.0, 111.0, 68.0, 59.0, 47.0, 18.0, 10.0, 21.0, 16.0, 13.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.68505859375, -0.6647262573242188, -0.6443939208984375, -0.6240615844726562, -0.603729248046875, -0.5833969116210938, -0.5630645751953125, -0.5427322387695312, -0.52239990234375, -0.5020675659179688, -0.4817352294921875, -0.46140289306640625, -0.441070556640625, -0.42073822021484375, -0.4004058837890625, -0.38007354736328125, -0.3597412109375, -0.33940887451171875, -0.3190765380859375, -0.29874420166015625, -0.278411865234375, -0.25807952880859375, -0.2377471923828125, -0.21741485595703125, -0.19708251953125, -0.17675018310546875, -0.1564178466796875, -0.13608551025390625, -0.115753173828125, -0.09542083740234375, -0.0750885009765625, -0.05475616455078125, -0.034423828125, -0.01409149169921875, 0.0062408447265625, 0.02657318115234375, 0.046905517578125, 0.06723785400390625, 0.0875701904296875, 0.10790252685546875, 0.12823486328125, 0.14856719970703125, 0.1688995361328125, 0.18923187255859375, 0.209564208984375, 0.22989654541015625, 0.2502288818359375, 0.27056121826171875, 0.2908935546875, 0.31122589111328125, 0.3315582275390625, 0.35189056396484375, 0.372222900390625, 0.39255523681640625, 0.4128875732421875, 0.43321990966796875, 0.45355224609375, 0.47388458251953125, 0.4942169189453125, 0.5145492553710938, 0.534881591796875, 0.5552139282226562, 0.5755462646484375, 0.5958786010742188, 0.6162109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 2.0, 6.0, 13.0, 7.0, 14.0, 12.0, 19.0, 15.0, 16.0, 25.0, 28.0, 26.0, 27.0, 23.0, 23.0, 39.0, 37.0, 31.0, 39.0, 35.0, 47.0, 33.0, 32.0, 40.0, 44.0, 38.0, 43.0, 35.0, 48.0, 36.0, 29.0, 29.0, 13.0, 16.0, 17.0, 10.0, 10.0, 10.0, 10.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12412643432617188, -0.12020111083984375, -0.11627578735351562, -0.1123504638671875, -0.10842514038085938, -0.10449981689453125, -0.10057449340820312, -0.096649169921875, -0.09272384643554688, -0.08879852294921875, -0.08487319946289062, -0.0809478759765625, -0.07702255249023438, -0.07309722900390625, -0.06917190551757812, -0.06524658203125, -0.061321258544921875, -0.05739593505859375, -0.053470611572265625, -0.0495452880859375, -0.045619964599609375, -0.04169464111328125, -0.037769317626953125, -0.033843994140625, -0.029918670654296875, -0.02599334716796875, -0.022068023681640625, -0.0181427001953125, -0.014217376708984375, -0.01029205322265625, -0.006366729736328125, -0.00244140625, 0.001483917236328125, 0.00540924072265625, 0.009334564208984375, 0.0132598876953125, 0.017185211181640625, 0.02111053466796875, 0.025035858154296875, 0.028961181640625, 0.032886505126953125, 0.03681182861328125, 0.040737152099609375, 0.0446624755859375, 0.048587799072265625, 0.05251312255859375, 0.056438446044921875, 0.06036376953125, 0.06428909301757812, 0.06821441650390625, 0.07213973999023438, 0.0760650634765625, 0.07999038696289062, 0.08391571044921875, 0.08784103393554688, 0.091766357421875, 0.09569168090820312, 0.09961700439453125, 0.10354232788085938, 0.1074676513671875, 0.11139297485351562, 0.11531829833984375, 0.11924362182617188, 0.1231689453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 1.0, 7.0, 8.0, 21.0, 16.0, 23.0, 39.0, 43.0, 49.0, 110.0, 182.0, 334.0, 659.0, 1619.0, 4444.0, 18102.0, 337829.0, 655269.0, 21420.0, 4950.0, 1783.0, 753.0, 346.0, 184.0, 104.0, 74.0, 49.0, 37.0, 27.0, 17.0, 14.0, 5.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.348388671875, -0.335968017578125, -0.32354736328125, -0.311126708984375, -0.2987060546875, -0.286285400390625, -0.27386474609375, -0.261444091796875, -0.2490234375, -0.236602783203125, -0.22418212890625, -0.211761474609375, -0.1993408203125, -0.186920166015625, -0.17449951171875, -0.162078857421875, -0.149658203125, -0.137237548828125, -0.12481689453125, -0.112396240234375, -0.0999755859375, -0.087554931640625, -0.07513427734375, -0.062713623046875, -0.05029296875, -0.037872314453125, -0.02545166015625, -0.013031005859375, -0.0006103515625, 0.011810302734375, 0.02423095703125, 0.036651611328125, 0.049072265625, 0.061492919921875, 0.07391357421875, 0.086334228515625, 0.0987548828125, 0.111175537109375, 0.12359619140625, 0.136016845703125, 0.1484375, 0.160858154296875, 0.17327880859375, 0.185699462890625, 0.1981201171875, 0.210540771484375, 0.22296142578125, 0.235382080078125, 0.247802734375, 0.260223388671875, 0.27264404296875, 0.285064697265625, 0.2974853515625, 0.309906005859375, 0.32232666015625, 0.334747314453125, 0.34716796875, 0.359588623046875, 0.37200927734375, 0.384429931640625, 0.3968505859375, 0.409271240234375, 0.42169189453125, 0.434112548828125, 0.446533203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 0.0, 7.0, 15.0, 14.0, 46.0, 70.0, 213.0, 358.0, 137.0, 62.0, 34.0, 15.0, 15.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9485435485839844e-05, -5.769822746515274e-05, -5.591101944446564e-05, -5.4123811423778534e-05, -5.233660340309143e-05, -5.054939538240433e-05, -4.8762187361717224e-05, -4.697497934103012e-05, -4.518777132034302e-05, -4.3400563299655914e-05, -4.161335527896881e-05, -3.982614725828171e-05, -3.8038939237594604e-05, -3.62517312169075e-05, -3.44645231962204e-05, -3.2677315175533295e-05, -3.089010715484619e-05, -2.9102899134159088e-05, -2.7315691113471985e-05, -2.552848309278488e-05, -2.374127507209778e-05, -2.1954067051410675e-05, -2.0166859030723572e-05, -1.837965101003647e-05, -1.6592442989349365e-05, -1.4805234968662262e-05, -1.3018026947975159e-05, -1.1230818927288055e-05, -9.443610906600952e-06, -7.656402885913849e-06, -5.869194865226746e-06, -4.081986844539642e-06, -2.294778823852539e-06, -5.075708031654358e-07, 1.2796372175216675e-06, 3.0668452382087708e-06, 4.854053258895874e-06, 6.641261279582977e-06, 8.42846930027008e-06, 1.0215677320957184e-05, 1.2002885341644287e-05, 1.379009336233139e-05, 1.5577301383018494e-05, 1.7364509403705597e-05, 1.91517174243927e-05, 2.0938925445079803e-05, 2.2726133465766907e-05, 2.451334148645401e-05, 2.6300549507141113e-05, 2.8087757527828217e-05, 2.987496554851532e-05, 3.166217356920242e-05, 3.3449381589889526e-05, 3.523658961057663e-05, 3.702379763126373e-05, 3.8811005651950836e-05, 4.059821367263794e-05, 4.238542169332504e-05, 4.4172629714012146e-05, 4.595983773469925e-05, 4.774704575538635e-05, 4.9534253776073456e-05, 5.132146179676056e-05, 5.310866981744766e-05, 5.4895877838134766e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 4.0, 1.0, 6.0, 5.0, 13.0, 9.0, 28.0, 40.0, 73.0, 271.0, 1436.0, 16171.0, 1006004.0, 22282.0, 1720.0, 294.0, 76.0, 37.0, 23.0, 6.0, 13.0, 13.0, 8.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.73681640625, -0.7160873413085938, -0.6953582763671875, -0.6746292114257812, -0.653900146484375, -0.6331710815429688, -0.6124420166015625, -0.5917129516601562, -0.57098388671875, -0.5502548217773438, -0.5295257568359375, -0.5087966918945312, -0.488067626953125, -0.46733856201171875, -0.4466094970703125, -0.42588043212890625, -0.4051513671875, -0.38442230224609375, -0.3636932373046875, -0.34296417236328125, -0.322235107421875, -0.30150604248046875, -0.2807769775390625, -0.26004791259765625, -0.23931884765625, -0.21858978271484375, -0.1978607177734375, -0.17713165283203125, -0.156402587890625, -0.13567352294921875, -0.1149444580078125, -0.09421539306640625, -0.073486328125, -0.05275726318359375, -0.0320281982421875, -0.01129913330078125, 0.009429931640625, 0.03015899658203125, 0.0508880615234375, 0.07161712646484375, 0.09234619140625, 0.11307525634765625, 0.1338043212890625, 0.15453338623046875, 0.175262451171875, 0.19599151611328125, 0.2167205810546875, 0.23744964599609375, 0.2581787109375, 0.27890777587890625, 0.2996368408203125, 0.32036590576171875, 0.341094970703125, 0.36182403564453125, 0.3825531005859375, 0.40328216552734375, 0.42401123046875, 0.44474029541015625, 0.4654693603515625, 0.48619842529296875, 0.506927490234375, 0.5276565551757812, 0.5483856201171875, 0.5691146850585938, 0.58984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 12.0, 16.0, 31.0, 34.0, 53.0, 87.0, 228.0, 249.0, 103.0, 32.0, 45.0, 22.0, 17.0, 12.0, 10.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11859130859375, -0.11450862884521484, -0.11042594909667969, -0.10634326934814453, -0.10226058959960938, -0.09817790985107422, -0.09409523010253906, -0.0900125503540039, -0.08592987060546875, -0.0818471908569336, -0.07776451110839844, -0.07368183135986328, -0.06959915161132812, -0.06551647186279297, -0.06143379211425781, -0.057351112365722656, -0.0532684326171875, -0.049185752868652344, -0.04510307312011719, -0.04102039337158203, -0.036937713623046875, -0.03285503387451172, -0.028772354125976562, -0.024689674377441406, -0.02060699462890625, -0.016524314880371094, -0.012441635131835938, -0.008358955383300781, -0.004276275634765625, -0.00019359588623046875, 0.0038890838623046875, 0.007971763610839844, 0.012054443359375, 0.016137123107910156, 0.020219802856445312, 0.02430248260498047, 0.028385162353515625, 0.03246784210205078, 0.03655052185058594, 0.040633201599121094, 0.04471588134765625, 0.048798561096191406, 0.05288124084472656, 0.05696392059326172, 0.061046600341796875, 0.06512928009033203, 0.06921195983886719, 0.07329463958740234, 0.0773773193359375, 0.08145999908447266, 0.08554267883300781, 0.08962535858154297, 0.09370803833007812, 0.09779071807861328, 0.10187339782714844, 0.1059560775756836, 0.11003875732421875, 0.1141214370727539, 0.11820411682128906, 0.12228679656982422, 0.12636947631835938, 0.13045215606689453, 0.1345348358154297, 0.13861751556396484, 0.1427001953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [380.0, 642.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4372916519641876, -0.0263272225856781, 0.3846372067928314, 0.7956016063690186, 1.2065660953521729, 1.6175305843353271, 2.0284948348999023, 2.4394593238830566, 2.850423812866211, 3.2613883018493652, 3.6723527908325195, 4.083316802978516, 4.494281768798828, 4.905245780944824, 5.3162102699279785, 5.727174758911133, 6.138139247894287, 6.549103736877441, 6.960068225860596, 7.37103271484375, 7.781996726989746, 8.192961692810059, 8.603925704956055, 9.014890670776367, 9.425854682922363, 9.83681869506836, 10.247783660888672, 10.658747673034668, 11.06971263885498, 11.480676651000977, 11.891641616821289, 12.302605628967285, 12.713569641113281, 13.124533653259277, 13.53549861907959, 13.946462631225586, 14.357427597045898, 14.768391609191895, 15.17935562133789, 15.590320587158203, 16.001285552978516, 16.412250518798828, 16.823213577270508, 17.23417854309082, 17.645143508911133, 18.056108474731445, 18.467071533203125, 18.878036499023438, 19.28900146484375, 19.699966430664062, 20.110929489135742, 20.521894454956055, 20.932859420776367, 21.34382438659668, 21.75478744506836, 22.165752410888672, 22.57671546936035, 22.987680435180664, 23.398643493652344, 23.809608459472656, 24.22057342529297, 24.63153839111328, 25.04250144958496, 25.453466415405273, 25.864431381225586]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 9.0, 16.0, 16.0, 14.0, 24.0, 28.0, 40.0, 31.0, 26.0, 47.0, 48.0, 63.0, 45.0, 46.0, 51.0, 58.0, 57.0, 55.0, 39.0, 39.0, 35.0, 35.0, 30.0, 19.0, 22.0, 23.0, 13.0, 12.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7143536806106567, -0.6932075023651123, -0.6720612645149231, -0.6509150862693787, -0.6297688484191895, -0.608622670173645, -0.5874764919281006, -0.5663302540779114, -0.5451840162277222, -0.5240378379821777, -0.5028916001319885, -0.4817454218864441, -0.4605991840362549, -0.43945300579071045, -0.41830679774284363, -0.3971605896949768, -0.3760144114494324, -0.35486820340156555, -0.33372199535369873, -0.3125758171081543, -0.2914295792579651, -0.27028340101242065, -0.24913719296455383, -0.227990984916687, -0.2068447768688202, -0.18569856882095337, -0.16455236077308655, -0.14340616762638092, -0.1222599595785141, -0.10111375153064728, -0.07996755838394165, -0.05882135033607483, -0.03767514228820801, -0.016528937965631485, 0.004617266356945038, 0.025763466954231262, 0.046909675002098083, 0.0680558830499649, 0.08920207619667053, 0.11034828424453735, 0.13149449229240417, 0.152640700340271, 0.17378690838813782, 0.19493310153484344, 0.21607930958271027, 0.2372255176305771, 0.2583717107772827, 0.27951791882514954, 0.30066412687301636, 0.3218103349208832, 0.34295654296875, 0.36410272121429443, 0.38524895906448364, 0.4063951373100281, 0.4275413453578949, 0.4486875534057617, 0.46983376145362854, 0.49097996950149536, 0.5121261477470398, 0.533272385597229, 0.5544185638427734, 0.5755648016929626, 0.5967109799385071, 0.6178572177886963, 0.6390033960342407]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 15.0, 26.0, 28.0, 41.0, 64.0, 89.0, 136.0, 210.0, 358.0, 624.0, 1309.0, 3251.0, 13630.0, 168223.0, 3937895.0, 56392.0, 7578.0, 2156.0, 878.0, 507.0, 309.0, 198.0, 124.0, 67.0, 66.0, 23.0, 21.0, 18.0, 4.0, 6.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57861328125, -0.5607147216796875, -0.542816162109375, -0.5249176025390625, -0.50701904296875, -0.4891204833984375, -0.471221923828125, -0.4533233642578125, -0.4354248046875, -0.4175262451171875, -0.399627685546875, -0.3817291259765625, -0.36383056640625, -0.3459320068359375, -0.328033447265625, -0.3101348876953125, -0.292236328125, -0.2743377685546875, -0.256439208984375, -0.2385406494140625, -0.22064208984375, -0.2027435302734375, -0.184844970703125, -0.1669464111328125, -0.1490478515625, -0.1311492919921875, -0.113250732421875, -0.0953521728515625, -0.07745361328125, -0.0595550537109375, -0.041656494140625, -0.0237579345703125, -0.005859375, 0.0120391845703125, 0.029937744140625, 0.0478363037109375, 0.06573486328125, 0.0836334228515625, 0.101531982421875, 0.1194305419921875, 0.1373291015625, 0.1552276611328125, 0.173126220703125, 0.1910247802734375, 0.20892333984375, 0.2268218994140625, 0.244720458984375, 0.2626190185546875, 0.280517578125, 0.2984161376953125, 0.316314697265625, 0.3342132568359375, 0.35211181640625, 0.3700103759765625, 0.387908935546875, 0.4058074951171875, 0.4237060546875, 0.4416046142578125, 0.459503173828125, 0.4774017333984375, 0.49530029296875, 0.5131988525390625, 0.531097412109375, 0.5489959716796875, 0.56689453125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 7.0, 15.0, 11.0, 26.0, 25.0, 36.0, 37.0, 52.0, 56.0, 73.0, 92.0, 110.0, 91.0, 76.0, 57.0, 44.0, 55.0, 31.0, 32.0, 29.0, 12.0, 13.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08978271484375, -0.08702564239501953, -0.08426856994628906, -0.0815114974975586, -0.07875442504882812, -0.07599735260009766, -0.07324028015136719, -0.07048320770263672, -0.06772613525390625, -0.06496906280517578, -0.06221199035644531, -0.059454917907714844, -0.056697845458984375, -0.053940773010253906, -0.05118370056152344, -0.04842662811279297, -0.0456695556640625, -0.04291248321533203, -0.04015541076660156, -0.037398338317871094, -0.034641265869140625, -0.031884193420410156, -0.029127120971679688, -0.02637004852294922, -0.02361297607421875, -0.02085590362548828, -0.018098831176757812, -0.015341758728027344, -0.012584686279296875, -0.009827613830566406, -0.0070705413818359375, -0.004313468933105469, -0.001556396484375, 0.0012006759643554688, 0.0039577484130859375, 0.006714820861816406, 0.009471893310546875, 0.012228965759277344, 0.014986038208007812, 0.01774311065673828, 0.02050018310546875, 0.02325725555419922, 0.026014328002929688, 0.028771400451660156, 0.031528472900390625, 0.034285545349121094, 0.03704261779785156, 0.03979969024658203, 0.0425567626953125, 0.04531383514404297, 0.04807090759277344, 0.050827980041503906, 0.053585052490234375, 0.056342124938964844, 0.05909919738769531, 0.06185626983642578, 0.06461334228515625, 0.06737041473388672, 0.07012748718261719, 0.07288455963134766, 0.07564163208007812, 0.0783987045288086, 0.08115577697753906, 0.08391284942626953, 0.086669921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 12.0, 24.0, 62.0, 113.0, 163.0, 311.0, 828.0, 4600.0, 63806.0, 3764836.0, 343728.0, 12986.0, 1750.0, 547.0, 230.0, 129.0, 69.0, 42.0, 17.0, 13.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.75732421875, -0.7407608032226562, -0.7241973876953125, -0.7076339721679688, -0.691070556640625, -0.6745071411132812, -0.6579437255859375, -0.6413803100585938, -0.62481689453125, -0.6082534790039062, -0.5916900634765625, -0.5751266479492188, -0.558563232421875, -0.5419998168945312, -0.5254364013671875, -0.5088729858398438, -0.4923095703125, -0.47574615478515625, -0.4591827392578125, -0.44261932373046875, -0.426055908203125, -0.40949249267578125, -0.3929290771484375, -0.37636566162109375, -0.35980224609375, -0.34323883056640625, -0.3266754150390625, -0.31011199951171875, -0.293548583984375, -0.27698516845703125, -0.2604217529296875, -0.24385833740234375, -0.227294921875, -0.21073150634765625, -0.1941680908203125, -0.17760467529296875, -0.161041259765625, -0.14447784423828125, -0.1279144287109375, -0.11135101318359375, -0.09478759765625, -0.07822418212890625, -0.0616607666015625, -0.04509735107421875, -0.028533935546875, -0.01197052001953125, 0.0045928955078125, 0.02115631103515625, 0.0377197265625, 0.05428314208984375, 0.0708465576171875, 0.08740997314453125, 0.103973388671875, 0.12053680419921875, 0.1371002197265625, 0.15366363525390625, 0.17022705078125, 0.18679046630859375, 0.2033538818359375, 0.21991729736328125, 0.236480712890625, 0.25304412841796875, 0.2696075439453125, 0.28617095947265625, 0.302734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 14.0, 12.0, 18.0, 33.0, 46.0, 51.0, 74.0, 107.0, 194.0, 322.0, 738.0, 1036.0, 492.0, 282.0, 198.0, 123.0, 93.0, 57.0, 60.0, 36.0, 22.0, 17.0, 12.0, 11.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10687255859375, -0.1026601791381836, -0.09844779968261719, -0.09423542022705078, -0.09002304077148438, -0.08581066131591797, -0.08159828186035156, -0.07738590240478516, -0.07317352294921875, -0.06896114349365234, -0.06474876403808594, -0.06053638458251953, -0.056324005126953125, -0.05211162567138672, -0.04789924621582031, -0.043686866760253906, -0.0394744873046875, -0.035262107849121094, -0.031049728393554688, -0.02683734893798828, -0.022624969482421875, -0.01841259002685547, -0.014200210571289062, -0.009987831115722656, -0.00577545166015625, -0.0015630722045898438, 0.0026493072509765625, 0.006861686706542969, 0.011074066162109375, 0.015286445617675781, 0.019498825073242188, 0.023711204528808594, 0.027923583984375, 0.032135963439941406, 0.03634834289550781, 0.04056072235107422, 0.044773101806640625, 0.04898548126220703, 0.05319786071777344, 0.057410240173339844, 0.06162261962890625, 0.06583499908447266, 0.07004737854003906, 0.07425975799560547, 0.07847213745117188, 0.08268451690673828, 0.08689689636230469, 0.0911092758178711, 0.0953216552734375, 0.0995340347290039, 0.10374641418457031, 0.10795879364013672, 0.11217117309570312, 0.11638355255126953, 0.12059593200683594, 0.12480831146240234, 0.12902069091796875, 0.13323307037353516, 0.13744544982910156, 0.14165782928466797, 0.14587020874023438, 0.15008258819580078, 0.1542949676513672, 0.1585073471069336, 0.1627197265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 15.0, 25.0, 75.0, 125.0, 213.0, 220.0, 149.0, 87.0, 32.0, 23.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3275172710418701, -0.3021373152732849, -0.2767573297023773, -0.2513773739337921, -0.22599738836288452, -0.20061743259429932, -0.17523746192455292, -0.14985749125480652, -0.12447752058506012, -0.09909754991531372, -0.07371757924556732, -0.04833761602640152, -0.02295764535665512, 0.002422317862510681, 0.02780228853225708, 0.05318225920200348, 0.07856222987174988, 0.10394220054149628, 0.12932217121124268, 0.15470212697982788, 0.18008211255073547, 0.20546206831932068, 0.23084203898906708, 0.2562220096588135, 0.2816019654273987, 0.3069819211959839, 0.3323619067668915, 0.3577418625354767, 0.3831218481063843, 0.4085018038749695, 0.4338817596435547, 0.4592617452144623, 0.4846417307853699, 0.5100216865539551, 0.5354016423225403, 0.5607816576957703, 0.5861616134643555, 0.6115415692329407, 0.6369215250015259, 0.6623015403747559, 0.6876814961433411, 0.7130614519119263, 0.7384414076805115, 0.7638214230537415, 0.7892013788223267, 0.8145813345909119, 0.8399612903594971, 0.865341305732727, 0.8907212018966675, 0.9161011576652527, 0.9414811134338379, 0.9668611288070679, 0.9922410845756531, 1.0176210403442383, 1.0430010557174683, 1.0683809518814087, 1.0937609672546387, 1.1191409826278687, 1.144520878791809, 1.169900894165039, 1.1952807903289795, 1.2206608057022095, 1.2460408210754395, 1.2714207172393799, 1.2968007326126099]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 7.0, 12.0, 4.0, 9.0, 11.0, 15.0, 19.0, 14.0, 21.0, 18.0, 17.0, 27.0, 22.0, 36.0, 37.0, 33.0, 31.0, 36.0, 35.0, 51.0, 46.0, 38.0, 33.0, 43.0, 40.0, 31.0, 36.0, 28.0, 44.0, 28.0, 23.0, 25.0, 18.0, 19.0, 25.0, 9.0, 15.0, 8.0, 8.0, 3.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2619420289993286, -0.25254446268081665, -0.24314691126346588, -0.23374934494495392, -0.22435179352760315, -0.2149542272090912, -0.20555666089057922, -0.19615910947322845, -0.18676155805587769, -0.17736399173736572, -0.16796644032001495, -0.158568874001503, -0.14917132258415222, -0.13977375626564026, -0.1303761899471283, -0.12097863852977753, -0.11158107221126556, -0.1021835133433342, -0.09278595447540283, -0.08338838815689087, -0.0739908367395401, -0.06459327042102814, -0.05519571155309677, -0.045798152685165405, -0.03640059381723404, -0.027003034949302673, -0.017605474218726158, -0.008207913488149643, 0.001189645379781723, 0.010587204247713089, 0.019984766840934753, 0.02938232570886612, 0.038779884576797485, 0.04817744344472885, 0.05757500231266022, 0.06697256863117218, 0.07637012004852295, 0.08576768636703491, 0.09516524523496628, 0.10456280410289764, 0.11396036297082901, 0.12335792183876038, 0.13275548815727234, 0.1421530395746231, 0.15155060589313507, 0.16094815731048584, 0.1703457236289978, 0.17974328994750977, 0.18914084136486053, 0.1985384076833725, 0.20793595910072327, 0.21733352541923523, 0.226731076836586, 0.23612864315509796, 0.24552619457244873, 0.2549237608909607, 0.26432132720947266, 0.2737188935279846, 0.2831164598464966, 0.29251399636268616, 0.3019115626811981, 0.3113091289997101, 0.32070669531822205, 0.3301042318344116, 0.3395017981529236]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 6.0, 10.0, 8.0, 10.0, 14.0, 14.0, 31.0, 28.0, 43.0, 60.0, 86.0, 102.0, 146.0, 209.0, 307.0, 493.0, 720.0, 1209.0, 1975.0, 3449.0, 6154.0, 11419.0, 22295.0, 46276.0, 105619.0, 254471.0, 322464.0, 146639.0, 62668.0, 28913.0, 14351.0, 7727.0, 4117.0, 2430.0, 1383.0, 839.0, 578.0, 395.0, 264.0, 182.0, 109.0, 101.0, 65.0, 45.0, 36.0, 24.0, 15.0, 13.0, 9.0, 20.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1573486328125, -0.15213584899902344, -0.14692306518554688, -0.1417102813720703, -0.13649749755859375, -0.1312847137451172, -0.12607192993164062, -0.12085914611816406, -0.1156463623046875, -0.11043357849121094, -0.10522079467773438, -0.10000801086425781, -0.09479522705078125, -0.08958244323730469, -0.08436965942382812, -0.07915687561035156, -0.073944091796875, -0.06873130798339844, -0.06351852416992188, -0.05830574035644531, -0.05309295654296875, -0.04788017272949219, -0.042667388916015625, -0.03745460510253906, -0.0322418212890625, -0.027029037475585938, -0.021816253662109375, -0.016603469848632812, -0.01139068603515625, -0.0061779022216796875, -0.000965118408203125, 0.0042476654052734375, 0.00946044921875, 0.014673233032226562, 0.019886016845703125, 0.025098800659179688, 0.03031158447265625, 0.03552436828613281, 0.040737152099609375, 0.04594993591308594, 0.0511627197265625, 0.05637550354003906, 0.061588287353515625, 0.06680107116699219, 0.07201385498046875, 0.07722663879394531, 0.08243942260742188, 0.08765220642089844, 0.092864990234375, 0.09807777404785156, 0.10329055786132812, 0.10850334167480469, 0.11371612548828125, 0.11892890930175781, 0.12414169311523438, 0.12935447692871094, 0.1345672607421875, 0.13978004455566406, 0.14499282836914062, 0.1502056121826172, 0.15541839599609375, 0.1606311798095703, 0.16584396362304688, 0.17105674743652344, 0.17626953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 17.0, 11.0, 21.0, 28.0, 29.0, 39.0, 54.0, 68.0, 83.0, 91.0, 93.0, 85.0, 88.0, 51.0, 56.0, 53.0, 34.0, 32.0, 16.0, 17.0, 13.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068359375, -0.06578445434570312, -0.06320953369140625, -0.060634613037109375, -0.0580596923828125, -0.055484771728515625, -0.05290985107421875, -0.050334930419921875, -0.047760009765625, -0.045185089111328125, -0.04261016845703125, -0.040035247802734375, -0.0374603271484375, -0.034885406494140625, -0.03231048583984375, -0.029735565185546875, -0.02716064453125, -0.024585723876953125, -0.02201080322265625, -0.019435882568359375, -0.0168609619140625, -0.014286041259765625, -0.01171112060546875, -0.009136199951171875, -0.006561279296875, -0.003986358642578125, -0.00141143798828125, 0.001163482666015625, 0.0037384033203125, 0.006313323974609375, 0.00888824462890625, 0.011463165283203125, 0.0140380859375, 0.016613006591796875, 0.01918792724609375, 0.021762847900390625, 0.0243377685546875, 0.026912689208984375, 0.02948760986328125, 0.032062530517578125, 0.034637451171875, 0.037212371826171875, 0.03978729248046875, 0.042362213134765625, 0.0449371337890625, 0.047512054443359375, 0.05008697509765625, 0.052661895751953125, 0.05523681640625, 0.057811737060546875, 0.06038665771484375, 0.06296157836914062, 0.0655364990234375, 0.06811141967773438, 0.07068634033203125, 0.07326126098632812, 0.075836181640625, 0.07841110229492188, 0.08098602294921875, 0.08356094360351562, 0.0861358642578125, 0.08871078491210938, 0.09128570556640625, 0.09386062622070312, 0.096435546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 10.0, 15.0, 15.0, 27.0, 33.0, 49.0, 59.0, 119.0, 182.0, 284.0, 450.0, 827.0, 1630.0, 3943.0, 9794.0, 28716.0, 92925.0, 310791.0, 404685.0, 131130.0, 40101.0, 13165.0, 4979.0, 2097.0, 1051.0, 532.0, 309.0, 184.0, 127.0, 99.0, 72.0, 42.0, 23.0, 19.0, 14.0, 14.0, 9.0, 3.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2265625, -0.2197265625, -0.212890625, -0.2060546875, -0.19921875, -0.1923828125, -0.185546875, -0.1787109375, -0.171875, -0.1650390625, -0.158203125, -0.1513671875, -0.14453125, -0.1376953125, -0.130859375, -0.1240234375, -0.1171875, -0.1103515625, -0.103515625, -0.0966796875, -0.08984375, -0.0830078125, -0.076171875, -0.0693359375, -0.0625, -0.0556640625, -0.048828125, -0.0419921875, -0.03515625, -0.0283203125, -0.021484375, -0.0146484375, -0.0078125, -0.0009765625, 0.005859375, 0.0126953125, 0.01953125, 0.0263671875, 0.033203125, 0.0400390625, 0.046875, 0.0537109375, 0.060546875, 0.0673828125, 0.07421875, 0.0810546875, 0.087890625, 0.0947265625, 0.1015625, 0.1083984375, 0.115234375, 0.1220703125, 0.12890625, 0.1357421875, 0.142578125, 0.1494140625, 0.15625, 0.1630859375, 0.169921875, 0.1767578125, 0.18359375, 0.1904296875, 0.197265625, 0.2041015625, 0.2109375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 9.0, 13.0, 12.0, 28.0, 23.0, 28.0, 26.0, 34.0, 29.0, 40.0, 35.0, 53.0, 46.0, 58.0, 57.0, 61.0, 52.0, 49.0, 53.0, 31.0, 41.0, 29.0, 41.0, 29.0, 33.0, 13.0, 20.0, 9.0, 8.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.1326580047607422, -0.12835311889648438, -0.12404823303222656, -0.11974334716796875, -0.11543846130371094, -0.11113357543945312, -0.10682868957519531, -0.1025238037109375, -0.09821891784667969, -0.09391403198242188, -0.08960914611816406, -0.08530426025390625, -0.08099937438964844, -0.07669448852539062, -0.07238960266113281, -0.068084716796875, -0.06377983093261719, -0.059474945068359375, -0.05517005920410156, -0.05086517333984375, -0.04656028747558594, -0.042255401611328125, -0.03795051574707031, -0.0336456298828125, -0.029340744018554688, -0.025035858154296875, -0.020730972290039062, -0.01642608642578125, -0.012121200561523438, -0.007816314697265625, -0.0035114288330078125, 0.00079345703125, 0.0050983428955078125, 0.009403228759765625, 0.013708114624023438, 0.01801300048828125, 0.022317886352539062, 0.026622772216796875, 0.030927658081054688, 0.0352325439453125, 0.03953742980957031, 0.043842315673828125, 0.04814720153808594, 0.05245208740234375, 0.05675697326660156, 0.061061859130859375, 0.06536674499511719, 0.069671630859375, 0.07397651672363281, 0.07828140258789062, 0.08258628845214844, 0.08689117431640625, 0.09119606018066406, 0.09550094604492188, 0.09980583190917969, 0.1041107177734375, 0.10841560363769531, 0.11272048950195312, 0.11702537536621094, 0.12133026123046875, 0.12563514709472656, 0.12994003295898438, 0.1342449188232422, 0.1385498046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 2.0, 7.0, 6.0, 10.0, 22.0, 17.0, 44.0, 85.0, 154.0, 324.0, 827.0, 2165.0, 6870.0, 32680.0, 702417.0, 273178.0, 21694.0, 5171.0, 1721.0, 588.0, 270.0, 135.0, 53.0, 26.0, 27.0, 12.0, 6.0, 6.0, 7.0, 2.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.3859405517578125, -0.373443603515625, -0.3609466552734375, -0.34844970703125, -0.3359527587890625, -0.323455810546875, -0.3109588623046875, -0.2984619140625, -0.2859649658203125, -0.273468017578125, -0.2609710693359375, -0.24847412109375, -0.2359771728515625, -0.223480224609375, -0.2109832763671875, -0.198486328125, -0.1859893798828125, -0.173492431640625, -0.1609954833984375, -0.14849853515625, -0.1360015869140625, -0.123504638671875, -0.1110076904296875, -0.0985107421875, -0.0860137939453125, -0.073516845703125, -0.0610198974609375, -0.04852294921875, -0.0360260009765625, -0.023529052734375, -0.0110321044921875, 0.00146484375, 0.0139617919921875, 0.026458740234375, 0.0389556884765625, 0.05145263671875, 0.0639495849609375, 0.076446533203125, 0.0889434814453125, 0.1014404296875, 0.1139373779296875, 0.126434326171875, 0.1389312744140625, 0.15142822265625, 0.1639251708984375, 0.176422119140625, 0.1889190673828125, 0.201416015625, 0.2139129638671875, 0.226409912109375, 0.2389068603515625, 0.25140380859375, 0.2639007568359375, 0.276397705078125, 0.2888946533203125, 0.3013916015625, 0.3138885498046875, 0.326385498046875, 0.3388824462890625, 0.35137939453125, 0.3638763427734375, 0.376373291015625, 0.3888702392578125, 0.4013671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 5.0, 2.0, 9.0, 13.0, 21.0, 23.0, 40.0, 54.0, 105.0, 185.0, 191.0, 133.0, 75.0, 48.0, 27.0, 12.0, 15.0, 5.0, 6.0, 2.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.069639205932617e-05, -2.9797665774822235e-05, -2.88989394903183e-05, -2.800021320581436e-05, -2.7101486921310425e-05, -2.6202760636806488e-05, -2.530403435230255e-05, -2.4405308067798615e-05, -2.3506581783294678e-05, -2.260785549879074e-05, -2.1709129214286804e-05, -2.0810402929782867e-05, -1.991167664527893e-05, -1.9012950360774994e-05, -1.8114224076271057e-05, -1.721549779176712e-05, -1.6316771507263184e-05, -1.5418045222759247e-05, -1.451931893825531e-05, -1.3620592653751373e-05, -1.2721866369247437e-05, -1.18231400847435e-05, -1.0924413800239563e-05, -1.0025687515735626e-05, -9.12696123123169e-06, -8.228234946727753e-06, -7.329508662223816e-06, -6.430782377719879e-06, -5.532056093215942e-06, -4.633329808712006e-06, -3.734603524208069e-06, -2.835877239704132e-06, -1.9371509552001953e-06, -1.0384246706962585e-06, -1.3969838619232178e-07, 7.59027898311615e-07, 1.6577541828155518e-06, 2.5564804673194885e-06, 3.4552067518234253e-06, 4.353933036327362e-06, 5.252659320831299e-06, 6.151385605335236e-06, 7.050111889839172e-06, 7.948838174343109e-06, 8.847564458847046e-06, 9.746290743350983e-06, 1.064501702785492e-05, 1.1543743312358856e-05, 1.2442469596862793e-05, 1.334119588136673e-05, 1.4239922165870667e-05, 1.5138648450374603e-05, 1.603737473487854e-05, 1.6936101019382477e-05, 1.7834827303886414e-05, 1.873355358839035e-05, 1.9632279872894287e-05, 2.0531006157398224e-05, 2.142973244190216e-05, 2.2328458726406097e-05, 2.3227185010910034e-05, 2.412591129541397e-05, 2.5024637579917908e-05, 2.5923363864421844e-05, 2.682209014892578e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 8.0, 9.0, 10.0, 10.0, 11.0, 24.0, 39.0, 55.0, 95.0, 171.0, 245.0, 393.0, 756.0, 1519.0, 3178.0, 6997.0, 19216.0, 88435.0, 773975.0, 115965.0, 22452.0, 7890.0, 3433.0, 1642.0, 834.0, 459.0, 266.0, 142.0, 95.0, 61.0, 44.0, 28.0, 25.0, 14.0, 8.0, 5.0, 10.0, 5.0, 2.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2449951171875, -0.2367076873779297, -0.22842025756835938, -0.22013282775878906, -0.21184539794921875, -0.20355796813964844, -0.19527053833007812, -0.1869831085205078, -0.1786956787109375, -0.1704082489013672, -0.16212081909179688, -0.15383338928222656, -0.14554595947265625, -0.13725852966308594, -0.12897109985351562, -0.12068367004394531, -0.112396240234375, -0.10410881042480469, -0.09582138061523438, -0.08753395080566406, -0.07924652099609375, -0.07095909118652344, -0.06267166137695312, -0.05438423156738281, -0.0460968017578125, -0.03780937194824219, -0.029521942138671875, -0.021234512329101562, -0.01294708251953125, -0.0046596527099609375, 0.003627777099609375, 0.011915206909179688, 0.02020263671875, 0.028490066528320312, 0.036777496337890625, 0.04506492614746094, 0.05335235595703125, 0.06163978576660156, 0.06992721557617188, 0.07821464538574219, 0.0865020751953125, 0.09478950500488281, 0.10307693481445312, 0.11136436462402344, 0.11965179443359375, 0.12793922424316406, 0.13622665405273438, 0.1445140838623047, 0.152801513671875, 0.1610889434814453, 0.16937637329101562, 0.17766380310058594, 0.18595123291015625, 0.19423866271972656, 0.20252609252929688, 0.2108135223388672, 0.2191009521484375, 0.2273883819580078, 0.23567581176757812, 0.24396324157714844, 0.25225067138671875, 0.26053810119628906, 0.2688255310058594, 0.2771129608154297, 0.285400390625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 12.0, 11.0, 10.0, 9.0, 13.0, 13.0, 12.0, 18.0, 22.0, 26.0, 45.0, 54.0, 60.0, 94.0, 109.0, 104.0, 68.0, 62.0, 46.0, 33.0, 32.0, 22.0, 21.0, 16.0, 22.0, 11.0, 10.0, 1.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.079833984375, -0.0774698257446289, -0.07510566711425781, -0.07274150848388672, -0.07037734985351562, -0.06801319122314453, -0.06564903259277344, -0.06328487396240234, -0.06092071533203125, -0.058556556701660156, -0.05619239807128906, -0.05382823944091797, -0.051464080810546875, -0.04909992218017578, -0.04673576354980469, -0.044371604919433594, -0.0420074462890625, -0.039643287658691406, -0.03727912902832031, -0.03491497039794922, -0.032550811767578125, -0.03018665313720703, -0.027822494506835938, -0.025458335876464844, -0.02309417724609375, -0.020730018615722656, -0.018365859985351562, -0.01600170135498047, -0.013637542724609375, -0.011273384094238281, -0.008909225463867188, -0.006545066833496094, -0.004180908203125, -0.0018167495727539062, 0.0005474090576171875, 0.0029115676879882812, 0.005275726318359375, 0.007639884948730469, 0.010004043579101562, 0.012368202209472656, 0.01473236083984375, 0.017096519470214844, 0.019460678100585938, 0.02182483673095703, 0.024188995361328125, 0.02655315399169922, 0.028917312622070312, 0.031281471252441406, 0.0336456298828125, 0.036009788513183594, 0.03837394714355469, 0.04073810577392578, 0.043102264404296875, 0.04546642303466797, 0.04783058166503906, 0.050194740295410156, 0.05255889892578125, 0.054923057556152344, 0.05728721618652344, 0.05965137481689453, 0.062015533447265625, 0.06437969207763672, 0.06674385070800781, 0.0691080093383789, 0.07147216796875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 26.0, 114.0, 466.0, 313.0, 66.0, 16.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.142932415008545, -4.066018104553223, -3.9891035556793213, -3.912189245223999, -3.8352746963500977, -3.7583603858947754, -3.681445837020874, -3.6045315265655518, -3.5276169776916504, -3.450702667236328, -3.3737881183624268, -3.2968738079071045, -3.219959259033203, -3.143044948577881, -3.0661303997039795, -2.9892160892486572, -2.912301778793335, -2.8353874683380127, -2.7584729194641113, -2.681558609008789, -2.6046440601348877, -2.5277297496795654, -2.450815200805664, -2.373900890350342, -2.2969865798950195, -2.2200722694396973, -2.143157720565796, -2.0662434101104736, -1.9893288612365723, -1.91241455078125, -1.8355001211166382, -1.7585856914520264, -1.6816712617874146, -1.6047568321228027, -1.527842402458191, -1.450927972793579, -1.3740136623382568, -1.2970991134643555, -1.2201848030090332, -1.1432703733444214, -1.0663559436798096, -0.9894415140151978, -0.9125270843505859, -0.8356127142906189, -0.7586982846260071, -0.6817838549613953, -0.6048694849014282, -0.5279550552368164, -0.4510406255722046, -0.3741261959075928, -0.29721179604530334, -0.22029738128185272, -0.1433829665184021, -0.06646853685379028, 0.010445863008499146, 0.08736026287078857, 0.1642746925354004, 0.241189107298851, 0.31810352206230164, 0.39501792192459106, 0.4719323515892029, 0.5488467812538147, 0.6257611513137817, 0.7026755809783936, 0.7795900106430054]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 9.0, 8.0, 7.0, 8.0, 10.0, 15.0, 15.0, 18.0, 18.0, 27.0, 30.0, 33.0, 36.0, 33.0, 36.0, 36.0, 49.0, 43.0, 53.0, 46.0, 49.0, 46.0, 47.0, 35.0, 38.0, 49.0, 30.0, 31.0, 23.0, 25.0, 19.0, 15.0, 11.0, 15.0, 8.0, 7.0, 5.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4178602695465088, -0.404879629611969, -0.3918989896774292, -0.3789183497428894, -0.3659376800060272, -0.3529570400714874, -0.33997640013694763, -0.32699576020240784, -0.31401512026786804, -0.30103448033332825, -0.28805384039878845, -0.27507317066192627, -0.2620925307273865, -0.24911189079284668, -0.23613125085830688, -0.2231506109237671, -0.2101699560880661, -0.1971893161535263, -0.18420866131782532, -0.17122802138328552, -0.15824738144874573, -0.14526674151420593, -0.13228608667850494, -0.11930544674396515, -0.10632479935884476, -0.09334415197372437, -0.08036351203918457, -0.06738286465406418, -0.054402220994234085, -0.04142157733440399, -0.0284409299492836, -0.015460290014743805, -0.002479642629623413, 0.010501001961529255, 0.023481646552681923, 0.036462292075157166, 0.04944293573498726, 0.06242357939481735, 0.07540422677993774, 0.08838486671447754, 0.10136551409959793, 0.11434616148471832, 0.12732680141925812, 0.1403074562549591, 0.1532880961894989, 0.1662687361240387, 0.1792493760585785, 0.1922300159931183, 0.20521067082881927, 0.21819131076335907, 0.23117196559906006, 0.24415260553359985, 0.25713324546813965, 0.27011388540267944, 0.28309452533721924, 0.29607516527175903, 0.3090558350086212, 0.322036474943161, 0.3350171148777008, 0.347997784614563, 0.3609784245491028, 0.3739590644836426, 0.3869397044181824, 0.39992034435272217, 0.41290098428726196]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 9.0, 24.0, 27.0, 33.0, 42.0, 97.0, 143.0, 234.0, 384.0, 681.0, 1367.0, 3006.0, 7835.0, 23183.0, 89334.0, 823388.0, 2935425.0, 240040.0, 45794.0, 13683.0, 5026.0, 2066.0, 1005.0, 549.0, 293.0, 207.0, 110.0, 89.0, 55.0, 43.0, 22.0, 20.0, 13.0, 15.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13037109375, -0.125, -0.11962890625, -0.1142578125, -0.10888671875, -0.103515625, -0.09814453125, -0.0927734375, -0.08740234375, -0.08203125, -0.07666015625, -0.0712890625, -0.06591796875, -0.060546875, -0.05517578125, -0.0498046875, -0.04443359375, -0.0390625, -0.03369140625, -0.0283203125, -0.02294921875, -0.017578125, -0.01220703125, -0.0068359375, -0.00146484375, 0.00390625, 0.00927734375, 0.0146484375, 0.02001953125, 0.025390625, 0.03076171875, 0.0361328125, 0.04150390625, 0.046875, 0.05224609375, 0.0576171875, 0.06298828125, 0.068359375, 0.07373046875, 0.0791015625, 0.08447265625, 0.08984375, 0.09521484375, 0.1005859375, 0.10595703125, 0.111328125, 0.11669921875, 0.1220703125, 0.12744140625, 0.1328125, 0.13818359375, 0.1435546875, 0.14892578125, 0.154296875, 0.15966796875, 0.1650390625, 0.17041015625, 0.17578125, 0.18115234375, 0.1865234375, 0.19189453125, 0.197265625, 0.20263671875, 0.2080078125, 0.21337890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 9.0, 13.0, 17.0, 33.0, 41.0, 54.0, 54.0, 75.0, 73.0, 96.0, 76.0, 86.0, 82.0, 68.0, 65.0, 37.0, 33.0, 27.0, 14.0, 18.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06689453125, -0.0642538070678711, -0.06161308288574219, -0.05897235870361328, -0.056331634521484375, -0.05369091033935547, -0.05105018615722656, -0.048409461975097656, -0.04576873779296875, -0.043128013610839844, -0.04048728942871094, -0.03784656524658203, -0.035205841064453125, -0.03256511688232422, -0.029924392700195312, -0.027283668518066406, -0.0246429443359375, -0.022002220153808594, -0.019361495971679688, -0.01672077178955078, -0.014080047607421875, -0.011439323425292969, -0.008798599243164062, -0.006157875061035156, -0.00351715087890625, -0.0008764266967773438, 0.0017642974853515625, 0.004405021667480469, 0.007045745849609375, 0.009686470031738281, 0.012327194213867188, 0.014967918395996094, 0.017608642578125, 0.020249366760253906, 0.022890090942382812, 0.02553081512451172, 0.028171539306640625, 0.03081226348876953, 0.03345298767089844, 0.036093711853027344, 0.03873443603515625, 0.041375160217285156, 0.04401588439941406, 0.04665660858154297, 0.049297332763671875, 0.05193805694580078, 0.05457878112792969, 0.057219505310058594, 0.0598602294921875, 0.0625009536743164, 0.06514167785644531, 0.06778240203857422, 0.07042312622070312, 0.07306385040283203, 0.07570457458496094, 0.07834529876708984, 0.08098602294921875, 0.08362674713134766, 0.08626747131347656, 0.08890819549560547, 0.09154891967773438, 0.09418964385986328, 0.09683036804199219, 0.0994710922241211, 0.10211181640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 8.0, 16.0, 12.0, 25.0, 29.0, 36.0, 62.0, 72.0, 137.0, 206.0, 313.0, 604.0, 1479.0, 5044.0, 29982.0, 378162.0, 3457392.0, 288391.0, 24994.0, 4430.0, 1309.0, 600.0, 332.0, 210.0, 134.0, 87.0, 63.0, 41.0, 29.0, 30.0, 14.0, 11.0, 9.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3603515625, -0.3509807586669922, -0.3416099548339844, -0.33223915100097656, -0.32286834716796875, -0.31349754333496094, -0.3041267395019531, -0.2947559356689453, -0.2853851318359375, -0.2760143280029297, -0.2666435241699219, -0.25727272033691406, -0.24790191650390625, -0.23853111267089844, -0.22916030883789062, -0.2197895050048828, -0.210418701171875, -0.2010478973388672, -0.19167709350585938, -0.18230628967285156, -0.17293548583984375, -0.16356468200683594, -0.15419387817382812, -0.1448230743408203, -0.1354522705078125, -0.1260814666748047, -0.11671066284179688, -0.10733985900878906, -0.09796905517578125, -0.08859825134277344, -0.07922744750976562, -0.06985664367675781, -0.06048583984375, -0.05111503601074219, -0.041744232177734375, -0.03237342834472656, -0.02300262451171875, -0.013631820678710938, -0.004261016845703125, 0.0051097869873046875, 0.0144805908203125, 0.023851394653320312, 0.033222198486328125, 0.04259300231933594, 0.05196380615234375, 0.06133460998535156, 0.07070541381835938, 0.08007621765136719, 0.089447021484375, 0.09881782531738281, 0.10818862915039062, 0.11755943298339844, 0.12693023681640625, 0.13630104064941406, 0.14567184448242188, 0.1550426483154297, 0.1644134521484375, 0.1737842559814453, 0.18315505981445312, 0.19252586364746094, 0.20189666748046875, 0.21126747131347656, 0.22063827514648438, 0.2300090789794922, 0.2393798828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 11.0, 13.0, 20.0, 19.0, 39.0, 42.0, 70.0, 97.0, 141.0, 208.0, 315.0, 470.0, 633.0, 613.0, 408.0, 285.0, 196.0, 144.0, 93.0, 66.0, 51.0, 46.0, 22.0, 16.0, 17.0, 7.0, 7.0, 7.0, 0.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08856201171875, -0.08467960357666016, -0.08079719543457031, -0.07691478729248047, -0.07303237915039062, -0.06914997100830078, -0.06526756286621094, -0.061385154724121094, -0.05750274658203125, -0.053620338439941406, -0.04973793029785156, -0.04585552215576172, -0.041973114013671875, -0.03809070587158203, -0.03420829772949219, -0.030325889587402344, -0.0264434814453125, -0.022561073303222656, -0.018678665161132812, -0.014796257019042969, -0.010913848876953125, -0.007031440734863281, -0.0031490325927734375, 0.0007333755493164062, 0.00461578369140625, 0.008498191833496094, 0.012380599975585938, 0.01626300811767578, 0.020145416259765625, 0.02402782440185547, 0.027910232543945312, 0.031792640686035156, 0.035675048828125, 0.039557456970214844, 0.04343986511230469, 0.04732227325439453, 0.051204681396484375, 0.05508708953857422, 0.05896949768066406, 0.0628519058227539, 0.06673431396484375, 0.0706167221069336, 0.07449913024902344, 0.07838153839111328, 0.08226394653320312, 0.08614635467529297, 0.09002876281738281, 0.09391117095947266, 0.0977935791015625, 0.10167598724365234, 0.10555839538574219, 0.10944080352783203, 0.11332321166992188, 0.11720561981201172, 0.12108802795410156, 0.1249704360961914, 0.12885284423828125, 0.1327352523803711, 0.13661766052246094, 0.14050006866455078, 0.14438247680664062, 0.14826488494873047, 0.1521472930908203, 0.15602970123291016, 0.159912109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 27.0, 60.0, 113.0, 220.0, 263.0, 167.0, 71.0, 37.0, 20.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9384273290634155, -0.8979194164276123, -0.8574115037918091, -0.8169035911560059, -0.7763956785202026, -0.7358877658843994, -0.6953797936439514, -0.6548718810081482, -0.614363968372345, -0.5738560557365417, -0.5333481431007385, -0.4928402006626129, -0.4523322880268097, -0.41182437539100647, -0.37131643295288086, -0.33080852031707764, -0.2903006076812744, -0.2497926950454712, -0.20928476750850677, -0.16877683997154236, -0.12826892733573914, -0.08776101469993591, -0.0472530871629715, -0.00674515962600708, 0.03376275300979614, 0.07427067309617996, 0.11477859318256378, 0.1552865207195282, 0.19579443335533142, 0.23630234599113464, 0.27681028842926025, 0.3173182010650635, 0.35782623291015625, 0.3983341455459595, 0.4388420581817627, 0.4793500006198883, 0.5198578834533691, 0.5603657960891724, 0.6008737683296204, 0.6413816809654236, 0.6818895936012268, 0.72239750623703, 0.7629054188728333, 0.8034133315086365, 0.8439213037490845, 0.8844292163848877, 0.9249371290206909, 0.9654450416564941, 1.0059529542922974, 1.0464608669281006, 1.0869687795639038, 1.127476692199707, 1.1679846048355103, 1.2084925174713135, 1.2490004301071167, 1.28950834274292, 1.3300163745880127, 1.370524287223816, 1.4110321998596191, 1.4515401124954224, 1.4920480251312256, 1.5325559377670288, 1.573063850402832, 1.6135718822479248, 1.6540796756744385]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 7.0, 5.0, 4.0, 4.0, 7.0, 15.0, 27.0, 22.0, 22.0, 25.0, 43.0, 37.0, 55.0, 55.0, 52.0, 59.0, 52.0, 58.0, 63.0, 44.0, 51.0, 46.0, 42.0, 45.0, 35.0, 35.0, 31.0, 15.0, 12.0, 6.0, 11.0, 4.0, 8.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35754793882369995, -0.343615859746933, -0.329683780670166, -0.31575167179107666, -0.3018195927143097, -0.2878875136375427, -0.27395543456077576, -0.2600233554840088, -0.24609127640724182, -0.23215919733047485, -0.2182271033525467, -0.20429502427577972, -0.19036294519901276, -0.1764308512210846, -0.16249877214431763, -0.14856669306755066, -0.1346345990896225, -0.12070251256227493, -0.10677043348550797, -0.0928383469581604, -0.07890626788139343, -0.06497418135404587, -0.0510420948266983, -0.037110015749931335, -0.02317792922258377, -0.00924584548920393, 0.004686238244175911, 0.018618322908878326, 0.03255040571093559, 0.04648248851299286, 0.060414575040340424, 0.07434665411710739, 0.08827874064445496, 0.10221082717180252, 0.11614290624856949, 0.13007499277591705, 0.14400707185268402, 0.15793916583061218, 0.17187124490737915, 0.18580332398414612, 0.19973540306091309, 0.21366748213768005, 0.22759957611560822, 0.24153165519237518, 0.25546374917030334, 0.2693958282470703, 0.2833279073238373, 0.29725998640060425, 0.3111920952796936, 0.32512417435646057, 0.33905625343322754, 0.3529883623123169, 0.36692044138908386, 0.38085252046585083, 0.3947845995426178, 0.40871667861938477, 0.42264875769615173, 0.4365808367729187, 0.45051291584968567, 0.46444499492645264, 0.478377103805542, 0.49230918288230896, 0.5062412619590759, 0.5201733112335205, 0.5341054201126099]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 6.0, 5.0, 4.0, 9.0, 10.0, 17.0, 19.0, 13.0, 39.0, 37.0, 54.0, 79.0, 150.0, 199.0, 425.0, 908.0, 1863.0, 4469.0, 11211.0, 30439.0, 86516.0, 236083.0, 372522.0, 193369.0, 69373.0, 24636.0, 9133.0, 3593.0, 1646.0, 765.0, 378.0, 188.0, 107.0, 90.0, 69.0, 35.0, 25.0, 14.0, 18.0, 11.0, 7.0, 8.0, 9.0, 5.0, 4.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23486328125, -0.2282276153564453, -0.22159194946289062, -0.21495628356933594, -0.20832061767578125, -0.20168495178222656, -0.19504928588867188, -0.1884136199951172, -0.1817779541015625, -0.1751422882080078, -0.16850662231445312, -0.16187095642089844, -0.15523529052734375, -0.14859962463378906, -0.14196395874023438, -0.1353282928466797, -0.128692626953125, -0.12205696105957031, -0.11542129516601562, -0.10878562927246094, -0.10214996337890625, -0.09551429748535156, -0.08887863159179688, -0.08224296569824219, -0.0756072998046875, -0.06897163391113281, -0.062335968017578125, -0.05570030212402344, -0.04906463623046875, -0.04242897033691406, -0.035793304443359375, -0.029157638549804688, -0.02252197265625, -0.015886306762695312, -0.009250640869140625, -0.0026149749755859375, 0.00402069091796875, 0.010656356811523438, 0.017292022705078125, 0.023927688598632812, 0.0305633544921875, 0.03719902038574219, 0.043834686279296875, 0.05047035217285156, 0.05710601806640625, 0.06374168395996094, 0.07037734985351562, 0.07701301574707031, 0.083648681640625, 0.09028434753417969, 0.09692001342773438, 0.10355567932128906, 0.11019134521484375, 0.11682701110839844, 0.12346267700195312, 0.1300983428955078, 0.1367340087890625, 0.1433696746826172, 0.15000534057617188, 0.15664100646972656, 0.16327667236328125, 0.16991233825683594, 0.17654800415039062, 0.1831836700439453, 0.1898193359375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 7.0, 4.0, 8.0, 17.0, 17.0, 25.0, 21.0, 53.0, 60.0, 71.0, 85.0, 72.0, 89.0, 86.0, 66.0, 80.0, 64.0, 46.0, 33.0, 26.0, 27.0, 10.0, 17.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059356689453125, -0.05695772171020508, -0.054558753967285156, -0.052159786224365234, -0.04976081848144531, -0.04736185073852539, -0.04496288299560547, -0.04256391525268555, -0.040164947509765625, -0.0377659797668457, -0.03536701202392578, -0.03296804428100586, -0.030569076538085938, -0.028170108795166016, -0.025771141052246094, -0.023372173309326172, -0.02097320556640625, -0.018574237823486328, -0.016175270080566406, -0.013776302337646484, -0.011377334594726562, -0.00897836685180664, -0.006579399108886719, -0.004180431365966797, -0.001781463623046875, 0.0006175041198730469, 0.0030164718627929688, 0.005415439605712891, 0.007814407348632812, 0.010213375091552734, 0.012612342834472656, 0.015011310577392578, 0.0174102783203125, 0.019809246063232422, 0.022208213806152344, 0.024607181549072266, 0.027006149291992188, 0.02940511703491211, 0.03180408477783203, 0.03420305252075195, 0.036602020263671875, 0.0390009880065918, 0.04139995574951172, 0.04379892349243164, 0.04619789123535156, 0.048596858978271484, 0.050995826721191406, 0.05339479446411133, 0.05579376220703125, 0.05819272994995117, 0.060591697692871094, 0.06299066543579102, 0.06538963317871094, 0.06778860092163086, 0.07018756866455078, 0.0725865364074707, 0.07498550415039062, 0.07738447189331055, 0.07978343963623047, 0.08218240737915039, 0.08458137512207031, 0.08698034286499023, 0.08937931060791016, 0.09177827835083008, 0.09417724609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 8.0, 11.0, 14.0, 29.0, 37.0, 36.0, 62.0, 107.0, 156.0, 241.0, 336.0, 571.0, 912.0, 1692.0, 3276.0, 7620.0, 19375.0, 55400.0, 169752.0, 397038.0, 256763.0, 85140.0, 28982.0, 10943.0, 4644.0, 2234.0, 1180.0, 680.0, 406.0, 275.0, 197.0, 126.0, 92.0, 69.0, 35.0, 22.0, 30.0, 15.0, 17.0, 7.0, 2.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23876953125, -0.23123550415039062, -0.22370147705078125, -0.21616744995117188, -0.2086334228515625, -0.20109939575195312, -0.19356536865234375, -0.18603134155273438, -0.178497314453125, -0.17096328735351562, -0.16342926025390625, -0.15589523315429688, -0.1483612060546875, -0.14082717895507812, -0.13329315185546875, -0.12575912475585938, -0.11822509765625, -0.11069107055664062, -0.10315704345703125, -0.09562301635742188, -0.0880889892578125, -0.08055496215820312, -0.07302093505859375, -0.06548690795898438, -0.057952880859375, -0.050418853759765625, -0.04288482666015625, -0.035350799560546875, -0.0278167724609375, -0.020282745361328125, -0.01274871826171875, -0.005214691162109375, 0.0023193359375, 0.009853363037109375, 0.01738739013671875, 0.024921417236328125, 0.0324554443359375, 0.039989471435546875, 0.04752349853515625, 0.055057525634765625, 0.062591552734375, 0.07012557983398438, 0.07765960693359375, 0.08519363403320312, 0.0927276611328125, 0.10026168823242188, 0.10779571533203125, 0.11532974243164062, 0.12286376953125, 0.13039779663085938, 0.13793182373046875, 0.14546585083007812, 0.1529998779296875, 0.16053390502929688, 0.16806793212890625, 0.17560195922851562, 0.183135986328125, 0.19067001342773438, 0.19820404052734375, 0.20573806762695312, 0.2132720947265625, 0.22080612182617188, 0.22834014892578125, 0.23587417602539062, 0.243408203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 14.0, 11.0, 19.0, 24.0, 17.0, 19.0, 23.0, 28.0, 36.0, 28.0, 38.0, 47.0, 34.0, 42.0, 49.0, 36.0, 42.0, 41.0, 64.0, 31.0, 46.0, 36.0, 31.0, 26.0, 35.0, 27.0, 25.0, 14.0, 24.0, 18.0, 9.0, 14.0, 8.0, 11.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11578369140625, -0.11197948455810547, -0.10817527770996094, -0.1043710708618164, -0.10056686401367188, -0.09676265716552734, -0.09295845031738281, -0.08915424346923828, -0.08535003662109375, -0.08154582977294922, -0.07774162292480469, -0.07393741607666016, -0.07013320922851562, -0.0663290023803711, -0.06252479553222656, -0.05872058868408203, -0.0549163818359375, -0.05111217498779297, -0.04730796813964844, -0.043503761291503906, -0.039699554443359375, -0.035895347595214844, -0.03209114074707031, -0.02828693389892578, -0.02448272705078125, -0.02067852020263672, -0.016874313354492188, -0.013070106506347656, -0.009265899658203125, -0.005461692810058594, -0.0016574859619140625, 0.0021467208862304688, 0.005950927734375, 0.009755134582519531, 0.013559341430664062, 0.017363548278808594, 0.021167755126953125, 0.024971961975097656, 0.028776168823242188, 0.03258037567138672, 0.03638458251953125, 0.04018878936767578, 0.04399299621582031, 0.047797203063964844, 0.051601409912109375, 0.055405616760253906, 0.05920982360839844, 0.06301403045654297, 0.0668182373046875, 0.07062244415283203, 0.07442665100097656, 0.0782308578491211, 0.08203506469726562, 0.08583927154541016, 0.08964347839355469, 0.09344768524169922, 0.09725189208984375, 0.10105609893798828, 0.10486030578613281, 0.10866451263427734, 0.11246871948242188, 0.1162729263305664, 0.12007713317871094, 0.12388134002685547, 0.127685546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 3.0, 10.0, 11.0, 22.0, 42.0, 66.0, 135.0, 206.0, 407.0, 929.0, 2276.0, 7602.0, 65999.0, 943473.0, 20068.0, 4401.0, 1523.0, 668.0, 295.0, 158.0, 103.0, 65.0, 21.0, 20.0, 19.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9560546875, -0.9254989624023438, -0.8949432373046875, -0.8643875122070312, -0.833831787109375, -0.8032760620117188, -0.7727203369140625, -0.7421646118164062, -0.71160888671875, -0.6810531616210938, -0.6504974365234375, -0.6199417114257812, -0.589385986328125, -0.5588302612304688, -0.5282745361328125, -0.49771881103515625, -0.4671630859375, -0.43660736083984375, -0.4060516357421875, -0.37549591064453125, -0.344940185546875, -0.31438446044921875, -0.2838287353515625, -0.25327301025390625, -0.22271728515625, -0.19216156005859375, -0.1616058349609375, -0.13105010986328125, -0.100494384765625, -0.06993865966796875, -0.0393829345703125, -0.00882720947265625, 0.021728515625, 0.05228424072265625, 0.0828399658203125, 0.11339569091796875, 0.143951416015625, 0.17450714111328125, 0.2050628662109375, 0.23561859130859375, 0.26617431640625, 0.29673004150390625, 0.3272857666015625, 0.35784149169921875, 0.388397216796875, 0.41895294189453125, 0.4495086669921875, 0.48006439208984375, 0.5106201171875, 0.5411758422851562, 0.5717315673828125, 0.6022872924804688, 0.632843017578125, 0.6633987426757812, 0.6939544677734375, 0.7245101928710938, 0.75506591796875, 0.7856216430664062, 0.8161773681640625, 0.8467330932617188, 0.877288818359375, 0.9078445434570312, 0.9384002685546875, 0.9689559936523438, 0.99951171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 23.0, 100.0, 402.0, 331.0, 72.0, 22.0, 7.0, 5.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.673833847045898e-05, -9.37972217798233e-05, -9.085610508918762e-05, -8.791498839855194e-05, -8.497387170791626e-05, -8.203275501728058e-05, -7.90916383266449e-05, -7.615052163600922e-05, -7.320940494537354e-05, -7.026828825473785e-05, -6.732717156410217e-05, -6.438605487346649e-05, -6.144493818283081e-05, -5.850382149219513e-05, -5.556270480155945e-05, -5.262158811092377e-05, -4.9680471420288086e-05, -4.6739354729652405e-05, -4.3798238039016724e-05, -4.085712134838104e-05, -3.791600465774536e-05, -3.497488796710968e-05, -3.2033771276474e-05, -2.9092654585838318e-05, -2.6151537895202637e-05, -2.3210421204566956e-05, -2.0269304513931274e-05, -1.7328187823295593e-05, -1.4387071132659912e-05, -1.1445954442024231e-05, -8.50483775138855e-06, -5.563721060752869e-06, -2.6226043701171875e-06, 3.1851232051849365e-07, 3.259629011154175e-06, 6.200745701789856e-06, 9.141862392425537e-06, 1.2082979083061218e-05, 1.50240957736969e-05, 1.796521246433258e-05, 2.0906329154968262e-05, 2.3847445845603943e-05, 2.6788562536239624e-05, 2.9729679226875305e-05, 3.2670795917510986e-05, 3.561191260814667e-05, 3.855302929878235e-05, 4.149414598941803e-05, 4.443526268005371e-05, 4.737637937068939e-05, 5.031749606132507e-05, 5.3258612751960754e-05, 5.6199729442596436e-05, 5.914084613323212e-05, 6.20819628238678e-05, 6.502307951450348e-05, 6.796419620513916e-05, 7.090531289577484e-05, 7.384642958641052e-05, 7.67875462770462e-05, 7.972866296768188e-05, 8.266977965831757e-05, 8.561089634895325e-05, 8.855201303958893e-05, 9.149312973022461e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 3.0, 9.0, 12.0, 7.0, 18.0, 29.0, 36.0, 53.0, 80.0, 118.0, 186.0, 354.0, 640.0, 1217.0, 2439.0, 5741.0, 17560.0, 91401.0, 670682.0, 212286.0, 30028.0, 8490.0, 3346.0, 1614.0, 862.0, 524.0, 274.0, 185.0, 117.0, 77.0, 53.0, 29.0, 22.0, 15.0, 11.0, 10.0, 4.0, 5.0, 9.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1905517578125, -0.1836681365966797, -0.17678451538085938, -0.16990089416503906, -0.16301727294921875, -0.15613365173339844, -0.14925003051757812, -0.1423664093017578, -0.1354827880859375, -0.1285991668701172, -0.12171554565429688, -0.11483192443847656, -0.10794830322265625, -0.10106468200683594, -0.09418106079101562, -0.08729743957519531, -0.080413818359375, -0.07353019714355469, -0.06664657592773438, -0.05976295471191406, -0.05287933349609375, -0.04599571228027344, -0.039112091064453125, -0.03222846984863281, -0.0253448486328125, -0.018461227416992188, -0.011577606201171875, -0.0046939849853515625, 0.00218963623046875, 0.009073257446289062, 0.015956878662109375, 0.022840499877929688, 0.02972412109375, 0.03660774230957031, 0.043491363525390625, 0.05037498474121094, 0.05725860595703125, 0.06414222717285156, 0.07102584838867188, 0.07790946960449219, 0.0847930908203125, 0.09167671203613281, 0.09856033325195312, 0.10544395446777344, 0.11232757568359375, 0.11921119689941406, 0.12609481811523438, 0.1329784393310547, 0.139862060546875, 0.1467456817626953, 0.15362930297851562, 0.16051292419433594, 0.16739654541015625, 0.17428016662597656, 0.18116378784179688, 0.1880474090576172, 0.1949310302734375, 0.2018146514892578, 0.20869827270507812, 0.21558189392089844, 0.22246551513671875, 0.22934913635253906, 0.23623275756835938, 0.2431163787841797, 0.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 17.0, 20.0, 28.0, 37.0, 76.0, 113.0, 137.0, 148.0, 114.0, 102.0, 79.0, 33.0, 17.0, 12.0, 12.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10833740234375, -0.10499858856201172, -0.10165977478027344, -0.09832096099853516, -0.09498214721679688, -0.0916433334350586, -0.08830451965332031, -0.08496570587158203, -0.08162689208984375, -0.07828807830810547, -0.07494926452636719, -0.0716104507446289, -0.06827163696289062, -0.06493282318115234, -0.06159400939941406, -0.05825519561767578, -0.0549163818359375, -0.05157756805419922, -0.04823875427246094, -0.044899940490722656, -0.041561126708984375, -0.038222312927246094, -0.03488349914550781, -0.03154468536376953, -0.02820587158203125, -0.02486705780029297, -0.021528244018554688, -0.018189430236816406, -0.014850616455078125, -0.011511802673339844, -0.008172988891601562, -0.004834175109863281, -0.001495361328125, 0.0018434524536132812, 0.0051822662353515625, 0.008521080017089844, 0.011859893798828125, 0.015198707580566406, 0.018537521362304688, 0.02187633514404297, 0.02521514892578125, 0.02855396270751953, 0.03189277648925781, 0.035231590270996094, 0.038570404052734375, 0.041909217834472656, 0.04524803161621094, 0.04858684539794922, 0.0519256591796875, 0.05526447296142578, 0.05860328674316406, 0.061942100524902344, 0.06528091430664062, 0.0686197280883789, 0.07195854187011719, 0.07529735565185547, 0.07863616943359375, 0.08197498321533203, 0.08531379699707031, 0.0886526107788086, 0.09199142456054688, 0.09533023834228516, 0.09866905212402344, 0.10200786590576172, 0.1053466796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 16.0, 58.0, 168.0, 254.0, 265.0, 143.0, 60.0, 10.0, 17.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6344008445739746, -2.575676918029785, -2.5169529914855957, -2.458228826522827, -2.3995048999786377, -2.3407809734344482, -2.282057046890259, -2.2233331203460693, -2.164608955383301, -2.1058850288391113, -2.047161102294922, -1.9884370565414429, -1.9297130107879639, -1.8709890842437744, -1.812265157699585, -1.753541111946106, -1.694817304611206, -1.6360933780670166, -1.5773693323135376, -1.5186454057693481, -1.4599213600158691, -1.4011974334716797, -1.3424735069274902, -1.2837494611740112, -1.2250254154205322, -1.1663014888763428, -1.1075774431228638, -1.0488535165786743, -0.9901295304298401, -0.9314055442810059, -0.8726815581321716, -0.8139575719833374, -0.755233645439148, -0.6965096592903137, -0.6377856731414795, -0.57906174659729, -0.5203377604484558, -0.4616137742996216, -0.40288978815078735, -0.3441658318042755, -0.2854418456554413, -0.22671787440776825, -0.16799390316009521, -0.10926991701126099, -0.05054594576358795, 0.008178025484085083, 0.06690201163291931, 0.12562596797943115, 0.18434995412826538, 0.24307392537593842, 0.30179789662361145, 0.3605218827724457, 0.4192458391189575, 0.47796982526779175, 0.536693811416626, 0.5954177379608154, 0.6541417837142944, 0.7128657698631287, 0.7715897560119629, 0.8303136825561523, 0.8890376687049866, 0.9477616548538208, 1.0064857006072998, 1.0652096271514893, 1.1239335536956787]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 10.0, 12.0, 19.0, 20.0, 23.0, 32.0, 36.0, 30.0, 35.0, 36.0, 46.0, 55.0, 52.0, 49.0, 52.0, 49.0, 41.0, 45.0, 39.0, 41.0, 37.0, 33.0, 31.0, 26.0, 24.0, 20.0, 16.0, 12.0, 18.0, 11.0, 8.0, 0.0, 4.0, 7.0, 5.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4254211187362671, -0.4117816090583801, -0.39814212918281555, -0.3845026195049286, -0.370863139629364, -0.35722362995147705, -0.3435841202735901, -0.3299446403980255, -0.31630516052246094, -0.302665650844574, -0.2890261709690094, -0.27538666129112244, -0.26174718141555786, -0.2481076717376709, -0.23446817696094513, -0.22082868218421936, -0.2071891725063324, -0.19354967772960663, -0.17991018295288086, -0.1662706732749939, -0.15263119339942932, -0.13899168372154236, -0.1253521889448166, -0.11171269416809082, -0.09807319939136505, -0.08443370461463928, -0.07079420983791351, -0.05715470761060715, -0.04351521283388138, -0.02987571805715561, -0.016236215829849243, -0.002596721053123474, 0.011042773723602295, 0.024682270362973213, 0.03832176700234413, 0.0519612655043602, 0.06560076028108597, 0.07924025505781174, 0.0928797572851181, 0.10651925206184387, 0.12015874683856964, 0.1337982416152954, 0.14743773639202118, 0.16107723116874695, 0.1747167408466339, 0.1883562207221985, 0.20199573040008545, 0.21563522517681122, 0.229274719953537, 0.24291421473026276, 0.2565537095069885, 0.2701932191848755, 0.28383269906044006, 0.297472208738327, 0.3111116886138916, 0.32475119829177856, 0.3383907079696655, 0.3520302176475525, 0.36566969752311707, 0.37930920720100403, 0.3929486870765686, 0.40658819675445557, 0.42022770643234253, 0.4338671863079071, 0.4475066661834717]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 9.0, 11.0, 21.0, 31.0, 47.0, 65.0, 95.0, 214.0, 718.0, 3653.0, 43867.0, 3717948.0, 411184.0, 14008.0, 1671.0, 365.0, 144.0, 65.0, 39.0, 37.0, 29.0, 17.0, 14.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5449066162109375, -0.528778076171875, -0.5126495361328125, -0.49652099609375, -0.4803924560546875, -0.464263916015625, -0.4481353759765625, -0.4320068359375, -0.4158782958984375, -0.399749755859375, -0.3836212158203125, -0.36749267578125, -0.3513641357421875, -0.335235595703125, -0.3191070556640625, -0.302978515625, -0.2868499755859375, -0.270721435546875, -0.2545928955078125, -0.23846435546875, -0.2223358154296875, -0.206207275390625, -0.1900787353515625, -0.1739501953125, -0.1578216552734375, -0.141693115234375, -0.1255645751953125, -0.10943603515625, -0.0933074951171875, -0.077178955078125, -0.0610504150390625, -0.044921875, -0.0287933349609375, -0.012664794921875, 0.0034637451171875, 0.01959228515625, 0.0357208251953125, 0.051849365234375, 0.0679779052734375, 0.0841064453125, 0.1002349853515625, 0.116363525390625, 0.1324920654296875, 0.14862060546875, 0.1647491455078125, 0.180877685546875, 0.1970062255859375, 0.213134765625, 0.2292633056640625, 0.245391845703125, 0.2615203857421875, 0.27764892578125, 0.2937774658203125, 0.309906005859375, 0.3260345458984375, 0.3421630859375, 0.3582916259765625, 0.374420166015625, 0.3905487060546875, 0.40667724609375, 0.4228057861328125, 0.438934326171875, 0.4550628662109375, 0.47119140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 1.0, 11.0, 7.0, 10.0, 13.0, 14.0, 27.0, 37.0, 37.0, 47.0, 58.0, 51.0, 47.0, 59.0, 57.0, 70.0, 66.0, 63.0, 58.0, 53.0, 48.0, 21.0, 32.0, 21.0, 16.0, 23.0, 16.0, 6.0, 7.0, 9.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051483154296875, -0.049512386322021484, -0.04754161834716797, -0.04557085037231445, -0.04360008239746094, -0.04162931442260742, -0.039658546447753906, -0.03768777847290039, -0.035717010498046875, -0.03374624252319336, -0.031775474548339844, -0.029804706573486328, -0.027833938598632812, -0.025863170623779297, -0.02389240264892578, -0.021921634674072266, -0.01995086669921875, -0.017980098724365234, -0.01600933074951172, -0.014038562774658203, -0.012067794799804688, -0.010097026824951172, -0.008126258850097656, -0.006155490875244141, -0.004184722900390625, -0.0022139549255371094, -0.00024318695068359375, 0.0017275810241699219, 0.0036983489990234375, 0.005669116973876953, 0.007639884948730469, 0.009610652923583984, 0.0115814208984375, 0.013552188873291016, 0.015522956848144531, 0.017493724822998047, 0.019464492797851562, 0.021435260772705078, 0.023406028747558594, 0.02537679672241211, 0.027347564697265625, 0.02931833267211914, 0.031289100646972656, 0.03325986862182617, 0.03523063659667969, 0.0372014045715332, 0.03917217254638672, 0.041142940521240234, 0.04311370849609375, 0.045084476470947266, 0.04705524444580078, 0.0490260124206543, 0.05099678039550781, 0.05296754837036133, 0.054938316345214844, 0.05690908432006836, 0.058879852294921875, 0.06085062026977539, 0.0628213882446289, 0.06479215621948242, 0.06676292419433594, 0.06873369216918945, 0.07070446014404297, 0.07267522811889648, 0.07464599609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 16.0, 16.0, 19.0, 26.0, 42.0, 80.0, 95.0, 206.0, 375.0, 674.0, 1297.0, 2972.0, 7661.0, 27752.0, 159160.0, 2226157.0, 1602175.0, 129331.0, 23887.0, 6830.0, 2680.0, 1260.0, 655.0, 369.0, 205.0, 96.0, 102.0, 36.0, 32.0, 19.0, 18.0, 5.0, 6.0, 4.0, 2.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.265625, -0.25704193115234375, -0.2484588623046875, -0.23987579345703125, -0.231292724609375, -0.22270965576171875, -0.2141265869140625, -0.20554351806640625, -0.19696044921875, -0.18837738037109375, -0.1797943115234375, -0.17121124267578125, -0.162628173828125, -0.15404510498046875, -0.1454620361328125, -0.13687896728515625, -0.1282958984375, -0.11971282958984375, -0.1111297607421875, -0.10254669189453125, -0.093963623046875, -0.08538055419921875, -0.0767974853515625, -0.06821441650390625, -0.05963134765625, -0.05104827880859375, -0.0424652099609375, -0.03388214111328125, -0.025299072265625, -0.01671600341796875, -0.0081329345703125, 0.00045013427734375, 0.009033203125, 0.01761627197265625, 0.0261993408203125, 0.03478240966796875, 0.043365478515625, 0.05194854736328125, 0.0605316162109375, 0.06911468505859375, 0.07769775390625, 0.08628082275390625, 0.0948638916015625, 0.10344696044921875, 0.112030029296875, 0.12061309814453125, 0.1291961669921875, 0.13777923583984375, 0.1463623046875, 0.15494537353515625, 0.1635284423828125, 0.17211151123046875, 0.180694580078125, 0.18927764892578125, 0.1978607177734375, 0.20644378662109375, 0.21502685546875, 0.22360992431640625, 0.2321929931640625, 0.24077606201171875, 0.249359130859375, 0.25794219970703125, 0.2665252685546875, 0.27510833740234375, 0.28369140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 3.0, 10.0, 11.0, 15.0, 28.0, 33.0, 41.0, 43.0, 68.0, 101.0, 106.0, 175.0, 224.0, 286.0, 429.0, 589.0, 528.0, 403.0, 253.0, 189.0, 139.0, 97.0, 93.0, 48.0, 47.0, 31.0, 28.0, 13.0, 8.0, 5.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10919189453125, -0.10540485382080078, -0.10161781311035156, -0.09783077239990234, -0.09404373168945312, -0.0902566909790039, -0.08646965026855469, -0.08268260955810547, -0.07889556884765625, -0.07510852813720703, -0.07132148742675781, -0.0675344467163086, -0.06374740600585938, -0.059960365295410156, -0.05617332458496094, -0.05238628387451172, -0.0485992431640625, -0.04481220245361328, -0.04102516174316406, -0.037238121032714844, -0.033451080322265625, -0.029664039611816406, -0.025876998901367188, -0.02208995819091797, -0.01830291748046875, -0.014515876770019531, -0.010728836059570312, -0.006941795349121094, -0.003154754638671875, 0.0006322860717773438, 0.0044193267822265625, 0.008206367492675781, 0.011993408203125, 0.01578044891357422, 0.019567489624023438, 0.023354530334472656, 0.027141571044921875, 0.030928611755371094, 0.03471565246582031, 0.03850269317626953, 0.04228973388671875, 0.04607677459716797, 0.04986381530761719, 0.053650856018066406, 0.057437896728515625, 0.061224937438964844, 0.06501197814941406, 0.06879901885986328, 0.0725860595703125, 0.07637310028076172, 0.08016014099121094, 0.08394718170166016, 0.08773422241210938, 0.0915212631225586, 0.09530830383300781, 0.09909534454345703, 0.10288238525390625, 0.10666942596435547, 0.11045646667480469, 0.1142435073852539, 0.11803054809570312, 0.12181758880615234, 0.12560462951660156, 0.12939167022705078, 0.1331787109375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 54.0, 112.0, 236.0, 315.0, 168.0, 68.0, 20.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.037745714187622, -2.979569911956787, -2.921393871307373, -2.863218069076538, -2.805042266845703, -2.746866226196289, -2.688690423965454, -2.630514621734619, -2.572338581085205, -2.51416277885437, -2.455986738204956, -2.397810935974121, -2.339635133743286, -2.281459331512451, -2.223283290863037, -2.165107488632202, -2.106931686401367, -2.0487558841705322, -1.9905799627304077, -1.9324040412902832, -1.8742282390594482, -1.8160523176193237, -1.7578763961791992, -1.6997005939483643, -1.6415246725082397, -1.5833487510681152, -1.5251729488372803, -1.4669970273971558, -1.4088211059570312, -1.3506453037261963, -1.2924693822860718, -1.2342934608459473, -1.1761176586151123, -1.1179417371749878, -1.0597659349441528, -1.0015900135040283, -0.9434141516685486, -0.8852382898330688, -0.8270623683929443, -0.7688865065574646, -0.7107106447219849, -0.6525347828865051, -0.5943589210510254, -0.5361829996109009, -0.47800713777542114, -0.4198312759399414, -0.3616553843021393, -0.30347949266433716, -0.24530363082885742, -0.1871277540922165, -0.12895187735557556, -0.07077600061893463, -0.012600123882293701, 0.045575737953186035, 0.10375162959098816, 0.16192752122879028, 0.22010338306427002, 0.27827924489974976, 0.3364551365375519, 0.394631028175354, 0.45280689001083374, 0.5109827518463135, 0.569158673286438, 0.6273345351219177, 0.6855103969573975]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 7.0, 11.0, 9.0, 15.0, 13.0, 31.0, 26.0, 37.0, 49.0, 44.0, 54.0, 62.0, 63.0, 59.0, 63.0, 58.0, 46.0, 56.0, 37.0, 50.0, 48.0, 30.0, 21.0, 29.0, 19.0, 16.0, 11.0, 13.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3577038645744324, -0.3420743942260742, -0.3264448940753937, -0.3108154237270355, -0.295185923576355, -0.2795564532279968, -0.26392698287963867, -0.24829748272895813, -0.23266799747943878, -0.21703851222991943, -0.20140902698040009, -0.18577954173088074, -0.17015007138252258, -0.15452057123184204, -0.1388911008834839, -0.12326161563396454, -0.10763213038444519, -0.09200264513492584, -0.0763731598854065, -0.06074368208646774, -0.045114196836948395, -0.029484711587429047, -0.013855233788490295, 0.0017742514610290527, 0.0174037367105484, 0.03303322196006775, 0.0486627034842968, 0.06429218500852585, 0.0799216702580452, 0.09555115550756454, 0.1111806333065033, 0.12681011855602264, 0.142439603805542, 0.15806908905506134, 0.1736985743045807, 0.18932804465293884, 0.20495754480361938, 0.22058701515197754, 0.2362165004014969, 0.25184598565101624, 0.2674754858016968, 0.28310495615005493, 0.2987344563007355, 0.31436392664909363, 0.32999342679977417, 0.3456228971481323, 0.3612523674964905, 0.376881867647171, 0.3925113379955292, 0.40814080834388733, 0.42377030849456787, 0.439399778842926, 0.45502927899360657, 0.4706587493419647, 0.48628824949264526, 0.5019177198410034, 0.5175471901893616, 0.5331766605377197, 0.5488061308860779, 0.5644356608390808, 0.580065131187439, 0.5956946015357971, 0.6113240718841553, 0.6269536018371582, 0.6425830721855164]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 5.0, 6.0, 5.0, 13.0, 12.0, 17.0, 30.0, 35.0, 67.0, 108.0, 165.0, 267.0, 501.0, 1135.0, 2276.0, 5620.0, 14710.0, 44575.0, 160968.0, 452710.0, 259598.0, 69897.0, 21988.0, 7673.0, 3199.0, 1397.0, 648.0, 363.0, 183.0, 128.0, 70.0, 55.0, 33.0, 23.0, 21.0, 13.0, 8.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25439453125, -0.24520492553710938, -0.23601531982421875, -0.22682571411132812, -0.2176361083984375, -0.20844650268554688, -0.19925689697265625, -0.19006729125976562, -0.180877685546875, -0.17168807983398438, -0.16249847412109375, -0.15330886840820312, -0.1441192626953125, -0.13492965698242188, -0.12574005126953125, -0.11655044555664062, -0.10736083984375, -0.09817123413085938, -0.08898162841796875, -0.07979202270507812, -0.0706024169921875, -0.061412811279296875, -0.05222320556640625, -0.043033599853515625, -0.033843994140625, -0.024654388427734375, -0.01546478271484375, -0.006275177001953125, 0.0029144287109375, 0.012104034423828125, 0.02129364013671875, 0.030483245849609375, 0.0396728515625, 0.048862457275390625, 0.05805206298828125, 0.06724166870117188, 0.0764312744140625, 0.08562088012695312, 0.09481048583984375, 0.10400009155273438, 0.113189697265625, 0.12237930297851562, 0.13156890869140625, 0.14075851440429688, 0.1499481201171875, 0.15913772583007812, 0.16832733154296875, 0.17751693725585938, 0.18670654296875, 0.19589614868164062, 0.20508575439453125, 0.21427536010742188, 0.2234649658203125, 0.23265457153320312, 0.24184417724609375, 0.2510337829589844, 0.260223388671875, 0.2694129943847656, 0.27860260009765625, 0.2877922058105469, 0.2969818115234375, 0.3061714172363281, 0.31536102294921875, 0.3245506286621094, 0.333740234375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 9.0, 8.0, 9.0, 11.0, 25.0, 34.0, 51.0, 55.0, 45.0, 49.0, 61.0, 67.0, 66.0, 56.0, 50.0, 61.0, 66.0, 52.0, 50.0, 40.0, 32.0, 29.0, 16.0, 16.0, 9.0, 6.0, 9.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052154541015625, -0.05016279220581055, -0.048171043395996094, -0.04617929458618164, -0.04418754577636719, -0.042195796966552734, -0.04020404815673828, -0.03821229934692383, -0.036220550537109375, -0.03422880172729492, -0.03223705291748047, -0.030245304107666016, -0.028253555297851562, -0.02626180648803711, -0.024270057678222656, -0.022278308868408203, -0.02028656005859375, -0.018294811248779297, -0.016303062438964844, -0.01431131362915039, -0.012319564819335938, -0.010327816009521484, -0.008336067199707031, -0.006344318389892578, -0.004352569580078125, -0.002360820770263672, -0.00036907196044921875, 0.0016226768493652344, 0.0036144256591796875, 0.005606174468994141, 0.007597923278808594, 0.009589672088623047, 0.0115814208984375, 0.013573169708251953, 0.015564918518066406, 0.01755666732788086, 0.019548416137695312, 0.021540164947509766, 0.02353191375732422, 0.025523662567138672, 0.027515411376953125, 0.029507160186767578, 0.03149890899658203, 0.033490657806396484, 0.03548240661621094, 0.03747415542602539, 0.039465904235839844, 0.0414576530456543, 0.04344940185546875, 0.0454411506652832, 0.047432899475097656, 0.04942464828491211, 0.05141639709472656, 0.053408145904541016, 0.05539989471435547, 0.05739164352416992, 0.059383392333984375, 0.06137514114379883, 0.06336688995361328, 0.06535863876342773, 0.06735038757324219, 0.06934213638305664, 0.0713338851928711, 0.07332563400268555, 0.0753173828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 9.0, 16.0, 14.0, 19.0, 29.0, 38.0, 40.0, 54.0, 113.0, 162.0, 232.0, 353.0, 619.0, 1177.0, 2701.0, 8254.0, 35490.0, 212471.0, 602449.0, 147096.0, 26014.0, 6568.0, 2121.0, 956.0, 508.0, 306.0, 193.0, 141.0, 115.0, 77.0, 56.0, 38.0, 33.0, 14.0, 17.0, 14.0, 16.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.3483314514160156, -0.33606719970703125, -0.3238029479980469, -0.3115386962890625, -0.2992744445800781, -0.28701019287109375, -0.2747459411621094, -0.262481689453125, -0.2502174377441406, -0.23795318603515625, -0.22568893432617188, -0.2134246826171875, -0.20116043090820312, -0.18889617919921875, -0.17663192749023438, -0.16436767578125, -0.15210342407226562, -0.13983917236328125, -0.12757492065429688, -0.1153106689453125, -0.10304641723632812, -0.09078216552734375, -0.07851791381835938, -0.066253662109375, -0.053989410400390625, -0.04172515869140625, -0.029460906982421875, -0.0171966552734375, -0.004932403564453125, 0.00733184814453125, 0.019596099853515625, 0.0318603515625, 0.044124603271484375, 0.05638885498046875, 0.06865310668945312, 0.0809173583984375, 0.09318161010742188, 0.10544586181640625, 0.11771011352539062, 0.129974365234375, 0.14223861694335938, 0.15450286865234375, 0.16676712036132812, 0.1790313720703125, 0.19129562377929688, 0.20355987548828125, 0.21582412719726562, 0.22808837890625, 0.24035263061523438, 0.25261688232421875, 0.2648811340332031, 0.2771453857421875, 0.2894096374511719, 0.30167388916015625, 0.3139381408691406, 0.326202392578125, 0.3384666442871094, 0.35073089599609375, 0.3629951477050781, 0.3752593994140625, 0.3875236511230469, 0.39978790283203125, 0.4120521545410156, 0.42431640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 6.0, 0.0, 9.0, 5.0, 5.0, 8.0, 11.0, 20.0, 8.0, 16.0, 21.0, 21.0, 20.0, 31.0, 31.0, 28.0, 38.0, 42.0, 29.0, 43.0, 35.0, 39.0, 43.0, 56.0, 48.0, 36.0, 33.0, 38.0, 33.0, 27.0, 34.0, 33.0, 24.0, 17.0, 20.0, 13.0, 15.0, 14.0, 17.0, 8.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10076904296875, -0.09700298309326172, -0.09323692321777344, -0.08947086334228516, -0.08570480346679688, -0.0819387435913086, -0.07817268371582031, -0.07440662384033203, -0.07064056396484375, -0.06687450408935547, -0.06310844421386719, -0.059342384338378906, -0.055576324462890625, -0.051810264587402344, -0.04804420471191406, -0.04427814483642578, -0.0405120849609375, -0.03674602508544922, -0.03297996520996094, -0.029213905334472656, -0.025447845458984375, -0.021681785583496094, -0.017915725708007812, -0.014149665832519531, -0.01038360595703125, -0.006617546081542969, -0.0028514862060546875, 0.0009145736694335938, 0.004680633544921875, 0.008446693420410156, 0.012212753295898438, 0.01597881317138672, 0.019744873046875, 0.02351093292236328, 0.027276992797851562, 0.031043052673339844, 0.034809112548828125, 0.038575172424316406, 0.04234123229980469, 0.04610729217529297, 0.04987335205078125, 0.05363941192626953, 0.05740547180175781, 0.061171531677246094, 0.06493759155273438, 0.06870365142822266, 0.07246971130371094, 0.07623577117919922, 0.0800018310546875, 0.08376789093017578, 0.08753395080566406, 0.09130001068115234, 0.09506607055664062, 0.0988321304321289, 0.10259819030761719, 0.10636425018310547, 0.11013031005859375, 0.11389636993408203, 0.11766242980957031, 0.1214284896850586, 0.12519454956054688, 0.12896060943603516, 0.13272666931152344, 0.13649272918701172, 0.1402587890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 8.0, 18.0, 20.0, 30.0, 37.0, 58.0, 92.0, 114.0, 173.0, 290.0, 480.0, 903.0, 1836.0, 4252.0, 11792.0, 41450.0, 235707.0, 579726.0, 129847.0, 26578.0, 8392.0, 3188.0, 1559.0, 813.0, 428.0, 217.0, 167.0, 114.0, 66.0, 49.0, 31.0, 33.0, 21.0, 13.0, 16.0, 6.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1260986328125, -0.12220001220703125, -0.1183013916015625, -0.11440277099609375, -0.110504150390625, -0.10660552978515625, -0.1027069091796875, -0.09880828857421875, -0.09490966796875, -0.09101104736328125, -0.0871124267578125, -0.08321380615234375, -0.079315185546875, -0.07541656494140625, -0.0715179443359375, -0.06761932373046875, -0.063720703125, -0.05982208251953125, -0.0559234619140625, -0.05202484130859375, -0.048126220703125, -0.04422760009765625, -0.0403289794921875, -0.03643035888671875, -0.03253173828125, -0.02863311767578125, -0.0247344970703125, -0.02083587646484375, -0.016937255859375, -0.01303863525390625, -0.0091400146484375, -0.00524139404296875, -0.0013427734375, 0.00255584716796875, 0.0064544677734375, 0.01035308837890625, 0.014251708984375, 0.01815032958984375, 0.0220489501953125, 0.02594757080078125, 0.02984619140625, 0.03374481201171875, 0.0376434326171875, 0.04154205322265625, 0.045440673828125, 0.04933929443359375, 0.0532379150390625, 0.05713653564453125, 0.06103515625, 0.06493377685546875, 0.0688323974609375, 0.07273101806640625, 0.076629638671875, 0.08052825927734375, 0.0844268798828125, 0.08832550048828125, 0.09222412109375, 0.09612274169921875, 0.1000213623046875, 0.10391998291015625, 0.107818603515625, 0.11171722412109375, 0.1156158447265625, 0.11951446533203125, 0.1234130859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 11.0, 6.0, 19.0, 35.0, 54.0, 115.0, 153.0, 195.0, 157.0, 110.0, 66.0, 34.0, 13.0, 14.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.485513687133789e-05, -2.388283610343933e-05, -2.291053533554077e-05, -2.1938234567642212e-05, -2.0965933799743652e-05, -1.9993633031845093e-05, -1.9021332263946533e-05, -1.8049031496047974e-05, -1.7076730728149414e-05, -1.6104429960250854e-05, -1.5132129192352295e-05, -1.4159828424453735e-05, -1.3187527656555176e-05, -1.2215226888656616e-05, -1.1242926120758057e-05, -1.0270625352859497e-05, -9.298324584960938e-06, -8.326023817062378e-06, -7.353723049163818e-06, -6.381422281265259e-06, -5.409121513366699e-06, -4.43682074546814e-06, -3.46451997756958e-06, -2.4922192096710205e-06, -1.519918441772461e-06, -5.476176738739014e-07, 4.246830940246582e-07, 1.3969838619232178e-06, 2.3692846298217773e-06, 3.341585397720337e-06, 4.3138861656188965e-06, 5.286186933517456e-06, 6.258487701416016e-06, 7.230788469314575e-06, 8.203089237213135e-06, 9.175390005111694e-06, 1.0147690773010254e-05, 1.1119991540908813e-05, 1.2092292308807373e-05, 1.3064593076705933e-05, 1.4036893844604492e-05, 1.5009194612503052e-05, 1.598149538040161e-05, 1.695379614830017e-05, 1.792609691619873e-05, 1.889839768409729e-05, 1.987069845199585e-05, 2.084299921989441e-05, 2.181529998779297e-05, 2.278760075569153e-05, 2.3759901523590088e-05, 2.4732202291488647e-05, 2.5704503059387207e-05, 2.6676803827285767e-05, 2.7649104595184326e-05, 2.8621405363082886e-05, 2.9593706130981445e-05, 3.0566006898880005e-05, 3.1538307666778564e-05, 3.2510608434677124e-05, 3.3482909202575684e-05, 3.445520997047424e-05, 3.54275107383728e-05, 3.639981150627136e-05, 3.737211227416992e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 2.0, 11.0, 21.0, 20.0, 35.0, 81.0, 148.0, 279.0, 595.0, 1789.0, 10595.0, 275213.0, 735302.0, 20263.0, 2745.0, 765.0, 311.0, 154.0, 94.0, 38.0, 31.0, 22.0, 8.0, 5.0, 6.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2415771484375, -0.23113441467285156, -0.22069168090820312, -0.2102489471435547, -0.19980621337890625, -0.1893634796142578, -0.17892074584960938, -0.16847801208496094, -0.1580352783203125, -0.14759254455566406, -0.13714981079101562, -0.1267070770263672, -0.11626434326171875, -0.10582160949707031, -0.09537887573242188, -0.08493614196777344, -0.074493408203125, -0.06405067443847656, -0.053607940673828125, -0.04316520690917969, -0.03272247314453125, -0.022279739379882812, -0.011837005615234375, -0.0013942718505859375, 0.0090484619140625, 0.019491195678710938, 0.029933929443359375, 0.04037666320800781, 0.05081939697265625, 0.06126213073730469, 0.07170486450195312, 0.08214759826660156, 0.09259033203125, 0.10303306579589844, 0.11347579956054688, 0.12391853332519531, 0.13436126708984375, 0.1448040008544922, 0.15524673461914062, 0.16568946838378906, 0.1761322021484375, 0.18657493591308594, 0.19701766967773438, 0.2074604034423828, 0.21790313720703125, 0.2283458709716797, 0.23878860473632812, 0.24923133850097656, 0.259674072265625, 0.27011680603027344, 0.2805595397949219, 0.2910022735595703, 0.30144500732421875, 0.3118877410888672, 0.3223304748535156, 0.33277320861816406, 0.3432159423828125, 0.35365867614746094, 0.3641014099121094, 0.3745441436767578, 0.38498687744140625, 0.3954296112060547, 0.4058723449707031, 0.41631507873535156, 0.4267578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 8.0, 3.0, 7.0, 5.0, 10.0, 9.0, 10.0, 14.0, 14.0, 29.0, 36.0, 28.0, 43.0, 39.0, 49.0, 56.0, 64.0, 68.0, 78.0, 80.0, 64.0, 44.0, 52.0, 35.0, 26.0, 28.0, 14.0, 13.0, 12.0, 14.0, 16.0, 5.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04052734375, -0.03913116455078125, -0.0377349853515625, -0.03633880615234375, -0.034942626953125, -0.03354644775390625, -0.0321502685546875, -0.03075408935546875, -0.02935791015625, -0.02796173095703125, -0.0265655517578125, -0.02516937255859375, -0.023773193359375, -0.02237701416015625, -0.0209808349609375, -0.01958465576171875, -0.0181884765625, -0.01679229736328125, -0.0153961181640625, -0.01399993896484375, -0.012603759765625, -0.01120758056640625, -0.0098114013671875, -0.00841522216796875, -0.00701904296875, -0.00562286376953125, -0.0042266845703125, -0.00283050537109375, -0.001434326171875, -3.814697265625e-05, 0.0013580322265625, 0.00275421142578125, 0.004150390625, 0.00554656982421875, 0.0069427490234375, 0.00833892822265625, 0.009735107421875, 0.01113128662109375, 0.0125274658203125, 0.01392364501953125, 0.01531982421875, 0.01671600341796875, 0.0181121826171875, 0.01950836181640625, 0.020904541015625, 0.02230072021484375, 0.0236968994140625, 0.02509307861328125, 0.0264892578125, 0.02788543701171875, 0.0292816162109375, 0.03067779541015625, 0.032073974609375, 0.03347015380859375, 0.0348663330078125, 0.03626251220703125, 0.03765869140625, 0.03905487060546875, 0.0404510498046875, 0.04184722900390625, 0.043243408203125, 0.04463958740234375, 0.0460357666015625, 0.04743194580078125, 0.048828125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 17.0, 34.0, 41.0, 49.0, 80.0, 97.0, 118.0, 117.0, 115.0, 91.0, 64.0, 44.0, 34.0, 24.0, 11.0, 13.0, 8.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.613517165184021, -0.593284547328949, -0.5730518698692322, -0.5528192520141602, -0.5325866341590881, -0.5123539566993713, -0.4921213388442993, -0.4718886911869049, -0.4516560435295105, -0.4314233958721161, -0.41119077801704407, -0.39095813035964966, -0.37072548270225525, -0.35049283504486084, -0.3302602171897888, -0.3100275695323944, -0.2897949516773224, -0.269562304019928, -0.24932967126369476, -0.22909703850746155, -0.20886439085006714, -0.18863175809383392, -0.1683991253376007, -0.1481664776802063, -0.12793384492397308, -0.10770120471715927, -0.08746856451034546, -0.06723593175411224, -0.04700329154729843, -0.02677065134048462, -0.006538018584251404, 0.013694629073143005, 0.03392726182937622, 0.05415990203619003, 0.07439254224300385, 0.09462517499923706, 0.11485781520605087, 0.13509045541286469, 0.1553230881690979, 0.1755557358264923, 0.19578836858272552, 0.21602100133895874, 0.23625364899635315, 0.25648629665374756, 0.2767189145088196, 0.296951562166214, 0.3171842098236084, 0.3374168276786804, 0.35764947533607483, 0.37788212299346924, 0.39811474084854126, 0.41834738850593567, 0.4385800361633301, 0.4588126540184021, 0.4790453016757965, 0.4992779493331909, 0.5195105671882629, 0.539743185043335, 0.5599758625030518, 0.5802084803581238, 0.6004410982131958, 0.6206737756729126, 0.6409063935279846, 0.6611390113830566, 0.6813716888427734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 18.0, 15.0, 19.0, 19.0, 18.0, 18.0, 24.0, 27.0, 27.0, 33.0, 33.0, 35.0, 47.0, 43.0, 56.0, 39.0, 48.0, 46.0, 33.0, 47.0, 46.0, 31.0, 36.0, 40.0, 24.0, 29.0, 11.0, 17.0, 17.0, 18.0, 17.0, 12.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32443588972091675, -0.31215420365333557, -0.2998725175857544, -0.28759080171585083, -0.27530911564826965, -0.2630274295806885, -0.2507457435131073, -0.23846404254436493, -0.22618234157562256, -0.21390065550804138, -0.201618954539299, -0.18933726847171783, -0.17705556750297546, -0.1647738814353943, -0.1524921953678131, -0.14021049439907074, -0.12792880833148956, -0.11564711481332779, -0.10336542129516602, -0.09108373522758484, -0.07880203425884247, -0.06652034819126129, -0.05423865467309952, -0.041956961154937744, -0.02967526763677597, -0.017393574118614197, -0.005111882463097572, 0.007169809192419052, 0.019451502710580826, 0.0317331962287426, 0.044014886021614075, 0.05629657953977585, 0.06857827305793762, 0.0808599665760994, 0.09314166009426117, 0.10542334616184235, 0.11770504713058472, 0.1299867331981659, 0.14226841926574707, 0.15455012023448944, 0.1668318212032318, 0.179113507270813, 0.19139520823955536, 0.20367689430713654, 0.2159585952758789, 0.22824028134346008, 0.24052196741104126, 0.2528036832809448, 0.2650853395462036, 0.2773670256137848, 0.28964871168136597, 0.30193042755126953, 0.3142121136188507, 0.3264937996864319, 0.33877548575401306, 0.35105717182159424, 0.3633388876914978, 0.375620573759079, 0.38790225982666016, 0.4001839756965637, 0.4124656617641449, 0.4247473478317261, 0.43702903389930725, 0.4493107199668884, 0.461592435836792]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 10.0, 20.0, 27.0, 66.0, 119.0, 246.0, 560.0, 1409.0, 4861.0, 21385.0, 133924.0, 3235440.0, 719802.0, 59266.0, 11969.0, 3194.0, 1092.0, 430.0, 231.0, 100.0, 56.0, 32.0, 17.0, 5.0, 9.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2870635986328125, -0.277740478515625, -0.2684173583984375, -0.25909423828125, -0.2497711181640625, -0.240447998046875, -0.2311248779296875, -0.2218017578125, -0.2124786376953125, -0.203155517578125, -0.1938323974609375, -0.18450927734375, -0.1751861572265625, -0.165863037109375, -0.1565399169921875, -0.147216796875, -0.1378936767578125, -0.128570556640625, -0.1192474365234375, -0.10992431640625, -0.1006011962890625, -0.091278076171875, -0.0819549560546875, -0.0726318359375, -0.0633087158203125, -0.053985595703125, -0.0446624755859375, -0.03533935546875, -0.0260162353515625, -0.016693115234375, -0.0073699951171875, 0.001953125, 0.0112762451171875, 0.020599365234375, 0.0299224853515625, 0.03924560546875, 0.0485687255859375, 0.057891845703125, 0.0672149658203125, 0.0765380859375, 0.0858612060546875, 0.095184326171875, 0.1045074462890625, 0.11383056640625, 0.1231536865234375, 0.132476806640625, 0.1417999267578125, 0.151123046875, 0.1604461669921875, 0.169769287109375, 0.1790924072265625, 0.18841552734375, 0.1977386474609375, 0.207061767578125, 0.2163848876953125, 0.2257080078125, 0.2350311279296875, 0.244354248046875, 0.2536773681640625, 0.26300048828125, 0.2723236083984375, 0.281646728515625, 0.2909698486328125, 0.30029296875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 14.0, 23.0, 38.0, 35.0, 37.0, 50.0, 49.0, 60.0, 56.0, 61.0, 61.0, 73.0, 62.0, 68.0, 44.0, 47.0, 47.0, 45.0, 26.0, 17.0, 18.0, 12.0, 15.0, 10.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.06077098846435547, -0.05873680114746094, -0.056702613830566406, -0.054668426513671875, -0.052634239196777344, -0.05060005187988281, -0.04856586456298828, -0.04653167724609375, -0.04449748992919922, -0.04246330261230469, -0.040429115295410156, -0.038394927978515625, -0.036360740661621094, -0.03432655334472656, -0.03229236602783203, -0.0302581787109375, -0.02822399139404297, -0.026189804077148438, -0.024155616760253906, -0.022121429443359375, -0.020087242126464844, -0.018053054809570312, -0.01601886749267578, -0.01398468017578125, -0.011950492858886719, -0.009916305541992188, -0.007882118225097656, -0.005847930908203125, -0.0038137435913085938, -0.0017795562744140625, 0.00025463104248046875, 0.002288818359375, 0.004323005676269531, 0.0063571929931640625, 0.008391380310058594, 0.010425567626953125, 0.012459754943847656, 0.014493942260742188, 0.01652812957763672, 0.01856231689453125, 0.02059650421142578, 0.022630691528320312, 0.024664878845214844, 0.026699066162109375, 0.028733253479003906, 0.030767440795898438, 0.03280162811279297, 0.0348358154296875, 0.03687000274658203, 0.03890419006347656, 0.040938377380371094, 0.042972564697265625, 0.045006752014160156, 0.04704093933105469, 0.04907512664794922, 0.05110931396484375, 0.05314350128173828, 0.05517768859863281, 0.057211875915527344, 0.059246063232421875, 0.061280250549316406, 0.06331443786621094, 0.06534862518310547, 0.0673828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 8.0, 23.0, 29.0, 72.0, 102.0, 177.0, 275.0, 614.0, 1305.0, 3949.0, 19902.0, 253541.0, 3678795.0, 211969.0, 17518.0, 3633.0, 1216.0, 534.0, 267.0, 159.0, 69.0, 44.0, 29.0, 15.0, 11.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.428955078125, -0.4157447814941406, -0.40253448486328125, -0.3893241882324219, -0.3761138916015625, -0.3629035949707031, -0.34969329833984375, -0.3364830017089844, -0.323272705078125, -0.3100624084472656, -0.29685211181640625, -0.2836418151855469, -0.2704315185546875, -0.2572212219238281, -0.24401092529296875, -0.23080062866210938, -0.21759033203125, -0.20438003540039062, -0.19116973876953125, -0.17795944213867188, -0.1647491455078125, -0.15153884887695312, -0.13832855224609375, -0.12511825561523438, -0.111907958984375, -0.09869766235351562, -0.08548736572265625, -0.07227706909179688, -0.0590667724609375, -0.045856475830078125, -0.03264617919921875, -0.019435882568359375, -0.0062255859375, 0.006984710693359375, 0.02019500732421875, 0.033405303955078125, 0.0466156005859375, 0.059825897216796875, 0.07303619384765625, 0.08624649047851562, 0.099456787109375, 0.11266708374023438, 0.12587738037109375, 0.13908767700195312, 0.1522979736328125, 0.16550827026367188, 0.17871856689453125, 0.19192886352539062, 0.20513916015625, 0.21834945678710938, 0.23155975341796875, 0.24477005004882812, 0.2579803466796875, 0.2711906433105469, 0.28440093994140625, 0.2976112365722656, 0.310821533203125, 0.3240318298339844, 0.33724212646484375, 0.3504524230957031, 0.3636627197265625, 0.3768730163574219, 0.39008331298828125, 0.4032936096191406, 0.41650390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 5.0, 7.0, 9.0, 14.0, 17.0, 20.0, 27.0, 50.0, 65.0, 117.0, 144.0, 209.0, 300.0, 505.0, 765.0, 679.0, 361.0, 223.0, 136.0, 132.0, 87.0, 54.0, 36.0, 34.0, 21.0, 17.0, 12.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.1844320297241211, -0.1798992156982422, -0.17536640167236328, -0.17083358764648438, -0.16630077362060547, -0.16176795959472656, -0.15723514556884766, -0.15270233154296875, -0.14816951751708984, -0.14363670349121094, -0.13910388946533203, -0.13457107543945312, -0.13003826141357422, -0.1255054473876953, -0.1209726333618164, -0.1164398193359375, -0.1119070053100586, -0.10737419128417969, -0.10284137725830078, -0.09830856323242188, -0.09377574920654297, -0.08924293518066406, -0.08471012115478516, -0.08017730712890625, -0.07564449310302734, -0.07111167907714844, -0.06657886505126953, -0.062046051025390625, -0.05751323699951172, -0.05298042297363281, -0.048447608947753906, -0.043914794921875, -0.039381980895996094, -0.03484916687011719, -0.03031635284423828, -0.025783538818359375, -0.02125072479248047, -0.016717910766601562, -0.012185096740722656, -0.00765228271484375, -0.0031194686889648438, 0.0014133453369140625, 0.005946159362792969, 0.010478973388671875, 0.015011787414550781, 0.019544601440429688, 0.024077415466308594, 0.0286102294921875, 0.033143043518066406, 0.03767585754394531, 0.04220867156982422, 0.046741485595703125, 0.05127429962158203, 0.05580711364746094, 0.060339927673339844, 0.06487274169921875, 0.06940555572509766, 0.07393836975097656, 0.07847118377685547, 0.08300399780273438, 0.08753681182861328, 0.09206962585449219, 0.0966024398803711, 0.10113525390625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 23.0, 63.0, 130.0, 329.0, 277.0, 107.0, 45.0, 15.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1658518314361572, -2.100003719329834, -2.0341556072235107, -1.9683074951171875, -1.9024595022201538, -1.8366113901138306, -1.7707632780075073, -1.704915165901184, -1.6390671730041504, -1.5732190608978271, -1.507370948791504, -1.4415228366851807, -1.375674843788147, -1.3098267316818237, -1.2439786195755005, -1.1781305074691772, -1.112282395362854, -1.0464342832565308, -0.9805862307548523, -0.914738118648529, -0.8488900661468506, -0.7830419540405273, -0.7171938419342041, -0.6513457298278809, -0.5854976773262024, -0.5196495652198792, -0.4538015127182007, -0.38795340061187744, -0.3221053183078766, -0.25625723600387573, -0.1904091238975525, -0.12456104159355164, -0.05871295928955078, 0.00713513046503067, 0.07298322021961212, 0.13883131742477417, 0.20467939972877502, 0.2705274820327759, 0.3363755941390991, 0.4022236764431, 0.46807175874710083, 0.5339198708534241, 0.5997679233551025, 0.6656160354614258, 0.731464147567749, 0.7973122000694275, 0.8631603121757507, 0.9290083646774292, 0.9948564767837524, 1.0607045888900757, 1.126552700996399, 1.1924006938934326, 1.2582488059997559, 1.324096918106079, 1.3899450302124023, 1.4557931423187256, 1.5216412544250488, 1.587489366531372, 1.6533374786376953, 1.7191855907440186, 1.7850335836410522, 1.8508816957473755, 1.9167298078536987, 1.982577919960022, 2.0484259128570557]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 3.0, 3.0, 5.0, 14.0, 18.0, 21.0, 25.0, 23.0, 35.0, 44.0, 49.0, 67.0, 54.0, 72.0, 69.0, 70.0, 55.0, 49.0, 54.0, 49.0, 45.0, 38.0, 32.0, 27.0, 21.0, 20.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5232751369476318, -0.5064801573753357, -0.48968514800071716, -0.47289013862609863, -0.4560951590538025, -0.43930017948150635, -0.4225051701068878, -0.4057101607322693, -0.38891518115997314, -0.372120201587677, -0.35532519221305847, -0.33853018283843994, -0.3217352032661438, -0.30494022369384766, -0.2881452143192291, -0.2713502049446106, -0.25455522537231445, -0.23776023089885712, -0.22096523642539978, -0.20417024195194244, -0.1873752474784851, -0.17058025300502777, -0.15378525853157043, -0.1369902640581131, -0.12019526958465576, -0.10340027511119843, -0.08660528063774109, -0.06981028616428375, -0.053015291690826416, -0.03622029721736908, -0.019425302743911743, -0.0026303082704544067, 0.014164745807647705, 0.03095974028110504, 0.04775473475456238, 0.06454972922801971, 0.08134472370147705, 0.09813971817493439, 0.11493471264839172, 0.13172970712184906, 0.1485247015953064, 0.16531969606876373, 0.18211469054222107, 0.1989096850156784, 0.21570467948913574, 0.23249967396259308, 0.24929466843605042, 0.26608967781066895, 0.2828846573829651, 0.29967963695526123, 0.31647464632987976, 0.3332696557044983, 0.35006463527679443, 0.3668596148490906, 0.3836546242237091, 0.40044963359832764, 0.4172446131706238, 0.4340395927429199, 0.45083460211753845, 0.467629611492157, 0.4844245910644531, 0.5012195706367493, 0.5180145502090454, 0.5348095893859863, 0.5516045689582825]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 13.0, 18.0, 26.0, 32.0, 31.0, 43.0, 82.0, 134.0, 167.0, 303.0, 448.0, 791.0, 1620.0, 3604.0, 9051.0, 25751.0, 83563.0, 291127.0, 423458.0, 142531.0, 41845.0, 14034.0, 5154.0, 2141.0, 1022.0, 536.0, 324.0, 183.0, 156.0, 103.0, 69.0, 44.0, 39.0, 25.0, 10.0, 19.0, 13.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.265380859375, -0.25762367248535156, -0.24986648559570312, -0.2421092987060547, -0.23435211181640625, -0.2265949249267578, -0.21883773803710938, -0.21108055114746094, -0.2033233642578125, -0.19556617736816406, -0.18780899047851562, -0.1800518035888672, -0.17229461669921875, -0.1645374298095703, -0.15678024291992188, -0.14902305603027344, -0.141265869140625, -0.13350868225097656, -0.12575149536132812, -0.11799430847167969, -0.11023712158203125, -0.10247993469238281, -0.09472274780273438, -0.08696556091308594, -0.0792083740234375, -0.07145118713378906, -0.06369400024414062, -0.05593681335449219, -0.04817962646484375, -0.04042243957519531, -0.032665252685546875, -0.024908065795898438, -0.01715087890625, -0.009393692016601562, -0.001636505126953125, 0.0061206817626953125, 0.01387786865234375, 0.021635055541992188, 0.029392242431640625, 0.03714942932128906, 0.0449066162109375, 0.05266380310058594, 0.060420989990234375, 0.06817817687988281, 0.07593536376953125, 0.08369255065917969, 0.09144973754882812, 0.09920692443847656, 0.106964111328125, 0.11472129821777344, 0.12247848510742188, 0.1302356719970703, 0.13799285888671875, 0.1457500457763672, 0.15350723266601562, 0.16126441955566406, 0.1690216064453125, 0.17677879333496094, 0.18453598022460938, 0.1922931671142578, 0.20005035400390625, 0.2078075408935547, 0.21556472778320312, 0.22332191467285156, 0.2310791015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 9.0, 14.0, 21.0, 27.0, 47.0, 56.0, 52.0, 74.0, 73.0, 89.0, 90.0, 82.0, 80.0, 86.0, 62.0, 45.0, 28.0, 21.0, 14.0, 11.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07977294921875, -0.07714176177978516, -0.07451057434082031, -0.07187938690185547, -0.06924819946289062, -0.06661701202392578, -0.06398582458496094, -0.061354637145996094, -0.05872344970703125, -0.056092262268066406, -0.05346107482910156, -0.05082988739013672, -0.048198699951171875, -0.04556751251220703, -0.04293632507324219, -0.040305137634277344, -0.0376739501953125, -0.035042762756347656, -0.03241157531738281, -0.02978038787841797, -0.027149200439453125, -0.02451801300048828, -0.021886825561523438, -0.019255638122558594, -0.01662445068359375, -0.013993263244628906, -0.011362075805664062, -0.008730888366699219, -0.006099700927734375, -0.0034685134887695312, -0.0008373260498046875, 0.0017938613891601562, 0.004425048828125, 0.007056236267089844, 0.009687423706054688, 0.012318611145019531, 0.014949798583984375, 0.01758098602294922, 0.020212173461914062, 0.022843360900878906, 0.02547454833984375, 0.028105735778808594, 0.030736923217773438, 0.03336811065673828, 0.035999298095703125, 0.03863048553466797, 0.04126167297363281, 0.043892860412597656, 0.0465240478515625, 0.049155235290527344, 0.05178642272949219, 0.05441761016845703, 0.057048797607421875, 0.05967998504638672, 0.06231117248535156, 0.0649423599243164, 0.06757354736328125, 0.0702047348022461, 0.07283592224121094, 0.07546710968017578, 0.07809829711914062, 0.08072948455810547, 0.08336067199707031, 0.08599185943603516, 0.088623046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 11.0, 21.0, 28.0, 36.0, 63.0, 132.0, 217.0, 496.0, 1366.0, 4590.0, 16599.0, 78541.0, 440532.0, 411361.0, 72453.0, 15510.0, 4225.0, 1310.0, 499.0, 218.0, 119.0, 71.0, 45.0, 41.0, 16.0, 12.0, 14.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30517578125, -0.2946434020996094, -0.28411102294921875, -0.2735786437988281, -0.2630462646484375, -0.2525138854980469, -0.24198150634765625, -0.23144912719726562, -0.220916748046875, -0.21038436889648438, -0.19985198974609375, -0.18931961059570312, -0.1787872314453125, -0.16825485229492188, -0.15772247314453125, -0.14719009399414062, -0.13665771484375, -0.12612533569335938, -0.11559295654296875, -0.10506057739257812, -0.0945281982421875, -0.08399581909179688, -0.07346343994140625, -0.06293106079101562, -0.052398681640625, -0.041866302490234375, -0.03133392333984375, -0.020801544189453125, -0.0102691650390625, 0.000263214111328125, 0.01079559326171875, 0.021327972412109375, 0.0318603515625, 0.042392730712890625, 0.05292510986328125, 0.06345748901367188, 0.0739898681640625, 0.08452224731445312, 0.09505462646484375, 0.10558700561523438, 0.116119384765625, 0.12665176391601562, 0.13718414306640625, 0.14771652221679688, 0.1582489013671875, 0.16878128051757812, 0.17931365966796875, 0.18984603881835938, 0.20037841796875, 0.21091079711914062, 0.22144317626953125, 0.23197555541992188, 0.2425079345703125, 0.2530403137207031, 0.26357269287109375, 0.2741050720214844, 0.284637451171875, 0.2951698303222656, 0.30570220947265625, 0.3162345886230469, 0.3267669677734375, 0.3372993469238281, 0.34783172607421875, 0.3583641052246094, 0.368896484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 8.0, 4.0, 9.0, 12.0, 13.0, 13.0, 14.0, 18.0, 15.0, 25.0, 30.0, 30.0, 26.0, 39.0, 29.0, 35.0, 46.0, 39.0, 28.0, 34.0, 43.0, 31.0, 46.0, 49.0, 55.0, 32.0, 36.0, 34.0, 35.0, 23.0, 22.0, 19.0, 11.0, 21.0, 12.0, 16.0, 10.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.119140625, -0.11549091339111328, -0.11184120178222656, -0.10819149017333984, -0.10454177856445312, -0.1008920669555664, -0.09724235534667969, -0.09359264373779297, -0.08994293212890625, -0.08629322052001953, -0.08264350891113281, -0.0789937973022461, -0.07534408569335938, -0.07169437408447266, -0.06804466247558594, -0.06439495086669922, -0.0607452392578125, -0.05709552764892578, -0.05344581604003906, -0.049796104431152344, -0.046146392822265625, -0.042496681213378906, -0.03884696960449219, -0.03519725799560547, -0.03154754638671875, -0.02789783477783203, -0.024248123168945312, -0.020598411560058594, -0.016948699951171875, -0.013298988342285156, -0.009649276733398438, -0.005999565124511719, -0.002349853515625, 0.0012998580932617188, 0.0049495697021484375, 0.008599281311035156, 0.012248992919921875, 0.015898704528808594, 0.019548416137695312, 0.02319812774658203, 0.02684783935546875, 0.03049755096435547, 0.03414726257324219, 0.037796974182128906, 0.041446685791015625, 0.045096397399902344, 0.04874610900878906, 0.05239582061767578, 0.0560455322265625, 0.05969524383544922, 0.06334495544433594, 0.06699466705322266, 0.07064437866210938, 0.0742940902709961, 0.07794380187988281, 0.08159351348876953, 0.08524322509765625, 0.08889293670654297, 0.09254264831542969, 0.0961923599243164, 0.09984207153320312, 0.10349178314208984, 0.10714149475097656, 0.11079120635986328, 0.11444091796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 7.0, 10.0, 12.0, 24.0, 45.0, 87.0, 131.0, 259.0, 576.0, 1258.0, 3353.0, 11024.0, 52482.0, 418134.0, 481066.0, 61526.0, 12153.0, 3720.0, 1374.0, 655.0, 290.0, 141.0, 71.0, 57.0, 38.0, 19.0, 13.0, 9.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1749267578125, -0.17044639587402344, -0.16596603393554688, -0.1614856719970703, -0.15700531005859375, -0.1525249481201172, -0.14804458618164062, -0.14356422424316406, -0.1390838623046875, -0.13460350036621094, -0.13012313842773438, -0.1256427764892578, -0.12116241455078125, -0.11668205261230469, -0.11220169067382812, -0.10772132873535156, -0.103240966796875, -0.09876060485839844, -0.09428024291992188, -0.08979988098144531, -0.08531951904296875, -0.08083915710449219, -0.07635879516601562, -0.07187843322753906, -0.0673980712890625, -0.06291770935058594, -0.058437347412109375, -0.05395698547363281, -0.04947662353515625, -0.04499626159667969, -0.040515899658203125, -0.03603553771972656, -0.03155517578125, -0.027074813842773438, -0.022594451904296875, -0.018114089965820312, -0.01363372802734375, -0.009153366088867188, -0.004673004150390625, -0.0001926422119140625, 0.0042877197265625, 0.008768081665039062, 0.013248443603515625, 0.017728805541992188, 0.02220916748046875, 0.026689529418945312, 0.031169891357421875, 0.03565025329589844, 0.040130615234375, 0.04461097717285156, 0.049091339111328125, 0.05357170104980469, 0.05805206298828125, 0.06253242492675781, 0.06701278686523438, 0.07149314880371094, 0.0759735107421875, 0.08045387268066406, 0.08493423461914062, 0.08941459655761719, 0.09389495849609375, 0.09837532043457031, 0.10285568237304688, 0.10733604431152344, 0.11181640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 8.0, 14.0, 16.0, 20.0, 35.0, 42.0, 78.0, 92.0, 124.0, 117.0, 146.0, 94.0, 62.0, 45.0, 23.0, 25.0, 13.0, 8.0, 11.0, 8.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6570091247558594e-05, -1.5941448509693146e-05, -1.5312805771827698e-05, -1.468416303396225e-05, -1.4055520296096802e-05, -1.3426877558231354e-05, -1.2798234820365906e-05, -1.2169592082500458e-05, -1.154094934463501e-05, -1.0912306606769562e-05, -1.0283663868904114e-05, -9.655021131038666e-06, -9.026378393173218e-06, -8.39773565530777e-06, -7.769092917442322e-06, -7.140450179576874e-06, -6.511807441711426e-06, -5.883164703845978e-06, -5.25452196598053e-06, -4.625879228115082e-06, -3.997236490249634e-06, -3.368593752384186e-06, -2.739951014518738e-06, -2.11130827665329e-06, -1.4826655387878418e-06, -8.540228009223938e-07, -2.253800630569458e-07, 4.032626748085022e-07, 1.0319054126739502e-06, 1.6605481505393982e-06, 2.289190888404846e-06, 2.917833626270294e-06, 3.546476364135742e-06, 4.17511910200119e-06, 4.803761839866638e-06, 5.432404577732086e-06, 6.061047315597534e-06, 6.689690053462982e-06, 7.31833279132843e-06, 7.946975529193878e-06, 8.575618267059326e-06, 9.204261004924774e-06, 9.832903742790222e-06, 1.046154648065567e-05, 1.1090189218521118e-05, 1.1718831956386566e-05, 1.2347474694252014e-05, 1.2976117432117462e-05, 1.360476016998291e-05, 1.4233402907848358e-05, 1.4862045645713806e-05, 1.5490688383579254e-05, 1.6119331121444702e-05, 1.674797385931015e-05, 1.7376616597175598e-05, 1.8005259335041046e-05, 1.8633902072906494e-05, 1.9262544810771942e-05, 1.989118754863739e-05, 2.0519830286502838e-05, 2.1148473024368286e-05, 2.1777115762233734e-05, 2.2405758500099182e-05, 2.303440123796463e-05, 2.3663043975830078e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 10.0, 5.0, 22.0, 23.0, 27.0, 51.0, 62.0, 118.0, 228.0, 420.0, 988.0, 2662.0, 9723.0, 74850.0, 765146.0, 172479.0, 15587.0, 3641.0, 1313.0, 533.0, 276.0, 154.0, 83.0, 45.0, 30.0, 27.0, 12.0, 14.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.18601608276367188, -0.18013763427734375, -0.17425918579101562, -0.1683807373046875, -0.16250228881835938, -0.15662384033203125, -0.15074539184570312, -0.144866943359375, -0.13898849487304688, -0.13311004638671875, -0.12723159790039062, -0.1213531494140625, -0.11547470092773438, -0.10959625244140625, -0.10371780395507812, -0.09783935546875, -0.09196090698242188, -0.08608245849609375, -0.08020401000976562, -0.0743255615234375, -0.06844711303710938, -0.06256866455078125, -0.056690216064453125, -0.050811767578125, -0.044933319091796875, -0.03905487060546875, -0.033176422119140625, -0.0272979736328125, -0.021419525146484375, -0.01554107666015625, -0.009662628173828125, -0.0037841796875, 0.002094268798828125, 0.00797271728515625, 0.013851165771484375, 0.0197296142578125, 0.025608062744140625, 0.03148651123046875, 0.037364959716796875, 0.043243408203125, 0.049121856689453125, 0.05500030517578125, 0.060878753662109375, 0.0667572021484375, 0.07263565063476562, 0.07851409912109375, 0.08439254760742188, 0.09027099609375, 0.09614944458007812, 0.10202789306640625, 0.10790634155273438, 0.1137847900390625, 0.11966323852539062, 0.12554168701171875, 0.13142013549804688, 0.137298583984375, 0.14317703247070312, 0.14905548095703125, 0.15493392944335938, 0.1608123779296875, 0.16669082641601562, 0.17256927490234375, 0.17844772338867188, 0.184326171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 19.0, 15.0, 35.0, 39.0, 69.0, 77.0, 106.0, 113.0, 108.0, 114.0, 86.0, 66.0, 40.0, 26.0, 18.0, 16.0, 11.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059112548828125, -0.05684041976928711, -0.05456829071044922, -0.05229616165161133, -0.05002403259277344, -0.04775190353393555, -0.045479774475097656, -0.043207645416259766, -0.040935516357421875, -0.038663387298583984, -0.036391258239746094, -0.0341191291809082, -0.03184700012207031, -0.029574871063232422, -0.02730274200439453, -0.02503061294555664, -0.02275848388671875, -0.02048635482788086, -0.01821422576904297, -0.015942096710205078, -0.013669967651367188, -0.011397838592529297, -0.009125709533691406, -0.006853580474853516, -0.004581451416015625, -0.0023093223571777344, -3.719329833984375e-05, 0.002234935760498047, 0.0045070648193359375, 0.006779193878173828, 0.009051322937011719, 0.01132345199584961, 0.0135955810546875, 0.01586771011352539, 0.01813983917236328, 0.020411968231201172, 0.022684097290039062, 0.024956226348876953, 0.027228355407714844, 0.029500484466552734, 0.031772613525390625, 0.034044742584228516, 0.036316871643066406, 0.0385890007019043, 0.04086112976074219, 0.04313325881958008, 0.04540538787841797, 0.04767751693725586, 0.04994964599609375, 0.05222177505493164, 0.05449390411376953, 0.05676603317260742, 0.05903816223144531, 0.0613102912902832, 0.0635824203491211, 0.06585454940795898, 0.06812667846679688, 0.07039880752563477, 0.07267093658447266, 0.07494306564331055, 0.07721519470214844, 0.07948732376098633, 0.08175945281982422, 0.08403158187866211, 0.0863037109375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 11.0, 13.0, 33.0, 95.0, 177.0, 250.0, 234.0, 114.0, 38.0, 24.0, 12.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3420050144195557, -2.293875217437744, -2.2457454204559326, -2.197615385055542, -2.1494855880737305, -2.101355791091919, -2.0532259941101074, -2.005095958709717, -1.9569661617279053, -1.9088363647460938, -1.8607064485549927, -1.8125766515731812, -1.76444673538208, -1.7163169384002686, -1.668187141418457, -1.620057225227356, -1.5719274282455444, -1.523797631263733, -1.4756677150726318, -1.4275379180908203, -1.3794080018997192, -1.3312782049179077, -1.2831482887268066, -1.2350184917449951, -1.1868886947631836, -1.138758897781372, -1.090628981590271, -1.0424991846084595, -0.9943692684173584, -0.9462394714355469, -0.8981096148490906, -0.8499797582626343, -0.8018497228622437, -0.7537198662757874, -0.705590009689331, -0.6574602127075195, -0.6093302965164185, -0.5612004995346069, -0.5130706429481506, -0.46494078636169434, -0.41681092977523804, -0.36868107318878174, -0.32055121660232544, -0.27242138981819153, -0.22429153323173523, -0.17616167664527893, -0.12803184986114502, -0.07990199327468872, -0.03177213668823242, 0.01635771244764328, 0.06448756158351898, 0.11261740326881409, 0.16074725985527039, 0.20887711644172668, 0.2570069432258606, 0.3051367998123169, 0.3532666563987732, 0.4013965129852295, 0.4495263695716858, 0.4976561963558197, 0.5457860231399536, 0.5939159393310547, 0.6420457363128662, 0.6901755928993225, 0.7383054494857788]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 13.0, 13.0, 12.0, 15.0, 9.0, 27.0, 29.0, 42.0, 49.0, 49.0, 55.0, 51.0, 53.0, 57.0, 49.0, 57.0, 49.0, 53.0, 53.0, 46.0, 37.0, 29.0, 23.0, 30.0, 23.0, 12.0, 15.0, 15.0, 8.0, 14.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3458029627799988, -0.32993677258491516, -0.31407058238983154, -0.29820436239242554, -0.2823381721973419, -0.2664719820022583, -0.2506057620048523, -0.23473957180976868, -0.21887338161468506, -0.20300719141960144, -0.18714098632335663, -0.17127478122711182, -0.1554085910320282, -0.13954240083694458, -0.12367619574069977, -0.10780999809503555, -0.09194380044937134, -0.07607760280370712, -0.06021140515804291, -0.04434520751237869, -0.028479009866714478, -0.012612812221050262, 0.0032533854246139526, 0.019119583070278168, 0.03498578071594238, 0.0508519783616066, 0.06671817600727081, 0.08258437365293503, 0.09845057129859924, 0.11431676894426346, 0.13018296658992767, 0.14604917168617249, 0.1619153618812561, 0.17778155207633972, 0.19364775717258453, 0.20951396226882935, 0.22538015246391296, 0.24124634265899658, 0.2571125626564026, 0.2729787528514862, 0.2888449430465698, 0.30471113324165344, 0.32057732343673706, 0.33644354343414307, 0.3523097336292267, 0.3681759238243103, 0.3840421438217163, 0.3999083340167999, 0.41577452421188354, 0.43164071440696716, 0.4475069046020508, 0.4633731245994568, 0.4792393147945404, 0.495105504989624, 0.51097172498703, 0.5268378853797913, 0.5427041053771973, 0.5585703253746033, 0.5744364857673645, 0.5903027057647705, 0.6061688661575317, 0.6220350861549377, 0.6379013061523438, 0.653767466545105, 0.669633686542511]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 7.0, 10.0, 24.0, 30.0, 38.0, 90.0, 101.0, 150.0, 270.0, 416.0, 806.0, 1543.0, 3359.0, 7401.0, 19153.0, 61299.0, 327604.0, 3224594.0, 436066.0, 71448.0, 22394.0, 8829.0, 3971.0, 2051.0, 1057.0, 522.0, 361.0, 229.0, 133.0, 87.0, 77.0, 31.0, 33.0, 21.0, 13.0, 14.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.2218017578125, -0.21556472778320312, -0.20932769775390625, -0.20309066772460938, -0.1968536376953125, -0.19061660766601562, -0.18437957763671875, -0.17814254760742188, -0.171905517578125, -0.16566848754882812, -0.15943145751953125, -0.15319442749023438, -0.1469573974609375, -0.14072036743164062, -0.13448333740234375, -0.12824630737304688, -0.12200927734375, -0.11577224731445312, -0.10953521728515625, -0.10329818725585938, -0.0970611572265625, -0.09082412719726562, -0.08458709716796875, -0.07835006713867188, -0.072113037109375, -0.06587600708007812, -0.05963897705078125, -0.053401947021484375, -0.0471649169921875, -0.040927886962890625, -0.03469085693359375, -0.028453826904296875, -0.022216796875, -0.015979766845703125, -0.00974273681640625, -0.003505706787109375, 0.0027313232421875, 0.008968353271484375, 0.01520538330078125, 0.021442413330078125, 0.027679443359375, 0.033916473388671875, 0.04015350341796875, 0.046390533447265625, 0.0526275634765625, 0.058864593505859375, 0.06510162353515625, 0.07133865356445312, 0.07757568359375, 0.08381271362304688, 0.09004974365234375, 0.09628677368164062, 0.1025238037109375, 0.10876083374023438, 0.11499786376953125, 0.12123489379882812, 0.127471923828125, 0.13370895385742188, 0.13994598388671875, 0.14618301391601562, 0.1524200439453125, 0.15865707397460938, 0.16489410400390625, 0.17113113403320312, 0.1773681640625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 11.0, 16.0, 30.0, 32.0, 53.0, 49.0, 60.0, 62.0, 62.0, 73.0, 55.0, 69.0, 67.0, 85.0, 57.0, 50.0, 33.0, 34.0, 25.0, 21.0, 12.0, 6.0, 9.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06337261199951172, -0.06107139587402344, -0.058770179748535156, -0.056468963623046875, -0.054167747497558594, -0.05186653137207031, -0.04956531524658203, -0.04726409912109375, -0.04496288299560547, -0.04266166687011719, -0.040360450744628906, -0.038059234619140625, -0.035758018493652344, -0.03345680236816406, -0.03115558624267578, -0.0288543701171875, -0.02655315399169922, -0.024251937866210938, -0.021950721740722656, -0.019649505615234375, -0.017348289489746094, -0.015047073364257812, -0.012745857238769531, -0.01044464111328125, -0.008143424987792969, -0.0058422088623046875, -0.0035409927368164062, -0.001239776611328125, 0.0010614395141601562, 0.0033626556396484375, 0.005663871765136719, 0.007965087890625, 0.010266304016113281, 0.012567520141601562, 0.014868736267089844, 0.017169952392578125, 0.019471168518066406, 0.021772384643554688, 0.02407360076904297, 0.02637481689453125, 0.02867603302001953, 0.030977249145507812, 0.033278465270996094, 0.035579681396484375, 0.037880897521972656, 0.04018211364746094, 0.04248332977294922, 0.0447845458984375, 0.04708576202392578, 0.04938697814941406, 0.051688194274902344, 0.053989410400390625, 0.056290626525878906, 0.05859184265136719, 0.06089305877685547, 0.06319427490234375, 0.06549549102783203, 0.06779670715332031, 0.0700979232788086, 0.07239913940429688, 0.07470035552978516, 0.07700157165527344, 0.07930278778076172, 0.08160400390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 14.0, 18.0, 33.0, 50.0, 72.0, 127.0, 277.0, 729.0, 2428.0, 16416.0, 496315.0, 3627032.0, 44471.0, 4487.0, 1057.0, 354.0, 171.0, 98.0, 51.0, 26.0, 18.0, 15.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.49639129638671875, -0.4781341552734375, -0.45987701416015625, -0.441619873046875, -0.42336273193359375, -0.4051055908203125, -0.38684844970703125, -0.36859130859375, -0.35033416748046875, -0.3320770263671875, -0.31381988525390625, -0.295562744140625, -0.27730560302734375, -0.2590484619140625, -0.24079132080078125, -0.2225341796875, -0.20427703857421875, -0.1860198974609375, -0.16776275634765625, -0.149505615234375, -0.13124847412109375, -0.1129913330078125, -0.09473419189453125, -0.07647705078125, -0.05821990966796875, -0.0399627685546875, -0.02170562744140625, -0.003448486328125, 0.01480865478515625, 0.0330657958984375, 0.05132293701171875, 0.069580078125, 0.08783721923828125, 0.1060943603515625, 0.12435150146484375, 0.142608642578125, 0.16086578369140625, 0.1791229248046875, 0.19738006591796875, 0.21563720703125, 0.23389434814453125, 0.2521514892578125, 0.27040863037109375, 0.288665771484375, 0.30692291259765625, 0.3251800537109375, 0.34343719482421875, 0.3616943359375, 0.37995147705078125, 0.3982086181640625, 0.41646575927734375, 0.434722900390625, 0.45298004150390625, 0.4712371826171875, 0.48949432373046875, 0.50775146484375, 0.5260086059570312, 0.5442657470703125, 0.5625228881835938, 0.580780029296875, 0.5990371704101562, 0.6172943115234375, 0.6355514526367188, 0.65380859375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 4.0, 10.0, 9.0, 18.0, 20.0, 17.0, 29.0, 46.0, 60.0, 73.0, 121.0, 158.0, 250.0, 473.0, 823.0, 721.0, 383.0, 256.0, 171.0, 111.0, 84.0, 63.0, 39.0, 39.0, 20.0, 17.0, 12.0, 7.0, 7.0, 5.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14143753051757812, -0.13700103759765625, -0.13256454467773438, -0.1281280517578125, -0.12369155883789062, -0.11925506591796875, -0.11481857299804688, -0.110382080078125, -0.10594558715820312, -0.10150909423828125, -0.09707260131835938, -0.0926361083984375, -0.08819961547851562, -0.08376312255859375, -0.07932662963867188, -0.07489013671875, -0.07045364379882812, -0.06601715087890625, -0.061580657958984375, -0.0571441650390625, -0.052707672119140625, -0.04827117919921875, -0.043834686279296875, -0.039398193359375, -0.034961700439453125, -0.03052520751953125, -0.026088714599609375, -0.0216522216796875, -0.017215728759765625, -0.01277923583984375, -0.008342742919921875, -0.00390625, 0.000530242919921875, 0.00496673583984375, 0.009403228759765625, 0.0138397216796875, 0.018276214599609375, 0.02271270751953125, 0.027149200439453125, 0.031585693359375, 0.036022186279296875, 0.04045867919921875, 0.044895172119140625, 0.0493316650390625, 0.053768157958984375, 0.05820465087890625, 0.06264114379882812, 0.06707763671875, 0.07151412963867188, 0.07595062255859375, 0.08038711547851562, 0.0848236083984375, 0.08926010131835938, 0.09369659423828125, 0.09813308715820312, 0.102569580078125, 0.10700607299804688, 0.11144256591796875, 0.11587905883789062, 0.1203155517578125, 0.12475204467773438, 0.12918853759765625, 0.13362503051757812, 0.1380615234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 14.0, 12.0, 22.0, 48.0, 78.0, 109.0, 152.0, 157.0, 136.0, 83.0, 58.0, 54.0, 23.0, 20.0, 14.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.329711675643921, -1.2974512577056885, -1.2651907205581665, -1.232930302619934, -1.200669765472412, -1.1684093475341797, -1.1361488103866577, -1.1038883924484253, -1.0716278553009033, -1.039367437362671, -1.007106900215149, -0.9748464226722717, -0.9425859451293945, -0.9103255271911621, -0.8780650496482849, -0.8458045721054077, -0.8135441541671753, -0.7812836766242981, -0.7490231990814209, -0.7167627215385437, -0.6845022439956665, -0.6522418260574341, -0.6199813485145569, -0.5877208709716797, -0.5554603934288025, -0.5231999158859253, -0.4909394383430481, -0.4586789906024933, -0.4264185130596161, -0.3941580355167389, -0.3618975877761841, -0.3296371102333069, -0.29737669229507446, -0.26511621475219727, -0.23285575211048126, -0.20059528946876526, -0.16833481192588806, -0.13607433438301086, -0.10381387174129486, -0.07155340909957886, -0.03929293155670166, -0.00703246146440506, 0.02522800862789154, 0.05748847872018814, 0.08974894881248474, 0.12200942635536194, 0.15426988899707794, 0.18653035163879395, 0.21879082918167114, 0.25105130672454834, 0.28331178426742554, 0.31557223200798035, 0.34783270955085754, 0.38009318709373474, 0.41235363483428955, 0.44461411237716675, 0.47687458992004395, 0.5091350674629211, 0.5413955450057983, 0.5736560225486755, 0.6059165000915527, 0.6381769180297852, 0.6704373955726624, 0.7026978731155396, 0.7349583506584167]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 8.0, 11.0, 11.0, 17.0, 11.0, 25.0, 17.0, 23.0, 34.0, 25.0, 24.0, 30.0, 41.0, 28.0, 49.0, 44.0, 51.0, 38.0, 38.0, 29.0, 36.0, 45.0, 36.0, 53.0, 32.0, 38.0, 35.0, 24.0, 21.0, 13.0, 19.0, 9.0, 16.0, 11.0, 11.0, 7.0, 9.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4203031063079834, -0.4076533913612366, -0.39500370621681213, -0.3823539912700653, -0.3697042763233185, -0.35705459117889404, -0.3444048762321472, -0.3317551612854004, -0.31910547614097595, -0.3064557611942291, -0.2938060760498047, -0.28115636110305786, -0.26850664615631104, -0.2558569610118866, -0.24320724606513977, -0.23055754601955414, -0.2179078310728073, -0.20525813102722168, -0.19260841608047485, -0.17995871603488922, -0.1673090159893036, -0.15465930104255676, -0.14200960099697113, -0.1293599009513855, -0.11671019345521927, -0.10406048595905304, -0.09141078591346741, -0.07876107841730118, -0.06611137092113495, -0.053461670875549316, -0.04081196337938309, -0.028162263333797455, -0.015512555837631226, -0.00286285113543272, 0.009786853566765785, 0.022436559200286865, 0.035086262971162796, 0.04773596674203873, 0.060385674238204956, 0.07303537428379059, 0.08568508177995682, 0.09833478927612305, 0.11098448932170868, 0.12363419681787491, 0.13628390431404114, 0.14893360435962677, 0.1615833044052124, 0.17423301935195923, 0.18688271939754486, 0.1995324194431305, 0.21218213438987732, 0.22483183443546295, 0.23748153448104858, 0.2501312494277954, 0.26278096437454224, 0.2754306495189667, 0.2880803644657135, 0.3007300794124603, 0.31337976455688477, 0.3260294795036316, 0.3386791944503784, 0.35132887959480286, 0.3639785945415497, 0.3766282796859741, 0.38927799463272095]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 9.0, 9.0, 13.0, 20.0, 26.0, 41.0, 58.0, 112.0, 186.0, 290.0, 533.0, 941.0, 2024.0, 4577.0, 12529.0, 39765.0, 149735.0, 466834.0, 269430.0, 68532.0, 20199.0, 6931.0, 2858.0, 1261.0, 683.0, 339.0, 197.0, 131.0, 80.0, 63.0, 39.0, 30.0, 19.0, 15.0, 9.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.30467987060546875, -0.2936859130859375, -0.28269195556640625, -0.271697998046875, -0.26070404052734375, -0.2497100830078125, -0.23871612548828125, -0.22772216796875, -0.21672821044921875, -0.2057342529296875, -0.19474029541015625, -0.183746337890625, -0.17275238037109375, -0.1617584228515625, -0.15076446533203125, -0.1397705078125, -0.12877655029296875, -0.1177825927734375, -0.10678863525390625, -0.095794677734375, -0.08480072021484375, -0.0738067626953125, -0.06281280517578125, -0.05181884765625, -0.04082489013671875, -0.0298309326171875, -0.01883697509765625, -0.007843017578125, 0.00315093994140625, 0.0141448974609375, 0.02513885498046875, 0.0361328125, 0.04712677001953125, 0.0581207275390625, 0.06911468505859375, 0.080108642578125, 0.09110260009765625, 0.1020965576171875, 0.11309051513671875, 0.12408447265625, 0.13507843017578125, 0.1460723876953125, 0.15706634521484375, 0.168060302734375, 0.17905426025390625, 0.1900482177734375, 0.20104217529296875, 0.2120361328125, 0.22303009033203125, 0.2340240478515625, 0.24501800537109375, 0.256011962890625, 0.26700592041015625, 0.2779998779296875, 0.28899383544921875, 0.29998779296875, 0.31098175048828125, 0.3219757080078125, 0.33296966552734375, 0.343963623046875, 0.35495758056640625, 0.3659515380859375, 0.37694549560546875, 0.387939453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 9.0, 11.0, 16.0, 9.0, 29.0, 41.0, 39.0, 57.0, 58.0, 56.0, 69.0, 79.0, 66.0, 67.0, 73.0, 60.0, 62.0, 49.0, 40.0, 36.0, 27.0, 17.0, 13.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0771484375, -0.07477283477783203, -0.07239723205566406, -0.0700216293334961, -0.06764602661132812, -0.06527042388916016, -0.06289482116699219, -0.06051921844482422, -0.05814361572265625, -0.05576801300048828, -0.05339241027832031, -0.051016807556152344, -0.048641204833984375, -0.046265602111816406, -0.04388999938964844, -0.04151439666748047, -0.0391387939453125, -0.03676319122314453, -0.03438758850097656, -0.032011985778808594, -0.029636383056640625, -0.027260780334472656, -0.024885177612304688, -0.02250957489013672, -0.02013397216796875, -0.01775836944580078, -0.015382766723632812, -0.013007164001464844, -0.010631561279296875, -0.008255958557128906, -0.0058803558349609375, -0.0035047531127929688, -0.001129150390625, 0.0012464523315429688, 0.0036220550537109375, 0.005997657775878906, 0.008373260498046875, 0.010748863220214844, 0.013124465942382812, 0.015500068664550781, 0.01787567138671875, 0.02025127410888672, 0.022626876831054688, 0.025002479553222656, 0.027378082275390625, 0.029753684997558594, 0.03212928771972656, 0.03450489044189453, 0.0368804931640625, 0.03925609588623047, 0.04163169860839844, 0.044007301330566406, 0.046382904052734375, 0.048758506774902344, 0.05113410949707031, 0.05350971221923828, 0.05588531494140625, 0.05826091766357422, 0.06063652038574219, 0.06301212310791016, 0.06538772583007812, 0.0677633285522461, 0.07013893127441406, 0.07251453399658203, 0.07489013671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 6.0, 16.0, 13.0, 22.0, 24.0, 56.0, 97.0, 203.0, 347.0, 746.0, 2001.0, 9585.0, 78912.0, 686539.0, 241128.0, 22938.0, 3800.0, 1128.0, 473.0, 216.0, 110.0, 71.0, 36.0, 28.0, 20.0, 10.0, 8.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.4831695556640625, -0.464385986328125, -0.4456024169921875, -0.42681884765625, -0.4080352783203125, -0.389251708984375, -0.3704681396484375, -0.3516845703125, -0.3329010009765625, -0.314117431640625, -0.2953338623046875, -0.27655029296875, -0.2577667236328125, -0.238983154296875, -0.2201995849609375, -0.201416015625, -0.1826324462890625, -0.163848876953125, -0.1450653076171875, -0.12628173828125, -0.1074981689453125, -0.088714599609375, -0.0699310302734375, -0.0511474609375, -0.0323638916015625, -0.013580322265625, 0.0052032470703125, 0.02398681640625, 0.0427703857421875, 0.061553955078125, 0.0803375244140625, 0.09912109375, 0.1179046630859375, 0.136688232421875, 0.1554718017578125, 0.17425537109375, 0.1930389404296875, 0.211822509765625, 0.2306060791015625, 0.2493896484375, 0.2681732177734375, 0.286956787109375, 0.3057403564453125, 0.32452392578125, 0.3433074951171875, 0.362091064453125, 0.3808746337890625, 0.399658203125, 0.4184417724609375, 0.437225341796875, 0.4560089111328125, 0.47479248046875, 0.4935760498046875, 0.512359619140625, 0.5311431884765625, 0.5499267578125, 0.5687103271484375, 0.587493896484375, 0.6062774658203125, 0.62506103515625, 0.6438446044921875, 0.662628173828125, 0.6814117431640625, 0.7001953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 8.0, 8.0, 5.0, 10.0, 15.0, 15.0, 9.0, 22.0, 25.0, 25.0, 30.0, 33.0, 48.0, 32.0, 40.0, 39.0, 37.0, 52.0, 50.0, 47.0, 55.0, 38.0, 41.0, 40.0, 36.0, 28.0, 34.0, 28.0, 25.0, 26.0, 19.0, 14.0, 11.0, 12.0, 8.0, 14.0, 11.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1566162109375, -0.1521472930908203, -0.14767837524414062, -0.14320945739746094, -0.13874053955078125, -0.13427162170410156, -0.12980270385742188, -0.1253337860107422, -0.1208648681640625, -0.11639595031738281, -0.11192703247070312, -0.10745811462402344, -0.10298919677734375, -0.09852027893066406, -0.09405136108398438, -0.08958244323730469, -0.085113525390625, -0.08064460754394531, -0.07617568969726562, -0.07170677185058594, -0.06723785400390625, -0.06276893615722656, -0.058300018310546875, -0.05383110046386719, -0.0493621826171875, -0.04489326477050781, -0.040424346923828125, -0.03595542907714844, -0.03148651123046875, -0.027017593383789062, -0.022548675537109375, -0.018079757690429688, -0.01361083984375, -0.009141921997070312, -0.004673004150390625, -0.0002040863037109375, 0.00426483154296875, 0.008733749389648438, 0.013202667236328125, 0.017671585083007812, 0.0221405029296875, 0.026609420776367188, 0.031078338623046875, 0.03554725646972656, 0.04001617431640625, 0.04448509216308594, 0.048954010009765625, 0.05342292785644531, 0.057891845703125, 0.06236076354980469, 0.06682968139648438, 0.07129859924316406, 0.07576751708984375, 0.08023643493652344, 0.08470535278320312, 0.08917427062988281, 0.0936431884765625, 0.09811210632324219, 0.10258102416992188, 0.10704994201660156, 0.11151885986328125, 0.11598777770996094, 0.12045669555664062, 0.12492561340332031, 0.12939453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 11.0, 10.0, 18.0, 23.0, 30.0, 45.0, 73.0, 109.0, 142.0, 300.0, 612.0, 1242.0, 2832.0, 7864.0, 31301.0, 662882.0, 307108.0, 22708.0, 6559.0, 2401.0, 1024.0, 501.0, 268.0, 174.0, 104.0, 66.0, 29.0, 27.0, 26.0, 16.0, 8.0, 7.0, 8.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3366432189941406, -0.32538604736328125, -0.3141288757324219, -0.3028717041015625, -0.2916145324707031, -0.28035736083984375, -0.2691001892089844, -0.257843017578125, -0.24658584594726562, -0.23532867431640625, -0.22407150268554688, -0.2128143310546875, -0.20155715942382812, -0.19029998779296875, -0.17904281616210938, -0.16778564453125, -0.15652847290039062, -0.14527130126953125, -0.13401412963867188, -0.1227569580078125, -0.11149978637695312, -0.10024261474609375, -0.08898544311523438, -0.077728271484375, -0.06647109985351562, -0.05521392822265625, -0.043956756591796875, -0.0326995849609375, -0.021442413330078125, -0.01018524169921875, 0.001071929931640625, 0.0123291015625, 0.023586273193359375, 0.03484344482421875, 0.046100616455078125, 0.0573577880859375, 0.06861495971679688, 0.07987213134765625, 0.09112930297851562, 0.102386474609375, 0.11364364624023438, 0.12490081787109375, 0.13615798950195312, 0.1474151611328125, 0.15867233276367188, 0.16992950439453125, 0.18118667602539062, 0.19244384765625, 0.20370101928710938, 0.21495819091796875, 0.22621536254882812, 0.2374725341796875, 0.24872970581054688, 0.25998687744140625, 0.2712440490722656, 0.282501220703125, 0.2937583923339844, 0.30501556396484375, 0.3162727355957031, 0.3275299072265625, 0.3387870788574219, 0.35004425048828125, 0.3613014221191406, 0.37255859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 4.0, 8.0, 7.0, 8.0, 14.0, 34.0, 45.0, 99.0, 200.0, 225.0, 136.0, 73.0, 44.0, 24.0, 16.0, 9.0, 11.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.4405460357666016e-05, -4.314351826906204e-05, -4.188157618045807e-05, -4.0619634091854095e-05, -3.935769200325012e-05, -3.809574991464615e-05, -3.6833807826042175e-05, -3.55718657374382e-05, -3.430992364883423e-05, -3.3047981560230255e-05, -3.178603947162628e-05, -3.052409738302231e-05, -2.9262155294418335e-05, -2.800021320581436e-05, -2.6738271117210388e-05, -2.5476329028606415e-05, -2.421438694000244e-05, -2.2952444851398468e-05, -2.1690502762794495e-05, -2.042856067419052e-05, -1.9166618585586548e-05, -1.7904676496982574e-05, -1.66427344083786e-05, -1.5380792319774628e-05, -1.4118850231170654e-05, -1.2856908142566681e-05, -1.1594966053962708e-05, -1.0333023965358734e-05, -9.07108187675476e-06, -7.809139788150787e-06, -6.547197699546814e-06, -5.2852556109428406e-06, -4.023313522338867e-06, -2.761371433734894e-06, -1.4994293451309204e-06, -2.3748725652694702e-07, 1.0244548320770264e-06, 2.2863969206809998e-06, 3.548339009284973e-06, 4.8102810978889465e-06, 6.07222318649292e-06, 7.334165275096893e-06, 8.596107363700867e-06, 9.85804945230484e-06, 1.1119991540908813e-05, 1.2381933629512787e-05, 1.364387571811676e-05, 1.4905817806720734e-05, 1.6167759895324707e-05, 1.742970198392868e-05, 1.8691644072532654e-05, 1.9953586161136627e-05, 2.12155282497406e-05, 2.2477470338344574e-05, 2.3739412426948547e-05, 2.500135451555252e-05, 2.6263296604156494e-05, 2.7525238692760468e-05, 2.878718078136444e-05, 3.0049122869968414e-05, 3.131106495857239e-05, 3.257300704717636e-05, 3.3834949135780334e-05, 3.509689122438431e-05, 3.635883331298828e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 12.0, 9.0, 24.0, 17.0, 44.0, 63.0, 91.0, 220.0, 636.0, 2456.0, 16533.0, 966291.0, 55578.0, 4857.0, 1012.0, 339.0, 139.0, 70.0, 38.0, 27.0, 25.0, 13.0, 12.0, 6.0, 6.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9638671875, -0.9343948364257812, -0.9049224853515625, -0.8754501342773438, -0.845977783203125, -0.8165054321289062, -0.7870330810546875, -0.7575607299804688, -0.72808837890625, -0.6986160278320312, -0.6691436767578125, -0.6396713256835938, -0.610198974609375, -0.5807266235351562, -0.5512542724609375, -0.5217819213867188, -0.4923095703125, -0.46283721923828125, -0.4333648681640625, -0.40389251708984375, -0.374420166015625, -0.34494781494140625, -0.3154754638671875, -0.28600311279296875, -0.25653076171875, -0.22705841064453125, -0.1975860595703125, -0.16811370849609375, -0.138641357421875, -0.10916900634765625, -0.0796966552734375, -0.05022430419921875, -0.020751953125, 0.00872039794921875, 0.0381927490234375, 0.06766510009765625, 0.097137451171875, 0.12660980224609375, 0.1560821533203125, 0.18555450439453125, 0.21502685546875, 0.24449920654296875, 0.2739715576171875, 0.30344390869140625, 0.332916259765625, 0.36238861083984375, 0.3918609619140625, 0.42133331298828125, 0.4508056640625, 0.48027801513671875, 0.5097503662109375, 0.5392227172851562, 0.568695068359375, 0.5981674194335938, 0.6276397705078125, 0.6571121215820312, 0.68658447265625, 0.7160568237304688, 0.7455291748046875, 0.7750015258789062, 0.804473876953125, 0.8339462280273438, 0.8634185791015625, 0.8928909301757812, 0.92236328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 2.0, 11.0, 11.0, 23.0, 39.0, 77.0, 144.0, 266.0, 165.0, 77.0, 55.0, 16.0, 20.0, 11.0, 13.0, 7.0, 8.0, 5.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.198486328125, -0.192596435546875, -0.18670654296875, -0.180816650390625, -0.1749267578125, -0.169036865234375, -0.16314697265625, -0.157257080078125, -0.1513671875, -0.145477294921875, -0.13958740234375, -0.133697509765625, -0.1278076171875, -0.121917724609375, -0.11602783203125, -0.110137939453125, -0.104248046875, -0.098358154296875, -0.09246826171875, -0.086578369140625, -0.0806884765625, -0.074798583984375, -0.06890869140625, -0.063018798828125, -0.05712890625, -0.051239013671875, -0.04534912109375, -0.039459228515625, -0.0335693359375, -0.027679443359375, -0.02178955078125, -0.015899658203125, -0.010009765625, -0.004119873046875, 0.00177001953125, 0.007659912109375, 0.0135498046875, 0.019439697265625, 0.02532958984375, 0.031219482421875, 0.037109375, 0.042999267578125, 0.04888916015625, 0.054779052734375, 0.0606689453125, 0.066558837890625, 0.07244873046875, 0.078338623046875, 0.084228515625, 0.090118408203125, 0.09600830078125, 0.101898193359375, 0.1077880859375, 0.113677978515625, 0.11956787109375, 0.125457763671875, 0.13134765625, 0.137237548828125, 0.14312744140625, 0.149017333984375, 0.1549072265625, 0.160797119140625, 0.16668701171875, 0.172576904296875, 0.178466796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 14.0, 10.0, 22.0, 41.0, 62.0, 109.0, 124.0, 169.0, 153.0, 104.0, 78.0, 35.0, 28.0, 14.0, 8.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2782760858535767, -1.226572036743164, -1.174867868423462, -1.1231638193130493, -1.0714597702026367, -1.0197556018829346, -0.968051552772522, -0.9163475036621094, -0.864643394947052, -0.8129392862319946, -0.761235237121582, -0.7095311284065247, -0.6578270196914673, -0.6061229705810547, -0.5544188618659973, -0.5027147531509399, -0.45101070404052734, -0.39930662512779236, -0.3476025462150574, -0.2958984375, -0.24419435858726501, -0.19249027967453003, -0.14078617095947266, -0.08908209204673767, -0.037378013134002686, 0.014326073229312897, 0.06603015959262848, 0.11773425340652466, 0.16943833231925964, 0.22114241123199463, 0.272846519947052, 0.324550598859787, 0.3762545585632324, 0.4279586374759674, 0.4796627163887024, 0.5313668251037598, 0.5830708742141724, 0.6347749829292297, 0.6864790916442871, 0.7381831407546997, 0.7898872494697571, 0.8415913581848145, 0.893295407295227, 0.9449995160102844, 0.9967036247253418, 1.0484076738357544, 1.100111722946167, 1.1518158912658691, 1.2035199403762817, 1.2552239894866943, 1.3069281578063965, 1.358632206916809, 1.4103362560272217, 1.4620404243469238, 1.5137444734573364, 1.565448522567749, 1.6171526908874512, 1.6688567399978638, 1.720560908317566, 1.7722649574279785, 1.8239690065383911, 1.8756730556488037, 1.9273772239685059, 1.9790812730789185, 2.030785322189331]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 9.0, 8.0, 19.0, 8.0, 19.0, 14.0, 11.0, 18.0, 21.0, 31.0, 24.0, 27.0, 31.0, 40.0, 34.0, 49.0, 32.0, 50.0, 31.0, 39.0, 44.0, 41.0, 31.0, 38.0, 38.0, 30.0, 31.0, 31.0, 18.0, 14.0, 22.0, 24.0, 20.0, 13.0, 15.0, 9.0, 7.0, 7.0, 11.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5394516587257385, -0.5219951868057251, -0.5045387744903564, -0.487082302570343, -0.4696258306503296, -0.45216938853263855, -0.4347129464149475, -0.4172564744949341, -0.39980003237724304, -0.382343590259552, -0.3648871183395386, -0.34743067622184753, -0.3299742341041565, -0.31251776218414307, -0.295061320066452, -0.277604877948761, -0.26014840602874756, -0.24269194900989532, -0.2252354919910431, -0.20777904987335205, -0.19032259285449982, -0.17286613583564758, -0.15540969371795654, -0.1379532366991043, -0.12049677968025208, -0.10304032266139984, -0.0855838730931282, -0.06812742352485657, -0.050670966506004333, -0.0332145094871521, -0.015758059918880463, 0.0016983896493911743, 0.019154906272888184, 0.03661135956645012, 0.054067812860012054, 0.07152426242828369, 0.08898071944713593, 0.10643717646598816, 0.1238936260342598, 0.14135007560253143, 0.15880653262138367, 0.1762629896402359, 0.19371944665908813, 0.21117588877677917, 0.2286323457956314, 0.24608880281448364, 0.2635452449321747, 0.2810016870498657, 0.29845815896987915, 0.3159146010875702, 0.3333710730075836, 0.35082751512527466, 0.3682839870452881, 0.3857404291629791, 0.40319687128067017, 0.4206533432006836, 0.43810978531837463, 0.4555662274360657, 0.4730226993560791, 0.49047914147377014, 0.5079355835914612, 0.5253920555114746, 0.542848527431488, 0.5603049397468567, 0.5777614116668701]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 8.0, 10.0, 26.0, 30.0, 46.0, 72.0, 96.0, 128.0, 179.0, 354.0, 662.0, 1281.0, 2925.0, 6633.0, 16213.0, 48175.0, 248477.0, 3012812.0, 731227.0, 81022.0, 25601.0, 9821.0, 4216.0, 1964.0, 982.0, 518.0, 337.0, 159.0, 94.0, 65.0, 45.0, 23.0, 26.0, 13.0, 3.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2127685546875, -0.20560264587402344, -0.19843673706054688, -0.1912708282470703, -0.18410491943359375, -0.1769390106201172, -0.16977310180664062, -0.16260719299316406, -0.1554412841796875, -0.14827537536621094, -0.14110946655273438, -0.1339435577392578, -0.12677764892578125, -0.11961174011230469, -0.11244583129882812, -0.10527992248535156, -0.098114013671875, -0.09094810485839844, -0.08378219604492188, -0.07661628723144531, -0.06945037841796875, -0.06228446960449219, -0.055118560791015625, -0.04795265197753906, -0.0407867431640625, -0.03362083435058594, -0.026454925537109375, -0.019289016723632812, -0.01212310791015625, -0.0049571990966796875, 0.002208709716796875, 0.009374618530273438, 0.01654052734375, 0.023706436157226562, 0.030872344970703125, 0.03803825378417969, 0.04520416259765625, 0.05237007141113281, 0.059535980224609375, 0.06670188903808594, 0.0738677978515625, 0.08103370666503906, 0.08819961547851562, 0.09536552429199219, 0.10253143310546875, 0.10969734191894531, 0.11686325073242188, 0.12402915954589844, 0.131195068359375, 0.13836097717285156, 0.14552688598632812, 0.1526927947998047, 0.15985870361328125, 0.1670246124267578, 0.17419052124023438, 0.18135643005371094, 0.1885223388671875, 0.19568824768066406, 0.20285415649414062, 0.2100200653076172, 0.21718597412109375, 0.2243518829345703, 0.23151779174804688, 0.23868370056152344, 0.245849609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 9.0, 13.0, 25.0, 30.0, 41.0, 31.0, 34.0, 49.0, 51.0, 42.0, 59.0, 56.0, 77.0, 69.0, 48.0, 50.0, 47.0, 36.0, 45.0, 36.0, 32.0, 24.0, 20.0, 19.0, 15.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.087646484375, -0.08486747741699219, -0.08208847045898438, -0.07930946350097656, -0.07653045654296875, -0.07375144958496094, -0.07097244262695312, -0.06819343566894531, -0.0654144287109375, -0.06263542175292969, -0.059856414794921875, -0.05707740783691406, -0.05429840087890625, -0.05151939392089844, -0.048740386962890625, -0.04596138000488281, -0.043182373046875, -0.04040336608886719, -0.037624359130859375, -0.03484535217285156, -0.03206634521484375, -0.029287338256835938, -0.026508331298828125, -0.023729324340820312, -0.0209503173828125, -0.018171310424804688, -0.015392303466796875, -0.012613296508789062, -0.00983428955078125, -0.0070552825927734375, -0.004276275634765625, -0.0014972686767578125, 0.00128173828125, 0.0040607452392578125, 0.006839752197265625, 0.009618759155273438, 0.01239776611328125, 0.015176773071289062, 0.017955780029296875, 0.020734786987304688, 0.0235137939453125, 0.026292800903320312, 0.029071807861328125, 0.03185081481933594, 0.03462982177734375, 0.03740882873535156, 0.040187835693359375, 0.04296684265136719, 0.045745849609375, 0.04852485656738281, 0.051303863525390625, 0.05408287048339844, 0.05686187744140625, 0.05964088439941406, 0.062419891357421875, 0.06519889831542969, 0.0679779052734375, 0.07075691223144531, 0.07353591918945312, 0.07631492614746094, 0.07909393310546875, 0.08187294006347656, 0.08465194702148438, 0.08743095397949219, 0.0902099609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 8.0, 6.0, 12.0, 12.0, 20.0, 44.0, 47.0, 81.0, 125.0, 200.0, 304.0, 543.0, 961.0, 1965.0, 4735.0, 13335.0, 53172.0, 497166.0, 3421295.0, 157460.0, 28021.0, 8275.0, 3203.0, 1451.0, 752.0, 407.0, 229.0, 139.0, 116.0, 57.0, 34.0, 24.0, 24.0, 13.0, 7.0, 11.0, 8.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3798828125, -0.367340087890625, -0.35479736328125, -0.342254638671875, -0.3297119140625, -0.317169189453125, -0.30462646484375, -0.292083740234375, -0.279541015625, -0.266998291015625, -0.25445556640625, -0.241912841796875, -0.2293701171875, -0.216827392578125, -0.20428466796875, -0.191741943359375, -0.17919921875, -0.166656494140625, -0.15411376953125, -0.141571044921875, -0.1290283203125, -0.116485595703125, -0.10394287109375, -0.091400146484375, -0.078857421875, -0.066314697265625, -0.05377197265625, -0.041229248046875, -0.0286865234375, -0.016143798828125, -0.00360107421875, 0.008941650390625, 0.021484375, 0.034027099609375, 0.04656982421875, 0.059112548828125, 0.0716552734375, 0.084197998046875, 0.09674072265625, 0.109283447265625, 0.121826171875, 0.134368896484375, 0.14691162109375, 0.159454345703125, 0.1719970703125, 0.184539794921875, 0.19708251953125, 0.209625244140625, 0.22216796875, 0.234710693359375, 0.24725341796875, 0.259796142578125, 0.2723388671875, 0.284881591796875, 0.29742431640625, 0.309967041015625, 0.322509765625, 0.335052490234375, 0.34759521484375, 0.360137939453125, 0.3726806640625, 0.385223388671875, 0.39776611328125, 0.410308837890625, 0.4228515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 2.0, 12.0, 18.0, 30.0, 35.0, 35.0, 53.0, 100.0, 182.0, 348.0, 890.0, 1207.0, 542.0, 232.0, 113.0, 91.0, 56.0, 26.0, 21.0, 25.0, 9.0, 9.0, 8.0, 11.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.2397308349609375, -0.230926513671875, -0.2221221923828125, -0.21331787109375, -0.2045135498046875, -0.195709228515625, -0.1869049072265625, -0.1781005859375, -0.1692962646484375, -0.160491943359375, -0.1516876220703125, -0.14288330078125, -0.1340789794921875, -0.125274658203125, -0.1164703369140625, -0.107666015625, -0.0988616943359375, -0.090057373046875, -0.0812530517578125, -0.07244873046875, -0.0636444091796875, -0.054840087890625, -0.0460357666015625, -0.0372314453125, -0.0284271240234375, -0.019622802734375, -0.0108184814453125, -0.00201416015625, 0.0067901611328125, 0.015594482421875, 0.0243988037109375, 0.033203125, 0.0420074462890625, 0.050811767578125, 0.0596160888671875, 0.06842041015625, 0.0772247314453125, 0.086029052734375, 0.0948333740234375, 0.1036376953125, 0.1124420166015625, 0.121246337890625, 0.1300506591796875, 0.13885498046875, 0.1476593017578125, 0.156463623046875, 0.1652679443359375, 0.174072265625, 0.1828765869140625, 0.191680908203125, 0.2004852294921875, 0.20928955078125, 0.2180938720703125, 0.226898193359375, 0.2357025146484375, 0.2445068359375, 0.2533111572265625, 0.262115478515625, 0.2709197998046875, 0.27972412109375, 0.2885284423828125, 0.297332763671875, 0.3061370849609375, 0.31494140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 10.0, 17.0, 29.0, 54.0, 125.0, 190.0, 216.0, 157.0, 94.0, 43.0, 29.0, 8.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029994249343872, -1.970624327659607, -1.9112544059753418, -1.8518844842910767, -1.7925145626068115, -1.7331446409225464, -1.6737747192382812, -1.6144049167633057, -1.555034875869751, -1.4956649541854858, -1.4362950325012207, -1.3769251108169556, -1.3175551891326904, -1.2581852674484253, -1.1988153457641602, -1.1394455432891846, -1.0800756216049194, -1.0207056999206543, -0.9613357782363892, -0.901965856552124, -0.8425959348678589, -0.7832260131835938, -0.7238561511039734, -0.6644862294197083, -0.6051163077354431, -0.545746386051178, -0.48637646436691284, -0.4270065724849701, -0.36763665080070496, -0.3082667291164398, -0.24889683723449707, -0.18952691555023193, -0.1301569938659668, -0.07078707963228226, -0.011417165398597717, 0.047952741384506226, 0.10732266306877136, 0.1666925847530365, 0.22606247663497925, 0.2854323983192444, 0.3448023200035095, 0.40417224168777466, 0.4635421633720398, 0.5229120254516602, 0.5822819471359253, 0.6416518688201904, 0.7010217905044556, 0.7603917121887207, 0.8197616338729858, 0.879131555557251, 0.9385014772415161, 0.9978713989257812, 1.0572413206100464, 1.1166112422943115, 1.175981044769287, 1.2353510856628418, 1.2947208881378174, 1.3540908098220825, 1.4134607315063477, 1.4728306531906128, 1.532200574874878, 1.591570496559143, 1.6509404182434082, 1.7103102207183838, 1.7696802616119385]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 11.0, 9.0, 9.0, 17.0, 13.0, 17.0, 22.0, 21.0, 19.0, 32.0, 25.0, 33.0, 33.0, 39.0, 43.0, 56.0, 34.0, 45.0, 58.0, 43.0, 53.0, 40.0, 36.0, 43.0, 35.0, 35.0, 28.0, 27.0, 23.0, 11.0, 19.0, 13.0, 13.0, 7.0, 12.0, 3.0, 7.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6707677245140076, -0.6523903608322144, -0.6340130567550659, -0.6156356930732727, -0.5972583889961243, -0.578881025314331, -0.5605037212371826, -0.5421263575553894, -0.5237489938735962, -0.505371630191803, -0.48699432611465454, -0.4686169922351837, -0.4502396583557129, -0.4318622946739197, -0.41348496079444885, -0.395107626914978, -0.3767303228378296, -0.35835298895835876, -0.33997565507888794, -0.3215983211994171, -0.3032209873199463, -0.2848436236381531, -0.26646628975868225, -0.24808895587921143, -0.2297116219997406, -0.21133428812026978, -0.19295695424079895, -0.17457960546016693, -0.1562022715806961, -0.13782493770122528, -0.11944759637117386, -0.10107025504112244, -0.08269298076629639, -0.06431564688682556, -0.04593830555677414, -0.027560967952013016, -0.009183630347251892, 0.009193703532218933, 0.027571044862270355, 0.04594838619232178, 0.0643257200717926, 0.08270305395126343, 0.10108039528131485, 0.11945773661136627, 0.1378350704908371, 0.15621240437030792, 0.17458975315093994, 0.19296708703041077, 0.2113444209098816, 0.22972175478935242, 0.24809908866882324, 0.26647642254829407, 0.2848537564277649, 0.3032311201095581, 0.32160845398902893, 0.33998578786849976, 0.3583631217479706, 0.3767404556274414, 0.39511778950691223, 0.41349512338638306, 0.43187248706817627, 0.4502497911453247, 0.4686271548271179, 0.48700448870658875, 0.5053818225860596]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 12.0, 21.0, 21.0, 20.0, 30.0, 50.0, 74.0, 154.0, 245.0, 500.0, 1244.0, 3471.0, 10639.0, 39486.0, 189311.0, 594887.0, 159194.0, 34323.0, 9523.0, 3149.0, 1149.0, 489.0, 223.0, 114.0, 81.0, 41.0, 26.0, 16.0, 10.0, 12.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.460693359375, -0.446044921875, -0.431396484375, -0.416748046875, -0.402099609375, -0.387451171875, -0.372802734375, -0.358154296875, -0.343505859375, -0.328857421875, -0.314208984375, -0.299560546875, -0.284912109375, -0.270263671875, -0.255615234375, -0.240966796875, -0.226318359375, -0.211669921875, -0.197021484375, -0.182373046875, -0.167724609375, -0.153076171875, -0.138427734375, -0.123779296875, -0.109130859375, -0.094482421875, -0.079833984375, -0.065185546875, -0.050537109375, -0.035888671875, -0.021240234375, -0.006591796875, 0.008056640625, 0.022705078125, 0.037353515625, 0.052001953125, 0.066650390625, 0.081298828125, 0.095947265625, 0.110595703125, 0.125244140625, 0.139892578125, 0.154541015625, 0.169189453125, 0.183837890625, 0.198486328125, 0.213134765625, 0.227783203125, 0.242431640625, 0.257080078125, 0.271728515625, 0.286376953125, 0.301025390625, 0.315673828125, 0.330322265625, 0.344970703125, 0.359619140625, 0.374267578125, 0.388916015625, 0.403564453125, 0.418212890625, 0.432861328125, 0.447509765625, 0.462158203125, 0.476806640625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 9.0, 13.0, 17.0, 23.0, 31.0, 42.0, 41.0, 45.0, 47.0, 45.0, 46.0, 72.0, 70.0, 55.0, 71.0, 63.0, 65.0, 54.0, 38.0, 47.0, 31.0, 20.0, 22.0, 11.0, 17.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1129150390625, -0.10968208312988281, -0.10644912719726562, -0.10321617126464844, -0.09998321533203125, -0.09675025939941406, -0.09351730346679688, -0.09028434753417969, -0.0870513916015625, -0.08381843566894531, -0.08058547973632812, -0.07735252380371094, -0.07411956787109375, -0.07088661193847656, -0.06765365600585938, -0.06442070007324219, -0.061187744140625, -0.05795478820800781, -0.054721832275390625, -0.05148887634277344, -0.04825592041015625, -0.04502296447753906, -0.041790008544921875, -0.03855705261230469, -0.0353240966796875, -0.03209114074707031, -0.028858184814453125, -0.025625228881835938, -0.02239227294921875, -0.019159317016601562, -0.015926361083984375, -0.012693405151367188, -0.00946044921875, -0.0062274932861328125, -0.002994537353515625, 0.0002384185791015625, 0.00347137451171875, 0.0067043304443359375, 0.009937286376953125, 0.013170242309570312, 0.0164031982421875, 0.019636154174804688, 0.022869110107421875, 0.026102066040039062, 0.02933502197265625, 0.03256797790527344, 0.035800933837890625, 0.03903388977050781, 0.042266845703125, 0.04549980163574219, 0.048732757568359375, 0.05196571350097656, 0.05519866943359375, 0.05843162536621094, 0.061664581298828125, 0.06489753723144531, 0.0681304931640625, 0.07136344909667969, 0.07459640502929688, 0.07782936096191406, 0.08106231689453125, 0.08429527282714844, 0.08752822875976562, 0.09076118469238281, 0.093994140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 5.0, 6.0, 14.0, 16.0, 24.0, 38.0, 50.0, 101.0, 211.0, 574.0, 2340.0, 22070.0, 897075.0, 118674.0, 5638.0, 1038.0, 289.0, 130.0, 68.0, 50.0, 35.0, 20.0, 13.0, 7.0, 14.0, 8.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1982421875, -1.153411865234375, -1.10858154296875, -1.063751220703125, -1.0189208984375, -0.974090576171875, -0.92926025390625, -0.884429931640625, -0.839599609375, -0.794769287109375, -0.74993896484375, -0.705108642578125, -0.6602783203125, -0.615447998046875, -0.57061767578125, -0.525787353515625, -0.48095703125, -0.436126708984375, -0.39129638671875, -0.346466064453125, -0.3016357421875, -0.256805419921875, -0.21197509765625, -0.167144775390625, -0.122314453125, -0.077484130859375, -0.03265380859375, 0.012176513671875, 0.0570068359375, 0.101837158203125, 0.14666748046875, 0.191497802734375, 0.236328125, 0.281158447265625, 0.32598876953125, 0.370819091796875, 0.4156494140625, 0.460479736328125, 0.50531005859375, 0.550140380859375, 0.594970703125, 0.639801025390625, 0.68463134765625, 0.729461669921875, 0.7742919921875, 0.819122314453125, 0.86395263671875, 0.908782958984375, 0.95361328125, 0.998443603515625, 1.04327392578125, 1.088104248046875, 1.1329345703125, 1.177764892578125, 1.22259521484375, 1.267425537109375, 1.312255859375, 1.357086181640625, 1.40191650390625, 1.446746826171875, 1.4915771484375, 1.536407470703125, 1.58123779296875, 1.626068115234375, 1.6708984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 6.0, 2.0, 4.0, 5.0, 6.0, 10.0, 14.0, 16.0, 22.0, 28.0, 36.0, 38.0, 41.0, 38.0, 55.0, 70.0, 60.0, 57.0, 56.0, 59.0, 59.0, 42.0, 33.0, 37.0, 34.0, 34.0, 21.0, 25.0, 14.0, 15.0, 14.0, 12.0, 9.0, 6.0, 2.0, 3.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23511505126953125, -0.2273101806640625, -0.21950531005859375, -0.211700439453125, -0.20389556884765625, -0.1960906982421875, -0.18828582763671875, -0.18048095703125, -0.17267608642578125, -0.1648712158203125, -0.15706634521484375, -0.149261474609375, -0.14145660400390625, -0.1336517333984375, -0.12584686279296875, -0.1180419921875, -0.11023712158203125, -0.1024322509765625, -0.09462738037109375, -0.086822509765625, -0.07901763916015625, -0.0712127685546875, -0.06340789794921875, -0.05560302734375, -0.04779815673828125, -0.0399932861328125, -0.03218841552734375, -0.024383544921875, -0.01657867431640625, -0.0087738037109375, -0.00096893310546875, 0.0068359375, 0.01464080810546875, 0.0224456787109375, 0.03025054931640625, 0.038055419921875, 0.04586029052734375, 0.0536651611328125, 0.06147003173828125, 0.06927490234375, 0.07707977294921875, 0.0848846435546875, 0.09268951416015625, 0.100494384765625, 0.10829925537109375, 0.1161041259765625, 0.12390899658203125, 0.1317138671875, 0.13951873779296875, 0.1473236083984375, 0.15512847900390625, 0.162933349609375, 0.17073822021484375, 0.1785430908203125, 0.18634796142578125, 0.19415283203125, 0.20195770263671875, 0.2097625732421875, 0.21756744384765625, 0.225372314453125, 0.23317718505859375, 0.2409820556640625, 0.24878692626953125, 0.256591796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 3.0, 7.0, 13.0, 21.0, 36.0, 70.0, 97.0, 185.0, 394.0, 770.0, 1693.0, 4707.0, 16272.0, 120320.0, 770383.0, 110344.0, 15613.0, 4401.0, 1687.0, 754.0, 342.0, 168.0, 100.0, 62.0, 31.0, 24.0, 16.0, 8.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183349609375, -0.1778736114501953, -0.17239761352539062, -0.16692161560058594, -0.16144561767578125, -0.15596961975097656, -0.15049362182617188, -0.1450176239013672, -0.1395416259765625, -0.1340656280517578, -0.12858963012695312, -0.12311363220214844, -0.11763763427734375, -0.11216163635253906, -0.10668563842773438, -0.10120964050292969, -0.095733642578125, -0.09025764465332031, -0.08478164672851562, -0.07930564880371094, -0.07382965087890625, -0.06835365295410156, -0.06287765502929688, -0.05740165710449219, -0.0519256591796875, -0.04644966125488281, -0.040973663330078125, -0.03549766540527344, -0.03002166748046875, -0.024545669555664062, -0.019069671630859375, -0.013593673706054688, -0.00811767578125, -0.0026416778564453125, 0.002834320068359375, 0.008310317993164062, 0.01378631591796875, 0.019262313842773438, 0.024738311767578125, 0.030214309692382812, 0.0356903076171875, 0.04116630554199219, 0.046642303466796875, 0.05211830139160156, 0.05759429931640625, 0.06307029724121094, 0.06854629516601562, 0.07402229309082031, 0.079498291015625, 0.08497428894042969, 0.09045028686523438, 0.09592628479003906, 0.10140228271484375, 0.10687828063964844, 0.11235427856445312, 0.11783027648925781, 0.1233062744140625, 0.1287822723388672, 0.13425827026367188, 0.13973426818847656, 0.14521026611328125, 0.15068626403808594, 0.15616226196289062, 0.1616382598876953, 0.1671142578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 3.0, 2.0, 15.0, 18.0, 17.0, 31.0, 32.0, 54.0, 93.0, 157.0, 186.0, 156.0, 90.0, 53.0, 26.0, 21.0, 13.0, 10.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3663043975830078e-05, -2.282857894897461e-05, -2.199411392211914e-05, -2.1159648895263672e-05, -2.0325183868408203e-05, -1.9490718841552734e-05, -1.8656253814697266e-05, -1.7821788787841797e-05, -1.6987323760986328e-05, -1.615285873413086e-05, -1.531839370727539e-05, -1.4483928680419922e-05, -1.3649463653564453e-05, -1.2814998626708984e-05, -1.1980533599853516e-05, -1.1146068572998047e-05, -1.0311603546142578e-05, -9.47713851928711e-06, -8.64267349243164e-06, -7.808208465576172e-06, -6.973743438720703e-06, -6.139278411865234e-06, -5.304813385009766e-06, -4.470348358154297e-06, -3.635883331298828e-06, -2.8014183044433594e-06, -1.9669532775878906e-06, -1.1324882507324219e-06, -2.980232238769531e-07, 5.364418029785156e-07, 1.3709068298339844e-06, 2.205371856689453e-06, 3.039836883544922e-06, 3.874301910400391e-06, 4.708766937255859e-06, 5.543231964111328e-06, 6.377696990966797e-06, 7.212162017822266e-06, 8.046627044677734e-06, 8.881092071533203e-06, 9.715557098388672e-06, 1.055002212524414e-05, 1.138448715209961e-05, 1.2218952178955078e-05, 1.3053417205810547e-05, 1.3887882232666016e-05, 1.4722347259521484e-05, 1.5556812286376953e-05, 1.6391277313232422e-05, 1.722574234008789e-05, 1.806020736694336e-05, 1.8894672393798828e-05, 1.9729137420654297e-05, 2.0563602447509766e-05, 2.1398067474365234e-05, 2.2232532501220703e-05, 2.3066997528076172e-05, 2.390146255493164e-05, 2.473592758178711e-05, 2.5570392608642578e-05, 2.6404857635498047e-05, 2.7239322662353516e-05, 2.8073787689208984e-05, 2.8908252716064453e-05, 2.9742717742919922e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 14.0, 17.0, 24.0, 65.0, 143.0, 446.0, 2570.0, 47139.0, 975922.0, 19984.0, 1639.0, 341.0, 111.0, 65.0, 21.0, 14.0, 6.0, 12.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51611328125, -0.5019302368164062, -0.4877471923828125, -0.47356414794921875, -0.459381103515625, -0.44519805908203125, -0.4310150146484375, -0.41683197021484375, -0.40264892578125, -0.38846588134765625, -0.3742828369140625, -0.36009979248046875, -0.345916748046875, -0.33173370361328125, -0.3175506591796875, -0.30336761474609375, -0.2891845703125, -0.27500152587890625, -0.2608184814453125, -0.24663543701171875, -0.232452392578125, -0.21826934814453125, -0.2040863037109375, -0.18990325927734375, -0.17572021484375, -0.16153717041015625, -0.1473541259765625, -0.13317108154296875, -0.118988037109375, -0.10480499267578125, -0.0906219482421875, -0.07643890380859375, -0.062255859375, -0.04807281494140625, -0.0338897705078125, -0.01970672607421875, -0.005523681640625, 0.00865936279296875, 0.0228424072265625, 0.03702545166015625, 0.05120849609375, 0.06539154052734375, 0.0795745849609375, 0.09375762939453125, 0.107940673828125, 0.12212371826171875, 0.1363067626953125, 0.15048980712890625, 0.1646728515625, 0.17885589599609375, 0.1930389404296875, 0.20722198486328125, 0.221405029296875, 0.23558807373046875, 0.2497711181640625, 0.26395416259765625, 0.27813720703125, 0.29232025146484375, 0.3065032958984375, 0.32068634033203125, 0.334869384765625, 0.34905242919921875, 0.3632354736328125, 0.37741851806640625, 0.3916015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 9.0, 3.0, 22.0, 25.0, 27.0, 40.0, 43.0, 65.0, 78.0, 99.0, 102.0, 93.0, 96.0, 81.0, 49.0, 34.0, 27.0, 18.0, 11.0, 10.0, 5.0, 7.0, 2.0, 8.0, 3.0, 5.0, 6.0, 5.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.060211181640625, -0.05801820755004883, -0.055825233459472656, -0.053632259368896484, -0.05143928527832031, -0.04924631118774414, -0.04705333709716797, -0.0448603630065918, -0.042667388916015625, -0.04047441482543945, -0.03828144073486328, -0.03608846664428711, -0.03389549255371094, -0.031702518463134766, -0.029509544372558594, -0.027316570281982422, -0.02512359619140625, -0.022930622100830078, -0.020737648010253906, -0.018544673919677734, -0.016351699829101562, -0.01415872573852539, -0.011965751647949219, -0.009772777557373047, -0.007579803466796875, -0.005386829376220703, -0.0031938552856445312, -0.0010008811950683594, 0.0011920928955078125, 0.0033850669860839844, 0.005578041076660156, 0.007771015167236328, 0.0099639892578125, 0.012156963348388672, 0.014349937438964844, 0.016542911529541016, 0.018735885620117188, 0.02092885971069336, 0.02312183380126953, 0.025314807891845703, 0.027507781982421875, 0.029700756072998047, 0.03189373016357422, 0.03408670425415039, 0.03627967834472656, 0.038472652435302734, 0.040665626525878906, 0.04285860061645508, 0.04505157470703125, 0.04724454879760742, 0.049437522888183594, 0.051630496978759766, 0.05382347106933594, 0.05601644515991211, 0.05820941925048828, 0.06040239334106445, 0.06259536743164062, 0.0647883415222168, 0.06698131561279297, 0.06917428970336914, 0.07136726379394531, 0.07356023788452148, 0.07575321197509766, 0.07794618606567383, 0.08013916015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 11.0, 18.0, 24.0, 68.0, 97.0, 157.0, 176.0, 205.0, 95.0, 78.0, 23.0, 22.0, 10.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0946606397628784, -1.0392156839370728, -0.9837707281112671, -0.9283257722854614, -0.8728808164596558, -0.8174358606338501, -0.7619909048080444, -0.7065459489822388, -0.6511009931564331, -0.5956560373306274, -0.5402110815048218, -0.4847661256790161, -0.42932116985321045, -0.3738762140274048, -0.3184312582015991, -0.26298630237579346, -0.2075413465499878, -0.15209639072418213, -0.09665143489837646, -0.0412064790725708, 0.014238476753234863, 0.06968343257904053, 0.1251283884048462, 0.18057334423065186, 0.23601830005645752, 0.2914632558822632, 0.34690821170806885, 0.4023531675338745, 0.4577981233596802, 0.5132430791854858, 0.5686880350112915, 0.6241329908370972, 0.6795778274536133, 0.735022783279419, 0.7904677391052246, 0.8459126949310303, 0.9013576507568359, 0.9568026065826416, 1.0122475624084473, 1.067692518234253, 1.1231374740600586, 1.1785824298858643, 1.23402738571167, 1.2894723415374756, 1.3449172973632812, 1.400362253189087, 1.4558072090148926, 1.5112521648406982, 1.566697120666504, 1.6221420764923096, 1.6775870323181152, 1.733031988143921, 1.7884769439697266, 1.8439218997955322, 1.899366855621338, 1.9548118114471436, 2.010256767272949, 2.065701723098755, 2.1211466789245605, 2.176591634750366, 2.232036590576172, 2.2874815464019775, 2.342926502227783, 2.398371458053589, 2.4538164138793945]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 4.0, 8.0, 8.0, 16.0, 8.0, 14.0, 16.0, 16.0, 13.0, 17.0, 32.0, 34.0, 35.0, 34.0, 35.0, 46.0, 45.0, 30.0, 38.0, 42.0, 34.0, 31.0, 42.0, 46.0, 34.0, 40.0, 36.0, 29.0, 27.0, 34.0, 21.0, 21.0, 20.0, 17.0, 8.0, 11.0, 17.0, 10.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5861512422561646, -0.5680791139602661, -0.5500070452690125, -0.531934916973114, -0.5138627886772156, -0.4957906901836395, -0.4777185916900635, -0.45964646339416504, -0.441574364900589, -0.42350226640701294, -0.4054301381111145, -0.38735803961753845, -0.3692859411239624, -0.35121381282806396, -0.3331417143344879, -0.31506961584091187, -0.2969974875450134, -0.2789253890514374, -0.26085326075553894, -0.2427811622619629, -0.22470904886722565, -0.2066369354724884, -0.18856483697891235, -0.1704927235841751, -0.15242061018943787, -0.13434849679470062, -0.11627639085054398, -0.09820428490638733, -0.08013217151165009, -0.06206005811691284, -0.043987952172756195, -0.02591584622859955, -0.007843732833862305, 0.01022837683558464, 0.028300486505031586, 0.04637259617447853, 0.06444470584392548, 0.08251681923866272, 0.10058892518281937, 0.11866103112697601, 0.13673314452171326, 0.1548052579164505, 0.17287737131118774, 0.1909494698047638, 0.20902158319950104, 0.22709369659423828, 0.24516579508781433, 0.2632378935813904, 0.2813100218772888, 0.29938212037086487, 0.3174542486667633, 0.33552634716033936, 0.3535984754562378, 0.37167057394981384, 0.3897426724433899, 0.40781480073928833, 0.4258868992328644, 0.44395899772644043, 0.46203112602233887, 0.4801032245159149, 0.49817532300949097, 0.5162474513053894, 0.5343195796012878, 0.5523916482925415, 0.5704637765884399]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 16.0, 13.0, 39.0, 45.0, 111.0, 151.0, 389.0, 1069.0, 3950.0, 18020.0, 190441.0, 3768620.0, 187341.0, 18295.0, 3922.0, 1124.0, 369.0, 178.0, 82.0, 34.0, 32.0, 14.0, 6.0, 8.0, 7.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3177757263183594, -0.30425262451171875, -0.2907295227050781, -0.2772064208984375, -0.2636833190917969, -0.25016021728515625, -0.23663711547851562, -0.223114013671875, -0.20959091186523438, -0.19606781005859375, -0.18254470825195312, -0.1690216064453125, -0.15549850463867188, -0.14197540283203125, -0.12845230102539062, -0.11492919921875, -0.10140609741210938, -0.08788299560546875, -0.07435989379882812, -0.0608367919921875, -0.047313690185546875, -0.03379058837890625, -0.020267486572265625, -0.006744384765625, 0.006778717041015625, 0.02030181884765625, 0.033824920654296875, 0.0473480224609375, 0.060871124267578125, 0.07439422607421875, 0.08791732788085938, 0.1014404296875, 0.11496353149414062, 0.12848663330078125, 0.14200973510742188, 0.1555328369140625, 0.16905593872070312, 0.18257904052734375, 0.19610214233398438, 0.209625244140625, 0.22314834594726562, 0.23667144775390625, 0.2501945495605469, 0.2637176513671875, 0.2772407531738281, 0.29076385498046875, 0.3042869567871094, 0.31781005859375, 0.3313331604003906, 0.34485626220703125, 0.3583793640136719, 0.3719024658203125, 0.3854255676269531, 0.39894866943359375, 0.4124717712402344, 0.425994873046875, 0.4395179748535156, 0.45304107666015625, 0.4665641784667969, 0.4800872802734375, 0.4936103820800781, 0.5071334838867188, 0.5206565856933594, 0.5341796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 13.0, 14.0, 26.0, 27.0, 37.0, 29.0, 44.0, 45.0, 59.0, 53.0, 68.0, 58.0, 50.0, 65.0, 63.0, 55.0, 39.0, 63.0, 36.0, 33.0, 21.0, 28.0, 26.0, 10.0, 9.0, 11.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11212158203125, -0.1087656021118164, -0.10540962219238281, -0.10205364227294922, -0.09869766235351562, -0.09534168243408203, -0.09198570251464844, -0.08862972259521484, -0.08527374267578125, -0.08191776275634766, -0.07856178283691406, -0.07520580291748047, -0.07184982299804688, -0.06849384307861328, -0.06513786315917969, -0.061781883239746094, -0.0584259033203125, -0.055069923400878906, -0.05171394348144531, -0.04835796356201172, -0.045001983642578125, -0.04164600372314453, -0.03829002380371094, -0.034934043884277344, -0.03157806396484375, -0.028222084045410156, -0.024866104125976562, -0.02151012420654297, -0.018154144287109375, -0.014798164367675781, -0.011442184448242188, -0.008086204528808594, -0.004730224609375, -0.0013742446899414062, 0.0019817352294921875, 0.005337715148925781, 0.008693695068359375, 0.012049674987792969, 0.015405654907226562, 0.018761634826660156, 0.02211761474609375, 0.025473594665527344, 0.028829574584960938, 0.03218555450439453, 0.035541534423828125, 0.03889751434326172, 0.04225349426269531, 0.045609474182128906, 0.0489654541015625, 0.052321434020996094, 0.05567741394042969, 0.05903339385986328, 0.062389373779296875, 0.06574535369873047, 0.06910133361816406, 0.07245731353759766, 0.07581329345703125, 0.07916927337646484, 0.08252525329589844, 0.08588123321533203, 0.08923721313476562, 0.09259319305419922, 0.09594917297363281, 0.0993051528930664, 0.1026611328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 11.0, 9.0, 12.0, 28.0, 39.0, 41.0, 61.0, 86.0, 119.0, 191.0, 237.0, 465.0, 680.0, 1219.0, 2172.0, 4674.0, 12172.0, 47103.0, 498484.0, 3443235.0, 143206.0, 24477.0, 7867.0, 3427.0, 1638.0, 952.0, 562.0, 329.0, 246.0, 162.0, 90.0, 78.0, 47.0, 34.0, 26.0, 26.0, 17.0, 12.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4440574645996094, -0.42986297607421875, -0.4156684875488281, -0.4014739990234375, -0.3872795104980469, -0.37308502197265625, -0.3588905334472656, -0.344696044921875, -0.3305015563964844, -0.31630706787109375, -0.3021125793457031, -0.2879180908203125, -0.2737236022949219, -0.25952911376953125, -0.24533462524414062, -0.23114013671875, -0.21694564819335938, -0.20275115966796875, -0.18855667114257812, -0.1743621826171875, -0.16016769409179688, -0.14597320556640625, -0.13177871704101562, -0.117584228515625, -0.10338973999023438, -0.08919525146484375, -0.07500076293945312, -0.0608062744140625, -0.046611785888671875, -0.03241729736328125, -0.018222808837890625, -0.0040283203125, 0.010166168212890625, 0.02436065673828125, 0.038555145263671875, 0.0527496337890625, 0.06694412231445312, 0.08113861083984375, 0.09533309936523438, 0.109527587890625, 0.12372207641601562, 0.13791656494140625, 0.15211105346679688, 0.1663055419921875, 0.18050003051757812, 0.19469451904296875, 0.20888900756835938, 0.22308349609375, 0.23727798461914062, 0.25147247314453125, 0.2656669616699219, 0.2798614501953125, 0.2940559387207031, 0.30825042724609375, 0.3224449157714844, 0.336639404296875, 0.3508338928222656, 0.36502838134765625, 0.3792228698730469, 0.3934173583984375, 0.4076118469238281, 0.42180633544921875, 0.4360008239746094, 0.4501953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 18.0, 23.0, 37.0, 74.0, 115.0, 298.0, 845.0, 1556.0, 598.0, 215.0, 126.0, 49.0, 34.0, 14.0, 12.0, 13.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42041015625, -0.4070091247558594, -0.39360809326171875, -0.3802070617675781, -0.3668060302734375, -0.3534049987792969, -0.34000396728515625, -0.3266029357910156, -0.313201904296875, -0.2998008728027344, -0.28639984130859375, -0.2729988098144531, -0.2595977783203125, -0.24619674682617188, -0.23279571533203125, -0.21939468383789062, -0.20599365234375, -0.19259262084960938, -0.17919158935546875, -0.16579055786132812, -0.1523895263671875, -0.13898849487304688, -0.12558746337890625, -0.11218643188476562, -0.098785400390625, -0.08538436889648438, -0.07198333740234375, -0.058582305908203125, -0.0451812744140625, -0.031780242919921875, -0.01837921142578125, -0.004978179931640625, 0.0084228515625, 0.021823883056640625, 0.03522491455078125, 0.048625946044921875, 0.0620269775390625, 0.07542800903320312, 0.08882904052734375, 0.10223007202148438, 0.115631103515625, 0.12903213500976562, 0.14243316650390625, 0.15583419799804688, 0.1692352294921875, 0.18263626098632812, 0.19603729248046875, 0.20943832397460938, 0.22283935546875, 0.23624038696289062, 0.24964141845703125, 0.2630424499511719, 0.2764434814453125, 0.2898445129394531, 0.30324554443359375, 0.3166465759277344, 0.330047607421875, 0.3434486389160156, 0.35684967041015625, 0.3702507019042969, 0.3836517333984375, 0.3970527648925781, 0.41045379638671875, 0.4238548278808594, 0.437255859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 15.0, 32.0, 50.0, 115.0, 199.0, 250.0, 168.0, 83.0, 36.0, 19.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.069161295890808, -0.9986083507537842, -0.9280553460121155, -0.8575024008750916, -0.7869493961334229, -0.7163964509963989, -0.645843505859375, -0.5752905607223511, -0.5047375559806824, -0.43418458104133606, -0.36363160610198975, -0.2930786609649658, -0.2225256860256195, -0.1519727110862732, -0.08141976594924927, -0.010866791009902954, 0.05968618392944336, 0.13023915886878967, 0.2007921189069748, 0.2713450789451599, 0.3418980538845062, 0.41245102882385254, 0.48300397396087646, 0.5535569190979004, 0.6241099238395691, 0.694662868976593, 0.7652158737182617, 0.8357688188552856, 0.9063217639923096, 0.9768747687339783, 1.0474276542663574, 1.117980718612671, 1.1885337829589844, 1.2590867280960083, 1.3296396732330322, 1.4001927375793457, 1.4707456827163696, 1.5412986278533936, 1.6118515729904175, 1.6824045181274414, 1.7529575824737549, 1.8235105276107788, 1.8940634727478027, 1.9646165370941162, 2.0351693630218506, 2.105722427368164, 2.1762752532958984, 2.246828317642212, 2.3173813819885254, 2.387934446334839, 2.4584872722625732, 2.5290403366088867, 2.599593162536621, 2.6701462268829346, 2.740699291229248, 2.8112521171569824, 2.881804943084717, 2.9523580074310303, 3.0229108333587646, 3.093463897705078, 3.1640167236328125, 3.234569787979126, 3.3051228523254395, 3.375675678253174, 3.4462287425994873]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 7.0, 4.0, 14.0, 6.0, 20.0, 21.0, 13.0, 20.0, 19.0, 19.0, 34.0, 47.0, 47.0, 31.0, 37.0, 54.0, 43.0, 43.0, 49.0, 44.0, 55.0, 33.0, 52.0, 41.0, 33.0, 20.0, 32.0, 23.0, 26.0, 17.0, 19.0, 15.0, 16.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.8471047878265381, -0.8246310949325562, -0.8021573424339294, -0.7796836495399475, -0.7572098970413208, -0.7347362041473389, -0.7122625112533569, -0.689788818359375, -0.6673150658607483, -0.6448413729667664, -0.6223676204681396, -0.5998939275741577, -0.5774202346801758, -0.5549464821815491, -0.5324727892875671, -0.5099990367889404, -0.4875253438949585, -0.4650516211986542, -0.44257789850234985, -0.4201042056083679, -0.3976304829120636, -0.3751567602157593, -0.35268306732177734, -0.330209344625473, -0.3077356219291687, -0.2852618992328644, -0.26278817653656006, -0.24031448364257812, -0.2178407609462738, -0.19536703824996948, -0.17289333045482635, -0.15041962265968323, -0.12794584035873413, -0.1054721251130104, -0.08299840986728668, -0.06052469462156296, -0.03805097937583923, -0.015577264130115509, 0.006896451115608215, 0.029370158910751343, 0.051843881607055664, 0.07431759685277939, 0.09679131209850311, 0.11926502734422684, 0.14173874258995056, 0.16421246528625488, 0.186686173081398, 0.20915988087654114, 0.23163360357284546, 0.2541073262691498, 0.2765810489654541, 0.29905474185943604, 0.32152846455574036, 0.3440021872520447, 0.3664758801460266, 0.38894960284233093, 0.41142332553863525, 0.4338970482349396, 0.4563707709312439, 0.47884446382522583, 0.5013182163238525, 0.5237919092178345, 0.5462656021118164, 0.5687392950057983, 0.591213047504425]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 8.0, 5.0, 12.0, 12.0, 27.0, 22.0, 27.0, 30.0, 56.0, 77.0, 131.0, 234.0, 403.0, 856.0, 1837.0, 4266.0, 11322.0, 31810.0, 98713.0, 318975.0, 386451.0, 129368.0, 40235.0, 13989.0, 5249.0, 2283.0, 944.0, 482.0, 261.0, 130.0, 97.0, 57.0, 55.0, 27.0, 18.0, 21.0, 11.0, 8.0, 12.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.345458984375, -0.3335914611816406, -0.32172393798828125, -0.3098564147949219, -0.2979888916015625, -0.2861213684082031, -0.27425384521484375, -0.2623863220214844, -0.250518798828125, -0.23865127563476562, -0.22678375244140625, -0.21491622924804688, -0.2030487060546875, -0.19118118286132812, -0.17931365966796875, -0.16744613647460938, -0.15557861328125, -0.14371109008789062, -0.13184356689453125, -0.11997604370117188, -0.1081085205078125, -0.09624099731445312, -0.08437347412109375, -0.07250595092773438, -0.060638427734375, -0.048770904541015625, -0.03690338134765625, -0.025035858154296875, -0.0131683349609375, -0.001300811767578125, 0.01056671142578125, 0.022434234619140625, 0.0343017578125, 0.046169281005859375, 0.05803680419921875, 0.06990432739257812, 0.0817718505859375, 0.09363937377929688, 0.10550689697265625, 0.11737442016601562, 0.129241943359375, 0.14110946655273438, 0.15297698974609375, 0.16484451293945312, 0.1767120361328125, 0.18857955932617188, 0.20044708251953125, 0.21231460571289062, 0.22418212890625, 0.23604965209960938, 0.24791717529296875, 0.2597846984863281, 0.2716522216796875, 0.2835197448730469, 0.29538726806640625, 0.3072547912597656, 0.319122314453125, 0.3309898376464844, 0.34285736083984375, 0.3547248840332031, 0.3665924072265625, 0.3784599304199219, 0.39032745361328125, 0.4021949768066406, 0.4140625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 7.0, 8.0, 21.0, 26.0, 29.0, 43.0, 42.0, 56.0, 48.0, 77.0, 68.0, 70.0, 79.0, 63.0, 73.0, 57.0, 43.0, 45.0, 43.0, 34.0, 23.0, 11.0, 11.0, 9.0, 8.0, 7.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148681640625, -0.14441680908203125, -0.1401519775390625, -0.13588714599609375, -0.131622314453125, -0.12735748291015625, -0.1230926513671875, -0.11882781982421875, -0.11456298828125, -0.11029815673828125, -0.1060333251953125, -0.10176849365234375, -0.097503662109375, -0.09323883056640625, -0.0889739990234375, -0.08470916748046875, -0.0804443359375, -0.07617950439453125, -0.0719146728515625, -0.06764984130859375, -0.063385009765625, -0.05912017822265625, -0.0548553466796875, -0.05059051513671875, -0.04632568359375, -0.04206085205078125, -0.0377960205078125, -0.03353118896484375, -0.029266357421875, -0.02500152587890625, -0.0207366943359375, -0.01647186279296875, -0.01220703125, -0.00794219970703125, -0.0036773681640625, 0.00058746337890625, 0.004852294921875, 0.00911712646484375, 0.0133819580078125, 0.01764678955078125, 0.02191162109375, 0.02617645263671875, 0.0304412841796875, 0.03470611572265625, 0.038970947265625, 0.04323577880859375, 0.0475006103515625, 0.05176544189453125, 0.0560302734375, 0.06029510498046875, 0.0645599365234375, 0.06882476806640625, 0.073089599609375, 0.07735443115234375, 0.0816192626953125, 0.08588409423828125, 0.09014892578125, 0.09441375732421875, 0.0986785888671875, 0.10294342041015625, 0.107208251953125, 0.11147308349609375, 0.1157379150390625, 0.12000274658203125, 0.124267578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 6.0, 9.0, 13.0, 19.0, 27.0, 45.0, 80.0, 146.0, 381.0, 1020.0, 3801.0, 23816.0, 369151.0, 607088.0, 35653.0, 5234.0, 1234.0, 395.0, 174.0, 83.0, 52.0, 22.0, 19.0, 13.0, 14.0, 10.0, 3.0, 5.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.05078125, -1.018035888671875, -0.98529052734375, -0.952545166015625, -0.9197998046875, -0.887054443359375, -0.85430908203125, -0.821563720703125, -0.788818359375, -0.756072998046875, -0.72332763671875, -0.690582275390625, -0.6578369140625, -0.625091552734375, -0.59234619140625, -0.559600830078125, -0.52685546875, -0.494110107421875, -0.46136474609375, -0.428619384765625, -0.3958740234375, -0.363128662109375, -0.33038330078125, -0.297637939453125, -0.264892578125, -0.232147216796875, -0.19940185546875, -0.166656494140625, -0.1339111328125, -0.101165771484375, -0.06842041015625, -0.035675048828125, -0.0029296875, 0.029815673828125, 0.06256103515625, 0.095306396484375, 0.1280517578125, 0.160797119140625, 0.19354248046875, 0.226287841796875, 0.259033203125, 0.291778564453125, 0.32452392578125, 0.357269287109375, 0.3900146484375, 0.422760009765625, 0.45550537109375, 0.488250732421875, 0.52099609375, 0.553741455078125, 0.58648681640625, 0.619232177734375, 0.6519775390625, 0.684722900390625, 0.71746826171875, 0.750213623046875, 0.782958984375, 0.815704345703125, 0.84844970703125, 0.881195068359375, 0.9139404296875, 0.946685791015625, 0.97943115234375, 1.012176513671875, 1.044921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 5.0, 3.0, 9.0, 6.0, 3.0, 11.0, 16.0, 13.0, 13.0, 12.0, 22.0, 18.0, 27.0, 28.0, 32.0, 33.0, 35.0, 31.0, 35.0, 44.0, 53.0, 53.0, 51.0, 54.0, 40.0, 52.0, 36.0, 45.0, 33.0, 34.0, 21.0, 22.0, 16.0, 20.0, 11.0, 14.0, 8.0, 12.0, 6.0, 10.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.28955078125, -0.28052520751953125, -0.2714996337890625, -0.26247406005859375, -0.253448486328125, -0.24442291259765625, -0.2353973388671875, -0.22637176513671875, -0.21734619140625, -0.20832061767578125, -0.1992950439453125, -0.19026947021484375, -0.181243896484375, -0.17221832275390625, -0.1631927490234375, -0.15416717529296875, -0.1451416015625, -0.13611602783203125, -0.1270904541015625, -0.11806488037109375, -0.109039306640625, -0.10001373291015625, -0.0909881591796875, -0.08196258544921875, -0.07293701171875, -0.06391143798828125, -0.0548858642578125, -0.04586029052734375, -0.036834716796875, -0.02780914306640625, -0.0187835693359375, -0.00975799560546875, -0.000732421875, 0.00829315185546875, 0.0173187255859375, 0.02634429931640625, 0.035369873046875, 0.04439544677734375, 0.0534210205078125, 0.06244659423828125, 0.07147216796875, 0.08049774169921875, 0.0895233154296875, 0.09854888916015625, 0.107574462890625, 0.11660003662109375, 0.1256256103515625, 0.13465118408203125, 0.1436767578125, 0.15270233154296875, 0.1617279052734375, 0.17075347900390625, 0.179779052734375, 0.18880462646484375, 0.1978302001953125, 0.20685577392578125, 0.21588134765625, 0.22490692138671875, 0.2339324951171875, 0.24295806884765625, 0.251983642578125, 0.26100921630859375, 0.2700347900390625, 0.27906036376953125, 0.2880859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 9.0, 3.0, 2.0, 6.0, 5.0, 14.0, 14.0, 26.0, 36.0, 58.0, 121.0, 194.0, 362.0, 679.0, 1263.0, 2417.0, 5159.0, 11315.0, 28548.0, 131961.0, 763581.0, 65448.0, 20523.0, 8689.0, 3956.0, 1966.0, 957.0, 544.0, 295.0, 154.0, 98.0, 55.0, 35.0, 21.0, 11.0, 11.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351806640625, -0.3412513732910156, -0.33069610595703125, -0.3201408386230469, -0.3095855712890625, -0.2990303039550781, -0.28847503662109375, -0.2779197692871094, -0.267364501953125, -0.2568092346191406, -0.24625396728515625, -0.23569869995117188, -0.2251434326171875, -0.21458816528320312, -0.20403289794921875, -0.19347763061523438, -0.18292236328125, -0.17236709594726562, -0.16181182861328125, -0.15125656127929688, -0.1407012939453125, -0.13014602661132812, -0.11959075927734375, -0.10903549194335938, -0.098480224609375, -0.08792495727539062, -0.07736968994140625, -0.06681442260742188, -0.0562591552734375, -0.045703887939453125, -0.03514862060546875, -0.024593353271484375, -0.0140380859375, -0.003482818603515625, 0.00707244873046875, 0.017627716064453125, 0.0281829833984375, 0.038738250732421875, 0.04929351806640625, 0.059848785400390625, 0.070404052734375, 0.08095932006835938, 0.09151458740234375, 0.10206985473632812, 0.1126251220703125, 0.12318038940429688, 0.13373565673828125, 0.14429092407226562, 0.15484619140625, 0.16540145874023438, 0.17595672607421875, 0.18651199340820312, 0.1970672607421875, 0.20762252807617188, 0.21817779541015625, 0.22873306274414062, 0.239288330078125, 0.24984359741210938, 0.26039886474609375, 0.2709541320800781, 0.2815093994140625, 0.2920646667480469, 0.30261993408203125, 0.3131752014160156, 0.32373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 6.0, 11.0, 7.0, 21.0, 40.0, 60.0, 112.0, 204.0, 206.0, 120.0, 52.0, 31.0, 23.0, 8.0, 15.0, 5.0, 10.0, 5.0, 5.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4955482482910156e-05, -5.3239986300468445e-05, -5.1524490118026733e-05, -4.980899393558502e-05, -4.809349775314331e-05, -4.63780015707016e-05, -4.466250538825989e-05, -4.2947009205818176e-05, -4.1231513023376465e-05, -3.9516016840934753e-05, -3.780052065849304e-05, -3.608502447605133e-05, -3.436952829360962e-05, -3.265403211116791e-05, -3.0938535928726196e-05, -2.9223039746284485e-05, -2.7507543563842773e-05, -2.5792047381401062e-05, -2.407655119895935e-05, -2.236105501651764e-05, -2.0645558834075928e-05, -1.8930062651634216e-05, -1.7214566469192505e-05, -1.5499070286750793e-05, -1.3783574104309082e-05, -1.206807792186737e-05, -1.035258173942566e-05, -8.637085556983948e-06, -6.921589374542236e-06, -5.206093192100525e-06, -3.4905970096588135e-06, -1.775100827217102e-06, -5.960464477539063e-08, 1.6558915376663208e-06, 3.3713877201080322e-06, 5.086883902549744e-06, 6.802380084991455e-06, 8.517876267433167e-06, 1.0233372449874878e-05, 1.194886863231659e-05, 1.36643648147583e-05, 1.5379860997200012e-05, 1.7095357179641724e-05, 1.8810853362083435e-05, 2.0526349544525146e-05, 2.2241845726966858e-05, 2.395734190940857e-05, 2.567283809185028e-05, 2.7388334274291992e-05, 2.9103830456733704e-05, 3.0819326639175415e-05, 3.2534822821617126e-05, 3.425031900405884e-05, 3.596581518650055e-05, 3.768131136894226e-05, 3.939680755138397e-05, 4.1112303733825684e-05, 4.2827799916267395e-05, 4.4543296098709106e-05, 4.625879228115082e-05, 4.797428846359253e-05, 4.968978464603424e-05, 5.140528082847595e-05, 5.3120777010917664e-05, 5.4836273193359375e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 11.0, 9.0, 12.0, 23.0, 35.0, 47.0, 89.0, 195.0, 475.0, 1543.0, 5834.0, 31765.0, 933446.0, 62713.0, 8890.0, 2192.0, 673.0, 255.0, 117.0, 61.0, 29.0, 15.0, 24.0, 14.0, 14.0, 10.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0654296875, -1.0346755981445312, -1.0039215087890625, -0.9731674194335938, -0.942413330078125, -0.9116592407226562, -0.8809051513671875, -0.8501510620117188, -0.81939697265625, -0.7886428833007812, -0.7578887939453125, -0.7271347045898438, -0.696380615234375, -0.6656265258789062, -0.6348724365234375, -0.6041183471679688, -0.5733642578125, -0.5426101684570312, -0.5118560791015625, -0.48110198974609375, -0.450347900390625, -0.41959381103515625, -0.3888397216796875, -0.35808563232421875, -0.32733154296875, -0.29657745361328125, -0.2658233642578125, -0.23506927490234375, -0.204315185546875, -0.17356109619140625, -0.1428070068359375, -0.11205291748046875, -0.081298828125, -0.05054473876953125, -0.0197906494140625, 0.01096343994140625, 0.041717529296875, 0.07247161865234375, 0.1032257080078125, 0.13397979736328125, 0.16473388671875, 0.19548797607421875, 0.2262420654296875, 0.25699615478515625, 0.287750244140625, 0.31850433349609375, 0.3492584228515625, 0.38001251220703125, 0.4107666015625, 0.44152069091796875, 0.4722747802734375, 0.5030288696289062, 0.533782958984375, 0.5645370483398438, 0.5952911376953125, 0.6260452270507812, 0.65679931640625, 0.6875534057617188, 0.7183074951171875, 0.7490615844726562, 0.779815673828125, 0.8105697631835938, 0.8413238525390625, 0.8720779418945312, 0.90283203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 7.0, 4.0, 9.0, 10.0, 13.0, 18.0, 11.0, 25.0, 36.0, 91.0, 247.0, 245.0, 79.0, 41.0, 25.0, 13.0, 12.0, 10.0, 4.0, 9.0, 6.0, 9.0, 10.0, 7.0, 2.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.250732421875, -0.24236297607421875, -0.2339935302734375, -0.22562408447265625, -0.217254638671875, -0.20888519287109375, -0.2005157470703125, -0.19214630126953125, -0.18377685546875, -0.17540740966796875, -0.1670379638671875, -0.15866851806640625, -0.150299072265625, -0.14192962646484375, -0.1335601806640625, -0.12519073486328125, -0.1168212890625, -0.10845184326171875, -0.1000823974609375, -0.09171295166015625, -0.083343505859375, -0.07497406005859375, -0.0666046142578125, -0.05823516845703125, -0.04986572265625, -0.04149627685546875, -0.0331268310546875, -0.02475738525390625, -0.016387939453125, -0.00801849365234375, 0.0003509521484375, 0.00872039794921875, 0.01708984375, 0.02545928955078125, 0.0338287353515625, 0.04219818115234375, 0.050567626953125, 0.05893707275390625, 0.0673065185546875, 0.07567596435546875, 0.08404541015625, 0.09241485595703125, 0.1007843017578125, 0.10915374755859375, 0.117523193359375, 0.12589263916015625, 0.1342620849609375, 0.14263153076171875, 0.1510009765625, 0.15937042236328125, 0.1677398681640625, 0.17610931396484375, 0.184478759765625, 0.19284820556640625, 0.2012176513671875, 0.20958709716796875, 0.21795654296875, 0.22632598876953125, 0.2346954345703125, 0.24306488037109375, 0.251434326171875, 0.25980377197265625, 0.2681732177734375, 0.27654266357421875, 0.284912109375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 19.0, 34.0, 95.0, 351.0, 371.0, 97.0, 33.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9791492223739624, -1.800457239151001, -1.621765375137329, -1.4430735111236572, -1.2643815279006958, -1.0856895446777344, -0.9069976806640625, -0.7283056974411011, -0.5496138334274292, -0.37092190980911255, -0.1922299861907959, -0.013538062572479248, 0.1651538610458374, 0.34384578466415405, 0.5225377082824707, 0.7012296915054321, 0.879921555519104, 1.0586135387420654, 1.2373054027557373, 1.4159972667694092, 1.5946892499923706, 1.773381233215332, 1.952073097229004, 2.130764961242676, 2.3094568252563477, 2.4881486892700195, 2.6668405532836914, 2.8455326557159424, 3.0242245197296143, 3.202916383743286, 3.381608486175537, 3.560300350189209, 3.738992691040039, 3.917684555053711, 4.096376419067383, 4.275068283081055, 4.453760147094727, 4.632452487945557, 4.8111443519592285, 4.9898362159729, 5.168528079986572, 5.347219944000244, 5.525911808013916, 5.704603672027588, 5.883296012878418, 6.06198787689209, 6.240679740905762, 6.419371604919434, 6.5980634689331055, 6.776755332946777, 6.955447196960449, 7.134139060974121, 7.312830924987793, 7.491523265838623, 7.670215129852295, 7.848906993865967, 8.027599334716797, 8.206291198730469, 8.38498306274414, 8.563674926757812, 8.742366790771484, 8.921058654785156, 9.099750518798828, 9.2784423828125, 9.457134246826172]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 7.0, 4.0, 15.0, 11.0, 14.0, 21.0, 25.0, 27.0, 22.0, 28.0, 31.0, 33.0, 43.0, 35.0, 42.0, 39.0, 41.0, 36.0, 52.0, 45.0, 40.0, 44.0, 51.0, 44.0, 35.0, 38.0, 27.0, 18.0, 17.0, 18.0, 16.0, 10.0, 11.0, 14.0, 8.0, 5.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8864017128944397, -0.8581781387329102, -0.8299545645713806, -0.8017309308052063, -0.7735073566436768, -0.7452837824821472, -0.7170602083206177, -0.6888365745544434, -0.6606130003929138, -0.6323894262313843, -0.6041658520698547, -0.5759422183036804, -0.5477186441421509, -0.5194950699806213, -0.4912714958190918, -0.46304789185523987, -0.4348243176937103, -0.4066007435321808, -0.37837713956832886, -0.3501535654067993, -0.3219299614429474, -0.29370638728141785, -0.2654827833175659, -0.23725920915603638, -0.20903562009334564, -0.1808120310306549, -0.15258844196796417, -0.12436486035585403, -0.0961412712931633, -0.06791768968105316, -0.03969410061836243, -0.011470511555671692, 0.016753077507019043, 0.04497666656970978, 0.07320025563240051, 0.10142383724451065, 0.12964743375778198, 0.15787100791931152, 0.18609459698200226, 0.214318186044693, 0.24254177510738373, 0.27076536417007446, 0.298988938331604, 0.32721254229545593, 0.3554361164569855, 0.3836597204208374, 0.41188329458236694, 0.4401068687438965, 0.4683304727077484, 0.49655404686927795, 0.5247776508331299, 0.5530012249946594, 0.581224799156189, 0.6094484329223633, 0.6376720070838928, 0.6658955812454224, 0.6941191554069519, 0.7223427295684814, 0.750566303730011, 0.7787899374961853, 0.8070135116577148, 0.8352370858192444, 0.8634606599807739, 0.8916842937469482, 0.9199078679084778]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 8.0, 19.0, 15.0, 23.0, 31.0, 52.0, 69.0, 117.0, 194.0, 276.0, 480.0, 752.0, 1314.0, 2375.0, 4753.0, 10439.0, 25688.0, 101195.0, 819386.0, 2822978.0, 319361.0, 51966.0, 17400.0, 7313.0, 3508.0, 1800.0, 1038.0, 633.0, 379.0, 228.0, 139.0, 104.0, 77.0, 47.0, 26.0, 21.0, 23.0, 12.0, 11.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1993408203125, -0.19276046752929688, -0.18618011474609375, -0.17959976196289062, -0.1730194091796875, -0.16643905639648438, -0.15985870361328125, -0.15327835083007812, -0.146697998046875, -0.14011764526367188, -0.13353729248046875, -0.12695693969726562, -0.1203765869140625, -0.11379623413085938, -0.10721588134765625, -0.10063552856445312, -0.09405517578125, -0.08747482299804688, -0.08089447021484375, -0.07431411743164062, -0.0677337646484375, -0.061153411865234375, -0.05457305908203125, -0.047992706298828125, -0.041412353515625, -0.034832000732421875, -0.02825164794921875, -0.021671295166015625, -0.0150909423828125, -0.008510589599609375, -0.00193023681640625, 0.004650115966796875, 0.01123046875, 0.017810821533203125, 0.02439117431640625, 0.030971527099609375, 0.0375518798828125, 0.044132232666015625, 0.05071258544921875, 0.057292938232421875, 0.063873291015625, 0.07045364379882812, 0.07703399658203125, 0.08361434936523438, 0.0901947021484375, 0.09677505493164062, 0.10335540771484375, 0.10993576049804688, 0.11651611328125, 0.12309646606445312, 0.12967681884765625, 0.13625717163085938, 0.1428375244140625, 0.14941787719726562, 0.15599822998046875, 0.16257858276367188, 0.169158935546875, 0.17573928833007812, 0.18231964111328125, 0.18889999389648438, 0.1954803466796875, 0.20206069946289062, 0.20864105224609375, 0.21522140502929688, 0.2218017578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 13.0, 14.0, 22.0, 19.0, 24.0, 29.0, 48.0, 45.0, 45.0, 53.0, 53.0, 50.0, 56.0, 65.0, 61.0, 68.0, 57.0, 57.0, 35.0, 40.0, 34.0, 30.0, 20.0, 11.0, 11.0, 11.0, 5.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.1390829086303711, -0.1349773406982422, -0.13087177276611328, -0.12676620483398438, -0.12266063690185547, -0.11855506896972656, -0.11444950103759766, -0.11034393310546875, -0.10623836517333984, -0.10213279724121094, -0.09802722930908203, -0.09392166137695312, -0.08981609344482422, -0.08571052551269531, -0.0816049575805664, -0.0774993896484375, -0.0733938217163086, -0.06928825378417969, -0.06518268585205078, -0.061077117919921875, -0.05697154998779297, -0.05286598205566406, -0.048760414123535156, -0.04465484619140625, -0.040549278259277344, -0.03644371032714844, -0.03233814239501953, -0.028232574462890625, -0.02412700653076172, -0.020021438598632812, -0.015915870666503906, -0.011810302734375, -0.007704734802246094, -0.0035991668701171875, 0.0005064010620117188, 0.004611968994140625, 0.008717536926269531, 0.012823104858398438, 0.016928672790527344, 0.02103424072265625, 0.025139808654785156, 0.029245376586914062, 0.03335094451904297, 0.037456512451171875, 0.04156208038330078, 0.04566764831542969, 0.049773216247558594, 0.0538787841796875, 0.057984352111816406, 0.06208992004394531, 0.06619548797607422, 0.07030105590820312, 0.07440662384033203, 0.07851219177246094, 0.08261775970458984, 0.08672332763671875, 0.09082889556884766, 0.09493446350097656, 0.09904003143310547, 0.10314559936523438, 0.10725116729736328, 0.11135673522949219, 0.1154623031616211, 0.11956787109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 13.0, 15.0, 20.0, 21.0, 28.0, 55.0, 53.0, 67.0, 106.0, 147.0, 206.0, 274.0, 393.0, 659.0, 1156.0, 2114.0, 4927.0, 13397.0, 52893.0, 510415.0, 3415647.0, 149228.0, 26844.0, 8133.0, 3233.0, 1568.0, 847.0, 538.0, 372.0, 242.0, 174.0, 129.0, 83.0, 71.0, 54.0, 42.0, 17.0, 25.0, 20.0, 7.0, 12.0, 5.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404296875, -0.3913688659667969, -0.37844085693359375, -0.3655128479003906, -0.3525848388671875, -0.3396568298339844, -0.32672882080078125, -0.3138008117675781, -0.300872802734375, -0.2879447937011719, -0.27501678466796875, -0.2620887756347656, -0.2491607666015625, -0.23623275756835938, -0.22330474853515625, -0.21037673950195312, -0.19744873046875, -0.18452072143554688, -0.17159271240234375, -0.15866470336914062, -0.1457366943359375, -0.13280868530273438, -0.11988067626953125, -0.10695266723632812, -0.094024658203125, -0.08109664916992188, -0.06816864013671875, -0.055240631103515625, -0.0423126220703125, -0.029384613037109375, -0.01645660400390625, -0.003528594970703125, 0.0093994140625, 0.022327423095703125, 0.03525543212890625, 0.048183441162109375, 0.0611114501953125, 0.07403945922851562, 0.08696746826171875, 0.09989547729492188, 0.112823486328125, 0.12575149536132812, 0.13867950439453125, 0.15160751342773438, 0.1645355224609375, 0.17746353149414062, 0.19039154052734375, 0.20331954956054688, 0.21624755859375, 0.22917556762695312, 0.24210357666015625, 0.2550315856933594, 0.2679595947265625, 0.2808876037597656, 0.29381561279296875, 0.3067436218261719, 0.319671630859375, 0.3325996398925781, 0.34552764892578125, 0.3584556579589844, 0.3713836669921875, 0.3843116760253906, 0.39723968505859375, 0.4101676940917969, 0.423095703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 27.0, 42.0, 73.0, 173.0, 402.0, 1264.0, 1324.0, 342.0, 164.0, 89.0, 53.0, 29.0, 18.0, 14.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.41064453125, -0.3985786437988281, -0.38651275634765625, -0.3744468688964844, -0.3623809814453125, -0.3503150939941406, -0.33824920654296875, -0.3261833190917969, -0.314117431640625, -0.3020515441894531, -0.28998565673828125, -0.2779197692871094, -0.2658538818359375, -0.2537879943847656, -0.24172210693359375, -0.22965621948242188, -0.21759033203125, -0.20552444458007812, -0.19345855712890625, -0.18139266967773438, -0.1693267822265625, -0.15726089477539062, -0.14519500732421875, -0.13312911987304688, -0.121063232421875, -0.10899734497070312, -0.09693145751953125, -0.08486557006835938, -0.0727996826171875, -0.060733795166015625, -0.04866790771484375, -0.036602020263671875, -0.0245361328125, -0.012470245361328125, -0.00040435791015625, 0.011661529541015625, 0.0237274169921875, 0.035793304443359375, 0.04785919189453125, 0.059925079345703125, 0.071990966796875, 0.08405685424804688, 0.09612274169921875, 0.10818862915039062, 0.1202545166015625, 0.13232040405273438, 0.14438629150390625, 0.15645217895507812, 0.16851806640625, 0.18058395385742188, 0.19264984130859375, 0.20471572875976562, 0.2167816162109375, 0.22884750366210938, 0.24091339111328125, 0.2529792785644531, 0.265045166015625, 0.2771110534667969, 0.28917694091796875, 0.3012428283691406, 0.3133087158203125, 0.3253746032714844, 0.33744049072265625, 0.3495063781738281, 0.361572265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 10.0, 36.0, 66.0, 134.0, 238.0, 196.0, 133.0, 87.0, 35.0, 25.0, 12.0, 10.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4871758222579956, -1.427170753479004, -1.3671656847000122, -1.3071606159210205, -1.2471556663513184, -1.187150478363037, -1.127145528793335, -1.0671404600143433, -1.0071353912353516, -0.9471303224563599, -0.8871252536773682, -0.8271202445030212, -0.7671151757240295, -0.7071101069450378, -0.6471050977706909, -0.5871000289916992, -0.5270949602127075, -0.4670898914337158, -0.4070848524570465, -0.3470798134803772, -0.2870747447013855, -0.2270696759223938, -0.1670646369457245, -0.10705959796905518, -0.04705452919006348, 0.012950524687767029, 0.07295557856559753, 0.13296063244342804, 0.19296568632125854, 0.25297075510025024, 0.31297579407691956, 0.37298083305358887, 0.4329860210418701, 0.4929910898208618, 0.5529961585998535, 0.6130011677742004, 0.6730062365531921, 0.7330113053321838, 0.7930163145065308, 0.8530213832855225, 0.9130264520645142, 0.9730315208435059, 1.0330365896224976, 1.0930416584014893, 1.1530466079711914, 1.2130517959594727, 1.2730567455291748, 1.3330618143081665, 1.3930668830871582, 1.45307195186615, 1.5130770206451416, 1.5730820894241333, 1.633087158203125, 1.6930921077728271, 1.7530971765518188, 1.8131022453308105, 1.8731073141098022, 1.933112382888794, 1.9931174516677856, 2.0531225204467773, 2.1131274700164795, 2.1731326580047607, 2.233137607574463, 2.293142795562744, 2.3531477451324463]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 5.0, 16.0, 11.0, 9.0, 24.0, 16.0, 25.0, 20.0, 22.0, 37.0, 27.0, 38.0, 36.0, 36.0, 47.0, 41.0, 39.0, 51.0, 48.0, 47.0, 41.0, 37.0, 34.0, 42.0, 35.0, 26.0, 27.0, 19.0, 22.0, 17.0, 12.0, 23.0, 12.0, 7.0, 11.0, 3.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181201338768005, -0.5986501574516296, -0.579180121421814, -0.5597101449966431, -0.5402401685714722, -0.5207701921463013, -0.5013002157211304, -0.4818301796913147, -0.4623602032661438, -0.4428902268409729, -0.4234202206134796, -0.40395021438598633, -0.38448023796081543, -0.36501026153564453, -0.34554025530815125, -0.32607024908065796, -0.30660027265548706, -0.28713029623031616, -0.2676602900028229, -0.24819029867649078, -0.2287203073501587, -0.2092503160238266, -0.1897803246974945, -0.17031033337116241, -0.15084034204483032, -0.13137035071849823, -0.11190035939216614, -0.09243036806583405, -0.07296037673950195, -0.05349038541316986, -0.03402039408683777, -0.014550402760505676, 0.004919588565826416, 0.02438957989215851, 0.0438595712184906, 0.06332956254482269, 0.08279955387115479, 0.10226954519748688, 0.12173953652381897, 0.14120952785015106, 0.16067951917648315, 0.18014951050281525, 0.19961950182914734, 0.21908949315547943, 0.23855948448181152, 0.2580294609069824, 0.2774994671344757, 0.296969473361969, 0.3164394497871399, 0.3359094262123108, 0.3553794324398041, 0.37484943866729736, 0.39431941509246826, 0.41378939151763916, 0.43325939774513245, 0.45272940397262573, 0.47219938039779663, 0.49166935682296753, 0.5111393928527832, 0.5306093692779541, 0.550079345703125, 0.5695493221282959, 0.5890192985534668, 0.6084893345832825, 0.6279593110084534]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 3.0, 9.0, 7.0, 15.0, 15.0, 32.0, 54.0, 83.0, 118.0, 200.0, 380.0, 820.0, 1800.0, 4694.0, 13358.0, 40713.0, 144806.0, 504953.0, 242422.0, 63114.0, 19346.0, 6805.0, 2523.0, 1098.0, 516.0, 253.0, 159.0, 72.0, 59.0, 29.0, 24.0, 13.0, 9.0, 12.0, 10.0, 13.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.483154296875, -0.4699821472167969, -0.45680999755859375, -0.4436378479003906, -0.4304656982421875, -0.4172935485839844, -0.40412139892578125, -0.3909492492675781, -0.377777099609375, -0.3646049499511719, -0.35143280029296875, -0.3382606506347656, -0.3250885009765625, -0.3119163513183594, -0.29874420166015625, -0.2855720520019531, -0.27239990234375, -0.2592277526855469, -0.24605560302734375, -0.23288345336914062, -0.2197113037109375, -0.20653915405273438, -0.19336700439453125, -0.18019485473632812, -0.167022705078125, -0.15385055541992188, -0.14067840576171875, -0.12750625610351562, -0.1143341064453125, -0.10116195678710938, -0.08798980712890625, -0.07481765747070312, -0.0616455078125, -0.048473358154296875, -0.03530120849609375, -0.022129058837890625, -0.0089569091796875, 0.004215240478515625, 0.01738739013671875, 0.030559539794921875, 0.043731689453125, 0.056903839111328125, 0.07007598876953125, 0.08324813842773438, 0.0964202880859375, 0.10959243774414062, 0.12276458740234375, 0.13593673706054688, 0.14910888671875, 0.16228103637695312, 0.17545318603515625, 0.18862533569335938, 0.2017974853515625, 0.21496963500976562, 0.22814178466796875, 0.24131393432617188, 0.254486083984375, 0.2676582336425781, 0.28083038330078125, 0.2940025329589844, 0.3071746826171875, 0.3203468322753906, 0.33351898193359375, 0.3466911315917969, 0.35986328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 10.0, 19.0, 32.0, 48.0, 40.0, 46.0, 59.0, 55.0, 71.0, 83.0, 66.0, 77.0, 66.0, 70.0, 56.0, 43.0, 43.0, 39.0, 18.0, 16.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16455078125, -0.15961074829101562, -0.15467071533203125, -0.14973068237304688, -0.1447906494140625, -0.13985061645507812, -0.13491058349609375, -0.12997055053710938, -0.125030517578125, -0.12009048461914062, -0.11515045166015625, -0.11021041870117188, -0.1052703857421875, -0.10033035278320312, -0.09539031982421875, -0.09045028686523438, -0.08551025390625, -0.08057022094726562, -0.07563018798828125, -0.07069015502929688, -0.0657501220703125, -0.060810089111328125, -0.05587005615234375, -0.050930023193359375, -0.045989990234375, -0.041049957275390625, -0.03610992431640625, -0.031169891357421875, -0.0262298583984375, -0.021289825439453125, -0.01634979248046875, -0.011409759521484375, -0.0064697265625, -0.001529693603515625, 0.00341033935546875, 0.008350372314453125, 0.0132904052734375, 0.018230438232421875, 0.02317047119140625, 0.028110504150390625, 0.033050537109375, 0.037990570068359375, 0.04293060302734375, 0.047870635986328125, 0.0528106689453125, 0.057750701904296875, 0.06269073486328125, 0.06763076782226562, 0.07257080078125, 0.07751083374023438, 0.08245086669921875, 0.08739089965820312, 0.0923309326171875, 0.09727096557617188, 0.10221099853515625, 0.10715103149414062, 0.112091064453125, 0.11703109741210938, 0.12197113037109375, 0.12691116333007812, 0.1318511962890625, 0.13679122924804688, 0.14173126220703125, 0.14667129516601562, 0.151611328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 3.0, 2.0, 8.0, 7.0, 10.0, 18.0, 20.0, 21.0, 29.0, 43.0, 71.0, 115.0, 258.0, 578.0, 1618.0, 5876.0, 27937.0, 187648.0, 690903.0, 108679.0, 18334.0, 4140.0, 1240.0, 443.0, 189.0, 103.0, 63.0, 46.0, 31.0, 19.0, 26.0, 10.0, 11.0, 14.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.77783203125, -0.7564468383789062, -0.7350616455078125, -0.7136764526367188, -0.692291259765625, -0.6709060668945312, -0.6495208740234375, -0.6281356811523438, -0.60675048828125, -0.5853652954101562, -0.5639801025390625, -0.5425949096679688, -0.521209716796875, -0.49982452392578125, -0.4784393310546875, -0.45705413818359375, -0.4356689453125, -0.41428375244140625, -0.3928985595703125, -0.37151336669921875, -0.350128173828125, -0.32874298095703125, -0.3073577880859375, -0.28597259521484375, -0.26458740234375, -0.24320220947265625, -0.2218170166015625, -0.20043182373046875, -0.179046630859375, -0.15766143798828125, -0.1362762451171875, -0.11489105224609375, -0.093505859375, -0.07212066650390625, -0.0507354736328125, -0.02935028076171875, -0.007965087890625, 0.01342010498046875, 0.0348052978515625, 0.05619049072265625, 0.07757568359375, 0.09896087646484375, 0.1203460693359375, 0.14173126220703125, 0.163116455078125, 0.18450164794921875, 0.2058868408203125, 0.22727203369140625, 0.2486572265625, 0.27004241943359375, 0.2914276123046875, 0.31281280517578125, 0.334197998046875, 0.35558319091796875, 0.3769683837890625, 0.39835357666015625, 0.41973876953125, 0.44112396240234375, 0.4625091552734375, 0.48389434814453125, 0.505279541015625, 0.5266647338867188, 0.5480499267578125, 0.5694351196289062, 0.5908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 8.0, 10.0, 8.0, 9.0, 16.0, 16.0, 18.0, 27.0, 26.0, 29.0, 36.0, 34.0, 39.0, 38.0, 59.0, 48.0, 53.0, 42.0, 38.0, 49.0, 41.0, 49.0, 40.0, 31.0, 31.0, 27.0, 30.0, 25.0, 13.0, 27.0, 16.0, 12.0, 14.0, 13.0, 4.0, 4.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.365966796875, -0.35646820068359375, -0.3469696044921875, -0.33747100830078125, -0.327972412109375, -0.31847381591796875, -0.3089752197265625, -0.29947662353515625, -0.28997802734375, -0.28047943115234375, -0.2709808349609375, -0.26148223876953125, -0.251983642578125, -0.24248504638671875, -0.2329864501953125, -0.22348785400390625, -0.2139892578125, -0.20449066162109375, -0.1949920654296875, -0.18549346923828125, -0.175994873046875, -0.16649627685546875, -0.1569976806640625, -0.14749908447265625, -0.13800048828125, -0.12850189208984375, -0.1190032958984375, -0.10950469970703125, -0.100006103515625, -0.09050750732421875, -0.0810089111328125, -0.07151031494140625, -0.06201171875, -0.05251312255859375, -0.0430145263671875, -0.03351593017578125, -0.024017333984375, -0.01451873779296875, -0.0050201416015625, 0.00447845458984375, 0.01397705078125, 0.02347564697265625, 0.0329742431640625, 0.04247283935546875, 0.051971435546875, 0.06147003173828125, 0.0709686279296875, 0.08046722412109375, 0.0899658203125, 0.09946441650390625, 0.1089630126953125, 0.11846160888671875, 0.127960205078125, 0.13745880126953125, 0.1469573974609375, 0.15645599365234375, 0.16595458984375, 0.17545318603515625, 0.1849517822265625, 0.19445037841796875, 0.203948974609375, 0.21344757080078125, 0.2229461669921875, 0.23244476318359375, 0.241943359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 10.0, 9.0, 20.0, 19.0, 41.0, 55.0, 101.0, 154.0, 271.0, 504.0, 843.0, 1521.0, 3018.0, 6859.0, 19890.0, 104713.0, 767232.0, 109186.0, 20349.0, 7054.0, 3150.0, 1608.0, 784.0, 462.0, 244.0, 176.0, 84.0, 67.0, 33.0, 25.0, 16.0, 14.0, 8.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.336181640625, -0.32614898681640625, -0.3161163330078125, -0.30608367919921875, -0.296051025390625, -0.28601837158203125, -0.2759857177734375, -0.26595306396484375, -0.25592041015625, -0.24588775634765625, -0.2358551025390625, -0.22582244873046875, -0.215789794921875, -0.20575714111328125, -0.1957244873046875, -0.18569183349609375, -0.1756591796875, -0.16562652587890625, -0.1555938720703125, -0.14556121826171875, -0.135528564453125, -0.12549591064453125, -0.1154632568359375, -0.10543060302734375, -0.09539794921875, -0.08536529541015625, -0.0753326416015625, -0.06529998779296875, -0.055267333984375, -0.04523468017578125, -0.0352020263671875, -0.02516937255859375, -0.01513671875, -0.00510406494140625, 0.0049285888671875, 0.01496124267578125, 0.024993896484375, 0.03502655029296875, 0.0450592041015625, 0.05509185791015625, 0.06512451171875, 0.07515716552734375, 0.0851898193359375, 0.09522247314453125, 0.105255126953125, 0.11528778076171875, 0.1253204345703125, 0.13535308837890625, 0.1453857421875, 0.15541839599609375, 0.1654510498046875, 0.17548370361328125, 0.185516357421875, 0.19554901123046875, 0.2055816650390625, 0.21561431884765625, 0.22564697265625, 0.23567962646484375, 0.2457122802734375, 0.25574493408203125, 0.265777587890625, 0.27581024169921875, 0.2858428955078125, 0.29587554931640625, 0.305908203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 15.0, 10.0, 18.0, 33.0, 58.0, 74.0, 247.0, 251.0, 118.0, 44.0, 26.0, 20.0, 20.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109476089477539e-05, -5.9351325035095215e-05, -5.760788917541504e-05, -5.586445331573486e-05, -5.412101745605469e-05, -5.237758159637451e-05, -5.0634145736694336e-05, -4.889070987701416e-05, -4.7147274017333984e-05, -4.540383815765381e-05, -4.366040229797363e-05, -4.191696643829346e-05, -4.017353057861328e-05, -3.8430094718933105e-05, -3.668665885925293e-05, -3.4943222999572754e-05, -3.319978713989258e-05, -3.14563512802124e-05, -2.9712915420532227e-05, -2.796947956085205e-05, -2.6226043701171875e-05, -2.44826078414917e-05, -2.2739171981811523e-05, -2.0995736122131348e-05, -1.9252300262451172e-05, -1.7508864402770996e-05, -1.576542854309082e-05, -1.4021992683410645e-05, -1.2278556823730469e-05, -1.0535120964050293e-05, -8.791685104370117e-06, -7.048249244689941e-06, -5.304813385009766e-06, -3.56137752532959e-06, -1.817941665649414e-06, -7.450580596923828e-08, 1.6689300537109375e-06, 3.4123659133911133e-06, 5.155801773071289e-06, 6.899237632751465e-06, 8.64267349243164e-06, 1.0386109352111816e-05, 1.2129545211791992e-05, 1.3872981071472168e-05, 1.5616416931152344e-05, 1.735985279083252e-05, 1.9103288650512695e-05, 2.084672451019287e-05, 2.2590160369873047e-05, 2.4333596229553223e-05, 2.60770320892334e-05, 2.7820467948913574e-05, 2.956390380859375e-05, 3.1307339668273926e-05, 3.30507755279541e-05, 3.479421138763428e-05, 3.653764724731445e-05, 3.828108310699463e-05, 4.0024518966674805e-05, 4.176795482635498e-05, 4.3511390686035156e-05, 4.525482654571533e-05, 4.699826240539551e-05, 4.8741698265075684e-05, 5.048513412475586e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 7.0, 3.0, 9.0, 19.0, 25.0, 41.0, 90.0, 197.0, 641.0, 2150.0, 12518.0, 895258.0, 128860.0, 6641.0, 1350.0, 409.0, 167.0, 60.0, 39.0, 12.0, 12.0, 6.0, 14.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.997955322265625, -0.96661376953125, -0.935272216796875, -0.9039306640625, -0.872589111328125, -0.84124755859375, -0.809906005859375, -0.778564453125, -0.747222900390625, -0.71588134765625, -0.684539794921875, -0.6531982421875, -0.621856689453125, -0.59051513671875, -0.559173583984375, -0.52783203125, -0.496490478515625, -0.46514892578125, -0.433807373046875, -0.4024658203125, -0.371124267578125, -0.33978271484375, -0.308441162109375, -0.277099609375, -0.245758056640625, -0.21441650390625, -0.183074951171875, -0.1517333984375, -0.120391845703125, -0.08905029296875, -0.057708740234375, -0.0263671875, 0.004974365234375, 0.03631591796875, 0.067657470703125, 0.0989990234375, 0.130340576171875, 0.16168212890625, 0.193023681640625, 0.224365234375, 0.255706787109375, 0.28704833984375, 0.318389892578125, 0.3497314453125, 0.381072998046875, 0.41241455078125, 0.443756103515625, 0.47509765625, 0.506439208984375, 0.53778076171875, 0.569122314453125, 0.6004638671875, 0.631805419921875, 0.66314697265625, 0.694488525390625, 0.725830078125, 0.757171630859375, 0.78851318359375, 0.819854736328125, 0.8511962890625, 0.882537841796875, 0.91387939453125, 0.945220947265625, 0.9765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 11.0, 12.0, 9.0, 17.0, 40.0, 55.0, 133.0, 253.0, 187.0, 101.0, 64.0, 28.0, 18.0, 14.0, 7.0, 14.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.278564453125, -0.2692298889160156, -0.25989532470703125, -0.2505607604980469, -0.2412261962890625, -0.23189163208007812, -0.22255706787109375, -0.21322250366210938, -0.203887939453125, -0.19455337524414062, -0.18521881103515625, -0.17588424682617188, -0.1665496826171875, -0.15721511840820312, -0.14788055419921875, -0.13854598999023438, -0.12921142578125, -0.11987686157226562, -0.11054229736328125, -0.10120773315429688, -0.0918731689453125, -0.08253860473632812, -0.07320404052734375, -0.06386947631835938, -0.054534912109375, -0.045200347900390625, -0.03586578369140625, -0.026531219482421875, -0.0171966552734375, -0.007862091064453125, 0.00147247314453125, 0.010807037353515625, 0.0201416015625, 0.029476165771484375, 0.03881072998046875, 0.048145294189453125, 0.0574798583984375, 0.06681442260742188, 0.07614898681640625, 0.08548355102539062, 0.094818115234375, 0.10415267944335938, 0.11348724365234375, 0.12282180786132812, 0.1321563720703125, 0.14149093627929688, 0.15082550048828125, 0.16016006469726562, 0.16949462890625, 0.17882919311523438, 0.18816375732421875, 0.19749832153320312, 0.2068328857421875, 0.21616744995117188, 0.22550201416015625, 0.23483657836914062, 0.244171142578125, 0.2535057067871094, 0.26284027099609375, 0.2721748352050781, 0.2815093994140625, 0.2908439636230469, 0.30017852783203125, 0.3095130920410156, 0.31884765625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 24.0, 54.0, 161.0, 338.0, 270.0, 87.0, 25.0, 18.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.888499140739441, -1.7612011432647705, -1.6339031457901, -1.5066051483154297, -1.3793072700500488, -1.2520091533660889, -1.124711275100708, -0.9974132776260376, -0.8701152801513672, -0.7428172826766968, -0.6155192852020264, -0.48822134733200073, -0.3609233498573303, -0.2336253523826599, -0.10632741451263428, 0.020970582962036133, 0.14826858043670654, 0.27556657791137695, 0.402864545583725, 0.530162513256073, 0.6574605107307434, 0.7847585082054138, 0.9120564460754395, 1.0393544435501099, 1.1666524410247803, 1.2939504384994507, 1.421248435974121, 1.548546314239502, 1.675844430923462, 1.8031423091888428, 1.9304403066635132, 2.0577383041381836, 2.1850361824035645, 2.3123340606689453, 2.4396321773529053, 2.566930055618286, 2.694228172302246, 2.821526050567627, 2.948823928833008, 3.0761220455169678, 3.2034201622009277, 3.3307180404663086, 3.4580161571502686, 3.5853140354156494, 3.7126121520996094, 3.8399100303649902, 3.967207908630371, 4.09450626373291, 4.221803665161133, 4.349101543426514, 4.4763994216918945, 4.603697776794434, 4.7309956550598145, 4.858293533325195, 4.985591411590576, 5.112889289855957, 5.240187644958496, 5.367485523223877, 5.494783401489258, 5.622081756591797, 5.749379634857178, 5.876677513122559, 6.0039753913879395, 6.13127326965332, 6.258571624755859]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 8.0, 6.0, 8.0, 21.0, 13.0, 13.0, 23.0, 20.0, 20.0, 28.0, 33.0, 35.0, 35.0, 30.0, 34.0, 44.0, 45.0, 35.0, 33.0, 44.0, 48.0, 37.0, 36.0, 41.0, 39.0, 40.0, 28.0, 31.0, 19.0, 21.0, 19.0, 21.0, 9.0, 11.0, 12.0, 9.0, 5.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.9722538590431213, -0.9452389478683472, -0.9182240962982178, -0.8912091851234436, -0.8641942739486694, -0.83717942237854, -0.8101645112037659, -0.7831496000289917, -0.7561347484588623, -0.7291198372840881, -0.7021049857139587, -0.6750900745391846, -0.6480752229690552, -0.621060311794281, -0.5940454006195068, -0.5670305490493774, -0.5400156378746033, -0.5130007266998291, -0.4859858751296997, -0.45897096395492554, -0.43195608258247375, -0.404941201210022, -0.3779262900352478, -0.350911408662796, -0.32389652729034424, -0.29688164591789246, -0.2698667645454407, -0.2428518533706665, -0.21583697199821472, -0.18882209062576294, -0.16180719435214996, -0.134792298078537, -0.1077774167060852, -0.08076252788305283, -0.05374763906002045, -0.026732750236988068, 0.0002821385860443115, 0.027297019958496094, 0.05431191623210907, 0.08132681250572205, 0.10834169387817383, 0.1353565752506256, 0.1623714715242386, 0.18938636779785156, 0.21640124917030334, 0.24341613054275513, 0.2704310417175293, 0.2974459230899811, 0.32446080446243286, 0.35147568583488464, 0.3784905672073364, 0.4055054783821106, 0.4325203597545624, 0.45953524112701416, 0.48655015230178833, 0.5135650634765625, 0.5405799150466919, 0.5675948262214661, 0.5946096777915955, 0.6216245889663696, 0.648639440536499, 0.6756543517112732, 0.7026692628860474, 0.7296841144561768, 0.7566990256309509]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 14.0, 30.0, 29.0, 76.0, 128.0, 328.0, 716.0, 2074.0, 9735.0, 167017.0, 3931515.0, 73270.0, 6602.0, 1622.0, 563.0, 244.0, 139.0, 76.0, 48.0, 22.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.382110595703125, -0.36578369140625, -0.349456787109375, -0.3331298828125, -0.316802978515625, -0.30047607421875, -0.284149169921875, -0.267822265625, -0.251495361328125, -0.23516845703125, -0.218841552734375, -0.2025146484375, -0.186187744140625, -0.16986083984375, -0.153533935546875, -0.13720703125, -0.120880126953125, -0.10455322265625, -0.088226318359375, -0.0718994140625, -0.055572509765625, -0.03924560546875, -0.022918701171875, -0.006591796875, 0.009735107421875, 0.02606201171875, 0.042388916015625, 0.0587158203125, 0.075042724609375, 0.09136962890625, 0.107696533203125, 0.1240234375, 0.140350341796875, 0.15667724609375, 0.173004150390625, 0.1893310546875, 0.205657958984375, 0.22198486328125, 0.238311767578125, 0.254638671875, 0.270965576171875, 0.28729248046875, 0.303619384765625, 0.3199462890625, 0.336273193359375, 0.35260009765625, 0.368927001953125, 0.38525390625, 0.401580810546875, 0.41790771484375, 0.434234619140625, 0.4505615234375, 0.466888427734375, 0.48321533203125, 0.499542236328125, 0.515869140625, 0.532196044921875, 0.54852294921875, 0.564849853515625, 0.5811767578125, 0.597503662109375, 0.61383056640625, 0.630157470703125, 0.646484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 13.0, 8.0, 9.0, 16.0, 28.0, 31.0, 35.0, 39.0, 55.0, 53.0, 62.0, 60.0, 72.0, 63.0, 65.0, 59.0, 62.0, 50.0, 60.0, 41.0, 33.0, 24.0, 13.0, 18.0, 11.0, 9.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15195083618164062, -0.14691925048828125, -0.14188766479492188, -0.1368560791015625, -0.13182449340820312, -0.12679290771484375, -0.12176132202148438, -0.116729736328125, -0.11169815063476562, -0.10666656494140625, -0.10163497924804688, -0.0966033935546875, -0.09157180786132812, -0.08654022216796875, -0.08150863647460938, -0.07647705078125, -0.07144546508789062, -0.06641387939453125, -0.061382293701171875, -0.0563507080078125, -0.051319122314453125, -0.04628753662109375, -0.041255950927734375, -0.036224365234375, -0.031192779541015625, -0.02616119384765625, -0.021129608154296875, -0.0160980224609375, -0.011066436767578125, -0.00603485107421875, -0.001003265380859375, 0.0040283203125, 0.009059906005859375, 0.01409149169921875, 0.019123077392578125, 0.0241546630859375, 0.029186248779296875, 0.03421783447265625, 0.039249420166015625, 0.044281005859375, 0.049312591552734375, 0.05434417724609375, 0.059375762939453125, 0.0644073486328125, 0.06943893432617188, 0.07447052001953125, 0.07950210571289062, 0.08453369140625, 0.08956527709960938, 0.09459686279296875, 0.09962844848632812, 0.1046600341796875, 0.10969161987304688, 0.11472320556640625, 0.11975479125976562, 0.124786376953125, 0.12981796264648438, 0.13484954833984375, 0.13988113403320312, 0.1449127197265625, 0.14994430541992188, 0.15497589111328125, 0.16000747680664062, 0.1650390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 12.0, 19.0, 23.0, 32.0, 46.0, 75.0, 107.0, 152.0, 278.0, 463.0, 872.0, 1691.0, 4101.0, 12825.0, 68540.0, 3405119.0, 647746.0, 37255.0, 8657.0, 3067.0, 1382.0, 703.0, 417.0, 235.0, 135.0, 90.0, 80.0, 35.0, 23.0, 23.0, 18.0, 14.0, 4.0, 8.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46435546875, -0.45021820068359375, -0.4360809326171875, -0.42194366455078125, -0.407806396484375, -0.39366912841796875, -0.3795318603515625, -0.36539459228515625, -0.35125732421875, -0.33712005615234375, -0.3229827880859375, -0.30884552001953125, -0.294708251953125, -0.28057098388671875, -0.2664337158203125, -0.25229644775390625, -0.2381591796875, -0.22402191162109375, -0.2098846435546875, -0.19574737548828125, -0.181610107421875, -0.16747283935546875, -0.1533355712890625, -0.13919830322265625, -0.12506103515625, -0.11092376708984375, -0.0967864990234375, -0.08264923095703125, -0.068511962890625, -0.05437469482421875, -0.0402374267578125, -0.02610015869140625, -0.011962890625, 0.00217437744140625, 0.0163116455078125, 0.03044891357421875, 0.044586181640625, 0.05872344970703125, 0.0728607177734375, 0.08699798583984375, 0.10113525390625, 0.11527252197265625, 0.1294097900390625, 0.14354705810546875, 0.157684326171875, 0.17182159423828125, 0.1859588623046875, 0.20009613037109375, 0.2142333984375, 0.22837066650390625, 0.2425079345703125, 0.25664520263671875, 0.270782470703125, 0.28491973876953125, 0.2990570068359375, 0.31319427490234375, 0.32733154296875, 0.34146881103515625, 0.3556060791015625, 0.36974334716796875, 0.383880615234375, 0.39801788330078125, 0.4121551513671875, 0.42629241943359375, 0.4404296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 12.0, 23.0, 38.0, 82.0, 206.0, 645.0, 2064.0, 607.0, 206.0, 65.0, 43.0, 22.0, 21.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.23728179931640625, -0.2262725830078125, -0.21526336669921875, -0.204254150390625, -0.19324493408203125, -0.1822357177734375, -0.17122650146484375, -0.16021728515625, -0.14920806884765625, -0.1381988525390625, -0.12718963623046875, -0.116180419921875, -0.10517120361328125, -0.0941619873046875, -0.08315277099609375, -0.0721435546875, -0.06113433837890625, -0.0501251220703125, -0.03911590576171875, -0.028106689453125, -0.01709747314453125, -0.0060882568359375, 0.00492095947265625, 0.01593017578125, 0.02693939208984375, 0.0379486083984375, 0.04895782470703125, 0.059967041015625, 0.07097625732421875, 0.0819854736328125, 0.09299468994140625, 0.10400390625, 0.11501312255859375, 0.1260223388671875, 0.13703155517578125, 0.148040771484375, 0.15904998779296875, 0.1700592041015625, 0.18106842041015625, 0.19207763671875, 0.20308685302734375, 0.2140960693359375, 0.22510528564453125, 0.236114501953125, 0.24712371826171875, 0.2581329345703125, 0.26914215087890625, 0.2801513671875, 0.29116058349609375, 0.3021697998046875, 0.31317901611328125, 0.324188232421875, 0.33519744873046875, 0.3462066650390625, 0.35721588134765625, 0.36822509765625, 0.37923431396484375, 0.3902435302734375, 0.40125274658203125, 0.412261962890625, 0.42327117919921875, 0.4342803955078125, 0.44528961181640625, 0.456298828125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 4.0, 16.0, 28.0, 38.0, 50.0, 108.0, 177.0, 195.0, 144.0, 93.0, 49.0, 30.0, 33.0, 12.0, 14.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8778213858604431, -0.8453740477561951, -0.812926709651947, -0.780479371547699, -0.7480320930480957, -0.7155847549438477, -0.6831374168395996, -0.6506900787353516, -0.6182427406311035, -0.5857954025268555, -0.5533480644226074, -0.5209007263183594, -0.4884534180164337, -0.45600607991218567, -0.42355877161026, -0.39111143350601196, -0.3586640954017639, -0.32621675729751587, -0.2937694191932678, -0.26132211089134216, -0.22887477278709412, -0.19642743468284607, -0.16398011147975922, -0.13153278827667236, -0.09908545017242432, -0.06663811951875687, -0.034190788865089417, -0.0017434582114219666, 0.030703872442245483, 0.06315121054649353, 0.09559853374958038, 0.12804585695266724, 0.16049325466156006, 0.1929405927658081, 0.22538791596889496, 0.2578352391719818, 0.29028257727622986, 0.3227299153804779, 0.35517722368240356, 0.3876245617866516, 0.42007189989089966, 0.4525192379951477, 0.48496657609939575, 0.5174139142036438, 0.5498611927032471, 0.5823085308074951, 0.6147558689117432, 0.6472032070159912, 0.6796505451202393, 0.7120978832244873, 0.7445452213287354, 0.7769925594329834, 0.8094398975372314, 0.8418872356414795, 0.8743345141410828, 0.9067818522453308, 0.9392291903495789, 0.9716765284538269, 1.0041238069534302, 1.0365711450576782, 1.0690184831619263, 1.1014658212661743, 1.1339131593704224, 1.1663604974746704, 1.1988078355789185]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 7.0, 8.0, 6.0, 14.0, 10.0, 16.0, 13.0, 19.0, 20.0, 22.0, 18.0, 20.0, 22.0, 35.0, 30.0, 28.0, 41.0, 35.0, 32.0, 31.0, 37.0, 32.0, 47.0, 38.0, 34.0, 42.0, 41.0, 40.0, 30.0, 37.0, 27.0, 21.0, 22.0, 15.0, 18.0, 17.0, 8.0, 12.0, 14.0, 9.0, 7.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37005430459976196, -0.3578120172023773, -0.3455697000026703, -0.33332741260528564, -0.3210850954055786, -0.30884280800819397, -0.2966005206108093, -0.2843582034111023, -0.27211591601371765, -0.259873628616333, -0.24763131141662598, -0.23538902401924133, -0.2231467217206955, -0.21090441942214966, -0.19866211712360382, -0.18641981482505798, -0.17417751252651215, -0.1619352102279663, -0.14969290792942047, -0.13745060563087463, -0.12520831823349, -0.11296601593494415, -0.10072371363639832, -0.08848141878843307, -0.07623911648988724, -0.0639968141913414, -0.05175451934337616, -0.03951221704483032, -0.027269918471574783, -0.015027619898319244, -0.002785317599773407, 0.009456977248191833, 0.02169927954673767, 0.03394157811999321, 0.04618387669324875, 0.058426178991794586, 0.07066847383975983, 0.08291077613830566, 0.0951530784368515, 0.10739537328481674, 0.11963767558336258, 0.13187997043132782, 0.14412227272987366, 0.1563645750284195, 0.16860687732696533, 0.18084916472434998, 0.193091481924057, 0.20533376932144165, 0.2175760716199875, 0.22981837391853333, 0.24206067621707916, 0.254302978515625, 0.26654526591300964, 0.2787875533103943, 0.2910298705101013, 0.30327215790748596, 0.315514475107193, 0.32775676250457764, 0.33999907970428467, 0.3522413671016693, 0.36448368430137634, 0.376725971698761, 0.388968288898468, 0.40121057629585266, 0.4134528636932373]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 12.0, 17.0, 31.0, 35.0, 77.0, 92.0, 150.0, 342.0, 651.0, 1395.0, 3074.0, 7677.0, 20586.0, 60109.0, 202920.0, 484736.0, 180811.0, 54321.0, 18807.0, 7057.0, 3037.0, 1293.0, 619.0, 284.0, 149.0, 88.0, 53.0, 31.0, 21.0, 16.0, 11.0, 10.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.36181640625, -0.3510017395019531, -0.34018707275390625, -0.3293724060058594, -0.3185577392578125, -0.3077430725097656, -0.29692840576171875, -0.2861137390136719, -0.275299072265625, -0.2644844055175781, -0.25366973876953125, -0.24285507202148438, -0.2320404052734375, -0.22122573852539062, -0.21041107177734375, -0.19959640502929688, -0.18878173828125, -0.17796707153320312, -0.16715240478515625, -0.15633773803710938, -0.1455230712890625, -0.13470840454101562, -0.12389373779296875, -0.11307907104492188, -0.102264404296875, -0.09144973754882812, -0.08063507080078125, -0.06982040405273438, -0.0590057373046875, -0.048191070556640625, -0.03737640380859375, -0.026561737060546875, -0.0157470703125, -0.004932403564453125, 0.00588226318359375, 0.016696929931640625, 0.0275115966796875, 0.038326263427734375, 0.04914093017578125, 0.059955596923828125, 0.070770263671875, 0.08158493041992188, 0.09239959716796875, 0.10321426391601562, 0.1140289306640625, 0.12484359741210938, 0.13565826416015625, 0.14647293090820312, 0.15728759765625, 0.16810226440429688, 0.17891693115234375, 0.18973159790039062, 0.2005462646484375, 0.21136093139648438, 0.22217559814453125, 0.23299026489257812, 0.243804931640625, 0.2546195983886719, 0.26543426513671875, 0.2762489318847656, 0.2870635986328125, 0.2978782653808594, 0.30869293212890625, 0.3195075988769531, 0.330322265625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 8.0, 13.0, 7.0, 25.0, 35.0, 35.0, 38.0, 53.0, 64.0, 57.0, 64.0, 70.0, 63.0, 64.0, 64.0, 70.0, 56.0, 32.0, 55.0, 37.0, 27.0, 18.0, 14.0, 11.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.167724609375, -0.1625213623046875, -0.157318115234375, -0.1521148681640625, -0.14691162109375, -0.1417083740234375, -0.136505126953125, -0.1313018798828125, -0.1260986328125, -0.1208953857421875, -0.115692138671875, -0.1104888916015625, -0.10528564453125, -0.1000823974609375, -0.094879150390625, -0.0896759033203125, -0.08447265625, -0.0792694091796875, -0.074066162109375, -0.0688629150390625, -0.06365966796875, -0.0584564208984375, -0.053253173828125, -0.0480499267578125, -0.0428466796875, -0.0376434326171875, -0.032440185546875, -0.0272369384765625, -0.02203369140625, -0.0168304443359375, -0.011627197265625, -0.0064239501953125, -0.001220703125, 0.0039825439453125, 0.009185791015625, 0.0143890380859375, 0.01959228515625, 0.0247955322265625, 0.029998779296875, 0.0352020263671875, 0.0404052734375, 0.0456085205078125, 0.050811767578125, 0.0560150146484375, 0.06121826171875, 0.0664215087890625, 0.071624755859375, 0.0768280029296875, 0.08203125, 0.0872344970703125, 0.092437744140625, 0.0976409912109375, 0.10284423828125, 0.1080474853515625, 0.113250732421875, 0.1184539794921875, 0.1236572265625, 0.1288604736328125, 0.134063720703125, 0.1392669677734375, 0.14447021484375, 0.1496734619140625, 0.154876708984375, 0.1600799560546875, 0.165283203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 3.0, 4.0, 12.0, 14.0, 20.0, 34.0, 60.0, 158.0, 392.0, 1431.0, 6954.0, 74122.0, 835812.0, 117564.0, 9402.0, 1738.0, 461.0, 164.0, 85.0, 48.0, 18.0, 14.0, 12.0, 10.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90283203125, -0.8723068237304688, -0.8417816162109375, -0.8112564086914062, -0.780731201171875, -0.7502059936523438, -0.7196807861328125, -0.6891555786132812, -0.65863037109375, -0.6281051635742188, -0.5975799560546875, -0.5670547485351562, -0.536529541015625, -0.5060043334960938, -0.4754791259765625, -0.44495391845703125, -0.4144287109375, -0.38390350341796875, -0.3533782958984375, -0.32285308837890625, -0.292327880859375, -0.26180267333984375, -0.2312774658203125, -0.20075225830078125, -0.17022705078125, -0.13970184326171875, -0.1091766357421875, -0.07865142822265625, -0.048126220703125, -0.01760101318359375, 0.0129241943359375, 0.04344940185546875, 0.073974609375, 0.10449981689453125, 0.1350250244140625, 0.16555023193359375, 0.196075439453125, 0.22660064697265625, 0.2571258544921875, 0.28765106201171875, 0.31817626953125, 0.34870147705078125, 0.3792266845703125, 0.40975189208984375, 0.440277099609375, 0.47080230712890625, 0.5013275146484375, 0.5318527221679688, 0.5623779296875, 0.5929031372070312, 0.6234283447265625, 0.6539535522460938, 0.684478759765625, 0.7150039672851562, 0.7455291748046875, 0.7760543823242188, 0.80657958984375, 0.8371047973632812, 0.8676300048828125, 0.8981552124023438, 0.928680419921875, 0.9592056274414062, 0.9897308349609375, 1.0202560424804688, 1.05078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 11.0, 6.0, 7.0, 8.0, 13.0, 14.0, 17.0, 18.0, 35.0, 31.0, 33.0, 32.0, 37.0, 49.0, 48.0, 48.0, 51.0, 53.0, 67.0, 46.0, 54.0, 36.0, 46.0, 31.0, 37.0, 30.0, 26.0, 26.0, 17.0, 17.0, 9.0, 15.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335693359375, -0.32537078857421875, -0.3150482177734375, -0.30472564697265625, -0.294403076171875, -0.28408050537109375, -0.2737579345703125, -0.26343536376953125, -0.25311279296875, -0.24279022216796875, -0.2324676513671875, -0.22214508056640625, -0.211822509765625, -0.20149993896484375, -0.1911773681640625, -0.18085479736328125, -0.1705322265625, -0.16020965576171875, -0.1498870849609375, -0.13956451416015625, -0.129241943359375, -0.11891937255859375, -0.1085968017578125, -0.09827423095703125, -0.08795166015625, -0.07762908935546875, -0.0673065185546875, -0.05698394775390625, -0.046661376953125, -0.03633880615234375, -0.0260162353515625, -0.01569366455078125, -0.00537109375, 0.00495147705078125, 0.0152740478515625, 0.02559661865234375, 0.035919189453125, 0.04624176025390625, 0.0565643310546875, 0.06688690185546875, 0.07720947265625, 0.08753204345703125, 0.0978546142578125, 0.10817718505859375, 0.118499755859375, 0.12882232666015625, 0.1391448974609375, 0.14946746826171875, 0.1597900390625, 0.17011260986328125, 0.1804351806640625, 0.19075775146484375, 0.201080322265625, 0.21140289306640625, 0.2217254638671875, 0.23204803466796875, 0.24237060546875, 0.25269317626953125, 0.2630157470703125, 0.27333831787109375, 0.283660888671875, 0.29398345947265625, 0.3043060302734375, 0.31462860107421875, 0.324951171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 10.0, 16.0, 14.0, 24.0, 25.0, 36.0, 67.0, 82.0, 145.0, 234.0, 323.0, 518.0, 811.0, 1380.0, 2507.0, 6043.0, 22524.0, 275088.0, 686013.0, 37379.0, 8002.0, 3112.0, 1622.0, 942.0, 571.0, 371.0, 231.0, 157.0, 92.0, 69.0, 47.0, 28.0, 20.0, 13.0, 13.0, 3.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.345947265625, -0.33663177490234375, -0.3273162841796875, -0.31800079345703125, -0.308685302734375, -0.29936981201171875, -0.2900543212890625, -0.28073883056640625, -0.27142333984375, -0.26210784912109375, -0.2527923583984375, -0.24347686767578125, -0.234161376953125, -0.22484588623046875, -0.2155303955078125, -0.20621490478515625, -0.1968994140625, -0.18758392333984375, -0.1782684326171875, -0.16895294189453125, -0.159637451171875, -0.15032196044921875, -0.1410064697265625, -0.13169097900390625, -0.12237548828125, -0.11305999755859375, -0.1037445068359375, -0.09442901611328125, -0.085113525390625, -0.07579803466796875, -0.0664825439453125, -0.05716705322265625, -0.0478515625, -0.03853607177734375, -0.0292205810546875, -0.01990509033203125, -0.010589599609375, -0.00127410888671875, 0.0080413818359375, 0.01735687255859375, 0.02667236328125, 0.03598785400390625, 0.0453033447265625, 0.05461883544921875, 0.063934326171875, 0.07324981689453125, 0.0825653076171875, 0.09188079833984375, 0.1011962890625, 0.11051177978515625, 0.1198272705078125, 0.12914276123046875, 0.138458251953125, 0.14777374267578125, 0.1570892333984375, 0.16640472412109375, 0.17572021484375, 0.18503570556640625, 0.1943511962890625, 0.20366668701171875, 0.212982177734375, 0.22229766845703125, 0.2316131591796875, 0.24092864990234375, 0.250244140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 8.0, 11.0, 10.0, 11.0, 22.0, 23.0, 53.0, 80.0, 167.0, 230.0, 157.0, 66.0, 55.0, 26.0, 19.0, 19.0, 17.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.357099533081055e-05, -4.246830940246582e-05, -4.1365623474121094e-05, -4.026293754577637e-05, -3.916025161743164e-05, -3.8057565689086914e-05, -3.695487976074219e-05, -3.585219383239746e-05, -3.4749507904052734e-05, -3.364682197570801e-05, -3.254413604736328e-05, -3.1441450119018555e-05, -3.0338764190673828e-05, -2.92360782623291e-05, -2.8133392333984375e-05, -2.703070640563965e-05, -2.5928020477294922e-05, -2.4825334548950195e-05, -2.372264862060547e-05, -2.2619962692260742e-05, -2.1517276763916016e-05, -2.041459083557129e-05, -1.9311904907226562e-05, -1.8209218978881836e-05, -1.710653305053711e-05, -1.6003847122192383e-05, -1.4901161193847656e-05, -1.379847526550293e-05, -1.2695789337158203e-05, -1.1593103408813477e-05, -1.049041748046875e-05, -9.387731552124023e-06, -8.285045623779297e-06, -7.18235969543457e-06, -6.079673767089844e-06, -4.976987838745117e-06, -3.874301910400391e-06, -2.771615982055664e-06, -1.6689300537109375e-06, -5.662441253662109e-07, 5.364418029785156e-07, 1.6391277313232422e-06, 2.7418136596679688e-06, 3.844499588012695e-06, 4.947185516357422e-06, 6.0498714447021484e-06, 7.152557373046875e-06, 8.255243301391602e-06, 9.357929229736328e-06, 1.0460615158081055e-05, 1.1563301086425781e-05, 1.2665987014770508e-05, 1.3768672943115234e-05, 1.4871358871459961e-05, 1.5974044799804688e-05, 1.7076730728149414e-05, 1.817941665649414e-05, 1.9282102584838867e-05, 2.0384788513183594e-05, 2.148747444152832e-05, 2.2590160369873047e-05, 2.3692846298217773e-05, 2.47955322265625e-05, 2.5898218154907227e-05, 2.7000904083251953e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 7.0, 7.0, 15.0, 27.0, 67.0, 178.0, 509.0, 1839.0, 16303.0, 1017515.0, 9861.0, 1545.0, 419.0, 133.0, 56.0, 28.0, 17.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.766937255859375, -0.73114013671875, -0.695343017578125, -0.6595458984375, -0.623748779296875, -0.58795166015625, -0.552154541015625, -0.516357421875, -0.480560302734375, -0.44476318359375, -0.408966064453125, -0.3731689453125, -0.337371826171875, -0.30157470703125, -0.265777587890625, -0.22998046875, -0.194183349609375, -0.15838623046875, -0.122589111328125, -0.0867919921875, -0.050994873046875, -0.01519775390625, 0.020599365234375, 0.056396484375, 0.092193603515625, 0.12799072265625, 0.163787841796875, 0.1995849609375, 0.235382080078125, 0.27117919921875, 0.306976318359375, 0.3427734375, 0.378570556640625, 0.41436767578125, 0.450164794921875, 0.4859619140625, 0.521759033203125, 0.55755615234375, 0.593353271484375, 0.629150390625, 0.664947509765625, 0.70074462890625, 0.736541748046875, 0.7723388671875, 0.808135986328125, 0.84393310546875, 0.879730224609375, 0.91552734375, 0.951324462890625, 0.98712158203125, 1.022918701171875, 1.0587158203125, 1.094512939453125, 1.13031005859375, 1.166107177734375, 1.201904296875, 1.237701416015625, 1.27349853515625, 1.309295654296875, 1.3450927734375, 1.380889892578125, 1.41668701171875, 1.452484130859375, 1.48828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 4.0, 4.0, 12.0, 19.0, 56.0, 123.0, 286.0, 255.0, 107.0, 63.0, 30.0, 11.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.396240234375, -0.3865776062011719, -0.37691497802734375, -0.3672523498535156, -0.3575897216796875, -0.3479270935058594, -0.33826446533203125, -0.3286018371582031, -0.318939208984375, -0.3092765808105469, -0.29961395263671875, -0.2899513244628906, -0.2802886962890625, -0.2706260681152344, -0.26096343994140625, -0.2513008117675781, -0.24163818359375, -0.23197555541992188, -0.22231292724609375, -0.21265029907226562, -0.2029876708984375, -0.19332504272460938, -0.18366241455078125, -0.17399978637695312, -0.164337158203125, -0.15467453002929688, -0.14501190185546875, -0.13534927368164062, -0.1256866455078125, -0.11602401733398438, -0.10636138916015625, -0.09669876098632812, -0.0870361328125, -0.07737350463867188, -0.06771087646484375, -0.058048248291015625, -0.0483856201171875, -0.038722991943359375, -0.02906036376953125, -0.019397735595703125, -0.009735107421875, -7.2479248046875e-05, 0.00959014892578125, 0.019252777099609375, 0.0289154052734375, 0.038578033447265625, 0.04824066162109375, 0.057903289794921875, 0.06756591796875, 0.07722854614257812, 0.08689117431640625, 0.09655380249023438, 0.1062164306640625, 0.11587905883789062, 0.12554168701171875, 0.13520431518554688, 0.144866943359375, 0.15452957153320312, 0.16419219970703125, 0.17385482788085938, 0.1835174560546875, 0.19318008422851562, 0.20284271240234375, 0.21250534057617188, 0.22216796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 15.0, 18.0, 52.0, 100.0, 220.0, 263.0, 191.0, 85.0, 23.0, 20.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9868803024291992, -0.8993257880210876, -0.8117712140083313, -0.7242166996002197, -0.6366621255874634, -0.5491076111793518, -0.46155309677124023, -0.3739985227584839, -0.2864440083503723, -0.19888946413993835, -0.11133493483066559, -0.023780405521392822, 0.06377413868904114, 0.1513286828994751, 0.23888319730758667, 0.326437771320343, 0.4139922857284546, 0.5015468001365662, 0.5891013741493225, 0.6766558885574341, 0.7642104625701904, 0.851764976978302, 0.9393194913864136, 1.02687406539917, 1.1144285202026367, 1.201983094215393, 1.2895375490188599, 1.3770921230316162, 1.4646466970443726, 1.552201271057129, 1.6397557258605957, 1.727310299873352, 1.8148648738861084, 1.9024194478988647, 1.9899739027023315, 2.077528476715088, 2.1650829315185547, 2.2526376247406006, 2.3401920795440674, 2.4277467727661133, 2.51530122756958, 2.602855682373047, 2.6904103755950928, 2.7779648303985596, 2.8655192852020264, 2.9530739784240723, 3.040628433227539, 3.128182888031006, 3.2157373428344727, 3.3032917976379395, 3.3908464908599854, 3.478400945663452, 3.565955400466919, 3.653510093688965, 3.7410645484924316, 3.8286190032958984, 3.9161736965179443, 4.00372838973999, 4.091282844543457, 4.178837299346924, 4.266391754150391, 4.353946208953857, 4.441500663757324, 4.529055595397949, 4.616610050201416]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 7.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 6.0, 4.0, 13.0, 14.0, 17.0, 21.0, 23.0, 21.0, 16.0, 26.0, 32.0, 33.0, 31.0, 23.0, 32.0, 32.0, 40.0, 40.0, 40.0, 32.0, 46.0, 43.0, 35.0, 32.0, 30.0, 41.0, 36.0, 24.0, 33.0, 19.0, 19.0, 16.0, 15.0, 20.0, 16.0, 13.0, 6.0, 3.0, 13.0, 7.0, 11.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7170867919921875, -0.6934553384780884, -0.6698238253593445, -0.6461923718452454, -0.6225608587265015, -0.5989294052124023, -0.5752979516983032, -0.5516664981842041, -0.5280349850654602, -0.5044035315513611, -0.4807720184326172, -0.45714056491851807, -0.43350908160209656, -0.40987759828567505, -0.3862461447715759, -0.3626146614551544, -0.3389831781387329, -0.3153516948223114, -0.2917202115058899, -0.26808875799179077, -0.24445727467536926, -0.22082579135894775, -0.19719432294368744, -0.17356285452842712, -0.14993137121200562, -0.1262998878955841, -0.10266841948032379, -0.07903694361448288, -0.05540546774864197, -0.031773991882801056, -0.008142516016960144, 0.015488952398300171, 0.03912043571472168, 0.06275191158056259, 0.0863833874464035, 0.11001486331224442, 0.13364633917808533, 0.15727782249450684, 0.18090929090976715, 0.20454075932502747, 0.22817224264144897, 0.2518037259578705, 0.275435209274292, 0.2990666627883911, 0.3226981461048126, 0.34632962942123413, 0.36996108293533325, 0.39359256625175476, 0.41722404956817627, 0.4408555328845978, 0.4644870162010193, 0.4881184697151184, 0.5117499828338623, 0.5353814363479614, 0.5590128898620605, 0.5826443433761597, 0.6062758564949036, 0.6299073100090027, 0.6535388231277466, 0.6771702766418457, 0.7008017301559448, 0.7244332432746887, 0.7480646967887878, 0.7716962099075317, 0.7953276634216309]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 10.0, 16.0, 21.0, 42.0, 98.0, 207.0, 463.0, 1449.0, 5421.0, 29493.0, 2798238.0, 1324918.0, 27099.0, 4730.0, 1228.0, 478.0, 208.0, 70.0, 48.0, 17.0, 16.0, 7.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359130859375, -0.3441429138183594, -0.32915496826171875, -0.3141670227050781, -0.2991790771484375, -0.2841911315917969, -0.26920318603515625, -0.2542152404785156, -0.239227294921875, -0.22423934936523438, -0.20925140380859375, -0.19426345825195312, -0.1792755126953125, -0.16428756713867188, -0.14929962158203125, -0.13431167602539062, -0.11932373046875, -0.10433578491210938, -0.08934783935546875, -0.07435989379882812, -0.0593719482421875, -0.044384002685546875, -0.02939605712890625, -0.014408111572265625, 0.000579833984375, 0.015567779541015625, 0.03055572509765625, 0.045543670654296875, 0.0605316162109375, 0.07551956176757812, 0.09050750732421875, 0.10549545288085938, 0.1204833984375, 0.13547134399414062, 0.15045928955078125, 0.16544723510742188, 0.1804351806640625, 0.19542312622070312, 0.21041107177734375, 0.22539901733398438, 0.240386962890625, 0.2553749084472656, 0.27036285400390625, 0.2853507995605469, 0.3003387451171875, 0.3153266906738281, 0.33031463623046875, 0.3453025817871094, 0.36029052734375, 0.3752784729003906, 0.39026641845703125, 0.4052543640136719, 0.4202423095703125, 0.4352302551269531, 0.45021820068359375, 0.4652061462402344, 0.480194091796875, 0.4951820373535156, 0.5101699829101562, 0.5251579284667969, 0.5401458740234375, 0.5551338195800781, 0.5701217651367188, 0.5851097106933594, 0.60009765625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 11.0, 18.0, 22.0, 18.0, 30.0, 38.0, 54.0, 47.0, 58.0, 58.0, 77.0, 71.0, 81.0, 76.0, 62.0, 50.0, 47.0, 40.0, 37.0, 25.0, 26.0, 15.0, 8.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.16481590270996094, -0.15946578979492188, -0.1541156768798828, -0.14876556396484375, -0.1434154510498047, -0.13806533813476562, -0.13271522521972656, -0.1273651123046875, -0.12201499938964844, -0.11666488647460938, -0.11131477355957031, -0.10596466064453125, -0.10061454772949219, -0.09526443481445312, -0.08991432189941406, -0.084564208984375, -0.07921409606933594, -0.07386398315429688, -0.06851387023925781, -0.06316375732421875, -0.05781364440917969, -0.052463531494140625, -0.04711341857910156, -0.0417633056640625, -0.03641319274902344, -0.031063079833984375, -0.025712966918945312, -0.02036285400390625, -0.015012741088867188, -0.009662628173828125, -0.0043125152587890625, 0.00103759765625, 0.0063877105712890625, 0.011737823486328125, 0.017087936401367188, 0.02243804931640625, 0.027788162231445312, 0.033138275146484375, 0.03848838806152344, 0.0438385009765625, 0.04918861389160156, 0.054538726806640625, 0.05988883972167969, 0.06523895263671875, 0.07058906555175781, 0.07593917846679688, 0.08128929138183594, 0.086639404296875, 0.09198951721191406, 0.09733963012695312, 0.10268974304199219, 0.10803985595703125, 0.11338996887207031, 0.11874008178710938, 0.12409019470214844, 0.1294403076171875, 0.13479042053222656, 0.14014053344726562, 0.1454906463623047, 0.15084075927734375, 0.1561908721923828, 0.16154098510742188, 0.16689109802246094, 0.1722412109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 9.0, 14.0, 21.0, 23.0, 43.0, 45.0, 69.0, 92.0, 149.0, 181.0, 298.0, 589.0, 1218.0, 3265.0, 10881.0, 62709.0, 3688481.0, 390246.0, 25661.0, 6009.0, 2046.0, 877.0, 441.0, 290.0, 182.0, 118.0, 75.0, 65.0, 50.0, 22.0, 27.0, 20.0, 15.0, 7.0, 9.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.55517578125, -0.5396575927734375, -0.524139404296875, -0.5086212158203125, -0.49310302734375, -0.4775848388671875, -0.462066650390625, -0.4465484619140625, -0.4310302734375, -0.4155120849609375, -0.399993896484375, -0.3844757080078125, -0.36895751953125, -0.3534393310546875, -0.337921142578125, -0.3224029541015625, -0.306884765625, -0.2913665771484375, -0.275848388671875, -0.2603302001953125, -0.24481201171875, -0.2292938232421875, -0.213775634765625, -0.1982574462890625, -0.1827392578125, -0.1672210693359375, -0.151702880859375, -0.1361846923828125, -0.12066650390625, -0.1051483154296875, -0.089630126953125, -0.0741119384765625, -0.05859375, -0.0430755615234375, -0.027557373046875, -0.0120391845703125, 0.00347900390625, 0.0189971923828125, 0.034515380859375, 0.0500335693359375, 0.0655517578125, 0.0810699462890625, 0.096588134765625, 0.1121063232421875, 0.12762451171875, 0.1431427001953125, 0.158660888671875, 0.1741790771484375, 0.189697265625, 0.2052154541015625, 0.220733642578125, 0.2362518310546875, 0.25177001953125, 0.2672882080078125, 0.282806396484375, 0.2983245849609375, 0.3138427734375, 0.3293609619140625, 0.344879150390625, 0.3603973388671875, 0.37591552734375, 0.3914337158203125, 0.406951904296875, 0.4224700927734375, 0.43798828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 12.0, 11.0, 28.0, 50.0, 128.0, 399.0, 2214.0, 837.0, 192.0, 91.0, 40.0, 21.0, 12.0, 11.0, 10.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.2049999237060547, -0.19405746459960938, -0.18311500549316406, -0.17217254638671875, -0.16123008728027344, -0.15028762817382812, -0.1393451690673828, -0.1284027099609375, -0.11746025085449219, -0.10651779174804688, -0.09557533264160156, -0.08463287353515625, -0.07369041442871094, -0.06274795532226562, -0.05180549621582031, -0.040863037109375, -0.029920578002929688, -0.018978118896484375, -0.008035659790039062, 0.00290679931640625, 0.013849258422851562, 0.024791717529296875, 0.03573417663574219, 0.0466766357421875, 0.05761909484863281, 0.06856155395507812, 0.07950401306152344, 0.09044647216796875, 0.10138893127441406, 0.11233139038085938, 0.12327384948730469, 0.13421630859375, 0.1451587677001953, 0.15610122680664062, 0.16704368591308594, 0.17798614501953125, 0.18892860412597656, 0.19987106323242188, 0.2108135223388672, 0.2217559814453125, 0.2326984405517578, 0.24364089965820312, 0.25458335876464844, 0.26552581787109375, 0.27646827697753906, 0.2874107360839844, 0.2983531951904297, 0.309295654296875, 0.3202381134033203, 0.3311805725097656, 0.34212303161621094, 0.35306549072265625, 0.36400794982910156, 0.3749504089355469, 0.3858928680419922, 0.3968353271484375, 0.4077777862548828, 0.4187202453613281, 0.42966270446777344, 0.44060516357421875, 0.45154762268066406, 0.4624900817871094, 0.4734325408935547, 0.484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 19.0, 59.0, 130.0, 234.0, 256.0, 161.0, 63.0, 30.0, 16.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53953617811203, -0.49449628591537476, -0.4494563937187195, -0.4044164717197418, -0.35937657952308655, -0.3143366873264313, -0.2692967653274536, -0.22425687313079834, -0.17921698093414307, -0.1341770887374878, -0.08913718163967133, -0.04409727454185486, 0.000942617654800415, 0.04598250985145569, 0.09102243185043335, 0.13606232404708862, 0.1811022162437439, 0.22614210844039917, 0.27118200063705444, 0.3162219226360321, 0.3612618148326874, 0.40630170702934265, 0.4513416290283203, 0.4963815212249756, 0.5414214134216309, 0.5864613056182861, 0.6315011978149414, 0.6765410900115967, 0.721580982208252, 0.7666208744049072, 0.8116608262062073, 0.8567007184028625, 0.901740550994873, 0.9467804431915283, 0.9918203353881836, 1.0368602275848389, 1.0819001197814941, 1.1269400119781494, 1.1719799041748047, 1.21701979637146, 1.2620596885681152, 1.3070995807647705, 1.3521394729614258, 1.397179365158081, 1.4422192573547363, 1.4872591495513916, 1.5322990417480469, 1.5773389339447021, 1.622378945350647, 1.6674188375473022, 1.7124587297439575, 1.7574986219406128, 1.802538514137268, 1.8475784063339233, 1.8926184177398682, 1.9376583099365234, 1.9826982021331787, 2.027738094329834, 2.0727779865264893, 2.1178178787231445, 2.1628577709198, 2.207897663116455, 2.2529375553131104, 2.2979774475097656, 2.343017339706421]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 5.0, 11.0, 10.0, 15.0, 13.0, 19.0, 25.0, 28.0, 23.0, 36.0, 28.0, 43.0, 57.0, 46.0, 41.0, 46.0, 63.0, 62.0, 48.0, 60.0, 39.0, 41.0, 32.0, 38.0, 35.0, 34.0, 22.0, 18.0, 17.0, 9.0, 7.0, 6.0, 8.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5333893895149231, -0.5170274376869202, -0.5006654858589172, -0.4843035340309143, -0.4679415822029114, -0.45157963037490845, -0.4352177083492279, -0.418855756521225, -0.40249380469322205, -0.3861318528652191, -0.3697699010372162, -0.35340794920921326, -0.3370460271835327, -0.3206840753555298, -0.30432212352752686, -0.2879601716995239, -0.271598219871521, -0.25523626804351807, -0.23887431621551514, -0.2225123792886734, -0.20615042746067047, -0.18978847563266754, -0.1734265387058258, -0.15706458687782288, -0.14070263504981995, -0.12434068322181702, -0.10797873884439468, -0.09161679446697235, -0.07525484263896942, -0.05889289081096649, -0.04253094643354416, -0.026169002056121826, -0.009807109832763672, 0.006554838269948959, 0.02291678637266159, 0.03927873447537422, 0.05564068257808685, 0.07200263440608978, 0.08836457878351212, 0.10472652316093445, 0.12108847498893738, 0.1374504268169403, 0.15381237864494324, 0.17017431557178497, 0.1865362673997879, 0.20289821922779083, 0.21926015615463257, 0.2356221079826355, 0.2519840598106384, 0.26834601163864136, 0.2847079634666443, 0.3010699152946472, 0.31743186712265015, 0.3337938189506531, 0.3501557409763336, 0.36651769280433655, 0.3828796446323395, 0.3992415964603424, 0.41560354828834534, 0.43196550011634827, 0.4483274221420288, 0.46468937397003174, 0.48105132579803467, 0.4974132776260376, 0.5137752294540405]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 9.0, 18.0, 26.0, 36.0, 72.0, 132.0, 259.0, 658.0, 1928.0, 6953.0, 33524.0, 273130.0, 639616.0, 74257.0, 12910.0, 3201.0, 994.0, 399.0, 172.0, 107.0, 63.0, 33.0, 21.0, 16.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6669921875, -0.6480484008789062, -0.6291046142578125, -0.6101608276367188, -0.591217041015625, -0.5722732543945312, -0.5533294677734375, -0.5343856811523438, -0.51544189453125, -0.49649810791015625, -0.4775543212890625, -0.45861053466796875, -0.439666748046875, -0.42072296142578125, -0.4017791748046875, -0.38283538818359375, -0.3638916015625, -0.34494781494140625, -0.3260040283203125, -0.30706024169921875, -0.288116455078125, -0.26917266845703125, -0.2502288818359375, -0.23128509521484375, -0.21234130859375, -0.19339752197265625, -0.1744537353515625, -0.15550994873046875, -0.136566162109375, -0.11762237548828125, -0.0986785888671875, -0.07973480224609375, -0.060791015625, -0.04184722900390625, -0.0229034423828125, -0.00395965576171875, 0.014984130859375, 0.03392791748046875, 0.0528717041015625, 0.07181549072265625, 0.09075927734375, 0.10970306396484375, 0.1286468505859375, 0.14759063720703125, 0.166534423828125, 0.18547821044921875, 0.2044219970703125, 0.22336578369140625, 0.2423095703125, 0.26125335693359375, 0.2801971435546875, 0.29914093017578125, 0.318084716796875, 0.33702850341796875, 0.3559722900390625, 0.37491607666015625, 0.39385986328125, 0.41280364990234375, 0.4317474365234375, 0.45069122314453125, 0.469635009765625, 0.48857879638671875, 0.5075225830078125, 0.5264663696289062, 0.54541015625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 14.0, 18.0, 23.0, 24.0, 41.0, 49.0, 48.0, 54.0, 80.0, 68.0, 77.0, 76.0, 83.0, 57.0, 63.0, 40.0, 43.0, 38.0, 35.0, 22.0, 15.0, 14.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17447662353515625, -0.1686553955078125, -0.16283416748046875, -0.157012939453125, -0.15119171142578125, -0.1453704833984375, -0.13954925537109375, -0.13372802734375, -0.12790679931640625, -0.1220855712890625, -0.11626434326171875, -0.110443115234375, -0.10462188720703125, -0.0988006591796875, -0.09297943115234375, -0.087158203125, -0.08133697509765625, -0.0755157470703125, -0.06969451904296875, -0.063873291015625, -0.05805206298828125, -0.0522308349609375, -0.04640960693359375, -0.04058837890625, -0.03476715087890625, -0.0289459228515625, -0.02312469482421875, -0.017303466796875, -0.01148223876953125, -0.0056610107421875, 0.00016021728515625, 0.0059814453125, 0.01180267333984375, 0.0176239013671875, 0.02344512939453125, 0.029266357421875, 0.03508758544921875, 0.0409088134765625, 0.04673004150390625, 0.05255126953125, 0.05837249755859375, 0.0641937255859375, 0.07001495361328125, 0.075836181640625, 0.08165740966796875, 0.0874786376953125, 0.09329986572265625, 0.09912109375, 0.10494232177734375, 0.1107635498046875, 0.11658477783203125, 0.122406005859375, 0.12822723388671875, 0.1340484619140625, 0.13986968994140625, 0.14569091796875, 0.15151214599609375, 0.1573333740234375, 0.16315460205078125, 0.168975830078125, 0.17479705810546875, 0.1806182861328125, 0.18643951416015625, 0.1922607421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 14.0, 26.0, 40.0, 47.0, 107.0, 189.0, 491.0, 1162.0, 3744.0, 15739.0, 87370.0, 691818.0, 208935.0, 29295.0, 6569.0, 1778.0, 644.0, 259.0, 122.0, 73.0, 36.0, 31.0, 17.0, 8.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.671875, -0.6530532836914062, -0.6342315673828125, -0.6154098510742188, -0.596588134765625, -0.5777664184570312, -0.5589447021484375, -0.5401229858398438, -0.52130126953125, -0.5024795532226562, -0.4836578369140625, -0.46483612060546875, -0.446014404296875, -0.42719268798828125, -0.4083709716796875, -0.38954925537109375, -0.3707275390625, -0.35190582275390625, -0.3330841064453125, -0.31426239013671875, -0.295440673828125, -0.27661895751953125, -0.2577972412109375, -0.23897552490234375, -0.22015380859375, -0.20133209228515625, -0.1825103759765625, -0.16368865966796875, -0.144866943359375, -0.12604522705078125, -0.1072235107421875, -0.08840179443359375, -0.069580078125, -0.05075836181640625, -0.0319366455078125, -0.01311492919921875, 0.005706787109375, 0.02452850341796875, 0.0433502197265625, 0.06217193603515625, 0.08099365234375, 0.09981536865234375, 0.1186370849609375, 0.13745880126953125, 0.156280517578125, 0.17510223388671875, 0.1939239501953125, 0.21274566650390625, 0.2315673828125, 0.25038909912109375, 0.2692108154296875, 0.28803253173828125, 0.306854248046875, 0.32567596435546875, 0.3444976806640625, 0.36331939697265625, 0.38214111328125, 0.40096282958984375, 0.4197845458984375, 0.43860626220703125, 0.457427978515625, 0.47624969482421875, 0.4950714111328125, 0.5138931274414062, 0.53271484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 10.0, 12.0, 11.0, 15.0, 13.0, 16.0, 17.0, 19.0, 32.0, 25.0, 26.0, 44.0, 42.0, 38.0, 50.0, 64.0, 59.0, 53.0, 49.0, 54.0, 44.0, 50.0, 43.0, 19.0, 35.0, 27.0, 29.0, 28.0, 18.0, 12.0, 8.0, 13.0, 8.0, 13.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.27512359619140625, -0.2650909423828125, -0.25505828857421875, -0.245025634765625, -0.23499298095703125, -0.2249603271484375, -0.21492767333984375, -0.20489501953125, -0.19486236572265625, -0.1848297119140625, -0.17479705810546875, -0.164764404296875, -0.15473175048828125, -0.1446990966796875, -0.13466644287109375, -0.1246337890625, -0.11460113525390625, -0.1045684814453125, -0.09453582763671875, -0.084503173828125, -0.07447052001953125, -0.0644378662109375, -0.05440521240234375, -0.04437255859375, -0.03433990478515625, -0.0243072509765625, -0.01427459716796875, -0.004241943359375, 0.00579071044921875, 0.0158233642578125, 0.02585601806640625, 0.035888671875, 0.04592132568359375, 0.0559539794921875, 0.06598663330078125, 0.076019287109375, 0.08605194091796875, 0.0960845947265625, 0.10611724853515625, 0.11614990234375, 0.12618255615234375, 0.1362152099609375, 0.14624786376953125, 0.156280517578125, 0.16631317138671875, 0.1763458251953125, 0.18637847900390625, 0.1964111328125, 0.20644378662109375, 0.2164764404296875, 0.22650909423828125, 0.236541748046875, 0.24657440185546875, 0.2566070556640625, 0.26663970947265625, 0.27667236328125, 0.28670501708984375, 0.2967376708984375, 0.30677032470703125, 0.316802978515625, 0.32683563232421875, 0.3368682861328125, 0.34690093994140625, 0.35693359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 10.0, 12.0, 19.0, 20.0, 37.0, 69.0, 119.0, 206.0, 404.0, 785.0, 1731.0, 3958.0, 10413.0, 30807.0, 112083.0, 473927.0, 308991.0, 71068.0, 21123.0, 7237.0, 2883.0, 1330.0, 572.0, 305.0, 179.0, 101.0, 55.0, 35.0, 29.0, 17.0, 13.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08258056640625, -0.07961368560791016, -0.07664680480957031, -0.07367992401123047, -0.07071304321289062, -0.06774616241455078, -0.06477928161621094, -0.061812400817871094, -0.05884552001953125, -0.055878639221191406, -0.05291175842285156, -0.04994487762451172, -0.046977996826171875, -0.04401111602783203, -0.04104423522949219, -0.038077354431152344, -0.0351104736328125, -0.032143592834472656, -0.029176712036132812, -0.02620983123779297, -0.023242950439453125, -0.02027606964111328, -0.017309188842773438, -0.014342308044433594, -0.01137542724609375, -0.008408546447753906, -0.0054416656494140625, -0.0024747848510742188, 0.000492095947265625, 0.0034589767456054688, 0.0064258575439453125, 0.009392738342285156, 0.012359619140625, 0.015326499938964844, 0.018293380737304688, 0.02126026153564453, 0.024227142333984375, 0.02719402313232422, 0.030160903930664062, 0.033127784729003906, 0.03609466552734375, 0.039061546325683594, 0.04202842712402344, 0.04499530792236328, 0.047962188720703125, 0.05092906951904297, 0.05389595031738281, 0.056862831115722656, 0.0598297119140625, 0.06279659271240234, 0.06576347351074219, 0.06873035430908203, 0.07169723510742188, 0.07466411590576172, 0.07763099670410156, 0.0805978775024414, 0.08356475830078125, 0.0865316390991211, 0.08949851989746094, 0.09246540069580078, 0.09543228149414062, 0.09839916229248047, 0.10136604309082031, 0.10433292388916016, 0.1072998046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 13.0, 7.0, 23.0, 21.0, 44.0, 62.0, 84.0, 133.0, 143.0, 143.0, 97.0, 73.0, 43.0, 28.0, 16.0, 14.0, 10.0, 11.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.181529998779297e-05, -2.1236948668956757e-05, -2.0658597350120544e-05, -2.0080246031284332e-05, -1.950189471244812e-05, -1.8923543393611908e-05, -1.8345192074775696e-05, -1.7766840755939484e-05, -1.718848943710327e-05, -1.661013811826706e-05, -1.6031786799430847e-05, -1.5453435480594635e-05, -1.4875084161758423e-05, -1.429673284292221e-05, -1.3718381524085999e-05, -1.3140030205249786e-05, -1.2561678886413574e-05, -1.1983327567577362e-05, -1.140497624874115e-05, -1.0826624929904938e-05, -1.0248273611068726e-05, -9.669922292232513e-06, -9.091570973396301e-06, -8.513219654560089e-06, -7.934868335723877e-06, -7.356517016887665e-06, -6.778165698051453e-06, -6.1998143792152405e-06, -5.621463060379028e-06, -5.043111741542816e-06, -4.464760422706604e-06, -3.886409103870392e-06, -3.3080577850341797e-06, -2.7297064661979675e-06, -2.1513551473617554e-06, -1.5730038285255432e-06, -9.94652509689331e-07, -4.163011908531189e-07, 1.6205012798309326e-07, 7.404014468193054e-07, 1.3187527656555176e-06, 1.8971040844917297e-06, 2.475455403327942e-06, 3.053806722164154e-06, 3.632158041000366e-06, 4.210509359836578e-06, 4.7888606786727905e-06, 5.367211997509003e-06, 5.945563316345215e-06, 6.523914635181427e-06, 7.102265954017639e-06, 7.680617272853851e-06, 8.258968591690063e-06, 8.837319910526276e-06, 9.415671229362488e-06, 9.9940225481987e-06, 1.0572373867034912e-05, 1.1150725185871124e-05, 1.1729076504707336e-05, 1.2307427823543549e-05, 1.288577914237976e-05, 1.3464130461215973e-05, 1.4042481780052185e-05, 1.4620833098888397e-05, 1.519918441772461e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 3.0, 13.0, 17.0, 26.0, 33.0, 66.0, 133.0, 335.0, 963.0, 3131.0, 17025.0, 203891.0, 756509.0, 56445.0, 7225.0, 1684.0, 520.0, 239.0, 110.0, 56.0, 33.0, 20.0, 18.0, 12.0, 7.0, 14.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2220458984375, -0.21556663513183594, -0.20908737182617188, -0.2026081085205078, -0.19612884521484375, -0.1896495819091797, -0.18317031860351562, -0.17669105529785156, -0.1702117919921875, -0.16373252868652344, -0.15725326538085938, -0.1507740020751953, -0.14429473876953125, -0.1378154754638672, -0.13133621215820312, -0.12485694885253906, -0.118377685546875, -0.11189842224121094, -0.10541915893554688, -0.09893989562988281, -0.09246063232421875, -0.08598136901855469, -0.07950210571289062, -0.07302284240722656, -0.0665435791015625, -0.06006431579589844, -0.053585052490234375, -0.04710578918457031, -0.04062652587890625, -0.03414726257324219, -0.027667999267578125, -0.021188735961914062, -0.01470947265625, -0.008230209350585938, -0.001750946044921875, 0.0047283172607421875, 0.01120758056640625, 0.017686843872070312, 0.024166107177734375, 0.030645370483398438, 0.0371246337890625, 0.04360389709472656, 0.050083160400390625, 0.05656242370605469, 0.06304168701171875, 0.06952095031738281, 0.07600021362304688, 0.08247947692871094, 0.088958740234375, 0.09543800354003906, 0.10191726684570312, 0.10839653015136719, 0.11487579345703125, 0.12135505676269531, 0.12783432006835938, 0.13431358337402344, 0.1407928466796875, 0.14727210998535156, 0.15375137329101562, 0.1602306365966797, 0.16670989990234375, 0.1731891632080078, 0.17966842651367188, 0.18614768981933594, 0.192626953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 6.0, 3.0, 2.0, 5.0, 13.0, 14.0, 18.0, 14.0, 24.0, 19.0, 30.0, 42.0, 39.0, 75.0, 60.0, 57.0, 66.0, 81.0, 84.0, 63.0, 69.0, 41.0, 34.0, 30.0, 33.0, 18.0, 15.0, 13.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06891632080078125, -0.0666046142578125, -0.06429290771484375, -0.061981201171875, -0.05966949462890625, -0.0573577880859375, -0.05504608154296875, -0.052734375, -0.05042266845703125, -0.0481109619140625, -0.04579925537109375, -0.043487548828125, -0.04117584228515625, -0.0388641357421875, -0.03655242919921875, -0.03424072265625, -0.03192901611328125, -0.0296173095703125, -0.02730560302734375, -0.024993896484375, -0.02268218994140625, -0.0203704833984375, -0.01805877685546875, -0.0157470703125, -0.01343536376953125, -0.0111236572265625, -0.00881195068359375, -0.006500244140625, -0.00418853759765625, -0.0018768310546875, 0.00043487548828125, 0.00274658203125, 0.00505828857421875, 0.0073699951171875, 0.00968170166015625, 0.011993408203125, 0.01430511474609375, 0.0166168212890625, 0.01892852783203125, 0.021240234375, 0.02355194091796875, 0.0258636474609375, 0.02817535400390625, 0.030487060546875, 0.03279876708984375, 0.0351104736328125, 0.03742218017578125, 0.03973388671875, 0.04204559326171875, 0.0443572998046875, 0.04666900634765625, 0.048980712890625, 0.05129241943359375, 0.0536041259765625, 0.05591583251953125, 0.0582275390625, 0.06053924560546875, 0.0628509521484375, 0.06516265869140625, 0.067474365234375, 0.06978607177734375, 0.0720977783203125, 0.07440948486328125, 0.07672119140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 58.0, 258.0, 513.0, 147.0, 23.0, 4.0, 4.0], "bins": [-9.007247924804688, -8.855456352233887, -8.70366382598877, -8.551872253417969, -8.400079727172852, -8.24828815460205, -8.09649658203125, -7.944704055786133, -7.792912483215332, -7.641120433807373, -7.489328384399414, -7.337536811828613, -7.185744762420654, -7.033952713012695, -6.882160663604736, -6.730368614196777, -6.578576564788818, -6.426784515380859, -6.2749924659729, -6.1232008934021, -5.971408843994141, -5.819616794586182, -5.667824745178223, -5.516032695770264, -5.364240646362305, -5.212448596954346, -5.060656547546387, -4.908864974975586, -4.757072925567627, -4.605280876159668, -4.453488826751709, -4.30169677734375, -4.149905204772949, -3.9981131553649902, -3.8463213443756104, -3.6945292949676514, -3.5427374839782715, -3.3909454345703125, -3.2391533851623535, -3.0873613357543945, -2.9355692863464355, -2.7837772369384766, -2.6319854259490967, -2.4801933765411377, -2.328401565551758, -2.176609516143799, -2.02481746673584, -1.8730255365371704, -1.721233606338501, -1.5694416761398315, -1.417649745941162, -1.2658576965332031, -1.1140657663345337, -0.9622738361358643, -0.81048184633255, -0.6586898565292358, -0.5068979263305664, -0.3551059663295746, -0.20331400632858276, -0.05152204632759094, 0.10026991367340088, 0.2520618438720703, 0.4038538336753845, 0.5556458234786987, 0.7074377536773682]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 21.0, 31.0, 31.0, 25.0, 31.0, 38.0, 37.0, 44.0, 41.0, 43.0, 44.0, 50.0, 47.0, 47.0, 42.0, 42.0, 43.0, 36.0, 39.0, 32.0, 28.0, 22.0, 27.0, 14.0, 24.0, 6.0, 22.0, 10.0, 4.0, 13.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8458569049835205, -0.8200733065605164, -0.794289767742157, -0.7685061693191528, -0.7427226305007935, -0.7169390320777893, -0.6911554336547852, -0.6653718948364258, -0.6395882964134216, -0.6138046979904175, -0.5880211591720581, -0.562237560749054, -0.5364539623260498, -0.5106704235076904, -0.4848868250846863, -0.4591032564640045, -0.43331968784332275, -0.407536119222641, -0.38175255060195923, -0.3559689521789551, -0.3301853835582733, -0.30440181493759155, -0.2786182165145874, -0.25283464789390564, -0.22705107927322388, -0.20126751065254211, -0.17548392713069916, -0.1497003436088562, -0.12391677498817444, -0.09813320636749268, -0.07234962284564972, -0.04656603932380676, -0.020782411098480225, 0.005001164972782135, 0.030784741044044495, 0.056568317115306854, 0.08235189318656921, 0.10813546180725098, 0.13391904532909393, 0.1597026288509369, 0.18548619747161865, 0.21126976609230042, 0.23705334961414337, 0.26283693313598633, 0.2886205017566681, 0.31440407037734985, 0.340187668800354, 0.36597123742103577, 0.39175480604171753, 0.4175383746623993, 0.44332194328308105, 0.4691055417060852, 0.49488911032676697, 0.5206726789474487, 0.5464562773704529, 0.572239875793457, 0.5980234146118164, 0.6238070130348206, 0.6495905518531799, 0.6753741502761841, 0.7011576890945435, 0.7269412875175476, 0.7527248859405518, 0.7785084247589111, 0.8042920231819153]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 8.0, 9.0, 14.0, 34.0, 58.0, 85.0, 181.0, 363.0, 696.0, 1652.0, 3877.0, 9647.0, 35278.0, 513145.0, 3388222.0, 203073.0, 25254.0, 7662.0, 2762.0, 1160.0, 532.0, 262.0, 138.0, 57.0, 42.0, 28.0, 11.0, 9.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.271484375, -0.26190948486328125, -0.2523345947265625, -0.24275970458984375, -0.233184814453125, -0.22360992431640625, -0.2140350341796875, -0.20446014404296875, -0.19488525390625, -0.18531036376953125, -0.1757354736328125, -0.16616058349609375, -0.156585693359375, -0.14701080322265625, -0.1374359130859375, -0.12786102294921875, -0.1182861328125, -0.10871124267578125, -0.0991363525390625, -0.08956146240234375, -0.079986572265625, -0.07041168212890625, -0.0608367919921875, -0.05126190185546875, -0.04168701171875, -0.03211212158203125, -0.0225372314453125, -0.01296234130859375, -0.003387451171875, 0.00618743896484375, 0.0157623291015625, 0.02533721923828125, 0.034912109375, 0.04448699951171875, 0.0540618896484375, 0.06363677978515625, 0.073211669921875, 0.08278656005859375, 0.0923614501953125, 0.10193634033203125, 0.11151123046875, 0.12108612060546875, 0.1306610107421875, 0.14023590087890625, 0.149810791015625, 0.15938568115234375, 0.1689605712890625, 0.17853546142578125, 0.1881103515625, 0.19768524169921875, 0.2072601318359375, 0.21683502197265625, 0.226409912109375, 0.23598480224609375, 0.2455596923828125, 0.25513458251953125, 0.26470947265625, 0.27428436279296875, 0.2838592529296875, 0.29343414306640625, 0.303009033203125, 0.31258392333984375, 0.3221588134765625, 0.33173370361328125, 0.34130859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 10.0, 5.0, 12.0, 14.0, 32.0, 34.0, 37.0, 35.0, 58.0, 54.0, 70.0, 75.0, 66.0, 84.0, 74.0, 54.0, 59.0, 41.0, 40.0, 42.0, 33.0, 27.0, 16.0, 10.0, 9.0, 3.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.16968536376953125, -0.1641998291015625, -0.15871429443359375, -0.153228759765625, -0.14774322509765625, -0.1422576904296875, -0.13677215576171875, -0.13128662109375, -0.12580108642578125, -0.1203155517578125, -0.11483001708984375, -0.109344482421875, -0.10385894775390625, -0.0983734130859375, -0.09288787841796875, -0.08740234375, -0.08191680908203125, -0.0764312744140625, -0.07094573974609375, -0.065460205078125, -0.05997467041015625, -0.0544891357421875, -0.04900360107421875, -0.04351806640625, -0.03803253173828125, -0.0325469970703125, -0.02706146240234375, -0.021575927734375, -0.01609039306640625, -0.0106048583984375, -0.00511932373046875, 0.0003662109375, 0.00585174560546875, 0.0113372802734375, 0.01682281494140625, 0.022308349609375, 0.02779388427734375, 0.0332794189453125, 0.03876495361328125, 0.04425048828125, 0.04973602294921875, 0.0552215576171875, 0.06070709228515625, 0.066192626953125, 0.07167816162109375, 0.0771636962890625, 0.08264923095703125, 0.088134765625, 0.09362030029296875, 0.0991058349609375, 0.10459136962890625, 0.110076904296875, 0.11556243896484375, 0.1210479736328125, 0.12653350830078125, 0.13201904296875, 0.13750457763671875, 0.1429901123046875, 0.14847564697265625, 0.153961181640625, 0.15944671630859375, 0.1649322509765625, 0.17041778564453125, 0.1759033203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 8.0, 27.0, 17.0, 34.0, 38.0, 51.0, 62.0, 85.0, 103.0, 175.0, 215.0, 284.0, 402.0, 603.0, 936.0, 1473.0, 2406.0, 4037.0, 7302.0, 15445.0, 37590.0, 123946.0, 1253301.0, 2493194.0, 168223.0, 45675.0, 18062.0, 8400.0, 4610.0, 2686.0, 1633.0, 971.0, 639.0, 441.0, 314.0, 237.0, 161.0, 105.0, 102.0, 74.0, 50.0, 43.0, 27.0, 29.0, 18.0, 16.0, 7.0, 9.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.207763671875, -0.20148658752441406, -0.19520950317382812, -0.1889324188232422, -0.18265533447265625, -0.1763782501220703, -0.17010116577148438, -0.16382408142089844, -0.1575469970703125, -0.15126991271972656, -0.14499282836914062, -0.1387157440185547, -0.13243865966796875, -0.1261615753173828, -0.11988449096679688, -0.11360740661621094, -0.107330322265625, -0.10105323791503906, -0.09477615356445312, -0.08849906921386719, -0.08222198486328125, -0.07594490051269531, -0.06966781616210938, -0.06339073181152344, -0.0571136474609375, -0.05083656311035156, -0.044559478759765625, -0.03828239440917969, -0.03200531005859375, -0.025728225708007812, -0.019451141357421875, -0.013174057006835938, -0.00689697265625, -0.0006198883056640625, 0.005657196044921875, 0.011934280395507812, 0.01821136474609375, 0.024488449096679688, 0.030765533447265625, 0.03704261779785156, 0.0433197021484375, 0.04959678649902344, 0.055873870849609375, 0.06215095520019531, 0.06842803955078125, 0.07470512390136719, 0.08098220825195312, 0.08725929260253906, 0.093536376953125, 0.09981346130371094, 0.10609054565429688, 0.11236763000488281, 0.11864471435546875, 0.12492179870605469, 0.13119888305664062, 0.13747596740722656, 0.1437530517578125, 0.15003013610839844, 0.15630722045898438, 0.1625843048095703, 0.16886138916015625, 0.1751384735107422, 0.18141555786132812, 0.18769264221191406, 0.1939697265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 1.0, 6.0, 12.0, 16.0, 12.0, 21.0, 23.0, 61.0, 90.0, 136.0, 353.0, 828.0, 1405.0, 572.0, 233.0, 95.0, 60.0, 44.0, 23.0, 20.0, 17.0, 10.0, 4.0, 4.0, 7.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2481689453125, -0.2405071258544922, -0.23284530639648438, -0.22518348693847656, -0.21752166748046875, -0.20985984802246094, -0.20219802856445312, -0.1945362091064453, -0.1868743896484375, -0.1792125701904297, -0.17155075073242188, -0.16388893127441406, -0.15622711181640625, -0.14856529235839844, -0.14090347290039062, -0.1332416534423828, -0.125579833984375, -0.11791801452636719, -0.11025619506835938, -0.10259437561035156, -0.09493255615234375, -0.08727073669433594, -0.07960891723632812, -0.07194709777832031, -0.0642852783203125, -0.05662345886230469, -0.048961639404296875, -0.04129981994628906, -0.03363800048828125, -0.025976181030273438, -0.018314361572265625, -0.010652542114257812, -0.00299072265625, 0.0046710968017578125, 0.012332916259765625, 0.019994735717773438, 0.02765655517578125, 0.03531837463378906, 0.042980194091796875, 0.05064201354980469, 0.0583038330078125, 0.06596565246582031, 0.07362747192382812, 0.08128929138183594, 0.08895111083984375, 0.09661293029785156, 0.10427474975585938, 0.11193656921386719, 0.119598388671875, 0.1272602081298828, 0.13492202758789062, 0.14258384704589844, 0.15024566650390625, 0.15790748596191406, 0.16556930541992188, 0.1732311248779297, 0.1808929443359375, 0.1885547637939453, 0.19621658325195312, 0.20387840270996094, 0.21154022216796875, 0.21920204162597656, 0.22686386108398438, 0.2345256805419922, 0.2421875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 12.0, 15.0, 20.0, 37.0, 68.0, 111.0, 173.0, 204.0, 143.0, 84.0, 51.0, 26.0, 21.0, 11.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9763112664222717, -0.9373905658721924, -0.898469865322113, -0.8595491647720337, -0.8206284046173096, -0.781707763671875, -0.7427870035171509, -0.7038663029670715, -0.6649456024169922, -0.6260249018669128, -0.5871042013168335, -0.5481835007667542, -0.5092628002166748, -0.47034206986427307, -0.43142133951187134, -0.392500638961792, -0.35357993841171265, -0.3146592378616333, -0.27573853731155396, -0.23681780695915222, -0.19789710640907288, -0.15897640585899353, -0.12005569040775299, -0.08113497495651245, -0.042214274406433105, -0.003293566405773163, 0.03562714159488678, 0.07454784959554672, 0.11346855759620667, 0.152389258146286, 0.19130997359752655, 0.2302306890487671, 0.26915132999420166, 0.308072030544281, 0.34699273109436035, 0.3859134614467621, 0.42483416199684143, 0.4637548625469208, 0.5026755928993225, 0.5415962934494019, 0.5805169939994812, 0.6194376945495605, 0.6583583950996399, 0.6972790956497192, 0.7361998558044434, 0.7751204967498779, 0.814041256904602, 0.8529619574546814, 0.8918826580047607, 0.9308033585548401, 0.9697240591049194, 1.0086448192596436, 1.0475654602050781, 1.0864862203598022, 1.1254068613052368, 1.164327621459961, 1.2032482624053955, 1.2421690225601196, 1.2810896635055542, 1.3200104236602783, 1.358931064605713, 1.397851824760437, 1.4367724657058716, 1.4756932258605957, 1.5146139860153198]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 9.0, 5.0, 8.0, 11.0, 10.0, 15.0, 10.0, 18.0, 20.0, 17.0, 21.0, 22.0, 25.0, 35.0, 28.0, 25.0, 42.0, 40.0, 43.0, 32.0, 43.0, 44.0, 35.0, 42.0, 29.0, 37.0, 40.0, 39.0, 32.0, 25.0, 28.0, 27.0, 14.0, 14.0, 21.0, 19.0, 14.0, 10.0, 6.0, 9.0, 7.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5011609792709351, -0.4860773980617523, -0.4709937870502472, -0.45591020584106445, -0.4408266246318817, -0.4257430136203766, -0.41065943241119385, -0.3955758213996887, -0.380492240190506, -0.36540865898132324, -0.3503250479698181, -0.3352414667606354, -0.32015788555145264, -0.3050742745399475, -0.28999069333076477, -0.27490711212158203, -0.2598235011100769, -0.24473990499973297, -0.22965632379055023, -0.2145727276802063, -0.19948913156986237, -0.18440553545951843, -0.1693219542503357, -0.15423835813999176, -0.13915479183197021, -0.12407120317220688, -0.10898760706186295, -0.09390401840209961, -0.07882042229175568, -0.06373683363199234, -0.048653244972229004, -0.03356964886188507, -0.018486052751541138, -0.0034024612978100777, 0.011681130155920982, 0.026764720678329468, 0.0418483130633831, 0.05693190544843674, 0.07201549410820007, 0.087099090218544, 0.10218267887830734, 0.11726626753807068, 0.1323498636484146, 0.14743345975875854, 0.16251704096794128, 0.17760063707828522, 0.19268423318862915, 0.2077678143978119, 0.22285141050815582, 0.23793500661849976, 0.2530185878276825, 0.26810216903686523, 0.28318578004837036, 0.2982693612575531, 0.31335294246673584, 0.32843655347824097, 0.3435201346874237, 0.35860371589660645, 0.3736873269081116, 0.3887709081172943, 0.40385448932647705, 0.4189381003379822, 0.4340216815471649, 0.44910526275634766, 0.4641888737678528]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 11.0, 4.0, 23.0, 37.0, 42.0, 53.0, 114.0, 195.0, 350.0, 753.0, 1844.0, 4712.0, 13523.0, 41652.0, 151757.0, 516803.0, 228324.0, 59409.0, 18297.0, 6308.0, 2294.0, 978.0, 467.0, 207.0, 111.0, 73.0, 54.0, 39.0, 21.0, 21.0, 16.0, 9.0, 10.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4806365966796875, -0.465911865234375, -0.4511871337890625, -0.43646240234375, -0.4217376708984375, -0.407012939453125, -0.3922882080078125, -0.3775634765625, -0.3628387451171875, -0.348114013671875, -0.3333892822265625, -0.31866455078125, -0.3039398193359375, -0.289215087890625, -0.2744903564453125, -0.259765625, -0.2450408935546875, -0.230316162109375, -0.2155914306640625, -0.20086669921875, -0.1861419677734375, -0.171417236328125, -0.1566925048828125, -0.1419677734375, -0.1272430419921875, -0.112518310546875, -0.0977935791015625, -0.08306884765625, -0.0683441162109375, -0.053619384765625, -0.0388946533203125, -0.024169921875, -0.0094451904296875, 0.005279541015625, 0.0200042724609375, 0.03472900390625, 0.0494537353515625, 0.064178466796875, 0.0789031982421875, 0.0936279296875, 0.1083526611328125, 0.123077392578125, 0.1378021240234375, 0.15252685546875, 0.1672515869140625, 0.181976318359375, 0.1967010498046875, 0.21142578125, 0.2261505126953125, 0.240875244140625, 0.2555999755859375, 0.27032470703125, 0.2850494384765625, 0.299774169921875, 0.3144989013671875, 0.3292236328125, 0.3439483642578125, 0.358673095703125, 0.3733978271484375, 0.38812255859375, 0.4028472900390625, 0.417572021484375, 0.4322967529296875, 0.447021484375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 14.0, 14.0, 25.0, 43.0, 29.0, 59.0, 61.0, 72.0, 82.0, 67.0, 79.0, 65.0, 81.0, 57.0, 54.0, 51.0, 35.0, 35.0, 21.0, 16.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.1710071563720703, -0.16513442993164062, -0.15926170349121094, -0.15338897705078125, -0.14751625061035156, -0.14164352416992188, -0.1357707977294922, -0.1298980712890625, -0.12402534484863281, -0.11815261840820312, -0.11227989196777344, -0.10640716552734375, -0.10053443908691406, -0.09466171264648438, -0.08878898620605469, -0.082916259765625, -0.07704353332519531, -0.07117080688476562, -0.06529808044433594, -0.05942535400390625, -0.05355262756347656, -0.047679901123046875, -0.04180717468261719, -0.0359344482421875, -0.030061721801757812, -0.024188995361328125, -0.018316268920898438, -0.01244354248046875, -0.0065708160400390625, -0.000698089599609375, 0.0051746368408203125, 0.01104736328125, 0.016920089721679688, 0.022792816162109375, 0.028665542602539062, 0.03453826904296875, 0.04041099548339844, 0.046283721923828125, 0.05215644836425781, 0.0580291748046875, 0.06390190124511719, 0.06977462768554688, 0.07564735412597656, 0.08152008056640625, 0.08739280700683594, 0.09326553344726562, 0.09913825988769531, 0.105010986328125, 0.11088371276855469, 0.11675643920898438, 0.12262916564941406, 0.12850189208984375, 0.13437461853027344, 0.14024734497070312, 0.1461200714111328, 0.1519927978515625, 0.1578655242919922, 0.16373825073242188, 0.16961097717285156, 0.17548370361328125, 0.18135643005371094, 0.18722915649414062, 0.1931018829345703, 0.198974609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 12.0, 10.0, 14.0, 32.0, 33.0, 41.0, 77.0, 156.0, 394.0, 1334.0, 5675.0, 34521.0, 343507.0, 595296.0, 56186.0, 8441.0, 1737.0, 566.0, 200.0, 93.0, 47.0, 23.0, 29.0, 21.0, 21.0, 9.0, 9.0, 8.0, 6.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.92041015625, -0.894927978515625, -0.86944580078125, -0.843963623046875, -0.8184814453125, -0.792999267578125, -0.76751708984375, -0.742034912109375, -0.716552734375, -0.691070556640625, -0.66558837890625, -0.640106201171875, -0.6146240234375, -0.589141845703125, -0.56365966796875, -0.538177490234375, -0.5126953125, -0.487213134765625, -0.46173095703125, -0.436248779296875, -0.4107666015625, -0.385284423828125, -0.35980224609375, -0.334320068359375, -0.308837890625, -0.283355712890625, -0.25787353515625, -0.232391357421875, -0.2069091796875, -0.181427001953125, -0.15594482421875, -0.130462646484375, -0.10498046875, -0.079498291015625, -0.05401611328125, -0.028533935546875, -0.0030517578125, 0.022430419921875, 0.04791259765625, 0.073394775390625, 0.098876953125, 0.124359130859375, 0.14984130859375, 0.175323486328125, 0.2008056640625, 0.226287841796875, 0.25177001953125, 0.277252197265625, 0.302734375, 0.328216552734375, 0.35369873046875, 0.379180908203125, 0.4046630859375, 0.430145263671875, 0.45562744140625, 0.481109619140625, 0.506591796875, 0.532073974609375, 0.55755615234375, 0.583038330078125, 0.6085205078125, 0.634002685546875, 0.65948486328125, 0.684967041015625, 0.71044921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 3.0, 6.0, 2.0, 7.0, 16.0, 12.0, 22.0, 17.0, 18.0, 22.0, 25.0, 25.0, 33.0, 29.0, 35.0, 47.0, 49.0, 44.0, 42.0, 46.0, 45.0, 51.0, 49.0, 47.0, 43.0, 47.0, 29.0, 34.0, 24.0, 18.0, 18.0, 20.0, 16.0, 9.0, 10.0, 13.0, 5.0, 8.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.327880859375, -0.3178291320800781, -0.30777740478515625, -0.2977256774902344, -0.2876739501953125, -0.2776222229003906, -0.26757049560546875, -0.2575187683105469, -0.247467041015625, -0.23741531372070312, -0.22736358642578125, -0.21731185913085938, -0.2072601318359375, -0.19720840454101562, -0.18715667724609375, -0.17710494995117188, -0.16705322265625, -0.15700149536132812, -0.14694976806640625, -0.13689804077148438, -0.1268463134765625, -0.11679458618164062, -0.10674285888671875, -0.09669113159179688, -0.086639404296875, -0.07658767700195312, -0.06653594970703125, -0.056484222412109375, -0.0464324951171875, -0.036380767822265625, -0.02632904052734375, -0.016277313232421875, -0.0062255859375, 0.003826141357421875, 0.01387786865234375, 0.023929595947265625, 0.0339813232421875, 0.044033050537109375, 0.05408477783203125, 0.06413650512695312, 0.074188232421875, 0.08423995971679688, 0.09429168701171875, 0.10434341430664062, 0.1143951416015625, 0.12444686889648438, 0.13449859619140625, 0.14455032348632812, 0.15460205078125, 0.16465377807617188, 0.17470550537109375, 0.18475723266601562, 0.1948089599609375, 0.20486068725585938, 0.21491241455078125, 0.22496414184570312, 0.235015869140625, 0.24506759643554688, 0.25511932373046875, 0.2651710510253906, 0.2752227783203125, 0.2852745056152344, 0.29532623291015625, 0.3053779602050781, 0.3154296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 9.0, 14.0, 24.0, 32.0, 80.0, 124.0, 264.0, 731.0, 2427.0, 11000.0, 92991.0, 788766.0, 132990.0, 14630.0, 3033.0, 858.0, 275.0, 134.0, 74.0, 36.0, 19.0, 16.0, 6.0, 9.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.14714431762695312, -0.13999176025390625, -0.13283920288085938, -0.1256866455078125, -0.11853408813476562, -0.11138153076171875, -0.10422897338867188, -0.097076416015625, -0.08992385864257812, -0.08277130126953125, -0.07561874389648438, -0.0684661865234375, -0.061313629150390625, -0.05416107177734375, -0.047008514404296875, -0.03985595703125, -0.032703399658203125, -0.02555084228515625, -0.018398284912109375, -0.0112457275390625, -0.004093170166015625, 0.00305938720703125, 0.010211944580078125, 0.017364501953125, 0.024517059326171875, 0.03166961669921875, 0.038822174072265625, 0.0459747314453125, 0.053127288818359375, 0.06027984619140625, 0.06743240356445312, 0.0745849609375, 0.08173751831054688, 0.08889007568359375, 0.09604263305664062, 0.1031951904296875, 0.11034774780273438, 0.11750030517578125, 0.12465286254882812, 0.131805419921875, 0.13895797729492188, 0.14611053466796875, 0.15326309204101562, 0.1604156494140625, 0.16756820678710938, 0.17472076416015625, 0.18187332153320312, 0.18902587890625, 0.19617843627929688, 0.20333099365234375, 0.21048355102539062, 0.2176361083984375, 0.22478866577148438, 0.23194122314453125, 0.23909378051757812, 0.246246337890625, 0.2533988952636719, 0.26055145263671875, 0.2677040100097656, 0.2748565673828125, 0.2820091247558594, 0.28916168212890625, 0.2963142395019531, 0.303466796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 13.0, 22.0, 27.0, 36.0, 71.0, 102.0, 244.0, 181.0, 107.0, 46.0, 39.0, 31.0, 14.0, 16.0, 9.0, 11.0, 4.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.124641418457031e-05, -4.003103822469711e-05, -3.8815662264823914e-05, -3.7600286304950714e-05, -3.6384910345077515e-05, -3.5169534385204315e-05, -3.3954158425331116e-05, -3.2738782465457916e-05, -3.152340650558472e-05, -3.0308030545711517e-05, -2.9092654585838318e-05, -2.787727862596512e-05, -2.666190266609192e-05, -2.544652670621872e-05, -2.423115074634552e-05, -2.301577478647232e-05, -2.180039882659912e-05, -2.058502286672592e-05, -1.9369646906852722e-05, -1.8154270946979523e-05, -1.6938894987106323e-05, -1.5723519027233124e-05, -1.4508143067359924e-05, -1.3292767107486725e-05, -1.2077391147613525e-05, -1.0862015187740326e-05, -9.646639227867126e-06, -8.431263267993927e-06, -7.2158873081207275e-06, -6.000511348247528e-06, -4.785135388374329e-06, -3.569759428501129e-06, -2.3543834686279297e-06, -1.1390075087547302e-06, 7.636845111846924e-08, 1.2917444109916687e-06, 2.507120370864868e-06, 3.7224963307380676e-06, 4.937872290611267e-06, 6.1532482504844666e-06, 7.368624210357666e-06, 8.584000170230865e-06, 9.799376130104065e-06, 1.1014752089977264e-05, 1.2230128049850464e-05, 1.3445504009723663e-05, 1.4660879969596863e-05, 1.5876255929470062e-05, 1.7091631889343262e-05, 1.830700784921646e-05, 1.952238380908966e-05, 2.073775976896286e-05, 2.195313572883606e-05, 2.316851168870926e-05, 2.438388764858246e-05, 2.5599263608455658e-05, 2.6814639568328857e-05, 2.8030015528202057e-05, 2.9245391488075256e-05, 3.0460767447948456e-05, 3.1676143407821655e-05, 3.2891519367694855e-05, 3.4106895327568054e-05, 3.5322271287441254e-05, 3.653764724731445e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 3.0, 9.0, 6.0, 11.0, 21.0, 24.0, 26.0, 47.0, 72.0, 128.0, 331.0, 905.0, 3787.0, 29590.0, 734432.0, 261354.0, 14275.0, 2317.0, 648.0, 267.0, 109.0, 46.0, 40.0, 32.0, 13.0, 11.0, 5.0, 7.0, 8.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3462638854980469, -0.33632659912109375, -0.3263893127441406, -0.3164520263671875, -0.3065147399902344, -0.29657745361328125, -0.2866401672363281, -0.276702880859375, -0.2667655944824219, -0.25682830810546875, -0.24689102172851562, -0.2369537353515625, -0.22701644897460938, -0.21707916259765625, -0.20714187622070312, -0.19720458984375, -0.18726730346679688, -0.17733001708984375, -0.16739273071289062, -0.1574554443359375, -0.14751815795898438, -0.13758087158203125, -0.12764358520507812, -0.117706298828125, -0.10776901245117188, -0.09783172607421875, -0.08789443969726562, -0.0779571533203125, -0.06801986694335938, -0.05808258056640625, -0.048145294189453125, -0.0382080078125, -0.028270721435546875, -0.01833343505859375, -0.008396148681640625, 0.0015411376953125, 0.011478424072265625, 0.02141571044921875, 0.031352996826171875, 0.041290283203125, 0.051227569580078125, 0.06116485595703125, 0.07110214233398438, 0.0810394287109375, 0.09097671508789062, 0.10091400146484375, 0.11085128784179688, 0.12078857421875, 0.13072586059570312, 0.14066314697265625, 0.15060043334960938, 0.1605377197265625, 0.17047500610351562, 0.18041229248046875, 0.19034957885742188, 0.200286865234375, 0.21022415161132812, 0.22016143798828125, 0.23009872436523438, 0.2400360107421875, 0.24997329711914062, 0.25991058349609375, 0.2698478698730469, 0.27978515625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 3.0, 9.0, 1.0, 5.0, 7.0, 10.0, 15.0, 20.0, 28.0, 30.0, 39.0, 57.0, 60.0, 69.0, 87.0, 89.0, 82.0, 85.0, 63.0, 54.0, 25.0, 30.0, 30.0, 14.0, 19.0, 24.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.0796346664428711, -0.07662773132324219, -0.07362079620361328, -0.07061386108398438, -0.06760692596435547, -0.06459999084472656, -0.061593055725097656, -0.05858612060546875, -0.055579185485839844, -0.05257225036621094, -0.04956531524658203, -0.046558380126953125, -0.04355144500732422, -0.04054450988769531, -0.037537574768066406, -0.0345306396484375, -0.031523704528808594, -0.028516769409179688, -0.02550983428955078, -0.022502899169921875, -0.01949596405029297, -0.016489028930664062, -0.013482093811035156, -0.01047515869140625, -0.007468223571777344, -0.0044612884521484375, -0.0014543533325195312, 0.001552581787109375, 0.004559516906738281, 0.0075664520263671875, 0.010573387145996094, 0.013580322265625, 0.016587257385253906, 0.019594192504882812, 0.02260112762451172, 0.025608062744140625, 0.02861499786376953, 0.03162193298339844, 0.034628868103027344, 0.03763580322265625, 0.040642738342285156, 0.04364967346191406, 0.04665660858154297, 0.049663543701171875, 0.05267047882080078, 0.05567741394042969, 0.058684349060058594, 0.0616912841796875, 0.0646982192993164, 0.06770515441894531, 0.07071208953857422, 0.07371902465820312, 0.07672595977783203, 0.07973289489746094, 0.08273983001708984, 0.08574676513671875, 0.08875370025634766, 0.09176063537597656, 0.09476757049560547, 0.09777450561523438, 0.10078144073486328, 0.10378837585449219, 0.1067953109741211, 0.10980224609375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 15.0, 45.0, 109.0, 335.0, 301.0, 135.0, 41.0, 10.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.869244575500488, -5.749422550201416, -5.629600524902344, -5.50977897644043, -5.389956951141357, -5.270134925842285, -5.150312900543213, -5.030490875244141, -4.910669326782227, -4.790847301483154, -4.671025276184082, -4.551203727722168, -4.431381702423096, -4.311559677124023, -4.191737651824951, -4.071915626525879, -3.9520936012268066, -3.8322715759277344, -3.712449789047241, -3.592627763748169, -3.472805976867676, -3.3529839515686035, -3.2331619262695312, -3.113340139389038, -2.993518352508545, -2.8736963272094727, -2.7538745403289795, -2.6340525150299072, -2.514230728149414, -2.394408702850342, -2.2745866775512695, -2.1547648906707764, -2.034943103790283, -1.9151211977005005, -1.7952992916107178, -1.6754772663116455, -1.5556553602218628, -1.43583345413208, -1.3160115480422974, -1.1961896419525146, -1.0763676166534424, -0.9565457105636597, -0.8367237448692322, -0.7169018387794495, -0.597079873085022, -0.47725796699523926, -0.35743606090545654, -0.23761409521102905, -0.11779212951660156, 0.002029798924922943, 0.12185172736644745, 0.24167364835739136, 0.36149558424949646, 0.48131752014160156, 0.6011394262313843, 0.7209613919258118, 0.8407832980155945, 0.9606052041053772, 1.0804271697998047, 1.2002490758895874, 1.3200709819793701, 1.4398930072784424, 1.5597147941589355, 1.6795368194580078, 1.7993587255477905]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 8.0, 11.0, 14.0, 11.0, 13.0, 12.0, 23.0, 24.0, 14.0, 23.0, 24.0, 25.0, 33.0, 28.0, 31.0, 51.0, 39.0, 46.0, 45.0, 31.0, 50.0, 40.0, 36.0, 54.0, 30.0, 35.0, 27.0, 23.0, 21.0, 25.0, 24.0, 16.0, 20.0, 16.0, 11.0, 17.0, 12.0, 5.0, 6.0, 4.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.836789071559906, -0.8119509220123291, -0.7871127128601074, -0.7622745037078857, -0.7374363541603088, -0.7125982046127319, -0.6877599954605103, -0.6629217863082886, -0.6380836367607117, -0.6132454872131348, -0.5884072780609131, -0.5635690689086914, -0.5387309193611145, -0.5138927698135376, -0.4890545606613159, -0.4642163813114166, -0.43937820196151733, -0.41454002261161804, -0.38970184326171875, -0.36486366391181946, -0.34002548456192017, -0.3151873052120209, -0.2903491258621216, -0.2655109465122223, -0.240672767162323, -0.2158345878124237, -0.19099640846252441, -0.16615822911262512, -0.14132004976272583, -0.11648187041282654, -0.09164369106292725, -0.06680551171302795, -0.04196739196777344, -0.017129212617874146, 0.0077089667320251465, 0.03254714608192444, 0.05738532543182373, 0.08222350478172302, 0.10706168413162231, 0.1318998634815216, 0.1567380428314209, 0.1815762221813202, 0.20641440153121948, 0.23125258088111877, 0.25609076023101807, 0.28092893958091736, 0.30576711893081665, 0.33060529828071594, 0.35544347763061523, 0.3802816569805145, 0.4051198363304138, 0.4299580156803131, 0.4547961950302124, 0.4796343743801117, 0.504472553730011, 0.5293107032775879, 0.5541489124298096, 0.5789871215820312, 0.6038252711296082, 0.6286634206771851, 0.6535016298294067, 0.6783398389816284, 0.7031779885292053, 0.7280161380767822, 0.7528543472290039]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 0.0, 1.0, 7.0, 8.0, 16.0, 17.0, 29.0, 62.0, 108.0, 189.0, 314.0, 648.0, 1472.0, 3541.0, 8383.0, 26899.0, 239040.0, 3455236.0, 404299.0, 36918.0, 10591.0, 3699.0, 1502.0, 662.0, 300.0, 156.0, 72.0, 40.0, 24.0, 12.0, 12.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26953125, -0.25939178466796875, -0.2492523193359375, -0.23911285400390625, -0.228973388671875, -0.21883392333984375, -0.2086944580078125, -0.19855499267578125, -0.18841552734375, -0.17827606201171875, -0.1681365966796875, -0.15799713134765625, -0.147857666015625, -0.13771820068359375, -0.1275787353515625, -0.11743927001953125, -0.1072998046875, -0.09716033935546875, -0.0870208740234375, -0.07688140869140625, -0.066741943359375, -0.05660247802734375, -0.0464630126953125, -0.03632354736328125, -0.02618408203125, -0.01604461669921875, -0.0059051513671875, 0.00423431396484375, 0.014373779296875, 0.02451324462890625, 0.0346527099609375, 0.04479217529296875, 0.054931640625, 0.06507110595703125, 0.0752105712890625, 0.08535003662109375, 0.095489501953125, 0.10562896728515625, 0.1157684326171875, 0.12590789794921875, 0.13604736328125, 0.14618682861328125, 0.1563262939453125, 0.16646575927734375, 0.176605224609375, 0.18674468994140625, 0.1968841552734375, 0.20702362060546875, 0.2171630859375, 0.22730255126953125, 0.2374420166015625, 0.24758148193359375, 0.257720947265625, 0.26786041259765625, 0.2779998779296875, 0.28813934326171875, 0.29827880859375, 0.30841827392578125, 0.3185577392578125, 0.32869720458984375, 0.338836669921875, 0.34897613525390625, 0.3591156005859375, 0.36925506591796875, 0.37939453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 11.0, 12.0, 27.0, 39.0, 29.0, 46.0, 58.0, 57.0, 74.0, 75.0, 78.0, 83.0, 65.0, 55.0, 74.0, 53.0, 44.0, 35.0, 23.0, 21.0, 13.0, 10.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17911911010742188, -0.17330169677734375, -0.16748428344726562, -0.1616668701171875, -0.15584945678710938, -0.15003204345703125, -0.14421463012695312, -0.138397216796875, -0.13257980346679688, -0.12676239013671875, -0.12094497680664062, -0.1151275634765625, -0.10931015014648438, -0.10349273681640625, -0.09767532348632812, -0.09185791015625, -0.08604049682617188, -0.08022308349609375, -0.07440567016601562, -0.0685882568359375, -0.06277084350585938, -0.05695343017578125, -0.051136016845703125, -0.045318603515625, -0.039501190185546875, -0.03368377685546875, -0.027866363525390625, -0.0220489501953125, -0.016231536865234375, -0.01041412353515625, -0.004596710205078125, 0.001220703125, 0.007038116455078125, 0.01285552978515625, 0.018672943115234375, 0.0244903564453125, 0.030307769775390625, 0.03612518310546875, 0.041942596435546875, 0.047760009765625, 0.053577423095703125, 0.05939483642578125, 0.06521224975585938, 0.0710296630859375, 0.07684707641601562, 0.08266448974609375, 0.08848190307617188, 0.09429931640625, 0.10011672973632812, 0.10593414306640625, 0.11175155639648438, 0.1175689697265625, 0.12338638305664062, 0.12920379638671875, 0.13502120971679688, 0.140838623046875, 0.14665603637695312, 0.15247344970703125, 0.15829086303710938, 0.1641082763671875, 0.16992568969726562, 0.17574310302734375, 0.18156051635742188, 0.1873779296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 11.0, 10.0, 11.0, 16.0, 22.0, 29.0, 29.0, 41.0, 43.0, 63.0, 99.0, 138.0, 185.0, 342.0, 525.0, 835.0, 1714.0, 3592.0, 9889.0, 43830.0, 1134220.0, 2921103.0, 57254.0, 11662.0, 4068.0, 1888.0, 965.0, 571.0, 352.0, 209.0, 139.0, 108.0, 76.0, 41.0, 47.0, 26.0, 30.0, 21.0, 15.0, 14.0, 8.0, 9.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.537109375, -0.5208663940429688, -0.5046234130859375, -0.48838043212890625, -0.472137451171875, -0.45589447021484375, -0.4396514892578125, -0.42340850830078125, -0.40716552734375, -0.39092254638671875, -0.3746795654296875, -0.35843658447265625, -0.342193603515625, -0.32595062255859375, -0.3097076416015625, -0.29346466064453125, -0.2772216796875, -0.26097869873046875, -0.2447357177734375, -0.22849273681640625, -0.212249755859375, -0.19600677490234375, -0.1797637939453125, -0.16352081298828125, -0.14727783203125, -0.13103485107421875, -0.1147918701171875, -0.09854888916015625, -0.082305908203125, -0.06606292724609375, -0.0498199462890625, -0.03357696533203125, -0.017333984375, -0.00109100341796875, 0.0151519775390625, 0.03139495849609375, 0.047637939453125, 0.06388092041015625, 0.0801239013671875, 0.09636688232421875, 0.11260986328125, 0.12885284423828125, 0.1450958251953125, 0.16133880615234375, 0.177581787109375, 0.19382476806640625, 0.2100677490234375, 0.22631072998046875, 0.2425537109375, 0.25879669189453125, 0.2750396728515625, 0.29128265380859375, 0.307525634765625, 0.32376861572265625, 0.3400115966796875, 0.35625457763671875, 0.37249755859375, 0.38874053955078125, 0.4049835205078125, 0.42122650146484375, 0.437469482421875, 0.45371246337890625, 0.4699554443359375, 0.48619842529296875, 0.50244140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 2.0, 7.0, 11.0, 23.0, 53.0, 158.0, 822.0, 2381.0, 397.0, 117.0, 48.0, 20.0, 7.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.635009765625, -0.61474609375, -0.594482421875, -0.57421875, -0.553955078125, -0.53369140625, -0.513427734375, -0.4931640625, -0.472900390625, -0.45263671875, -0.432373046875, -0.412109375, -0.391845703125, -0.37158203125, -0.351318359375, -0.3310546875, -0.310791015625, -0.29052734375, -0.270263671875, -0.25, -0.229736328125, -0.20947265625, -0.189208984375, -0.1689453125, -0.148681640625, -0.12841796875, -0.108154296875, -0.087890625, -0.067626953125, -0.04736328125, -0.027099609375, -0.0068359375, 0.013427734375, 0.03369140625, 0.053955078125, 0.07421875, 0.094482421875, 0.11474609375, 0.135009765625, 0.1552734375, 0.175537109375, 0.19580078125, 0.216064453125, 0.236328125, 0.256591796875, 0.27685546875, 0.297119140625, 0.3173828125, 0.337646484375, 0.35791015625, 0.378173828125, 0.3984375, 0.418701171875, 0.43896484375, 0.459228515625, 0.4794921875, 0.499755859375, 0.52001953125, 0.540283203125, 0.560546875, 0.580810546875, 0.60107421875, 0.621337890625, 0.6416015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 10.0, 15.0, 36.0, 96.0, 215.0, 279.0, 172.0, 92.0, 39.0, 22.0, 16.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5497100353240967, -2.47336483001709, -2.397019386291504, -2.320674180984497, -2.2443289756774902, -2.1679837703704834, -2.0916385650634766, -2.0152931213378906, -1.9389479160308838, -1.862602710723877, -1.7862573862075806, -1.7099120616912842, -1.6335668563842773, -1.5572216510772705, -1.4808763265609741, -1.4045310020446777, -1.328185796737671, -1.251840591430664, -1.1754952669143677, -1.0991499423980713, -1.0228047370910645, -0.9464594721794128, -0.8701142072677612, -0.7937689423561096, -0.717423677444458, -0.6410784125328064, -0.5647331476211548, -0.4883878827095032, -0.41204261779785156, -0.33569735288619995, -0.25935208797454834, -0.18300682306289673, -0.10666179656982422, -0.030316531658172607, 0.046028733253479004, 0.12237399816513062, 0.19871926307678223, 0.27506452798843384, 0.35140979290008545, 0.42775505781173706, 0.5041003227233887, 0.5804455876350403, 0.6567908525466919, 0.7331361174583435, 0.8094813823699951, 0.8858266472816467, 0.9621719121932983, 1.0385172367095947, 1.1148624420166016, 1.1912076473236084, 1.2675529718399048, 1.3438982963562012, 1.420243501663208, 1.4965887069702148, 1.5729340314865112, 1.6492793560028076, 1.7256245613098145, 1.8019697666168213, 1.8783150911331177, 1.954660415649414, 2.031005620956421, 2.1073508262634277, 2.1836962699890137, 2.2600414752960205, 2.3363866806030273]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 8.0, 10.0, 6.0, 10.0, 16.0, 21.0, 27.0, 37.0, 31.0, 41.0, 43.0, 47.0, 43.0, 32.0, 49.0, 48.0, 46.0, 51.0, 38.0, 47.0, 37.0, 42.0, 46.0, 34.0, 33.0, 33.0, 21.0, 26.0, 11.0, 18.0, 16.0, 13.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6365352869033813, -0.6102188229560852, -0.5839023590087891, -0.5575858950614929, -0.5312694311141968, -0.5049529671669006, -0.4786365032196045, -0.45232003927230835, -0.4260035753250122, -0.39968711137771606, -0.3733706474304199, -0.3470541834831238, -0.32073771953582764, -0.2944212555885315, -0.26810479164123535, -0.24178831279277802, -0.21547183394432068, -0.18915536999702454, -0.1628389060497284, -0.13652244210243225, -0.11020597070455551, -0.08388949930667877, -0.05757303535938263, -0.03125657141208649, -0.004940107464790344, 0.021376358345150948, 0.04769282415509224, 0.07400929182767868, 0.10032575577497482, 0.12664222717285156, 0.1529586911201477, 0.17927515506744385, 0.20559161901474, 0.23190808296203613, 0.2582245469093323, 0.2845410108566284, 0.31085747480392456, 0.3371739387512207, 0.36349040269851685, 0.389806866645813, 0.41612333059310913, 0.4424397945404053, 0.4687562584877014, 0.49507272243499756, 0.5213891863822937, 0.5477056503295898, 0.574022114276886, 0.6003385782241821, 0.626655101776123, 0.6529715657234192, 0.6792880296707153, 0.7056044936180115, 0.7319209575653076, 0.7582374215126038, 0.7845538854598999, 0.810870349407196, 0.8371868133544922, 0.8635032773017883, 0.8898197412490845, 0.9161362051963806, 0.9424526691436768, 0.9687691330909729, 0.995085597038269, 1.02140212059021, 1.0477185249328613]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 6.0, 17.0, 29.0, 40.0, 55.0, 93.0, 157.0, 366.0, 784.0, 2028.0, 5478.0, 17450.0, 65590.0, 357150.0, 480804.0, 85527.0, 21921.0, 6856.0, 2346.0, 967.0, 386.0, 169.0, 112.0, 67.0, 50.0, 18.0, 15.0, 18.0, 10.0, 7.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5099868774414062, -0.4940948486328125, -0.47820281982421875, -0.462310791015625, -0.44641876220703125, -0.4305267333984375, -0.41463470458984375, -0.39874267578125, -0.38285064697265625, -0.3669586181640625, -0.35106658935546875, -0.335174560546875, -0.31928253173828125, -0.3033905029296875, -0.28749847412109375, -0.2716064453125, -0.25571441650390625, -0.2398223876953125, -0.22393035888671875, -0.208038330078125, -0.19214630126953125, -0.1762542724609375, -0.16036224365234375, -0.14447021484375, -0.12857818603515625, -0.1126861572265625, -0.09679412841796875, -0.080902099609375, -0.06501007080078125, -0.0491180419921875, -0.03322601318359375, -0.017333984375, -0.00144195556640625, 0.0144500732421875, 0.03034210205078125, 0.046234130859375, 0.06212615966796875, 0.0780181884765625, 0.09391021728515625, 0.10980224609375, 0.12569427490234375, 0.1415863037109375, 0.15747833251953125, 0.173370361328125, 0.18926239013671875, 0.2051544189453125, 0.22104644775390625, 0.2369384765625, 0.25283050537109375, 0.2687225341796875, 0.28461456298828125, 0.300506591796875, 0.31639862060546875, 0.3322906494140625, 0.34818267822265625, 0.36407470703125, 0.37996673583984375, 0.3958587646484375, 0.41175079345703125, 0.427642822265625, 0.44353485107421875, 0.4594268798828125, 0.47531890869140625, 0.4912109375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 12.0, 14.0, 27.0, 30.0, 35.0, 43.0, 70.0, 62.0, 78.0, 71.0, 69.0, 87.0, 70.0, 63.0, 59.0, 61.0, 40.0, 36.0, 23.0, 20.0, 9.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182861328125, -0.1766834259033203, -0.17050552368164062, -0.16432762145996094, -0.15814971923828125, -0.15197181701660156, -0.14579391479492188, -0.1396160125732422, -0.1334381103515625, -0.1272602081298828, -0.12108230590820312, -0.11490440368652344, -0.10872650146484375, -0.10254859924316406, -0.09637069702148438, -0.09019279479980469, -0.084014892578125, -0.07783699035644531, -0.07165908813476562, -0.06548118591308594, -0.05930328369140625, -0.05312538146972656, -0.046947479248046875, -0.04076957702636719, -0.0345916748046875, -0.028413772583007812, -0.022235870361328125, -0.016057968139648438, -0.00988006591796875, -0.0037021636962890625, 0.002475738525390625, 0.008653640747070312, 0.01483154296875, 0.021009445190429688, 0.027187347412109375, 0.03336524963378906, 0.03954315185546875, 0.04572105407714844, 0.051898956298828125, 0.05807685852050781, 0.0642547607421875, 0.07043266296386719, 0.07661056518554688, 0.08278846740722656, 0.08896636962890625, 0.09514427185058594, 0.10132217407226562, 0.10750007629394531, 0.113677978515625, 0.11985588073730469, 0.12603378295898438, 0.13221168518066406, 0.13838958740234375, 0.14456748962402344, 0.15074539184570312, 0.1569232940673828, 0.1631011962890625, 0.1692790985107422, 0.17545700073242188, 0.18163490295410156, 0.18781280517578125, 0.19399070739746094, 0.20016860961914062, 0.2063465118408203, 0.2125244140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 7.0, 7.0, 13.0, 16.0, 30.0, 39.0, 104.0, 261.0, 628.0, 1834.0, 5785.0, 20213.0, 81421.0, 441058.0, 396713.0, 73839.0, 18477.0, 5276.0, 1727.0, 601.0, 253.0, 103.0, 52.0, 34.0, 19.0, 6.0, 7.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5395011901855469, -0.5252914428710938, -0.5110816955566406, -0.4968719482421875, -0.4826622009277344, -0.46845245361328125, -0.4542427062988281, -0.440032958984375, -0.4258232116699219, -0.41161346435546875, -0.3974037170410156, -0.3831939697265625, -0.3689842224121094, -0.35477447509765625, -0.3405647277832031, -0.32635498046875, -0.3121452331542969, -0.29793548583984375, -0.2837257385253906, -0.2695159912109375, -0.2553062438964844, -0.24109649658203125, -0.22688674926757812, -0.212677001953125, -0.19846725463867188, -0.18425750732421875, -0.17004776000976562, -0.1558380126953125, -0.14162826538085938, -0.12741851806640625, -0.11320877075195312, -0.0989990234375, -0.08478927612304688, -0.07057952880859375, -0.056369781494140625, -0.0421600341796875, -0.027950286865234375, -0.01374053955078125, 0.000469207763671875, 0.014678955078125, 0.028888702392578125, 0.04309844970703125, 0.057308197021484375, 0.0715179443359375, 0.08572769165039062, 0.09993743896484375, 0.11414718627929688, 0.12835693359375, 0.14256668090820312, 0.15677642822265625, 0.17098617553710938, 0.1851959228515625, 0.19940567016601562, 0.21361541748046875, 0.22782516479492188, 0.242034912109375, 0.2562446594238281, 0.27045440673828125, 0.2846641540527344, 0.2988739013671875, 0.3130836486816406, 0.32729339599609375, 0.3415031433105469, 0.355712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 17.0, 19.0, 18.0, 17.0, 24.0, 32.0, 38.0, 32.0, 46.0, 49.0, 40.0, 34.0, 51.0, 47.0, 53.0, 40.0, 42.0, 46.0, 51.0, 42.0, 27.0, 38.0, 22.0, 23.0, 22.0, 22.0, 12.0, 9.0, 12.0, 13.0, 6.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.24321365356445312, -0.23398590087890625, -0.22475814819335938, -0.2155303955078125, -0.20630264282226562, -0.19707489013671875, -0.18784713745117188, -0.178619384765625, -0.16939163208007812, -0.16016387939453125, -0.15093612670898438, -0.1417083740234375, -0.13248062133789062, -0.12325286865234375, -0.11402511596679688, -0.10479736328125, -0.09556961059570312, -0.08634185791015625, -0.07711410522460938, -0.0678863525390625, -0.058658599853515625, -0.04943084716796875, -0.040203094482421875, -0.030975341796875, -0.021747589111328125, -0.01251983642578125, -0.003292083740234375, 0.0059356689453125, 0.015163421630859375, 0.02439117431640625, 0.033618927001953125, 0.0428466796875, 0.052074432373046875, 0.06130218505859375, 0.07052993774414062, 0.0797576904296875, 0.08898544311523438, 0.09821319580078125, 0.10744094848632812, 0.116668701171875, 0.12589645385742188, 0.13512420654296875, 0.14435195922851562, 0.1535797119140625, 0.16280746459960938, 0.17203521728515625, 0.18126296997070312, 0.19049072265625, 0.19971847534179688, 0.20894622802734375, 0.21817398071289062, 0.2274017333984375, 0.23662948608398438, 0.24585723876953125, 0.2550849914550781, 0.264312744140625, 0.2735404968261719, 0.28276824951171875, 0.2919960021972656, 0.3012237548828125, 0.3104515075683594, 0.31967926025390625, 0.3289070129394531, 0.338134765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 13.0, 15.0, 18.0, 38.0, 67.0, 101.0, 162.0, 273.0, 372.0, 615.0, 1165.0, 2156.0, 3987.0, 8669.0, 21010.0, 68897.0, 493327.0, 357989.0, 55921.0, 18011.0, 7590.0, 3641.0, 1888.0, 1088.0, 552.0, 371.0, 198.0, 141.0, 103.0, 70.0, 32.0, 19.0, 14.0, 14.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15285110473632812, -0.14774322509765625, -0.14263534545898438, -0.1375274658203125, -0.13241958618164062, -0.12731170654296875, -0.12220382690429688, -0.117095947265625, -0.11198806762695312, -0.10688018798828125, -0.10177230834960938, -0.0966644287109375, -0.09155654907226562, -0.08644866943359375, -0.08134078979492188, -0.07623291015625, -0.07112503051757812, -0.06601715087890625, -0.060909271240234375, -0.0558013916015625, -0.050693511962890625, -0.04558563232421875, -0.040477752685546875, -0.035369873046875, -0.030261993408203125, -0.02515411376953125, -0.020046234130859375, -0.0149383544921875, -0.009830474853515625, -0.00472259521484375, 0.000385284423828125, 0.0054931640625, 0.010601043701171875, 0.01570892333984375, 0.020816802978515625, 0.0259246826171875, 0.031032562255859375, 0.03614044189453125, 0.041248321533203125, 0.046356201171875, 0.051464080810546875, 0.05657196044921875, 0.061679840087890625, 0.0667877197265625, 0.07189559936523438, 0.07700347900390625, 0.08211135864257812, 0.08721923828125, 0.09232711791992188, 0.09743499755859375, 0.10254287719726562, 0.1076507568359375, 0.11275863647460938, 0.11786651611328125, 0.12297439575195312, 0.128082275390625, 0.13319015502929688, 0.13829803466796875, 0.14340591430664062, 0.1485137939453125, 0.15362167358398438, 0.15872955322265625, 0.16383743286132812, 0.1689453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 3.0, 4.0, 12.0, 12.0, 11.0, 20.0, 28.0, 53.0, 62.0, 114.0, 162.0, 174.0, 113.0, 66.0, 36.0, 30.0, 22.0, 16.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.777576446533203e-05, -2.6850029826164246e-05, -2.592429518699646e-05, -2.4998560547828674e-05, -2.407282590866089e-05, -2.3147091269493103e-05, -2.2221356630325317e-05, -2.1295621991157532e-05, -2.0369887351989746e-05, -1.944415271282196e-05, -1.8518418073654175e-05, -1.759268343448639e-05, -1.6666948795318604e-05, -1.5741214156150818e-05, -1.4815479516983032e-05, -1.3889744877815247e-05, -1.2964010238647461e-05, -1.2038275599479675e-05, -1.111254096031189e-05, -1.0186806321144104e-05, -9.261071681976318e-06, -8.335337042808533e-06, -7.409602403640747e-06, -6.4838677644729614e-06, -5.558133125305176e-06, -4.63239848613739e-06, -3.7066638469696045e-06, -2.780929207801819e-06, -1.8551945686340332e-06, -9.294599294662476e-07, -3.725290298461914e-09, 9.220093488693237e-07, 1.8477439880371094e-06, 2.773478627204895e-06, 3.6992132663726807e-06, 4.624947905540466e-06, 5.550682544708252e-06, 6.476417183876038e-06, 7.402151823043823e-06, 8.327886462211609e-06, 9.253621101379395e-06, 1.017935574054718e-05, 1.1105090379714966e-05, 1.2030825018882751e-05, 1.2956559658050537e-05, 1.3882294297218323e-05, 1.4808028936386108e-05, 1.5733763575553894e-05, 1.665949821472168e-05, 1.7585232853889465e-05, 1.851096749305725e-05, 1.9436702132225037e-05, 2.0362436771392822e-05, 2.1288171410560608e-05, 2.2213906049728394e-05, 2.313964068889618e-05, 2.4065375328063965e-05, 2.499110996723175e-05, 2.5916844606399536e-05, 2.6842579245567322e-05, 2.7768313884735107e-05, 2.8694048523902893e-05, 2.961978316307068e-05, 3.0545517802238464e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 0.0, 4.0, 2.0, 8.0, 3.0, 9.0, 14.0, 11.0, 22.0, 30.0, 48.0, 119.0, 306.0, 792.0, 2309.0, 7668.0, 46644.0, 893189.0, 82262.0, 10621.0, 2803.0, 1007.0, 351.0, 142.0, 66.0, 36.0, 23.0, 9.0, 15.0, 7.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38671875, -0.3740806579589844, -0.36144256591796875, -0.3488044738769531, -0.3361663818359375, -0.3235282897949219, -0.31089019775390625, -0.2982521057128906, -0.285614013671875, -0.2729759216308594, -0.26033782958984375, -0.24769973754882812, -0.2350616455078125, -0.22242355346679688, -0.20978546142578125, -0.19714736938476562, -0.18450927734375, -0.17187118530273438, -0.15923309326171875, -0.14659500122070312, -0.1339569091796875, -0.12131881713867188, -0.10868072509765625, -0.09604263305664062, -0.083404541015625, -0.07076644897460938, -0.05812835693359375, -0.045490264892578125, -0.0328521728515625, -0.020214080810546875, -0.00757598876953125, 0.005062103271484375, 0.0177001953125, 0.030338287353515625, 0.04297637939453125, 0.055614471435546875, 0.0682525634765625, 0.08089065551757812, 0.09352874755859375, 0.10616683959960938, 0.118804931640625, 0.13144302368164062, 0.14408111572265625, 0.15671920776367188, 0.1693572998046875, 0.18199539184570312, 0.19463348388671875, 0.20727157592773438, 0.21990966796875, 0.23254776000976562, 0.24518585205078125, 0.2578239440917969, 0.2704620361328125, 0.2831001281738281, 0.29573822021484375, 0.3083763122558594, 0.321014404296875, 0.3336524963378906, 0.34629058837890625, 0.3589286804199219, 0.3715667724609375, 0.3842048645019531, 0.39684295654296875, 0.4094810485839844, 0.422119140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 8.0, 4.0, 10.0, 4.0, 13.0, 17.0, 22.0, 28.0, 63.0, 80.0, 128.0, 177.0, 175.0, 84.0, 56.0, 38.0, 17.0, 11.0, 8.0, 9.0, 8.0, 10.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.177734375, -0.17260360717773438, -0.16747283935546875, -0.16234207153320312, -0.1572113037109375, -0.15208053588867188, -0.14694976806640625, -0.14181900024414062, -0.136688232421875, -0.13155746459960938, -0.12642669677734375, -0.12129592895507812, -0.1161651611328125, -0.11103439331054688, -0.10590362548828125, -0.10077285766601562, -0.09564208984375, -0.09051132202148438, -0.08538055419921875, -0.08024978637695312, -0.0751190185546875, -0.06998825073242188, -0.06485748291015625, -0.059726715087890625, -0.054595947265625, -0.049465179443359375, -0.04433441162109375, -0.039203643798828125, -0.0340728759765625, -0.028942108154296875, -0.02381134033203125, -0.018680572509765625, -0.0135498046875, -0.008419036865234375, -0.00328826904296875, 0.001842498779296875, 0.0069732666015625, 0.012104034423828125, 0.01723480224609375, 0.022365570068359375, 0.027496337890625, 0.032627105712890625, 0.03775787353515625, 0.042888641357421875, 0.0480194091796875, 0.053150177001953125, 0.05828094482421875, 0.06341171264648438, 0.06854248046875, 0.07367324829101562, 0.07880401611328125, 0.08393478393554688, 0.0890655517578125, 0.09419631958007812, 0.09932708740234375, 0.10445785522460938, 0.109588623046875, 0.11471939086914062, 0.11985015869140625, 0.12498092651367188, 0.1301116943359375, 0.13524246215820312, 0.14037322998046875, 0.14550399780273438, 0.150634765625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 14.0, 61.0, 174.0, 409.0, 245.0, 82.0, 18.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8761684894561768, -3.745697021484375, -3.6152255535125732, -3.4847540855407715, -3.3542826175689697, -3.223811149597168, -3.093339443206787, -2.9628682136535645, -2.8323965072631836, -2.701925039291382, -2.57145357131958, -2.4409821033477783, -2.3105106353759766, -2.180039167404175, -2.049567699432373, -1.9190961122512817, -1.7886247634887695, -1.6581532955169678, -1.527681827545166, -1.3972103595733643, -1.2667388916015625, -1.1362674236297607, -1.0057958364486694, -0.8753243684768677, -0.7448529005050659, -0.6143814325332642, -0.48390993475914, -0.35343843698501587, -0.2229669690132141, -0.09249550104141235, 0.03797602653503418, 0.16844749450683594, 0.2989187240600586, 0.42939019203186035, 0.5598616600036621, 0.6903331875801086, 0.8208046555519104, 0.9512761235237122, 1.0817476511001587, 1.2122191190719604, 1.3426905870437622, 1.473162055015564, 1.6036335229873657, 1.734105110168457, 1.8645765781402588, 1.9950480461120605, 2.1255195140838623, 2.255990982055664, 2.386462450027466, 2.5169339179992676, 2.6474053859710693, 2.777876853942871, 2.908348321914673, 3.0388197898864746, 3.1692914962768555, 3.299762725830078, 3.430234432220459, 3.5607059001922607, 3.6911773681640625, 3.8216488361358643, 3.952120304107666, 4.082592010498047, 4.2130632400512695, 4.34353494644165, 4.474006175994873]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 14.0, 9.0, 8.0, 15.0, 14.0, 26.0, 27.0, 25.0, 31.0, 36.0, 28.0, 45.0, 32.0, 51.0, 49.0, 41.0, 40.0, 42.0, 28.0, 34.0, 42.0, 47.0, 36.0, 28.0, 28.0, 27.0, 34.0, 21.0, 20.0, 22.0, 13.0, 21.0, 9.0, 7.0, 13.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7876015901565552, -0.7645955085754395, -0.7415894269943237, -0.718583345413208, -0.6955773234367371, -0.6725712418556213, -0.6495651602745056, -0.6265590786933899, -0.6035529971122742, -0.5805469155311584, -0.5575408339500427, -0.5345348119735718, -0.511528730392456, -0.48852264881134033, -0.4655165672302246, -0.4425104856491089, -0.41950443387031555, -0.39649835228919983, -0.3734923005104065, -0.35048621892929077, -0.32748013734817505, -0.3044740557670593, -0.281468003988266, -0.25846192240715027, -0.23545585572719574, -0.2124497890472412, -0.1894437074661255, -0.16643764078617096, -0.14343157410621643, -0.12042549252510071, -0.09741942584514618, -0.07441334426403046, -0.05140727758407593, -0.02840120531618595, -0.005395133048295975, 0.017610937356948853, 0.04061701148748398, 0.0636230856180191, 0.08662915229797363, 0.10963523387908936, 0.13264130055904388, 0.1556473672389984, 0.17865344882011414, 0.20165951550006866, 0.2246655821800232, 0.24767166376113892, 0.27067774534225464, 0.29368382692337036, 0.3166898787021637, 0.3396959602832794, 0.36270201206207275, 0.3857080936431885, 0.4087141752243042, 0.4317202568054199, 0.45472630858421326, 0.477732390165329, 0.5007384419441223, 0.523744523525238, 0.5467506051063538, 0.5697566270828247, 0.5927627086639404, 0.6157687902450562, 0.6387748718261719, 0.6617809534072876, 0.6847870349884033]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 9.0, 6.0, 13.0, 22.0, 39.0, 43.0, 99.0, 126.0, 200.0, 339.0, 616.0, 1151.0, 2178.0, 5122.0, 13437.0, 50319.0, 927270.0, 3030288.0, 126735.0, 22963.0, 7458.0, 2945.0, 1399.0, 638.0, 371.0, 192.0, 124.0, 63.0, 53.0, 13.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400390625, -0.3893241882324219, -0.37825775146484375, -0.3671913146972656, -0.3561248779296875, -0.3450584411621094, -0.33399200439453125, -0.3229255676269531, -0.311859130859375, -0.3007926940917969, -0.28972625732421875, -0.2786598205566406, -0.2675933837890625, -0.2565269470214844, -0.24546051025390625, -0.23439407348632812, -0.22332763671875, -0.21226119995117188, -0.20119476318359375, -0.19012832641601562, -0.1790618896484375, -0.16799545288085938, -0.15692901611328125, -0.14586257934570312, -0.134796142578125, -0.12372970581054688, -0.11266326904296875, -0.10159683227539062, -0.0905303955078125, -0.07946395874023438, -0.06839752197265625, -0.057331085205078125, -0.0462646484375, -0.035198211669921875, -0.02413177490234375, -0.013065338134765625, -0.0019989013671875, 0.009067535400390625, 0.02013397216796875, 0.031200408935546875, 0.042266845703125, 0.053333282470703125, 0.06439971923828125, 0.07546615600585938, 0.0865325927734375, 0.09759902954101562, 0.10866546630859375, 0.11973190307617188, 0.13079833984375, 0.14186477661132812, 0.15293121337890625, 0.16399765014648438, 0.1750640869140625, 0.18613052368164062, 0.19719696044921875, 0.20826339721679688, 0.219329833984375, 0.23039627075195312, 0.24146270751953125, 0.2525291442871094, 0.2635955810546875, 0.2746620178222656, 0.28572845458984375, 0.2967948913574219, 0.307861328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 16.0, 7.0, 20.0, 21.0, 22.0, 30.0, 25.0, 44.0, 47.0, 46.0, 46.0, 72.0, 59.0, 66.0, 58.0, 72.0, 43.0, 44.0, 39.0, 38.0, 55.0, 28.0, 24.0, 25.0, 17.0, 9.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.1759786605834961, -0.1714153289794922, -0.16685199737548828, -0.16228866577148438, -0.15772533416748047, -0.15316200256347656, -0.14859867095947266, -0.14403533935546875, -0.13947200775146484, -0.13490867614746094, -0.13034534454345703, -0.12578201293945312, -0.12121868133544922, -0.11665534973144531, -0.1120920181274414, -0.1075286865234375, -0.1029653549194336, -0.09840202331542969, -0.09383869171142578, -0.08927536010742188, -0.08471202850341797, -0.08014869689941406, -0.07558536529541016, -0.07102203369140625, -0.06645870208740234, -0.06189537048339844, -0.05733203887939453, -0.052768707275390625, -0.04820537567138672, -0.04364204406738281, -0.039078712463378906, -0.034515380859375, -0.029952049255371094, -0.025388717651367188, -0.02082538604736328, -0.016262054443359375, -0.011698722839355469, -0.0071353912353515625, -0.0025720596313476562, 0.00199127197265625, 0.006554603576660156, 0.011117935180664062, 0.01568126678466797, 0.020244598388671875, 0.02480792999267578, 0.029371261596679688, 0.033934593200683594, 0.0384979248046875, 0.043061256408691406, 0.04762458801269531, 0.05218791961669922, 0.056751251220703125, 0.06131458282470703, 0.06587791442871094, 0.07044124603271484, 0.07500457763671875, 0.07956790924072266, 0.08413124084472656, 0.08869457244873047, 0.09325790405273438, 0.09782123565673828, 0.10238456726074219, 0.1069478988647461, 0.11151123046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 12.0, 12.0, 11.0, 20.0, 26.0, 30.0, 35.0, 53.0, 82.0, 113.0, 159.0, 215.0, 349.0, 504.0, 887.0, 1774.0, 3712.0, 10967.0, 50110.0, 1498248.0, 2548559.0, 57274.0, 12069.0, 4289.0, 1842.0, 1029.0, 579.0, 379.0, 264.0, 172.0, 137.0, 87.0, 69.0, 57.0, 39.0, 33.0, 22.0, 16.0, 11.0, 7.0, 8.0, 8.0, 3.0, 0.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.501953125, -0.48577880859375, -0.4696044921875, -0.45343017578125, -0.437255859375, -0.42108154296875, -0.4049072265625, -0.38873291015625, -0.37255859375, -0.35638427734375, -0.3402099609375, -0.32403564453125, -0.307861328125, -0.29168701171875, -0.2755126953125, -0.25933837890625, -0.2431640625, -0.22698974609375, -0.2108154296875, -0.19464111328125, -0.178466796875, -0.16229248046875, -0.1461181640625, -0.12994384765625, -0.11376953125, -0.09759521484375, -0.0814208984375, -0.06524658203125, -0.049072265625, -0.03289794921875, -0.0167236328125, -0.00054931640625, 0.015625, 0.03179931640625, 0.0479736328125, 0.06414794921875, 0.080322265625, 0.09649658203125, 0.1126708984375, 0.12884521484375, 0.14501953125, 0.16119384765625, 0.1773681640625, 0.19354248046875, 0.209716796875, 0.22589111328125, 0.2420654296875, 0.25823974609375, 0.2744140625, 0.29058837890625, 0.3067626953125, 0.32293701171875, 0.339111328125, 0.35528564453125, 0.3714599609375, 0.38763427734375, 0.40380859375, 0.41998291015625, 0.4361572265625, 0.45233154296875, 0.468505859375, 0.48468017578125, 0.5008544921875, 0.51702880859375, 0.533203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 7.0, 19.0, 31.0, 67.0, 151.0, 519.0, 2091.0, 759.0, 202.0, 91.0, 49.0, 25.0, 16.0, 6.0, 7.0, 3.0, 9.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.311767578125, -0.2966804504394531, -0.28159332275390625, -0.2665061950683594, -0.2514190673828125, -0.23633193969726562, -0.22124481201171875, -0.20615768432617188, -0.191070556640625, -0.17598342895507812, -0.16089630126953125, -0.14580917358398438, -0.1307220458984375, -0.11563491821289062, -0.10054779052734375, -0.08546066284179688, -0.07037353515625, -0.055286407470703125, -0.04019927978515625, -0.025112152099609375, -0.0100250244140625, 0.005062103271484375, 0.02014923095703125, 0.035236358642578125, 0.050323486328125, 0.06541061401367188, 0.08049774169921875, 0.09558486938476562, 0.1106719970703125, 0.12575912475585938, 0.14084625244140625, 0.15593338012695312, 0.1710205078125, 0.18610763549804688, 0.20119476318359375, 0.21628189086914062, 0.2313690185546875, 0.24645614624023438, 0.26154327392578125, 0.2766304016113281, 0.291717529296875, 0.3068046569824219, 0.32189178466796875, 0.3369789123535156, 0.3520660400390625, 0.3671531677246094, 0.38224029541015625, 0.3973274230957031, 0.41241455078125, 0.4275016784667969, 0.44258880615234375, 0.4576759338378906, 0.4727630615234375, 0.4878501892089844, 0.5029373168945312, 0.5180244445800781, 0.533111572265625, 0.5481986999511719, 0.5632858276367188, 0.5783729553222656, 0.5934600830078125, 0.6085472106933594, 0.6236343383789062, 0.6387214660644531, 0.65380859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 17.0, 42.0, 93.0, 176.0, 267.0, 170.0, 105.0, 46.0, 26.0, 19.0, 11.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2815996408462524, -1.2031147480010986, -1.1246298551559448, -1.046144962310791, -0.9676600694656372, -0.8891751766204834, -0.8106902241706848, -0.732205331325531, -0.6537204384803772, -0.5752355456352234, -0.4967506527900696, -0.4182657301425934, -0.3397808372974396, -0.26129594445228577, -0.18281102180480957, -0.10432612895965576, -0.025841236114501953, 0.05264366418123245, 0.13112856447696686, 0.20961347222328186, 0.28809836506843567, 0.3665832579135895, 0.4450681805610657, 0.5235530734062195, 0.6020379662513733, 0.6805228590965271, 0.7590077519416809, 0.8374927043914795, 0.9159775972366333, 0.9944624900817871, 1.072947382926941, 1.1514322757720947, 1.229917049407959, 1.3084019422531128, 1.3868868350982666, 1.4653717279434204, 1.5438566207885742, 1.622341513633728, 1.7008264064788818, 1.7793114185333252, 1.8577961921691895, 1.9362810850143433, 2.014765977859497, 2.0932509899139404, 2.1717357635498047, 2.250220775604248, 2.3287055492401123, 2.4071905612945557, 2.48567533493042, 2.5641603469848633, 2.6426451206207275, 2.721130132675171, 2.799614906311035, 2.8780999183654785, 2.9565846920013428, 3.035069704055786, 3.1135547161102295, 3.192039728164673, 3.270524501800537, 3.3490095138549805, 3.4274942874908447, 3.505979299545288, 3.5844640731811523, 3.6629490852355957, 3.74143385887146]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 15.0, 10.0, 12.0, 24.0, 23.0, 25.0, 28.0, 36.0, 48.0, 47.0, 38.0, 55.0, 59.0, 64.0, 46.0, 44.0, 56.0, 47.0, 30.0, 45.0, 40.0, 30.0, 38.0, 31.0, 25.0, 19.0, 17.0, 13.0, 5.0, 5.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7702376842498779, -0.7382128834724426, -0.7061881422996521, -0.6741633415222168, -0.6421386003494263, -0.610113799571991, -0.5780889987945557, -0.5460642576217651, -0.5140394568443298, -0.4820146858692169, -0.449989914894104, -0.4179651141166687, -0.3859403431415558, -0.35391557216644287, -0.32189077138900757, -0.28986600041389465, -0.25784122943878174, -0.22581645846366882, -0.19379167258739471, -0.1617668867111206, -0.1297421157360077, -0.09771734476089478, -0.06569255888462067, -0.03366777300834656, -0.0016430020332336426, 0.03038177639245987, 0.06240655481815338, 0.0944313332438469, 0.1264561116695404, 0.15848088264465332, 0.19050566852092743, 0.22253045439720154, 0.254555344581604, 0.2865801155567169, 0.31860488653182983, 0.35062968730926514, 0.38265445828437805, 0.41467922925949097, 0.44670403003692627, 0.4787288010120392, 0.5107535719871521, 0.5427783727645874, 0.5748031139373779, 0.6068279147148132, 0.6388527154922485, 0.6708774566650391, 0.7029022574424744, 0.7349270582199097, 0.7669517993927002, 0.7989766001701355, 0.831001341342926, 0.8630261421203613, 0.8950508832931519, 0.9270756840705872, 0.9591004848480225, 0.991125226020813, 1.0231499671936035, 1.055174708366394, 1.0871995687484741, 1.1192243099212646, 1.1512490510940552, 1.1832737922668457, 1.2152986526489258, 1.2473233938217163, 1.2793482542037964]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 6.0, 7.0, 14.0, 22.0, 35.0, 53.0, 66.0, 135.0, 214.0, 363.0, 846.0, 2078.0, 6092.0, 19727.0, 77012.0, 487296.0, 367244.0, 62166.0, 16578.0, 5175.0, 1831.0, 722.0, 352.0, 168.0, 139.0, 59.0, 40.0, 36.0, 21.0, 17.0, 8.0, 9.0, 9.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.6664657592773438, -0.6473846435546875, -0.6283035278320312, -0.609222412109375, -0.5901412963867188, -0.5710601806640625, -0.5519790649414062, -0.53289794921875, -0.5138168334960938, -0.4947357177734375, -0.47565460205078125, -0.456573486328125, -0.43749237060546875, -0.4184112548828125, -0.39933013916015625, -0.3802490234375, -0.36116790771484375, -0.3420867919921875, -0.32300567626953125, -0.303924560546875, -0.28484344482421875, -0.2657623291015625, -0.24668121337890625, -0.22760009765625, -0.20851898193359375, -0.1894378662109375, -0.17035675048828125, -0.151275634765625, -0.13219451904296875, -0.1131134033203125, -0.09403228759765625, -0.074951171875, -0.05587005615234375, -0.0367889404296875, -0.01770782470703125, 0.001373291015625, 0.02045440673828125, 0.0395355224609375, 0.05861663818359375, 0.07769775390625, 0.09677886962890625, 0.1158599853515625, 0.13494110107421875, 0.154022216796875, 0.17310333251953125, 0.1921844482421875, 0.21126556396484375, 0.2303466796875, 0.24942779541015625, 0.2685089111328125, 0.28759002685546875, 0.306671142578125, 0.32575225830078125, 0.3448333740234375, 0.36391448974609375, 0.38299560546875, 0.40207672119140625, 0.4211578369140625, 0.44023895263671875, 0.459320068359375, 0.47840118408203125, 0.4974822998046875, 0.5165634155273438, 0.53564453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 12.0, 9.0, 16.0, 18.0, 28.0, 45.0, 56.0, 47.0, 77.0, 72.0, 96.0, 86.0, 71.0, 70.0, 75.0, 44.0, 49.0, 35.0, 36.0, 23.0, 14.0, 14.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199462890625, -0.1926898956298828, -0.18591690063476562, -0.17914390563964844, -0.17237091064453125, -0.16559791564941406, -0.15882492065429688, -0.1520519256591797, -0.1452789306640625, -0.1385059356689453, -0.13173294067382812, -0.12495994567871094, -0.11818695068359375, -0.11141395568847656, -0.10464096069335938, -0.09786796569824219, -0.091094970703125, -0.08432197570800781, -0.07754898071289062, -0.07077598571777344, -0.06400299072265625, -0.05722999572753906, -0.050457000732421875, -0.04368400573730469, -0.0369110107421875, -0.030138015747070312, -0.023365020751953125, -0.016592025756835938, -0.00981903076171875, -0.0030460357666015625, 0.003726959228515625, 0.010499954223632812, 0.01727294921875, 0.024045944213867188, 0.030818939208984375, 0.03759193420410156, 0.04436492919921875, 0.05113792419433594, 0.057910919189453125, 0.06468391418457031, 0.0714569091796875, 0.07822990417480469, 0.08500289916992188, 0.09177589416503906, 0.09854888916015625, 0.10532188415527344, 0.11209487915039062, 0.11886787414550781, 0.125640869140625, 0.1324138641357422, 0.13918685913085938, 0.14595985412597656, 0.15273284912109375, 0.15950584411621094, 0.16627883911132812, 0.1730518341064453, 0.1798248291015625, 0.1865978240966797, 0.19337081909179688, 0.20014381408691406, 0.20691680908203125, 0.21368980407714844, 0.22046279907226562, 0.2272357940673828, 0.2340087890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 11.0, 14.0, 24.0, 29.0, 52.0, 95.0, 176.0, 296.0, 542.0, 1292.0, 2597.0, 5864.0, 14236.0, 36183.0, 111882.0, 454693.0, 296893.0, 77421.0, 26974.0, 10622.0, 4539.0, 2002.0, 1022.0, 465.0, 278.0, 133.0, 67.0, 47.0, 21.0, 10.0, 11.0, 10.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.403076171875, -0.39116668701171875, -0.3792572021484375, -0.36734771728515625, -0.355438232421875, -0.34352874755859375, -0.3316192626953125, -0.31970977783203125, -0.30780029296875, -0.29589080810546875, -0.2839813232421875, -0.27207183837890625, -0.260162353515625, -0.24825286865234375, -0.2363433837890625, -0.22443389892578125, -0.2125244140625, -0.20061492919921875, -0.1887054443359375, -0.17679595947265625, -0.164886474609375, -0.15297698974609375, -0.1410675048828125, -0.12915802001953125, -0.11724853515625, -0.10533905029296875, -0.0934295654296875, -0.08152008056640625, -0.069610595703125, -0.05770111083984375, -0.0457916259765625, -0.03388214111328125, -0.02197265625, -0.01006317138671875, 0.0018463134765625, 0.01375579833984375, 0.025665283203125, 0.03757476806640625, 0.0494842529296875, 0.06139373779296875, 0.07330322265625, 0.08521270751953125, 0.0971221923828125, 0.10903167724609375, 0.120941162109375, 0.13285064697265625, 0.1447601318359375, 0.15666961669921875, 0.1685791015625, 0.18048858642578125, 0.1923980712890625, 0.20430755615234375, 0.216217041015625, 0.22812652587890625, 0.2400360107421875, 0.25194549560546875, 0.26385498046875, 0.27576446533203125, 0.2876739501953125, 0.29958343505859375, 0.311492919921875, 0.32340240478515625, 0.3353118896484375, 0.34722137451171875, 0.359130859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 3.0, 5.0, 4.0, 4.0, 7.0, 7.0, 11.0, 16.0, 13.0, 17.0, 16.0, 26.0, 28.0, 40.0, 33.0, 35.0, 47.0, 57.0, 36.0, 37.0, 55.0, 52.0, 41.0, 56.0, 40.0, 34.0, 42.0, 40.0, 31.0, 28.0, 26.0, 16.0, 19.0, 22.0, 8.0, 11.0, 12.0, 5.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.308837890625, -0.29869842529296875, -0.2885589599609375, -0.27841949462890625, -0.268280029296875, -0.25814056396484375, -0.2480010986328125, -0.23786163330078125, -0.22772216796875, -0.21758270263671875, -0.2074432373046875, -0.19730377197265625, -0.187164306640625, -0.17702484130859375, -0.1668853759765625, -0.15674591064453125, -0.1466064453125, -0.13646697998046875, -0.1263275146484375, -0.11618804931640625, -0.106048583984375, -0.09590911865234375, -0.0857696533203125, -0.07563018798828125, -0.06549072265625, -0.05535125732421875, -0.0452117919921875, -0.03507232666015625, -0.024932861328125, -0.01479339599609375, -0.0046539306640625, 0.00548553466796875, 0.015625, 0.02576446533203125, 0.0359039306640625, 0.04604339599609375, 0.056182861328125, 0.06632232666015625, 0.0764617919921875, 0.08660125732421875, 0.09674072265625, 0.10688018798828125, 0.1170196533203125, 0.12715911865234375, 0.137298583984375, 0.14743804931640625, 0.1575775146484375, 0.16771697998046875, 0.1778564453125, 0.18799591064453125, 0.1981353759765625, 0.20827484130859375, 0.218414306640625, 0.22855377197265625, 0.2386932373046875, 0.24883270263671875, 0.25897216796875, 0.26911163330078125, 0.2792510986328125, 0.28939056396484375, 0.299530029296875, 0.30966949462890625, 0.3198089599609375, 0.32994842529296875, 0.340087890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 10.0, 10.0, 13.0, 22.0, 28.0, 43.0, 59.0, 91.0, 141.0, 214.0, 351.0, 558.0, 903.0, 1614.0, 3037.0, 6440.0, 16251.0, 54351.0, 403927.0, 469663.0, 59454.0, 17198.0, 6786.0, 3243.0, 1600.0, 931.0, 583.0, 355.0, 217.0, 162.0, 87.0, 78.0, 32.0, 29.0, 22.0, 18.0, 19.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2034912109375, -0.19733047485351562, -0.19116973876953125, -0.18500900268554688, -0.1788482666015625, -0.17268753051757812, -0.16652679443359375, -0.16036605834960938, -0.154205322265625, -0.14804458618164062, -0.14188385009765625, -0.13572311401367188, -0.1295623779296875, -0.12340164184570312, -0.11724090576171875, -0.11108016967773438, -0.10491943359375, -0.09875869750976562, -0.09259796142578125, -0.08643722534179688, -0.0802764892578125, -0.07411575317382812, -0.06795501708984375, -0.061794281005859375, -0.055633544921875, -0.049472808837890625, -0.04331207275390625, -0.037151336669921875, -0.0309906005859375, -0.024829864501953125, -0.01866912841796875, -0.012508392333984375, -0.00634765625, -0.000186920166015625, 0.00597381591796875, 0.012134552001953125, 0.0182952880859375, 0.024456024169921875, 0.03061676025390625, 0.036777496337890625, 0.042938232421875, 0.049098968505859375, 0.05525970458984375, 0.061420440673828125, 0.0675811767578125, 0.07374191284179688, 0.07990264892578125, 0.08606338500976562, 0.09222412109375, 0.09838485717773438, 0.10454559326171875, 0.11070632934570312, 0.1168670654296875, 0.12302780151367188, 0.12918853759765625, 0.13534927368164062, 0.141510009765625, 0.14767074584960938, 0.15383148193359375, 0.15999221801757812, 0.1661529541015625, 0.17231369018554688, 0.17847442626953125, 0.18463516235351562, 0.1907958984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 8.0, 17.0, 26.0, 41.0, 84.0, 168.0, 275.0, 171.0, 74.0, 44.0, 20.0, 19.0, 9.0, 6.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.67572021484375e-05, -6.514694541692734e-05, -6.353668868541718e-05, -6.192643195390701e-05, -6.031617522239685e-05, -5.870591849088669e-05, -5.7095661759376526e-05, -5.5485405027866364e-05, -5.38751482963562e-05, -5.226489156484604e-05, -5.0654634833335876e-05, -4.9044378101825714e-05, -4.743412137031555e-05, -4.582386463880539e-05, -4.421360790729523e-05, -4.2603351175785065e-05, -4.09930944442749e-05, -3.938283771276474e-05, -3.777258098125458e-05, -3.6162324249744415e-05, -3.455206751823425e-05, -3.294181078672409e-05, -3.133155405521393e-05, -2.9721297323703766e-05, -2.8111040592193604e-05, -2.650078386068344e-05, -2.489052712917328e-05, -2.3280270397663116e-05, -2.1670013666152954e-05, -2.0059756934642792e-05, -1.844950020313263e-05, -1.6839243471622467e-05, -1.5228986740112305e-05, -1.3618730008602142e-05, -1.200847327709198e-05, -1.0398216545581818e-05, -8.787959814071655e-06, -7.177703082561493e-06, -5.5674463510513306e-06, -3.957189619541168e-06, -2.346932888031006e-06, -7.366761565208435e-07, 8.735805749893188e-07, 2.483837306499481e-06, 4.0940940380096436e-06, 5.704350769519806e-06, 7.314607501029968e-06, 8.92486423254013e-06, 1.0535120964050293e-05, 1.2145377695560455e-05, 1.3755634427070618e-05, 1.536589115858078e-05, 1.6976147890090942e-05, 1.8586404621601105e-05, 2.0196661353111267e-05, 2.180691808462143e-05, 2.3417174816131592e-05, 2.5027431547641754e-05, 2.6637688279151917e-05, 2.824794501066208e-05, 2.985820174217224e-05, 3.1468458473682404e-05, 3.3078715205192566e-05, 3.468897193670273e-05, 3.629922866821289e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 4.0, 12.0, 21.0, 36.0, 43.0, 123.0, 326.0, 840.0, 2695.0, 12818.0, 333140.0, 676778.0, 16893.0, 3162.0, 967.0, 387.0, 128.0, 66.0, 34.0, 21.0, 12.0, 3.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5364913940429688, -0.5197601318359375, -0.5030288696289062, -0.486297607421875, -0.46956634521484375, -0.4528350830078125, -0.43610382080078125, -0.41937255859375, -0.40264129638671875, -0.3859100341796875, -0.36917877197265625, -0.352447509765625, -0.33571624755859375, -0.3189849853515625, -0.30225372314453125, -0.2855224609375, -0.26879119873046875, -0.2520599365234375, -0.23532867431640625, -0.218597412109375, -0.20186614990234375, -0.1851348876953125, -0.16840362548828125, -0.15167236328125, -0.13494110107421875, -0.1182098388671875, -0.10147857666015625, -0.084747314453125, -0.06801605224609375, -0.0512847900390625, -0.03455352783203125, -0.017822265625, -0.00109100341796875, 0.0156402587890625, 0.03237152099609375, 0.049102783203125, 0.06583404541015625, 0.0825653076171875, 0.09929656982421875, 0.11602783203125, 0.13275909423828125, 0.1494903564453125, 0.16622161865234375, 0.182952880859375, 0.19968414306640625, 0.2164154052734375, 0.23314666748046875, 0.2498779296875, 0.26660919189453125, 0.2833404541015625, 0.30007171630859375, 0.316802978515625, 0.33353424072265625, 0.3502655029296875, 0.36699676513671875, 0.38372802734375, 0.40045928955078125, 0.4171905517578125, 0.43392181396484375, 0.450653076171875, 0.46738433837890625, 0.4841156005859375, 0.5008468627929688, 0.517578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 7.0, 6.0, 13.0, 12.0, 16.0, 29.0, 37.0, 61.0, 66.0, 103.0, 153.0, 147.0, 89.0, 70.0, 54.0, 39.0, 16.0, 21.0, 8.0, 8.0, 8.0, 7.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1807861328125, -0.1749553680419922, -0.16912460327148438, -0.16329383850097656, -0.15746307373046875, -0.15163230895996094, -0.14580154418945312, -0.1399707794189453, -0.1341400146484375, -0.1283092498779297, -0.12247848510742188, -0.11664772033691406, -0.11081695556640625, -0.10498619079589844, -0.09915542602539062, -0.09332466125488281, -0.087493896484375, -0.08166313171386719, -0.07583236694335938, -0.07000160217285156, -0.06417083740234375, -0.05834007263183594, -0.052509307861328125, -0.04667854309082031, -0.0408477783203125, -0.03501701354980469, -0.029186248779296875, -0.023355484008789062, -0.01752471923828125, -0.011693954467773438, -0.005863189697265625, -3.24249267578125e-05, 0.00579833984375, 0.011629104614257812, 0.017459869384765625, 0.023290634155273438, 0.02912139892578125, 0.03495216369628906, 0.040782928466796875, 0.04661369323730469, 0.0524444580078125, 0.05827522277832031, 0.06410598754882812, 0.06993675231933594, 0.07576751708984375, 0.08159828186035156, 0.08742904663085938, 0.09325981140136719, 0.099090576171875, 0.10492134094238281, 0.11075210571289062, 0.11658287048339844, 0.12241363525390625, 0.12824440002441406, 0.13407516479492188, 0.1399059295654297, 0.1457366943359375, 0.1515674591064453, 0.15739822387695312, 0.16322898864746094, 0.16905975341796875, 0.17489051818847656, 0.18072128295898438, 0.1865520477294922, 0.1923828125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 10.0, 13.0, 26.0, 56.0, 98.0, 190.0, 218.0, 181.0, 105.0, 61.0, 23.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.101652145385742, -2.024793863296509, -1.947935700416565, -1.8710774183273315, -1.7942192554473877, -1.7173609733581543, -1.640502691268921, -1.5636444091796875, -1.4867862462997437, -1.4099279642105103, -1.3330698013305664, -1.256211519241333, -1.1793532371520996, -1.1024950742721558, -1.0256367921829224, -0.9487785696983337, -0.8719203472137451, -0.7950621247291565, -0.7182039022445679, -0.6413456201553345, -0.5644873976707458, -0.4876291751861572, -0.4107709228992462, -0.3339126706123352, -0.2570544481277466, -0.18019621074199677, -0.10333797335624695, -0.02647973597049713, 0.050378501415252686, 0.1272367238998413, 0.20409497618675232, 0.28095322847366333, 0.35781168937683105, 0.4346699118614197, 0.5115281343460083, 0.5883864164352417, 0.6652446389198303, 0.742102861404419, 0.8189611434936523, 0.895819365978241, 0.9726775884628296, 1.049535870552063, 1.1263940334320068, 1.2032523155212402, 1.2801105976104736, 1.3569687604904175, 1.4338270425796509, 1.5106852054595947, 1.5875434875488281, 1.6644017696380615, 1.7412599325180054, 1.8181182146072388, 1.8949763774871826, 1.971834659576416, 2.0486929416656494, 2.125551223754883, 2.202409267425537, 2.2792675495147705, 2.356125831604004, 2.432983875274658, 2.5098421573638916, 2.586700439453125, 2.6635587215423584, 2.740417003631592, 2.817275285720825]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 2.0, 5.0, 5.0, 11.0, 7.0, 15.0, 11.0, 9.0, 18.0, 22.0, 23.0, 22.0, 19.0, 29.0, 33.0, 43.0, 28.0, 38.0, 33.0, 43.0, 38.0, 33.0, 43.0, 33.0, 44.0, 36.0, 31.0, 32.0, 32.0, 26.0, 24.0, 27.0, 24.0, 27.0, 21.0, 13.0, 16.0, 9.0, 16.0, 8.0, 10.0, 9.0, 3.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.6852008700370789, -0.6619501113891602, -0.6386994123458862, -0.6154486536979675, -0.5921978950500488, -0.5689471960067749, -0.5456964373588562, -0.5224456787109375, -0.4991949498653412, -0.4759442210197449, -0.45269346237182617, -0.42944273352622986, -0.40619200468063354, -0.38294124603271484, -0.35969051718711853, -0.3364397883415222, -0.3131890296936035, -0.2899383008480072, -0.2666875422000885, -0.2434368133544922, -0.22018606960773468, -0.19693532586097717, -0.17368459701538086, -0.15043385326862335, -0.12718310952186584, -0.10393236577510834, -0.08068162947893143, -0.05743089318275452, -0.03418014943599701, -0.010929405689239502, 0.012321323156356812, 0.03557206690311432, 0.0588228702545166, 0.08207361400127411, 0.10532435029745102, 0.12857508659362793, 0.15182583034038544, 0.17507657408714294, 0.19832730293273926, 0.22157804667949677, 0.24482879042625427, 0.2680795192718506, 0.2913302779197693, 0.3145810067653656, 0.3378317356109619, 0.3610824942588806, 0.38433322310447693, 0.40758395195007324, 0.43083471059799194, 0.45408543944358826, 0.47733619809150696, 0.5005869269371033, 0.523837685585022, 0.5470883846282959, 0.5703391432762146, 0.5935899019241333, 0.6168406009674072, 0.6400913596153259, 0.6633420586585999, 0.6865928173065186, 0.7098435759544373, 0.733094334602356, 0.7563450336456299, 0.7795957922935486, 0.8028465509414673]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 10.0, 8.0, 15.0, 28.0, 40.0, 76.0, 126.0, 267.0, 631.0, 1510.0, 4471.0, 13943.0, 84661.0, 3322519.0, 718048.0, 36300.0, 7652.0, 2437.0, 860.0, 304.0, 169.0, 82.0, 39.0, 25.0, 22.0, 11.0, 8.0, 11.0, 1.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404541015625, -0.3875312805175781, -0.37052154541015625, -0.3535118103027344, -0.3365020751953125, -0.3194923400878906, -0.30248260498046875, -0.2854728698730469, -0.268463134765625, -0.2514533996582031, -0.23444366455078125, -0.21743392944335938, -0.2004241943359375, -0.18341445922851562, -0.16640472412109375, -0.14939498901367188, -0.13238525390625, -0.11537551879882812, -0.09836578369140625, -0.08135604858398438, -0.0643463134765625, -0.047336578369140625, -0.03032684326171875, -0.013317108154296875, 0.003692626953125, 0.020702362060546875, 0.03771209716796875, 0.054721832275390625, 0.0717315673828125, 0.08874130249023438, 0.10575103759765625, 0.12276077270507812, 0.1397705078125, 0.15678024291992188, 0.17378997802734375, 0.19079971313476562, 0.2078094482421875, 0.22481918334960938, 0.24182891845703125, 0.2588386535644531, 0.275848388671875, 0.2928581237792969, 0.30986785888671875, 0.3268775939941406, 0.3438873291015625, 0.3608970642089844, 0.37790679931640625, 0.3949165344238281, 0.41192626953125, 0.4289360046386719, 0.44594573974609375, 0.4629554748535156, 0.4799652099609375, 0.4969749450683594, 0.5139846801757812, 0.5309944152832031, 0.548004150390625, 0.5650138854980469, 0.5820236206054688, 0.5990333557128906, 0.6160430908203125, 0.6330528259277344, 0.6500625610351562, 0.6670722961425781, 0.68408203125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 5.0, 9.0, 7.0, 18.0, 13.0, 25.0, 30.0, 47.0, 46.0, 72.0, 67.0, 76.0, 78.0, 77.0, 73.0, 77.0, 54.0, 46.0, 45.0, 36.0, 27.0, 27.0, 20.0, 14.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.1725940704345703, -0.16623306274414062, -0.15987205505371094, -0.15351104736328125, -0.14715003967285156, -0.14078903198242188, -0.1344280242919922, -0.1280670166015625, -0.12170600891113281, -0.11534500122070312, -0.10898399353027344, -0.10262298583984375, -0.09626197814941406, -0.08990097045898438, -0.08353996276855469, -0.077178955078125, -0.07081794738769531, -0.06445693969726562, -0.05809593200683594, -0.05173492431640625, -0.04537391662597656, -0.039012908935546875, -0.03265190124511719, -0.0262908935546875, -0.019929885864257812, -0.013568878173828125, -0.0072078704833984375, -0.00084686279296875, 0.0055141448974609375, 0.011875152587890625, 0.018236160278320312, 0.02459716796875, 0.030958175659179688, 0.037319183349609375, 0.04368019104003906, 0.05004119873046875, 0.05640220642089844, 0.06276321411132812, 0.06912422180175781, 0.0754852294921875, 0.08184623718261719, 0.08820724487304688, 0.09456825256347656, 0.10092926025390625, 0.10729026794433594, 0.11365127563476562, 0.12001228332519531, 0.126373291015625, 0.1327342987060547, 0.13909530639648438, 0.14545631408691406, 0.15181732177734375, 0.15817832946777344, 0.16453933715820312, 0.1709003448486328, 0.1772613525390625, 0.1836223602294922, 0.18998336791992188, 0.19634437561035156, 0.20270538330078125, 0.20906639099121094, 0.21542739868164062, 0.2217884063720703, 0.2281494140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 9.0, 12.0, 11.0, 14.0, 19.0, 25.0, 29.0, 42.0, 72.0, 65.0, 90.0, 115.0, 162.0, 220.0, 407.0, 650.0, 1175.0, 2707.0, 7832.0, 33953.0, 345216.0, 3663783.0, 109442.0, 18397.0, 5062.0, 1965.0, 988.0, 518.0, 360.0, 222.0, 162.0, 132.0, 97.0, 75.0, 55.0, 49.0, 28.0, 29.0, 18.0, 12.0, 11.0, 14.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.49909210205078125, -0.4801177978515625, -0.46114349365234375, -0.442169189453125, -0.42319488525390625, -0.4042205810546875, -0.38524627685546875, -0.36627197265625, -0.34729766845703125, -0.3283233642578125, -0.30934906005859375, -0.290374755859375, -0.27140045166015625, -0.2524261474609375, -0.23345184326171875, -0.2144775390625, -0.19550323486328125, -0.1765289306640625, -0.15755462646484375, -0.138580322265625, -0.11960601806640625, -0.1006317138671875, -0.08165740966796875, -0.06268310546875, -0.04370880126953125, -0.0247344970703125, -0.00576019287109375, 0.013214111328125, 0.03218841552734375, 0.0511627197265625, 0.07013702392578125, 0.089111328125, 0.10808563232421875, 0.1270599365234375, 0.14603424072265625, 0.165008544921875, 0.18398284912109375, 0.2029571533203125, 0.22193145751953125, 0.24090576171875, 0.25988006591796875, 0.2788543701171875, 0.29782867431640625, 0.316802978515625, 0.33577728271484375, 0.3547515869140625, 0.37372589111328125, 0.3927001953125, 0.41167449951171875, 0.4306488037109375, 0.44962310791015625, 0.468597412109375, 0.48757171630859375, 0.5065460205078125, 0.5255203247070312, 0.54449462890625, 0.5634689331054688, 0.5824432373046875, 0.6014175415039062, 0.620391845703125, 0.6393661499023438, 0.6583404541015625, 0.6773147583007812, 0.6962890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 6.0, 12.0, 19.0, 28.0, 54.0, 99.0, 240.0, 778.0, 1966.0, 536.0, 150.0, 65.0, 37.0, 35.0, 20.0, 14.0, 6.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40234375, -0.38350677490234375, -0.3646697998046875, -0.34583282470703125, -0.326995849609375, -0.30815887451171875, -0.2893218994140625, -0.27048492431640625, -0.25164794921875, -0.23281097412109375, -0.2139739990234375, -0.19513702392578125, -0.176300048828125, -0.15746307373046875, -0.1386260986328125, -0.11978912353515625, -0.1009521484375, -0.08211517333984375, -0.0632781982421875, -0.04444122314453125, -0.025604248046875, -0.00676727294921875, 0.0120697021484375, 0.03090667724609375, 0.04974365234375, 0.06858062744140625, 0.0874176025390625, 0.10625457763671875, 0.125091552734375, 0.14392852783203125, 0.1627655029296875, 0.18160247802734375, 0.200439453125, 0.21927642822265625, 0.2381134033203125, 0.25695037841796875, 0.275787353515625, 0.29462432861328125, 0.3134613037109375, 0.33229827880859375, 0.35113525390625, 0.36997222900390625, 0.3888092041015625, 0.40764617919921875, 0.426483154296875, 0.44532012939453125, 0.4641571044921875, 0.48299407958984375, 0.5018310546875, 0.5206680297851562, 0.5395050048828125, 0.5583419799804688, 0.577178955078125, 0.5960159301757812, 0.6148529052734375, 0.6336898803710938, 0.65252685546875, 0.6713638305664062, 0.6902008056640625, 0.7090377807617188, 0.727874755859375, 0.7467117309570312, 0.7655487060546875, 0.7843856811523438, 0.80322265625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 11.0, 12.0, 21.0, 46.0, 103.0, 234.0, 266.0, 153.0, 77.0, 36.0, 22.0, 10.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.733350992202759, -2.6292102336883545, -2.52506947517395, -2.420928716659546, -2.3167879581451416, -2.2126471996307373, -2.108506202697754, -2.0043654441833496, -1.9002248048782349, -1.7960840463638306, -1.6919432878494263, -1.5878024101257324, -1.4836616516113281, -1.3795208930969238, -1.2753801345825195, -1.1712393760681152, -1.067098617553711, -0.9629578590393066, -0.8588171005249023, -0.7546762824058533, -0.650535523891449, -0.5463947653770447, -0.4422539472579956, -0.3381131887435913, -0.233972430229187, -0.12983165681362152, -0.02569088339805603, 0.07844990491867065, 0.18259066343307495, 0.28673142194747925, 0.3908722400665283, 0.4950129985809326, 0.5991537570953369, 0.7032945156097412, 0.8074352741241455, 0.9115760922431946, 1.015716791152954, 1.1198575496673584, 1.2239984273910522, 1.3281391859054565, 1.4322799444198608, 1.5364207029342651, 1.6405614614486694, 1.7447023391723633, 1.8488430976867676, 1.9529838562011719, 2.057124614715576, 2.1612653732299805, 2.2654061317443848, 2.369546890258789, 2.4736876487731934, 2.5778284072875977, 2.681969165802002, 2.7861099243164062, 2.8902506828308105, 2.994391441345215, 3.098532199859619, 3.2026729583740234, 3.3068137168884277, 3.410954475402832, 3.5150952339172363, 3.6192359924316406, 3.723376750946045, 3.827517509460449, 3.9316585063934326]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 12.0, 16.0, 29.0, 30.0, 26.0, 31.0, 25.0, 33.0, 62.0, 54.0, 42.0, 52.0, 55.0, 64.0, 62.0, 52.0, 44.0, 40.0, 38.0, 40.0, 33.0, 26.0, 29.0, 33.0, 20.0, 18.0, 11.0, 8.0, 5.0, 7.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3170136213302612, -1.2788667678833008, -1.2407199144363403, -1.2025730609893799, -1.1644262075424194, -1.126279354095459, -1.0881325006484985, -1.049985647201538, -1.0118389129638672, -0.9736920595169067, -0.9355452060699463, -0.8973983526229858, -0.8592514991760254, -0.8211046457290649, -0.7829578518867493, -0.7448109984397888, -0.7066640853881836, -0.6685172319412231, -0.6303703784942627, -0.5922235250473022, -0.5540766716003418, -0.5159298181533813, -0.4777830243110657, -0.4396361708641052, -0.4014893174171448, -0.3633424639701843, -0.3251956105232239, -0.2870487868785858, -0.24890193343162537, -0.21075507998466492, -0.17260824143886566, -0.1344614028930664, -0.0963144302368164, -0.058167584240436554, -0.0200207382440567, 0.01812610775232315, 0.056272953748703, 0.09441980719566345, 0.1325666457414627, 0.17071348428726196, 0.2088603377342224, 0.24700719118118286, 0.2851540446281433, 0.32330086827278137, 0.3614477217197418, 0.39959457516670227, 0.43774139881134033, 0.4758882522583008, 0.5140351057052612, 0.5521819591522217, 0.5903288125991821, 0.6284756660461426, 0.666622519493103, 0.7047693729400635, 0.7429161667823792, 0.7810630202293396, 0.8192098736763, 0.8573567271232605, 0.895503580570221, 0.9336504340171814, 0.9717972278594971, 1.0099440813064575, 1.048090934753418, 1.0862377882003784, 1.1243846416473389]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 9.0, 12.0, 14.0, 22.0, 46.0, 88.0, 195.0, 314.0, 857.0, 2048.0, 5889.0, 19396.0, 82150.0, 513045.0, 344471.0, 57754.0, 14565.0, 4670.0, 1601.0, 731.0, 335.0, 130.0, 90.0, 33.0, 38.0, 14.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7411422729492188, -0.7171478271484375, -0.6931533813476562, -0.669158935546875, -0.6451644897460938, -0.6211700439453125, -0.5971755981445312, -0.57318115234375, -0.5491867065429688, -0.5251922607421875, -0.5011978149414062, -0.477203369140625, -0.45320892333984375, -0.4292144775390625, -0.40522003173828125, -0.3812255859375, -0.35723114013671875, -0.3332366943359375, -0.30924224853515625, -0.285247802734375, -0.26125335693359375, -0.2372589111328125, -0.21326446533203125, -0.18927001953125, -0.16527557373046875, -0.1412811279296875, -0.11728668212890625, -0.093292236328125, -0.06929779052734375, -0.0453033447265625, -0.02130889892578125, 0.002685546875, 0.02667999267578125, 0.0506744384765625, 0.07466888427734375, 0.098663330078125, 0.12265777587890625, 0.1466522216796875, 0.17064666748046875, 0.19464111328125, 0.21863555908203125, 0.2426300048828125, 0.26662445068359375, 0.290618896484375, 0.31461334228515625, 0.3386077880859375, 0.36260223388671875, 0.3865966796875, 0.41059112548828125, 0.4345855712890625, 0.45858001708984375, 0.482574462890625, 0.5065689086914062, 0.5305633544921875, 0.5545578002929688, 0.57855224609375, 0.6025466918945312, 0.6265411376953125, 0.6505355834960938, 0.674530029296875, 0.6985244750976562, 0.7225189208984375, 0.7465133666992188, 0.7705078125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 18.0, 25.0, 20.0, 25.0, 27.0, 40.0, 55.0, 50.0, 84.0, 70.0, 70.0, 63.0, 69.0, 62.0, 55.0, 42.0, 35.0, 44.0, 31.0, 17.0, 22.0, 22.0, 16.0, 7.0, 9.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1416015625, -0.13545608520507812, -0.12931060791015625, -0.12316513061523438, -0.1170196533203125, -0.11087417602539062, -0.10472869873046875, -0.09858322143554688, -0.092437744140625, -0.08629226684570312, -0.08014678955078125, -0.07400131225585938, -0.0678558349609375, -0.061710357666015625, -0.05556488037109375, -0.049419403076171875, -0.04327392578125, -0.037128448486328125, -0.03098297119140625, -0.024837493896484375, -0.0186920166015625, -0.012546539306640625, -0.00640106201171875, -0.000255584716796875, 0.005889892578125, 0.012035369873046875, 0.01818084716796875, 0.024326324462890625, 0.0304718017578125, 0.036617279052734375, 0.04276275634765625, 0.048908233642578125, 0.0550537109375, 0.061199188232421875, 0.06734466552734375, 0.07349014282226562, 0.0796356201171875, 0.08578109741210938, 0.09192657470703125, 0.09807205200195312, 0.104217529296875, 0.11036300659179688, 0.11650848388671875, 0.12265396118164062, 0.1287994384765625, 0.13494491577148438, 0.14109039306640625, 0.14723587036132812, 0.15338134765625, 0.15952682495117188, 0.16567230224609375, 0.17181777954101562, 0.1779632568359375, 0.18410873413085938, 0.19025421142578125, 0.19639968872070312, 0.202545166015625, 0.20869064331054688, 0.21483612060546875, 0.22098159790039062, 0.2271270751953125, 0.23327255249023438, 0.23941802978515625, 0.24556350708007812, 0.251708984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 21.0, 21.0, 46.0, 68.0, 130.0, 297.0, 782.0, 2042.0, 6403.0, 24055.0, 121707.0, 679346.0, 170826.0, 30709.0, 8039.0, 2518.0, 853.0, 328.0, 146.0, 72.0, 33.0, 23.0, 17.0, 6.0, 13.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8085250854492188, -0.7820892333984375, -0.7556533813476562, -0.729217529296875, -0.7027816772460938, -0.6763458251953125, -0.6499099731445312, -0.62347412109375, -0.5970382690429688, -0.5706024169921875, -0.5441665649414062, -0.517730712890625, -0.49129486083984375, -0.4648590087890625, -0.43842315673828125, -0.4119873046875, -0.38555145263671875, -0.3591156005859375, -0.33267974853515625, -0.306243896484375, -0.27980804443359375, -0.2533721923828125, -0.22693634033203125, -0.20050048828125, -0.17406463623046875, -0.1476287841796875, -0.12119293212890625, -0.094757080078125, -0.06832122802734375, -0.0418853759765625, -0.01544952392578125, 0.010986328125, 0.03742218017578125, 0.0638580322265625, 0.09029388427734375, 0.116729736328125, 0.14316558837890625, 0.1696014404296875, 0.19603729248046875, 0.22247314453125, 0.24890899658203125, 0.2753448486328125, 0.30178070068359375, 0.328216552734375, 0.35465240478515625, 0.3810882568359375, 0.40752410888671875, 0.4339599609375, 0.46039581298828125, 0.4868316650390625, 0.5132675170898438, 0.539703369140625, 0.5661392211914062, 0.5925750732421875, 0.6190109252929688, 0.64544677734375, 0.6718826293945312, 0.6983184814453125, 0.7247543334960938, 0.751190185546875, 0.7776260375976562, 0.8040618896484375, 0.8304977416992188, 0.85693359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 3.0, 6.0, 14.0, 13.0, 26.0, 20.0, 27.0, 27.0, 32.0, 28.0, 42.0, 37.0, 45.0, 38.0, 53.0, 56.0, 48.0, 43.0, 55.0, 42.0, 59.0, 37.0, 36.0, 24.0, 25.0, 13.0, 13.0, 22.0, 12.0, 12.0, 8.0, 15.0, 8.0, 7.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3826560974121094, -0.37053680419921875, -0.3584175109863281, -0.3462982177734375, -0.3341789245605469, -0.32205963134765625, -0.3099403381347656, -0.297821044921875, -0.2857017517089844, -0.27358245849609375, -0.2614631652832031, -0.2493438720703125, -0.23722457885742188, -0.22510528564453125, -0.21298599243164062, -0.20086669921875, -0.18874740600585938, -0.17662811279296875, -0.16450881958007812, -0.1523895263671875, -0.14027023315429688, -0.12815093994140625, -0.11603164672851562, -0.103912353515625, -0.09179306030273438, -0.07967376708984375, -0.06755447387695312, -0.0554351806640625, -0.043315887451171875, -0.03119659423828125, -0.019077301025390625, -0.0069580078125, 0.005161285400390625, 0.01728057861328125, 0.029399871826171875, 0.0415191650390625, 0.053638458251953125, 0.06575775146484375, 0.07787704467773438, 0.089996337890625, 0.10211563110351562, 0.11423492431640625, 0.12635421752929688, 0.1384735107421875, 0.15059280395507812, 0.16271209716796875, 0.17483139038085938, 0.18695068359375, 0.19906997680664062, 0.21118927001953125, 0.22330856323242188, 0.2354278564453125, 0.24754714965820312, 0.25966644287109375, 0.2717857360839844, 0.283905029296875, 0.2960243225097656, 0.30814361572265625, 0.3202629089355469, 0.3323822021484375, 0.3445014953613281, 0.35662078857421875, 0.3687400817871094, 0.380859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 20.0, 29.0, 39.0, 50.0, 108.0, 159.0, 252.0, 451.0, 809.0, 1531.0, 3029.0, 6402.0, 15035.0, 38179.0, 168763.0, 667336.0, 95968.0, 28146.0, 11589.0, 5240.0, 2554.0, 1265.0, 647.0, 359.0, 219.0, 121.0, 75.0, 49.0, 29.0, 21.0, 23.0, 15.0, 10.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0], "bins": [-0.368896484375, -0.3597545623779297, -0.3506126403808594, -0.34147071838378906, -0.33232879638671875, -0.32318687438964844, -0.3140449523925781, -0.3049030303955078, -0.2957611083984375, -0.2866191864013672, -0.2774772644042969, -0.26833534240722656, -0.25919342041015625, -0.25005149841308594, -0.24090957641601562, -0.2317676544189453, -0.222625732421875, -0.2134838104248047, -0.20434188842773438, -0.19519996643066406, -0.18605804443359375, -0.17691612243652344, -0.16777420043945312, -0.1586322784423828, -0.1494903564453125, -0.1403484344482422, -0.13120651245117188, -0.12206459045410156, -0.11292266845703125, -0.10378074645996094, -0.09463882446289062, -0.08549690246582031, -0.07635498046875, -0.06721305847167969, -0.058071136474609375, -0.04892921447753906, -0.03978729248046875, -0.030645370483398438, -0.021503448486328125, -0.012361526489257812, -0.0032196044921875, 0.0059223175048828125, 0.015064239501953125, 0.024206161499023438, 0.03334808349609375, 0.04249000549316406, 0.051631927490234375, 0.06077384948730469, 0.069915771484375, 0.07905769348144531, 0.08819961547851562, 0.09734153747558594, 0.10648345947265625, 0.11562538146972656, 0.12476730346679688, 0.1339092254638672, 0.1430511474609375, 0.1521930694580078, 0.16133499145507812, 0.17047691345214844, 0.17961883544921875, 0.18876075744628906, 0.19790267944335938, 0.2070446014404297, 0.2161865234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 7.0, 12.0, 17.0, 26.0, 45.0, 58.0, 147.0, 328.0, 152.0, 65.0, 37.0, 14.0, 7.0, 17.0, 7.0, 11.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.909536361694336e-05, -7.64140859246254e-05, -7.373280823230743e-05, -7.105153053998947e-05, -6.837025284767151e-05, -6.568897515535355e-05, -6.300769746303558e-05, -6.032641977071762e-05, -5.764514207839966e-05, -5.4963864386081696e-05, -5.228258669376373e-05, -4.960130900144577e-05, -4.692003130912781e-05, -4.4238753616809845e-05, -4.155747592449188e-05, -3.887619823217392e-05, -3.619492053985596e-05, -3.3513642847537994e-05, -3.083236515522003e-05, -2.815108746290207e-05, -2.5469809770584106e-05, -2.2788532078266144e-05, -2.010725438594818e-05, -1.742597669363022e-05, -1.4744699001312256e-05, -1.2063421308994293e-05, -9.38214361667633e-06, -6.700865924358368e-06, -4.019588232040405e-06, -1.3383105397224426e-06, 1.34296715259552e-06, 4.024244844913483e-06, 6.705522537231445e-06, 9.386800229549408e-06, 1.206807792186737e-05, 1.4749355614185333e-05, 1.7430633306503296e-05, 2.011191099882126e-05, 2.279318869113922e-05, 2.5474466383457184e-05, 2.8155744075775146e-05, 3.083702176809311e-05, 3.351829946041107e-05, 3.6199577152729034e-05, 3.8880854845047e-05, 4.156213253736496e-05, 4.424341022968292e-05, 4.6924687922000885e-05, 4.960596561431885e-05, 5.228724330663681e-05, 5.496852099895477e-05, 5.7649798691272736e-05, 6.03310763835907e-05, 6.301235407590866e-05, 6.569363176822662e-05, 6.837490946054459e-05, 7.105618715286255e-05, 7.373746484518051e-05, 7.641874253749847e-05, 7.910002022981644e-05, 8.17812979221344e-05, 8.446257561445236e-05, 8.714385330677032e-05, 8.982513099908829e-05, 9.250640869140625e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 3.0, 6.0, 6.0, 10.0, 13.0, 17.0, 19.0, 31.0, 52.0, 125.0, 323.0, 959.0, 3469.0, 17970.0, 653768.0, 352111.0, 15036.0, 3140.0, 862.0, 324.0, 128.0, 65.0, 21.0, 25.0, 15.0, 9.0, 5.0, 6.0, 7.0, 5.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.94384765625, -0.9175949096679688, -0.8913421630859375, -0.8650894165039062, -0.838836669921875, -0.8125839233398438, -0.7863311767578125, -0.7600784301757812, -0.73382568359375, -0.7075729370117188, -0.6813201904296875, -0.6550674438476562, -0.628814697265625, -0.6025619506835938, -0.5763092041015625, -0.5500564575195312, -0.5238037109375, -0.49755096435546875, -0.4712982177734375, -0.44504547119140625, -0.418792724609375, -0.39253997802734375, -0.3662872314453125, -0.34003448486328125, -0.31378173828125, -0.28752899169921875, -0.2612762451171875, -0.23502349853515625, -0.208770751953125, -0.18251800537109375, -0.1562652587890625, -0.13001251220703125, -0.103759765625, -0.07750701904296875, -0.0512542724609375, -0.02500152587890625, 0.001251220703125, 0.02750396728515625, 0.0537567138671875, 0.08000946044921875, 0.10626220703125, 0.13251495361328125, 0.1587677001953125, 0.18502044677734375, 0.211273193359375, 0.23752593994140625, 0.2637786865234375, 0.29003143310546875, 0.3162841796875, 0.34253692626953125, 0.3687896728515625, 0.39504241943359375, 0.421295166015625, 0.44754791259765625, 0.4738006591796875, 0.5000534057617188, 0.52630615234375, 0.5525588989257812, 0.5788116455078125, 0.6050643920898438, 0.631317138671875, 0.6575698852539062, 0.6838226318359375, 0.7100753784179688, 0.736328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 10.0, 10.0, 14.0, 19.0, 22.0, 34.0, 41.0, 68.0, 97.0, 175.0, 168.0, 104.0, 61.0, 36.0, 22.0, 18.0, 16.0, 10.0, 11.0, 4.0, 7.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.22607421875, -0.2185211181640625, -0.210968017578125, -0.2034149169921875, -0.19586181640625, -0.1883087158203125, -0.180755615234375, -0.1732025146484375, -0.1656494140625, -0.1580963134765625, -0.150543212890625, -0.1429901123046875, -0.13543701171875, -0.1278839111328125, -0.120330810546875, -0.1127777099609375, -0.105224609375, -0.0976715087890625, -0.090118408203125, -0.0825653076171875, -0.07501220703125, -0.0674591064453125, -0.059906005859375, -0.0523529052734375, -0.0447998046875, -0.0372467041015625, -0.029693603515625, -0.0221405029296875, -0.01458740234375, -0.0070343017578125, 0.000518798828125, 0.0080718994140625, 0.015625, 0.0231781005859375, 0.030731201171875, 0.0382843017578125, 0.04583740234375, 0.0533905029296875, 0.060943603515625, 0.0684967041015625, 0.0760498046875, 0.0836029052734375, 0.091156005859375, 0.0987091064453125, 0.10626220703125, 0.1138153076171875, 0.121368408203125, 0.1289215087890625, 0.136474609375, 0.1440277099609375, 0.151580810546875, 0.1591339111328125, 0.16668701171875, 0.1742401123046875, 0.181793212890625, 0.1893463134765625, 0.1968994140625, 0.2044525146484375, 0.212005615234375, 0.2195587158203125, 0.22711181640625, 0.2346649169921875, 0.242218017578125, 0.2497711181640625, 0.25732421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 13.0, 27.0, 104.0, 253.0, 334.0, 163.0, 61.0, 24.0, 13.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.436753749847412, -4.246328353881836, -4.05590295791626, -3.8654775619506836, -3.6750521659851074, -3.4846267700195312, -3.294201374053955, -3.103775978088379, -2.9133505821228027, -2.7229251861572266, -2.5324997901916504, -2.342074394226074, -2.151648998260498, -1.9612236022949219, -1.7707982063293457, -1.5803728103637695, -1.3899474143981934, -1.1995220184326172, -1.009096622467041, -0.8186712265014648, -0.6282458305358887, -0.4378204345703125, -0.24739503860473633, -0.056969642639160156, 0.13345575332641602, 0.3238811492919922, 0.5143065452575684, 0.7047319412231445, 0.8951573371887207, 1.0855827331542969, 1.276008129119873, 1.4664335250854492, 1.6568584442138672, 1.8472838401794434, 2.0377092361450195, 2.2281346321105957, 2.418560028076172, 2.608985424041748, 2.799410820007324, 2.9898362159729004, 3.1802616119384766, 3.3706870079040527, 3.561112403869629, 3.751537799835205, 3.9419631958007812, 4.132388591766357, 4.322813987731934, 4.51323938369751, 4.703664779663086, 4.894090175628662, 5.084515571594238, 5.2749409675598145, 5.465366363525391, 5.655791759490967, 5.846217155456543, 6.036642551422119, 6.227067947387695, 6.4174933433532715, 6.607918739318848, 6.798344135284424, 6.98876953125, 7.179194927215576, 7.369620323181152, 7.5600457191467285, 7.750471115112305]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 4.0, 5.0, 5.0, 3.0, 8.0, 7.0, 13.0, 7.0, 12.0, 20.0, 13.0, 22.0, 21.0, 24.0, 40.0, 22.0, 23.0, 26.0, 30.0, 36.0, 47.0, 40.0, 38.0, 34.0, 32.0, 36.0, 39.0, 32.0, 38.0, 30.0, 26.0, 35.0, 25.0, 28.0, 30.0, 26.0, 19.0, 21.0, 14.0, 9.0, 16.0, 9.0, 7.0, 0.0, 5.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0179200172424316, -0.9860931038856506, -0.9542661905288696, -0.9224392771720886, -0.8906123638153076, -0.8587854504585266, -0.8269585371017456, -0.7951316237449646, -0.7633047103881836, -0.7314777970314026, -0.6996508836746216, -0.6678239703178406, -0.6359970569610596, -0.6041701436042786, -0.5723432302474976, -0.5405163168907166, -0.5086894035339355, -0.47686249017715454, -0.44503557682037354, -0.41320866346359253, -0.3813817501068115, -0.3495548367500305, -0.3177279233932495, -0.2859010100364685, -0.2540740966796875, -0.2222471833229065, -0.1904202699661255, -0.15859335660934448, -0.12676644325256348, -0.09493952989578247, -0.06311261653900146, -0.03128570318222046, 0.0005412101745605469, 0.03236812353134155, 0.06419503688812256, 0.09602195024490356, 0.12784886360168457, 0.15967577695846558, 0.19150269031524658, 0.2233296036720276, 0.2551565170288086, 0.2869834303855896, 0.3188103437423706, 0.3506372570991516, 0.3824641704559326, 0.4142910838127136, 0.44611799716949463, 0.47794491052627563, 0.5097718238830566, 0.5415987372398376, 0.5734256505966187, 0.6052525639533997, 0.6370794773101807, 0.6689063906669617, 0.7007333040237427, 0.7325602173805237, 0.7643871307373047, 0.7962140440940857, 0.8280409574508667, 0.8598678708076477, 0.8916947841644287, 0.9235216975212097, 0.9553486108779907, 0.9871755242347717, 1.0190024375915527]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 13.0, 19.0, 39.0, 58.0, 68.0, 172.0, 319.0, 546.0, 1101.0, 2431.0, 5698.0, 16174.0, 70562.0, 1885807.0, 2103395.0, 81668.0, 16335.0, 5361.0, 2258.0, 1048.0, 526.0, 269.0, 149.0, 75.0, 33.0, 30.0, 26.0, 15.0, 12.0, 9.0, 4.0, 6.0, 7.0, 2.0, 8.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.42626953125, -0.407745361328125, -0.38922119140625, -0.370697021484375, -0.3521728515625, -0.333648681640625, -0.31512451171875, -0.296600341796875, -0.278076171875, -0.259552001953125, -0.24102783203125, -0.222503662109375, -0.2039794921875, -0.185455322265625, -0.16693115234375, -0.148406982421875, -0.1298828125, -0.111358642578125, -0.09283447265625, -0.074310302734375, -0.0557861328125, -0.037261962890625, -0.01873779296875, -0.000213623046875, 0.018310546875, 0.036834716796875, 0.05535888671875, 0.073883056640625, 0.0924072265625, 0.110931396484375, 0.12945556640625, 0.147979736328125, 0.16650390625, 0.185028076171875, 0.20355224609375, 0.222076416015625, 0.2406005859375, 0.259124755859375, 0.27764892578125, 0.296173095703125, 0.314697265625, 0.333221435546875, 0.35174560546875, 0.370269775390625, 0.3887939453125, 0.407318115234375, 0.42584228515625, 0.444366455078125, 0.462890625, 0.481414794921875, 0.49993896484375, 0.518463134765625, 0.5369873046875, 0.555511474609375, 0.57403564453125, 0.592559814453125, 0.611083984375, 0.629608154296875, 0.64813232421875, 0.666656494140625, 0.6851806640625, 0.703704833984375, 0.72222900390625, 0.740753173828125, 0.75927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 9.0, 10.0, 24.0, 20.0, 26.0, 38.0, 57.0, 63.0, 67.0, 74.0, 87.0, 60.0, 91.0, 65.0, 53.0, 59.0, 55.0, 41.0, 27.0, 22.0, 23.0, 8.0, 8.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.1988658905029297, -0.19131088256835938, -0.18375587463378906, -0.17620086669921875, -0.16864585876464844, -0.16109085083007812, -0.1535358428955078, -0.1459808349609375, -0.1384258270263672, -0.13087081909179688, -0.12331581115722656, -0.11576080322265625, -0.10820579528808594, -0.10065078735351562, -0.09309577941894531, -0.085540771484375, -0.07798576354980469, -0.07043075561523438, -0.06287574768066406, -0.05532073974609375, -0.04776573181152344, -0.040210723876953125, -0.03265571594238281, -0.0251007080078125, -0.017545700073242188, -0.009990692138671875, -0.0024356842041015625, 0.00511932373046875, 0.012674331665039062, 0.020229339599609375, 0.027784347534179688, 0.03533935546875, 0.04289436340332031, 0.050449371337890625, 0.05800437927246094, 0.06555938720703125, 0.07311439514160156, 0.08066940307617188, 0.08822441101074219, 0.0957794189453125, 0.10333442687988281, 0.11088943481445312, 0.11844444274902344, 0.12599945068359375, 0.13355445861816406, 0.14110946655273438, 0.1486644744873047, 0.156219482421875, 0.1637744903564453, 0.17132949829101562, 0.17888450622558594, 0.18643951416015625, 0.19399452209472656, 0.20154953002929688, 0.2091045379638672, 0.2166595458984375, 0.2242145538330078, 0.23176956176757812, 0.23932456970214844, 0.24687957763671875, 0.25443458557128906, 0.2619895935058594, 0.2695446014404297, 0.277099609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 10.0, 23.0, 28.0, 24.0, 42.0, 65.0, 95.0, 134.0, 172.0, 226.0, 268.0, 342.0, 593.0, 860.0, 1349.0, 2128.0, 4275.0, 8824.0, 20973.0, 66397.0, 398223.0, 3352028.0, 250711.0, 51790.0, 17558.0, 7462.0, 3720.0, 1988.0, 1244.0, 813.0, 509.0, 401.0, 254.0, 199.0, 122.0, 93.0, 80.0, 66.0, 47.0, 31.0, 31.0, 17.0, 11.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.53857421875, -0.522918701171875, -0.50726318359375, -0.491607666015625, -0.4759521484375, -0.460296630859375, -0.44464111328125, -0.428985595703125, -0.413330078125, -0.397674560546875, -0.38201904296875, -0.366363525390625, -0.3507080078125, -0.335052490234375, -0.31939697265625, -0.303741455078125, -0.2880859375, -0.272430419921875, -0.25677490234375, -0.241119384765625, -0.2254638671875, -0.209808349609375, -0.19415283203125, -0.178497314453125, -0.162841796875, -0.147186279296875, -0.13153076171875, -0.115875244140625, -0.1002197265625, -0.084564208984375, -0.06890869140625, -0.053253173828125, -0.03759765625, -0.021942138671875, -0.00628662109375, 0.009368896484375, 0.0250244140625, 0.040679931640625, 0.05633544921875, 0.071990966796875, 0.087646484375, 0.103302001953125, 0.11895751953125, 0.134613037109375, 0.1502685546875, 0.165924072265625, 0.18157958984375, 0.197235107421875, 0.212890625, 0.228546142578125, 0.24420166015625, 0.259857177734375, 0.2755126953125, 0.291168212890625, 0.30682373046875, 0.322479248046875, 0.338134765625, 0.353790283203125, 0.36944580078125, 0.385101318359375, 0.4007568359375, 0.416412353515625, 0.43206787109375, 0.447723388671875, 0.46337890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 19.0, 15.0, 30.0, 57.0, 111.0, 178.0, 419.0, 1470.0, 1040.0, 305.0, 159.0, 74.0, 53.0, 29.0, 27.0, 20.0, 15.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.6592483520507812, -0.6397857666015625, -0.6203231811523438, -0.600860595703125, -0.5813980102539062, -0.5619354248046875, -0.5424728393554688, -0.52301025390625, -0.5035476684570312, -0.4840850830078125, -0.46462249755859375, -0.445159912109375, -0.42569732666015625, -0.4062347412109375, -0.38677215576171875, -0.3673095703125, -0.34784698486328125, -0.3283843994140625, -0.30892181396484375, -0.289459228515625, -0.26999664306640625, -0.2505340576171875, -0.23107147216796875, -0.21160888671875, -0.19214630126953125, -0.1726837158203125, -0.15322113037109375, -0.133758544921875, -0.11429595947265625, -0.0948333740234375, -0.07537078857421875, -0.055908203125, -0.03644561767578125, -0.0169830322265625, 0.00247955322265625, 0.021942138671875, 0.04140472412109375, 0.0608673095703125, 0.08032989501953125, 0.09979248046875, 0.11925506591796875, 0.1387176513671875, 0.15818023681640625, 0.177642822265625, 0.19710540771484375, 0.2165679931640625, 0.23603057861328125, 0.2554931640625, 0.27495574951171875, 0.2944183349609375, 0.31388092041015625, 0.333343505859375, 0.35280609130859375, 0.3722686767578125, 0.39173126220703125, 0.41119384765625, 0.43065643310546875, 0.4501190185546875, 0.46958160400390625, 0.489044189453125, 0.5085067749023438, 0.5279693603515625, 0.5474319458007812, 0.56689453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 23.0, 38.0, 53.0, 121.0, 203.0, 231.0, 138.0, 75.0, 38.0, 26.0, 10.0, 20.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3636971712112427, -1.251868486404419, -1.1400399208068848, -1.028211236000061, -0.9163825511932373, -0.8045539259910583, -0.6927253007888794, -0.5808966159820557, -0.4690679907798767, -0.35723933577537537, -0.24541069567203522, -0.13358205556869507, -0.021753400564193726, 0.09007525444030762, 0.20190387964248657, 0.3137325644493103, 0.42556118965148926, 0.5373898148536682, 0.6492184996604919, 0.7610471248626709, 0.8728758096694946, 0.9847044348716736, 1.0965330600738525, 1.2083617448806763, 1.3201904296875, 1.4320191144943237, 1.543847680091858, 1.6556763648986816, 1.7675050497055054, 1.879333734512329, 1.9911623001098633, 2.1029911041259766, 2.2148196697235107, 2.326648235321045, 2.438477039337158, 2.5503056049346924, 2.6621341705322266, 2.77396297454834, 2.885791540145874, 2.997620105743408, 3.1094489097595215, 3.2212774753570557, 3.333106279373169, 3.444934844970703, 3.5567634105682373, 3.6685922145843506, 3.7804207801818848, 3.892249584197998, 4.004077911376953, 4.115906715393066, 4.2277350425720215, 4.339563846588135, 4.451392650604248, 4.563220977783203, 4.675049781799316, 4.78687858581543, 4.898707389831543, 5.010536193847656, 5.122364521026611, 5.234193325042725, 5.346022129058838, 5.457850456237793, 5.569679260253906, 5.6815080642700195, 5.793336391448975]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 4.0, 5.0, 9.0, 10.0, 15.0, 22.0, 19.0, 22.0, 31.0, 25.0, 31.0, 27.0, 39.0, 51.0, 36.0, 53.0, 45.0, 37.0, 42.0, 33.0, 37.0, 33.0, 40.0, 37.0, 36.0, 39.0, 36.0, 27.0, 26.0, 20.0, 22.0, 17.0, 11.0, 14.0, 9.0, 3.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1318732500076294, -1.094403862953186, -1.0569344758987427, -1.0194650888442993, -0.9819956421852112, -0.9445262551307678, -0.9070568084716797, -0.8695874214172363, -0.832118034362793, -0.7946486473083496, -0.7571792602539062, -0.7197098135948181, -0.6822404265403748, -0.6447710394859314, -0.6073015928268433, -0.5698322057723999, -0.5323628187179565, -0.4948934316635132, -0.45742401480674744, -0.4199545979499817, -0.38248521089553833, -0.34501582384109497, -0.3075464069843292, -0.2700769901275635, -0.23260760307312012, -0.19513820111751556, -0.157668799161911, -0.12019939720630646, -0.0827299952507019, -0.04526059329509735, -0.007791191339492798, 0.02967822551727295, 0.06714761257171631, 0.10461701452732086, 0.14208641648292542, 0.17955581843852997, 0.21702522039413452, 0.2544946074485779, 0.29196402430534363, 0.3294334411621094, 0.36690282821655273, 0.4043722152709961, 0.44184163212776184, 0.4793110489845276, 0.516780436038971, 0.5542498230934143, 0.5917192697525024, 0.6291886568069458, 0.6666580438613892, 0.7041274309158325, 0.7415968179702759, 0.779066264629364, 0.8165356516838074, 0.8540050387382507, 0.8914744853973389, 0.9289438724517822, 0.9664132595062256, 1.003882646560669, 1.0413520336151123, 1.0788214206695557, 1.116290807723999, 1.153760313987732, 1.1912297010421753, 1.2286990880966187, 1.266168475151062]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 7.0, 11.0, 17.0, 20.0, 24.0, 52.0, 71.0, 97.0, 170.0, 332.0, 615.0, 1202.0, 2827.0, 6887.0, 18898.0, 57012.0, 203384.0, 516690.0, 165263.0, 47819.0, 16090.0, 6058.0, 2573.0, 1112.0, 590.0, 279.0, 150.0, 80.0, 56.0, 46.0, 35.0, 15.0, 13.0, 16.0, 7.0, 11.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65234375, -0.62939453125, -0.6064453125, -0.58349609375, -0.560546875, -0.53759765625, -0.5146484375, -0.49169921875, -0.46875, -0.44580078125, -0.4228515625, -0.39990234375, -0.376953125, -0.35400390625, -0.3310546875, -0.30810546875, -0.28515625, -0.26220703125, -0.2392578125, -0.21630859375, -0.193359375, -0.17041015625, -0.1474609375, -0.12451171875, -0.1015625, -0.07861328125, -0.0556640625, -0.03271484375, -0.009765625, 0.01318359375, 0.0361328125, 0.05908203125, 0.08203125, 0.10498046875, 0.1279296875, 0.15087890625, 0.173828125, 0.19677734375, 0.2197265625, 0.24267578125, 0.265625, 0.28857421875, 0.3115234375, 0.33447265625, 0.357421875, 0.38037109375, 0.4033203125, 0.42626953125, 0.44921875, 0.47216796875, 0.4951171875, 0.51806640625, 0.541015625, 0.56396484375, 0.5869140625, 0.60986328125, 0.6328125, 0.65576171875, 0.6787109375, 0.70166015625, 0.724609375, 0.74755859375, 0.7705078125, 0.79345703125, 0.81640625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 11.0, 23.0, 36.0, 39.0, 49.0, 56.0, 64.0, 68.0, 84.0, 70.0, 84.0, 74.0, 66.0, 47.0, 51.0, 27.0, 46.0, 27.0, 17.0, 18.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21610069274902344, -0.20771408081054688, -0.1993274688720703, -0.19094085693359375, -0.1825542449951172, -0.17416763305664062, -0.16578102111816406, -0.1573944091796875, -0.14900779724121094, -0.14062118530273438, -0.1322345733642578, -0.12384796142578125, -0.11546134948730469, -0.10707473754882812, -0.09868812561035156, -0.090301513671875, -0.08191490173339844, -0.07352828979492188, -0.06514167785644531, -0.05675506591796875, -0.04836845397949219, -0.039981842041015625, -0.03159523010253906, -0.0232086181640625, -0.014822006225585938, -0.006435394287109375, 0.0019512176513671875, 0.01033782958984375, 0.018724441528320312, 0.027111053466796875, 0.03549766540527344, 0.04388427734375, 0.05227088928222656, 0.060657501220703125, 0.06904411315917969, 0.07743072509765625, 0.08581733703613281, 0.09420394897460938, 0.10259056091308594, 0.1109771728515625, 0.11936378479003906, 0.12775039672851562, 0.1361370086669922, 0.14452362060546875, 0.1529102325439453, 0.16129684448242188, 0.16968345642089844, 0.178070068359375, 0.18645668029785156, 0.19484329223632812, 0.2032299041748047, 0.21161651611328125, 0.2200031280517578, 0.22838973999023438, 0.23677635192871094, 0.2451629638671875, 0.25354957580566406, 0.2619361877441406, 0.2703227996826172, 0.27870941162109375, 0.2870960235595703, 0.2954826354980469, 0.30386924743652344, 0.312255859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 16.0, 17.0, 30.0, 39.0, 76.0, 113.0, 222.0, 475.0, 1108.0, 3038.0, 9742.0, 40079.0, 270006.0, 620503.0, 78654.0, 16665.0, 4661.0, 1691.0, 676.0, 314.0, 160.0, 97.0, 45.0, 31.0, 27.0, 14.0, 16.0, 4.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3115234375, -1.277191162109375, -1.24285888671875, -1.208526611328125, -1.1741943359375, -1.139862060546875, -1.10552978515625, -1.071197509765625, -1.036865234375, -1.002532958984375, -0.96820068359375, -0.933868408203125, -0.8995361328125, -0.865203857421875, -0.83087158203125, -0.796539306640625, -0.76220703125, -0.727874755859375, -0.69354248046875, -0.659210205078125, -0.6248779296875, -0.590545654296875, -0.55621337890625, -0.521881103515625, -0.487548828125, -0.453216552734375, -0.41888427734375, -0.384552001953125, -0.3502197265625, -0.315887451171875, -0.28155517578125, -0.247222900390625, -0.212890625, -0.178558349609375, -0.14422607421875, -0.109893798828125, -0.0755615234375, -0.041229248046875, -0.00689697265625, 0.027435302734375, 0.061767578125, 0.096099853515625, 0.13043212890625, 0.164764404296875, 0.1990966796875, 0.233428955078125, 0.26776123046875, 0.302093505859375, 0.33642578125, 0.370758056640625, 0.40509033203125, 0.439422607421875, 0.4737548828125, 0.508087158203125, 0.54241943359375, 0.576751708984375, 0.611083984375, 0.645416259765625, 0.67974853515625, 0.714080810546875, 0.7484130859375, 0.782745361328125, 0.81707763671875, 0.851409912109375, 0.8857421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 10.0, 10.0, 12.0, 18.0, 21.0, 23.0, 19.0, 30.0, 44.0, 41.0, 56.0, 55.0, 50.0, 73.0, 68.0, 76.0, 64.0, 53.0, 53.0, 41.0, 38.0, 19.0, 30.0, 21.0, 19.0, 8.0, 7.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4283332824707031, -0.40915679931640625, -0.3899803161621094, -0.3708038330078125, -0.3516273498535156, -0.33245086669921875, -0.3132743835449219, -0.294097900390625, -0.2749214172363281, -0.25574493408203125, -0.23656845092773438, -0.2173919677734375, -0.19821548461914062, -0.17903900146484375, -0.15986251831054688, -0.14068603515625, -0.12150955200195312, -0.10233306884765625, -0.08315658569335938, -0.0639801025390625, -0.044803619384765625, -0.02562713623046875, -0.006450653076171875, 0.012725830078125, 0.031902313232421875, 0.05107879638671875, 0.07025527954101562, 0.0894317626953125, 0.10860824584960938, 0.12778472900390625, 0.14696121215820312, 0.1661376953125, 0.18531417846679688, 0.20449066162109375, 0.22366714477539062, 0.2428436279296875, 0.2620201110839844, 0.28119659423828125, 0.3003730773925781, 0.319549560546875, 0.3387260437011719, 0.35790252685546875, 0.3770790100097656, 0.3962554931640625, 0.4154319763183594, 0.43460845947265625, 0.4537849426269531, 0.47296142578125, 0.4921379089355469, 0.5113143920898438, 0.5304908752441406, 0.5496673583984375, 0.5688438415527344, 0.5880203247070312, 0.6071968078613281, 0.626373291015625, 0.6455497741699219, 0.6647262573242188, 0.6839027404785156, 0.7030792236328125, 0.7222557067871094, 0.7414321899414062, 0.7606086730957031, 0.77978515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 4.0, 6.0, 4.0, 2.0, 9.0, 12.0, 13.0, 18.0, 21.0, 41.0, 63.0, 73.0, 158.0, 243.0, 408.0, 733.0, 1345.0, 2637.0, 5794.0, 14777.0, 53762.0, 686778.0, 230428.0, 31885.0, 10403.0, 4313.0, 1980.0, 1117.0, 565.0, 359.0, 215.0, 113.0, 90.0, 49.0, 40.0, 18.0, 18.0, 11.0, 10.0, 12.0, 11.0, 8.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5703125, -0.5534515380859375, -0.536590576171875, -0.5197296142578125, -0.50286865234375, -0.4860076904296875, -0.469146728515625, -0.4522857666015625, -0.4354248046875, -0.4185638427734375, -0.401702880859375, -0.3848419189453125, -0.36798095703125, -0.3511199951171875, -0.334259033203125, -0.3173980712890625, -0.300537109375, -0.2836761474609375, -0.266815185546875, -0.2499542236328125, -0.23309326171875, -0.2162322998046875, -0.199371337890625, -0.1825103759765625, -0.1656494140625, -0.1487884521484375, -0.131927490234375, -0.1150665283203125, -0.09820556640625, -0.0813446044921875, -0.064483642578125, -0.0476226806640625, -0.03076171875, -0.0139007568359375, 0.002960205078125, 0.0198211669921875, 0.03668212890625, 0.0535430908203125, 0.070404052734375, 0.0872650146484375, 0.1041259765625, 0.1209869384765625, 0.137847900390625, 0.1547088623046875, 0.17156982421875, 0.1884307861328125, 0.205291748046875, 0.2221527099609375, 0.239013671875, 0.2558746337890625, 0.272735595703125, 0.2895965576171875, 0.30645751953125, 0.3233184814453125, 0.340179443359375, 0.3570404052734375, 0.3739013671875, 0.3907623291015625, 0.407623291015625, 0.4244842529296875, 0.44134521484375, 0.4582061767578125, 0.475067138671875, 0.4919281005859375, 0.5087890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 8.0, 8.0, 13.0, 13.0, 28.0, 50.0, 57.0, 137.0, 372.0, 140.0, 53.0, 30.0, 21.0, 17.0, 11.0, 6.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.219480514526367e-05, -7.854495197534561e-05, -7.489509880542755e-05, -7.124524563550949e-05, -6.759539246559143e-05, -6.394553929567337e-05, -6.029568612575531e-05, -5.664583295583725e-05, -5.299597978591919e-05, -4.934612661600113e-05, -4.569627344608307e-05, -4.204642027616501e-05, -3.839656710624695e-05, -3.474671393632889e-05, -3.109686076641083e-05, -2.7447007596492767e-05, -2.3797154426574707e-05, -2.0147301256656647e-05, -1.6497448086738586e-05, -1.2847594916820526e-05, -9.197741746902466e-06, -5.5478885769844055e-06, -1.8980354070663452e-06, 1.751817762851715e-06, 5.401670932769775e-06, 9.051524102687836e-06, 1.2701377272605896e-05, 1.6351230442523956e-05, 2.0001083612442017e-05, 2.3650936782360077e-05, 2.7300789952278137e-05, 3.09506431221962e-05, 3.460049629211426e-05, 3.825034946203232e-05, 4.190020263195038e-05, 4.555005580186844e-05, 4.91999089717865e-05, 5.284976214170456e-05, 5.649961531162262e-05, 6.014946848154068e-05, 6.379932165145874e-05, 6.74491748213768e-05, 7.109902799129486e-05, 7.474888116121292e-05, 7.839873433113098e-05, 8.204858750104904e-05, 8.56984406709671e-05, 8.934829384088516e-05, 9.299814701080322e-05, 9.664800018072128e-05, 0.00010029785335063934, 0.0001039477065205574, 0.00010759755969047546, 0.00011124741286039352, 0.00011489726603031158, 0.00011854711920022964, 0.0001221969723701477, 0.00012584682554006577, 0.00012949667870998383, 0.00013314653187990189, 0.00013679638504981995, 0.000140446238219738, 0.00014409609138965607, 0.00014774594455957413, 0.0001513957977294922]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 9.0, 4.0, 12.0, 20.0, 25.0, 52.0, 108.0, 239.0, 642.0, 1896.0, 7846.0, 57464.0, 912977.0, 56564.0, 7665.0, 1901.0, 622.0, 237.0, 106.0, 55.0, 40.0, 16.0, 15.0, 12.0, 5.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.810028076171875, -0.77825927734375, -0.746490478515625, -0.7147216796875, -0.682952880859375, -0.65118408203125, -0.619415283203125, -0.587646484375, -0.555877685546875, -0.52410888671875, -0.492340087890625, -0.4605712890625, -0.428802490234375, -0.39703369140625, -0.365264892578125, -0.33349609375, -0.301727294921875, -0.26995849609375, -0.238189697265625, -0.2064208984375, -0.174652099609375, -0.14288330078125, -0.111114501953125, -0.079345703125, -0.047576904296875, -0.01580810546875, 0.015960693359375, 0.0477294921875, 0.079498291015625, 0.11126708984375, 0.143035888671875, 0.1748046875, 0.206573486328125, 0.23834228515625, 0.270111083984375, 0.3018798828125, 0.333648681640625, 0.36541748046875, 0.397186279296875, 0.428955078125, 0.460723876953125, 0.49249267578125, 0.524261474609375, 0.5560302734375, 0.587799072265625, 0.61956787109375, 0.651336669921875, 0.68310546875, 0.714874267578125, 0.74664306640625, 0.778411865234375, 0.8101806640625, 0.841949462890625, 0.87371826171875, 0.905487060546875, 0.937255859375, 0.969024658203125, 1.00079345703125, 1.032562255859375, 1.0643310546875, 1.096099853515625, 1.12786865234375, 1.159637451171875, 1.19140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 1.0, 6.0, 6.0, 12.0, 11.0, 9.0, 14.0, 13.0, 14.0, 27.0, 47.0, 73.0, 134.0, 202.0, 178.0, 85.0, 52.0, 24.0, 20.0, 13.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.451416015625, -0.43939971923828125, -0.4273834228515625, -0.41536712646484375, -0.403350830078125, -0.39133453369140625, -0.3793182373046875, -0.36730194091796875, -0.35528564453125, -0.34326934814453125, -0.3312530517578125, -0.31923675537109375, -0.307220458984375, -0.29520416259765625, -0.2831878662109375, -0.27117156982421875, -0.2591552734375, -0.24713897705078125, -0.2351226806640625, -0.22310638427734375, -0.211090087890625, -0.19907379150390625, -0.1870574951171875, -0.17504119873046875, -0.16302490234375, -0.15100860595703125, -0.1389923095703125, -0.12697601318359375, -0.114959716796875, -0.10294342041015625, -0.0909271240234375, -0.07891082763671875, -0.06689453125, -0.05487823486328125, -0.0428619384765625, -0.03084564208984375, -0.018829345703125, -0.00681304931640625, 0.0052032470703125, 0.01721954345703125, 0.02923583984375, 0.04125213623046875, 0.0532684326171875, 0.06528472900390625, 0.077301025390625, 0.08931732177734375, 0.1013336181640625, 0.11334991455078125, 0.1253662109375, 0.13738250732421875, 0.1493988037109375, 0.16141510009765625, 0.173431396484375, 0.18544769287109375, 0.1974639892578125, 0.20948028564453125, 0.22149658203125, 0.23351287841796875, 0.2455291748046875, 0.25754547119140625, 0.269561767578125, 0.28157806396484375, 0.2935943603515625, 0.30561065673828125, 0.317626953125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 14.0, 21.0, 51.0, 129.0, 266.0, 294.0, 144.0, 48.0, 20.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.544559001922607, -5.323216438293457, -5.101874351501465, -4.8805317878723145, -4.659189224243164, -4.437847137451172, -4.2165045738220215, -3.995162010192871, -3.7738196849823, -3.5524773597717285, -3.331134796142578, -3.109792470932007, -2.8884501457214355, -2.667107582092285, -2.445765256881714, -2.2244229316711426, -2.003080368041992, -1.7817379236221313, -1.5603954792022705, -1.3390531539916992, -1.1177107095718384, -0.8963682651519775, -0.6750259399414062, -0.4536834955215454, -0.23234105110168457, -0.010998636484146118, 0.21034377813339233, 0.4316861629486084, 0.6530286073684692, 0.8743710517883301, 1.0957133769989014, 1.3170558214187622, 1.5383987426757812, 1.759741187095642, 1.981083631515503, 2.202425956726074, 2.4237685203552246, 2.645110845565796, 2.866453170776367, 3.0877957344055176, 3.309138059616089, 3.53048038482666, 3.7518229484558105, 3.973165273666382, 4.194507598876953, 4.4158501625061035, 4.637192726135254, 4.858534812927246, 5.0798773765563965, 5.301219940185547, 5.522562026977539, 5.7439045906066895, 5.96524715423584, 6.186589241027832, 6.407931804656982, 6.629274368286133, 6.850616455078125, 7.071959018707275, 7.293301105499268, 7.514643669128418, 7.735986232757568, 7.957328796386719, 8.178670883178711, 8.400012969970703, 8.621356010437012]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 9.0, 10.0, 14.0, 12.0, 18.0, 18.0, 19.0, 20.0, 20.0, 26.0, 34.0, 35.0, 33.0, 46.0, 32.0, 42.0, 53.0, 38.0, 42.0, 34.0, 32.0, 38.0, 34.0, 47.0, 27.0, 25.0, 32.0, 34.0, 20.0, 20.0, 25.0, 12.0, 20.0, 14.0, 18.0, 8.0, 7.0, 5.0, 4.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2888944149017334, -1.2482882738113403, -1.2076821327209473, -1.1670759916305542, -1.1264698505401611, -1.0858638286590576, -1.0452576875686646, -1.0046515464782715, -0.9640454053878784, -0.9234392642974854, -0.8828331232070923, -0.842227041721344, -0.8016209006309509, -0.7610147595405579, -0.7204086780548096, -0.6798025369644165, -0.6391963958740234, -0.5985902547836304, -0.5579841136932373, -0.517378032207489, -0.47677189111709595, -0.4361657500267029, -0.3955596387386322, -0.3549535274505615, -0.31434738636016846, -0.2737412452697754, -0.2331351339817047, -0.19252900779247284, -0.15192288160324097, -0.1113167554140091, -0.07071062922477722, -0.030104517936706543, 0.010501503944396973, 0.051107630133628845, 0.09171375632286072, 0.1323198825120926, 0.17292600870132446, 0.21353213489055634, 0.2541382610797882, 0.2947443723678589, 0.33535051345825195, 0.375956654548645, 0.4165627658367157, 0.4571688771247864, 0.49777501821517944, 0.5383811593055725, 0.5789872407913208, 0.6195933818817139, 0.6601995229721069, 0.7008056640625, 0.7414118051528931, 0.7820178866386414, 0.8226240277290344, 0.8632301688194275, 0.9038362503051758, 0.9444423913955688, 0.9850485324859619, 1.025654673576355, 1.066260814666748, 1.1068669557571411, 1.1474730968475342, 1.1880791187286377, 1.2286852598190308, 1.2692914009094238, 1.309897541999817]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 17.0, 25.0, 57.0, 103.0, 257.0, 672.0, 2300.0, 10928.0, 93677.0, 3866715.0, 200723.0, 14368.0, 2898.0, 855.0, 320.0, 123.0, 86.0, 56.0, 37.0, 16.0, 15.0, 7.0, 5.0, 10.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8115463256835938, -0.7739715576171875, -0.7363967895507812, -0.698822021484375, -0.6612472534179688, -0.6236724853515625, -0.5860977172851562, -0.54852294921875, -0.5109481811523438, -0.4733734130859375, -0.43579864501953125, -0.398223876953125, -0.36064910888671875, -0.3230743408203125, -0.28549957275390625, -0.2479248046875, -0.21035003662109375, -0.1727752685546875, -0.13520050048828125, -0.097625732421875, -0.06005096435546875, -0.0224761962890625, 0.01509857177734375, 0.05267333984375, 0.09024810791015625, 0.1278228759765625, 0.16539764404296875, 0.202972412109375, 0.24054718017578125, 0.2781219482421875, 0.31569671630859375, 0.353271484375, 0.39084625244140625, 0.4284210205078125, 0.46599578857421875, 0.503570556640625, 0.5411453247070312, 0.5787200927734375, 0.6162948608398438, 0.65386962890625, 0.6914443969726562, 0.7290191650390625, 0.7665939331054688, 0.804168701171875, 0.8417434692382812, 0.8793182373046875, 0.9168930053710938, 0.9544677734375, 0.9920425415039062, 1.0296173095703125, 1.0671920776367188, 1.104766845703125, 1.1423416137695312, 1.1799163818359375, 1.2174911499023438, 1.25506591796875, 1.2926406860351562, 1.3302154541015625, 1.3677902221679688, 1.405364990234375, 1.4429397583007812, 1.4805145263671875, 1.5180892944335938, 1.5556640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 13.0, 17.0, 10.0, 29.0, 41.0, 44.0, 68.0, 57.0, 71.0, 63.0, 79.0, 67.0, 76.0, 58.0, 54.0, 49.0, 40.0, 38.0, 32.0, 23.0, 19.0, 12.0, 9.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.20171165466308594, -0.19334030151367188, -0.1849689483642578, -0.17659759521484375, -0.1682262420654297, -0.15985488891601562, -0.15148353576660156, -0.1431121826171875, -0.13474082946777344, -0.12636947631835938, -0.11799812316894531, -0.10962677001953125, -0.10125541687011719, -0.09288406372070312, -0.08451271057128906, -0.076141357421875, -0.06777000427246094, -0.059398651123046875, -0.05102729797363281, -0.04265594482421875, -0.03428459167480469, -0.025913238525390625, -0.017541885375976562, -0.0091705322265625, -0.0007991790771484375, 0.007572174072265625, 0.015943527221679688, 0.02431488037109375, 0.03268623352050781, 0.041057586669921875, 0.04942893981933594, 0.05780029296875, 0.06617164611816406, 0.07454299926757812, 0.08291435241699219, 0.09128570556640625, 0.09965705871582031, 0.10802841186523438, 0.11639976501464844, 0.1247711181640625, 0.13314247131347656, 0.14151382446289062, 0.1498851776123047, 0.15825653076171875, 0.1666278839111328, 0.17499923706054688, 0.18337059020996094, 0.191741943359375, 0.20011329650878906, 0.20848464965820312, 0.2168560028076172, 0.22522735595703125, 0.2335987091064453, 0.24197006225585938, 0.25034141540527344, 0.2587127685546875, 0.26708412170410156, 0.2754554748535156, 0.2838268280029297, 0.29219818115234375, 0.3005695343017578, 0.3089408874511719, 0.31731224060058594, 0.32568359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 10.0, 16.0, 16.0, 19.0, 34.0, 33.0, 69.0, 75.0, 115.0, 202.0, 319.0, 496.0, 812.0, 1336.0, 2515.0, 4744.0, 10317.0, 24701.0, 79791.0, 619051.0, 3181482.0, 193081.0, 43865.0, 15959.0, 7168.0, 3425.0, 1817.0, 1071.0, 625.0, 398.0, 222.0, 153.0, 102.0, 79.0, 48.0, 32.0, 24.0, 24.0, 12.0, 10.0, 5.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6396484375, -0.6185150146484375, -0.597381591796875, -0.5762481689453125, -0.55511474609375, -0.5339813232421875, -0.512847900390625, -0.4917144775390625, -0.4705810546875, -0.4494476318359375, -0.428314208984375, -0.4071807861328125, -0.38604736328125, -0.3649139404296875, -0.343780517578125, -0.3226470947265625, -0.301513671875, -0.2803802490234375, -0.259246826171875, -0.2381134033203125, -0.21697998046875, -0.1958465576171875, -0.174713134765625, -0.1535797119140625, -0.1324462890625, -0.1113128662109375, -0.090179443359375, -0.0690460205078125, -0.04791259765625, -0.0267791748046875, -0.005645751953125, 0.0154876708984375, 0.03662109375, 0.0577545166015625, 0.078887939453125, 0.1000213623046875, 0.12115478515625, 0.1422882080078125, 0.163421630859375, 0.1845550537109375, 0.2056884765625, 0.2268218994140625, 0.247955322265625, 0.2690887451171875, 0.29022216796875, 0.3113555908203125, 0.332489013671875, 0.3536224365234375, 0.374755859375, 0.3958892822265625, 0.417022705078125, 0.4381561279296875, 0.45928955078125, 0.4804229736328125, 0.501556396484375, 0.5226898193359375, 0.5438232421875, 0.5649566650390625, 0.586090087890625, 0.6072235107421875, 0.62835693359375, 0.6494903564453125, 0.670623779296875, 0.6917572021484375, 0.712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 6.0, 3.0, 14.0, 16.0, 22.0, 25.0, 24.0, 36.0, 70.0, 129.0, 226.0, 519.0, 1280.0, 932.0, 342.0, 147.0, 83.0, 59.0, 43.0, 22.0, 23.0, 15.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7138671875, -0.6899032592773438, -0.6659393310546875, -0.6419754028320312, -0.618011474609375, -0.5940475463867188, -0.5700836181640625, -0.5461196899414062, -0.52215576171875, -0.49819183349609375, -0.4742279052734375, -0.45026397705078125, -0.426300048828125, -0.40233612060546875, -0.3783721923828125, -0.35440826416015625, -0.3304443359375, -0.30648040771484375, -0.2825164794921875, -0.25855255126953125, -0.234588623046875, -0.21062469482421875, -0.1866607666015625, -0.16269683837890625, -0.13873291015625, -0.11476898193359375, -0.0908050537109375, -0.06684112548828125, -0.042877197265625, -0.01891326904296875, 0.0050506591796875, 0.02901458740234375, 0.052978515625, 0.07694244384765625, 0.1009063720703125, 0.12487030029296875, 0.148834228515625, 0.17279815673828125, 0.1967620849609375, 0.22072601318359375, 0.24468994140625, 0.26865386962890625, 0.2926177978515625, 0.31658172607421875, 0.340545654296875, 0.36450958251953125, 0.3884735107421875, 0.41243743896484375, 0.4364013671875, 0.46036529541015625, 0.4843292236328125, 0.5082931518554688, 0.532257080078125, 0.5562210083007812, 0.5801849365234375, 0.6041488647460938, 0.62811279296875, 0.6520767211914062, 0.6760406494140625, 0.7000045776367188, 0.723968505859375, 0.7479324340820312, 0.7718963623046875, 0.7958602905273438, 0.81982421875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 32.0, 30.0, 72.0, 121.0, 199.0, 223.0, 129.0, 68.0, 49.0, 18.0, 11.0, 7.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.123235702514648, -3.9775922298431396, -3.83194899559021, -3.686305522918701, -3.5406622886657715, -3.3950188159942627, -3.249375343322754, -3.103732109069824, -2.9580888748168945, -2.8124454021453857, -2.666802167892456, -2.5211586952209473, -2.3755154609680176, -2.229871988296509, -2.084228515625, -1.9385852813720703, -1.7929418087005615, -1.6472984552383423, -1.501655101776123, -1.3560116291046143, -1.2103683948516846, -1.0647249221801758, -0.9190815687179565, -0.7734382152557373, -0.6277948617935181, -0.48215150833129883, -0.3365081250667572, -0.19086474180221558, -0.04522138833999634, 0.1004219651222229, 0.24606537818908691, 0.39170873165130615, 0.5373520851135254, 0.6829954385757446, 0.8286387920379639, 0.9742822051048279, 1.1199254989624023, 1.2655689716339111, 1.4112123250961304, 1.5568556785583496, 1.7024990320205688, 1.848142385482788, 1.9937857389450073, 2.1394290924072266, 2.2850725650787354, 2.430715799331665, 2.576359272003174, 2.7220025062561035, 2.8676459789276123, 3.013289451599121, 3.158932685852051, 3.3045761585235596, 3.4502193927764893, 3.595862865447998, 3.7415060997009277, 3.8871495723724365, 4.032793045043945, 4.178436279296875, 4.324079990386963, 4.469723224639893, 4.615366458892822, 4.761009693145752, 4.90665340423584, 5.0522966384887695, 5.197939872741699]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 4.0, 4.0, 9.0, 9.0, 12.0, 14.0, 17.0, 17.0, 22.0, 20.0, 28.0, 21.0, 34.0, 29.0, 33.0, 39.0, 33.0, 27.0, 30.0, 46.0, 36.0, 33.0, 42.0, 37.0, 39.0, 39.0, 27.0, 28.0, 32.0, 31.0, 26.0, 24.0, 27.0, 16.0, 22.0, 17.0, 11.0, 11.0, 12.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0], "bins": [-1.5099338293075562, -1.465242624282837, -1.4205515384674072, -1.375860333442688, -1.3311691284179688, -1.2864779233932495, -1.2417867183685303, -1.1970956325531006, -1.1524044275283813, -1.107713222503662, -1.0630221366882324, -1.0183309316635132, -0.973639726638794, -0.9289485216140747, -0.8842573761940002, -0.8395662307739258, -0.7948750257492065, -0.7501838207244873, -0.7054926753044128, -0.6608015298843384, -0.6161103248596191, -0.5714191198348999, -0.5267279744148254, -0.4820367991924286, -0.43734562397003174, -0.3926544487476349, -0.34796327352523804, -0.3032720983028412, -0.25858092308044434, -0.21388974785804749, -0.16919857263565063, -0.12450739741325378, -0.07981610298156738, -0.03512492775917053, 0.009566247463226318, 0.05425742268562317, 0.09894859790802002, 0.14363977313041687, 0.18833094835281372, 0.23302212357521057, 0.2777132987976074, 0.3224044740200043, 0.3670956492424011, 0.411786824464798, 0.4564779996871948, 0.5011692047119141, 0.5458603501319885, 0.590551495552063, 0.6352427005767822, 0.6799339056015015, 0.7246250510215759, 0.7693161964416504, 0.8140074014663696, 0.8586986064910889, 0.9033897519111633, 0.9480808973312378, 0.992772102355957, 1.0374633073806763, 1.0821545124053955, 1.1268455982208252, 1.1715368032455444, 1.2162280082702637, 1.2609190940856934, 1.3056102991104126, 1.3503015041351318]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 8.0, 20.0, 15.0, 28.0, 49.0, 75.0, 131.0, 287.0, 847.0, 2507.0, 9102.0, 38694.0, 252301.0, 628015.0, 91281.0, 18182.0, 4740.0, 1348.0, 474.0, 181.0, 85.0, 57.0, 43.0, 26.0, 20.0, 12.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0317535400390625, -0.985382080078125, -0.9390106201171875, -0.89263916015625, -0.8462677001953125, -0.799896240234375, -0.7535247802734375, -0.7071533203125, -0.6607818603515625, -0.614410400390625, -0.5680389404296875, -0.52166748046875, -0.4752960205078125, -0.428924560546875, -0.3825531005859375, -0.336181640625, -0.2898101806640625, -0.243438720703125, -0.1970672607421875, -0.15069580078125, -0.1043243408203125, -0.057952880859375, -0.0115814208984375, 0.0347900390625, 0.0811614990234375, 0.127532958984375, 0.1739044189453125, 0.22027587890625, 0.2666473388671875, 0.313018798828125, 0.3593902587890625, 0.40576171875, 0.4521331787109375, 0.498504638671875, 0.5448760986328125, 0.59124755859375, 0.6376190185546875, 0.683990478515625, 0.7303619384765625, 0.7767333984375, 0.8231048583984375, 0.869476318359375, 0.9158477783203125, 0.96221923828125, 1.0085906982421875, 1.054962158203125, 1.1013336181640625, 1.147705078125, 1.1940765380859375, 1.240447998046875, 1.2868194580078125, 1.33319091796875, 1.3795623779296875, 1.425933837890625, 1.4723052978515625, 1.5186767578125, 1.5650482177734375, 1.611419677734375, 1.6577911376953125, 1.70416259765625, 1.7505340576171875, 1.796905517578125, 1.8432769775390625, 1.8896484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 11.0, 10.0, 13.0, 30.0, 22.0, 33.0, 34.0, 40.0, 45.0, 64.0, 72.0, 66.0, 58.0, 66.0, 53.0, 75.0, 54.0, 40.0, 41.0, 37.0, 32.0, 25.0, 17.0, 19.0, 10.0, 10.0, 5.0, 10.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17441558837890625, -0.1657257080078125, -0.15703582763671875, -0.148345947265625, -0.13965606689453125, -0.1309661865234375, -0.12227630615234375, -0.11358642578125, -0.10489654541015625, -0.0962066650390625, -0.08751678466796875, -0.078826904296875, -0.07013702392578125, -0.0614471435546875, -0.05275726318359375, -0.0440673828125, -0.03537750244140625, -0.0266876220703125, -0.01799774169921875, -0.009307861328125, -0.00061798095703125, 0.0080718994140625, 0.01676177978515625, 0.02545166015625, 0.03414154052734375, 0.0428314208984375, 0.05152130126953125, 0.060211181640625, 0.06890106201171875, 0.0775909423828125, 0.08628082275390625, 0.094970703125, 0.10366058349609375, 0.1123504638671875, 0.12104034423828125, 0.129730224609375, 0.13842010498046875, 0.1471099853515625, 0.15579986572265625, 0.16448974609375, 0.17317962646484375, 0.1818695068359375, 0.19055938720703125, 0.199249267578125, 0.20793914794921875, 0.2166290283203125, 0.22531890869140625, 0.2340087890625, 0.24269866943359375, 0.2513885498046875, 0.26007843017578125, 0.268768310546875, 0.27745819091796875, 0.2861480712890625, 0.29483795166015625, 0.30352783203125, 0.31221771240234375, 0.3209075927734375, 0.32959747314453125, 0.338287353515625, 0.34697723388671875, 0.3556671142578125, 0.36435699462890625, 0.373046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 9.0, 10.0, 12.0, 21.0, 26.0, 46.0, 85.0, 123.0, 235.0, 434.0, 1063.0, 2621.0, 7778.0, 28328.0, 143932.0, 685746.0, 138277.0, 27423.0, 7680.0, 2660.0, 1012.0, 459.0, 255.0, 113.0, 61.0, 33.0, 24.0, 30.0, 8.0, 7.0, 12.0, 3.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.7841796875, -1.7365875244140625, -1.688995361328125, -1.6414031982421875, -1.59381103515625, -1.5462188720703125, -1.498626708984375, -1.4510345458984375, -1.4034423828125, -1.3558502197265625, -1.308258056640625, -1.2606658935546875, -1.21307373046875, -1.1654815673828125, -1.117889404296875, -1.0702972412109375, -1.022705078125, -0.9751129150390625, -0.927520751953125, -0.8799285888671875, -0.83233642578125, -0.7847442626953125, -0.737152099609375, -0.6895599365234375, -0.6419677734375, -0.5943756103515625, -0.546783447265625, -0.4991912841796875, -0.45159912109375, -0.4040069580078125, -0.356414794921875, -0.3088226318359375, -0.26123046875, -0.2136383056640625, -0.166046142578125, -0.1184539794921875, -0.07086181640625, -0.0232696533203125, 0.024322509765625, 0.0719146728515625, 0.1195068359375, 0.1670989990234375, 0.214691162109375, 0.2622833251953125, 0.30987548828125, 0.3574676513671875, 0.405059814453125, 0.4526519775390625, 0.500244140625, 0.5478363037109375, 0.595428466796875, 0.6430206298828125, 0.69061279296875, 0.7382049560546875, 0.785797119140625, 0.8333892822265625, 0.8809814453125, 0.9285736083984375, 0.976165771484375, 1.0237579345703125, 1.07135009765625, 1.1189422607421875, 1.166534423828125, 1.2141265869140625, 1.26171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 4.0, 4.0, 5.0, 7.0, 15.0, 17.0, 26.0, 31.0, 40.0, 35.0, 52.0, 47.0, 59.0, 66.0, 61.0, 87.0, 74.0, 73.0, 50.0, 49.0, 37.0, 33.0, 30.0, 20.0, 15.0, 13.0, 12.0, 10.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.76544189453125, -0.7369384765625, -0.70843505859375, -0.679931640625, -0.65142822265625, -0.6229248046875, -0.59442138671875, -0.56591796875, -0.53741455078125, -0.5089111328125, -0.48040771484375, -0.451904296875, -0.42340087890625, -0.3948974609375, -0.36639404296875, -0.337890625, -0.30938720703125, -0.2808837890625, -0.25238037109375, -0.223876953125, -0.19537353515625, -0.1668701171875, -0.13836669921875, -0.10986328125, -0.08135986328125, -0.0528564453125, -0.02435302734375, 0.004150390625, 0.03265380859375, 0.0611572265625, 0.08966064453125, 0.1181640625, 0.14666748046875, 0.1751708984375, 0.20367431640625, 0.232177734375, 0.26068115234375, 0.2891845703125, 0.31768798828125, 0.34619140625, 0.37469482421875, 0.4031982421875, 0.43170166015625, 0.460205078125, 0.48870849609375, 0.5172119140625, 0.54571533203125, 0.57421875, 0.60272216796875, 0.6312255859375, 0.65972900390625, 0.688232421875, 0.71673583984375, 0.7452392578125, 0.77374267578125, 0.80224609375, 0.83074951171875, 0.8592529296875, 0.88775634765625, 0.916259765625, 0.94476318359375, 0.9732666015625, 1.00177001953125, 1.0302734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 10.0, 19.0, 32.0, 33.0, 56.0, 114.0, 155.0, 272.0, 413.0, 762.0, 1255.0, 2521.0, 5467.0, 15750.0, 126349.0, 837147.0, 40521.0, 9434.0, 3904.0, 1882.0, 972.0, 567.0, 315.0, 186.0, 120.0, 90.0, 62.0, 37.0, 26.0, 18.0, 11.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9117355346679688, -0.8805999755859375, -0.8494644165039062, -0.818328857421875, -0.7871932983398438, -0.7560577392578125, -0.7249221801757812, -0.69378662109375, -0.6626510620117188, -0.6315155029296875, -0.6003799438476562, -0.569244384765625, -0.5381088256835938, -0.5069732666015625, -0.47583770751953125, -0.4447021484375, -0.41356658935546875, -0.3824310302734375, -0.35129547119140625, -0.320159912109375, -0.28902435302734375, -0.2578887939453125, -0.22675323486328125, -0.19561767578125, -0.16448211669921875, -0.1333465576171875, -0.10221099853515625, -0.071075439453125, -0.03993988037109375, -0.0088043212890625, 0.02233123779296875, 0.053466796875, 0.08460235595703125, 0.1157379150390625, 0.14687347412109375, 0.178009033203125, 0.20914459228515625, 0.2402801513671875, 0.27141571044921875, 0.30255126953125, 0.33368682861328125, 0.3648223876953125, 0.39595794677734375, 0.427093505859375, 0.45822906494140625, 0.4893646240234375, 0.5205001831054688, 0.5516357421875, 0.5827713012695312, 0.6139068603515625, 0.6450424194335938, 0.676177978515625, 0.7073135375976562, 0.7384490966796875, 0.7695846557617188, 0.80072021484375, 0.8318557739257812, 0.8629913330078125, 0.8941268920898438, 0.925262451171875, 0.9563980102539062, 0.9875335693359375, 1.0186691284179688, 1.0498046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 13.0, 10.0, 16.0, 40.0, 67.0, 116.0, 369.0, 178.0, 63.0, 38.0, 19.0, 16.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00019943714141845703, -0.0001942794770002365, -0.000189121812582016, -0.00018396414816379547, -0.00017880648374557495, -0.00017364881932735443, -0.0001684911549091339, -0.0001633334904909134, -0.00015817582607269287, -0.00015301816165447235, -0.00014786049723625183, -0.0001427028328180313, -0.0001375451683998108, -0.00013238750398159027, -0.00012722983956336975, -0.00012207217514514923, -0.00011691451072692871, -0.00011175684630870819, -0.00010659918189048767, -0.00010144151747226715, -9.628385305404663e-05, -9.112618863582611e-05, -8.596852421760559e-05, -8.081085979938507e-05, -7.565319538116455e-05, -7.049553096294403e-05, -6.533786654472351e-05, -6.018020212650299e-05, -5.502253770828247e-05, -4.986487329006195e-05, -4.470720887184143e-05, -3.954954445362091e-05, -3.439188003540039e-05, -2.923421561717987e-05, -2.407655119895935e-05, -1.891888678073883e-05, -1.376122236251831e-05, -8.60355794429779e-06, -3.4458935260772705e-06, 1.7117708921432495e-06, 6.8694353103637695e-06, 1.202709972858429e-05, 1.718476414680481e-05, 2.234242856502533e-05, 2.750009298324585e-05, 3.265775740146637e-05, 3.781542181968689e-05, 4.297308623790741e-05, 4.813075065612793e-05, 5.328841507434845e-05, 5.844607949256897e-05, 6.360374391078949e-05, 6.876140832901001e-05, 7.391907274723053e-05, 7.907673716545105e-05, 8.423440158367157e-05, 8.939206600189209e-05, 9.454973042011261e-05, 9.970739483833313e-05, 0.00010486505925655365, 0.00011002272367477417, 0.00011518038809299469, 0.00012033805251121521, 0.00012549571692943573, 0.00013065338134765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 17.0, 16.0, 22.0, 45.0, 81.0, 156.0, 342.0, 772.0, 2180.0, 8011.0, 95359.0, 918172.0, 17359.0, 3734.0, 1222.0, 522.0, 230.0, 137.0, 68.0, 31.0, 16.0, 19.0, 7.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9609375, -1.89813232421875, -1.8353271484375, -1.77252197265625, -1.709716796875, -1.64691162109375, -1.5841064453125, -1.52130126953125, -1.45849609375, -1.39569091796875, -1.3328857421875, -1.27008056640625, -1.207275390625, -1.14447021484375, -1.0816650390625, -1.01885986328125, -0.9560546875, -0.89324951171875, -0.8304443359375, -0.76763916015625, -0.704833984375, -0.64202880859375, -0.5792236328125, -0.51641845703125, -0.45361328125, -0.39080810546875, -0.3280029296875, -0.26519775390625, -0.202392578125, -0.13958740234375, -0.0767822265625, -0.01397705078125, 0.048828125, 0.11163330078125, 0.1744384765625, 0.23724365234375, 0.300048828125, 0.36285400390625, 0.4256591796875, 0.48846435546875, 0.55126953125, 0.61407470703125, 0.6768798828125, 0.73968505859375, 0.802490234375, 0.86529541015625, 0.9281005859375, 0.99090576171875, 1.0537109375, 1.11651611328125, 1.1793212890625, 1.24212646484375, 1.304931640625, 1.36773681640625, 1.4305419921875, 1.49334716796875, 1.55615234375, 1.61895751953125, 1.6817626953125, 1.74456787109375, 1.807373046875, 1.87017822265625, 1.9329833984375, 1.99578857421875, 2.05859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 8.0, 14.0, 28.0, 43.0, 107.0, 261.0, 285.0, 95.0, 58.0, 27.0, 15.0, 8.0, 7.0, 9.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96923828125, -0.93994140625, -0.91064453125, -0.88134765625, -0.85205078125, -0.82275390625, -0.79345703125, -0.76416015625, -0.73486328125, -0.70556640625, -0.67626953125, -0.64697265625, -0.61767578125, -0.58837890625, -0.55908203125, -0.52978515625, -0.50048828125, -0.47119140625, -0.44189453125, -0.41259765625, -0.38330078125, -0.35400390625, -0.32470703125, -0.29541015625, -0.26611328125, -0.23681640625, -0.20751953125, -0.17822265625, -0.14892578125, -0.11962890625, -0.09033203125, -0.06103515625, -0.03173828125, -0.00244140625, 0.02685546875, 0.05615234375, 0.08544921875, 0.11474609375, 0.14404296875, 0.17333984375, 0.20263671875, 0.23193359375, 0.26123046875, 0.29052734375, 0.31982421875, 0.34912109375, 0.37841796875, 0.40771484375, 0.43701171875, 0.46630859375, 0.49560546875, 0.52490234375, 0.55419921875, 0.58349609375, 0.61279296875, 0.64208984375, 0.67138671875, 0.70068359375, 0.72998046875, 0.75927734375, 0.78857421875, 0.81787109375, 0.84716796875, 0.87646484375, 0.90576171875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 23.0, 61.0, 184.0, 303.0, 254.0, 95.0, 35.0, 16.0, 8.0, 4.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.263287544250488, -8.952272415161133, -8.641256332397461, -8.330241203308105, -8.019225120544434, -7.708209991455078, -7.3971943855285645, -7.086178779602051, -6.775163650512695, -6.464148044586182, -6.153132438659668, -5.8421173095703125, -5.531101703643799, -5.220086097717285, -4.9090704917907715, -4.598054885864258, -4.287039279937744, -3.9760236740112305, -3.665008306503296, -3.3539927005767822, -3.0429773330688477, -2.731961727142334, -2.4209461212158203, -2.1099307537078857, -1.798915147781372, -1.487899661064148, -1.1768841743469238, -0.8658685684204102, -0.554853081703186, -0.24383759498596191, 0.06717801094055176, 0.37819337844848633, 0.689208984375, 1.0002244710922241, 1.3112399578094482, 1.622255563735962, 1.933271050453186, 2.24428653717041, 2.555302143096924, 2.8663175106048584, 3.177333116531372, 3.4883487224578857, 3.7993640899658203, 4.110379695892334, 4.421395301818848, 4.732410430908203, 5.043426513671875, 5.3544416427612305, 5.665457248687744, 5.976472854614258, 6.2874884605407715, 6.598504066467285, 6.909519195556641, 7.220534801483154, 7.531550407409668, 7.842565536499023, 8.153581619262695, 8.46459674835205, 8.775612831115723, 9.086627960205078, 9.39764404296875, 9.708659172058105, 10.019674301147461, 10.330690383911133, 10.641705513000488]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 2.0, 7.0, 17.0, 11.0, 15.0, 13.0, 25.0, 28.0, 39.0, 32.0, 35.0, 33.0, 43.0, 46.0, 59.0, 52.0, 38.0, 51.0, 46.0, 50.0, 40.0, 43.0, 36.0, 35.0, 36.0, 30.0, 22.0, 23.0, 17.0, 11.0, 12.0, 15.0, 5.0, 5.0, 9.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.738277554512024, -1.6682192087173462, -1.598160743713379, -1.5281023979187012, -1.4580440521240234, -1.3879857063293457, -1.3179272413253784, -1.2478688955307007, -1.1778104305267334, -1.1077520847320557, -1.0376936197280884, -0.9676352739334106, -0.8975769281387329, -0.8275185227394104, -0.7574601173400879, -0.6874017715454102, -0.6173434257507324, -0.5472850203514099, -0.4772266745567322, -0.40716826915740967, -0.33710989356040955, -0.2670515179634094, -0.19699311256408691, -0.1269347369670868, -0.05687636137008667, 0.013182021677494049, 0.08324040472507477, 0.15329879522323608, 0.2233571708202362, 0.29341554641723633, 0.36347395181655884, 0.43353232741355896, 0.5035908222198486, 0.5736492276191711, 0.6437075734138489, 0.7137659788131714, 0.7838243246078491, 0.8538827300071716, 0.9239411354064941, 0.9939994812011719, 1.0640578269958496, 1.1341161727905273, 1.2041746377944946, 1.2742329835891724, 1.34429132938385, 1.4143497943878174, 1.4844081401824951, 1.5544664859771729, 1.6245249509811401, 1.6945832967758179, 1.7646417617797852, 1.834700107574463, 1.9047584533691406, 1.9748167991638184, 2.044875144958496, 2.114933729171753, 2.1849920749664307, 2.2550504207611084, 2.325108766555786, 2.395167350769043, 2.4652256965637207, 2.5352840423583984, 2.605342388153076, 2.675400733947754, 2.7454590797424316]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 16.0, 42.0, 50.0, 110.0, 206.0, 486.0, 1355.0, 4161.0, 19192.0, 392933.0, 3698173.0, 64959.0, 8693.0, 2363.0, 813.0, 318.0, 169.0, 104.0, 40.0, 26.0, 13.0, 19.0, 10.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9070816040039062, -0.8644561767578125, -0.8218307495117188, -0.779205322265625, -0.7365798950195312, -0.6939544677734375, -0.6513290405273438, -0.60870361328125, -0.5660781860351562, -0.5234527587890625, -0.48082733154296875, -0.438201904296875, -0.39557647705078125, -0.3529510498046875, -0.31032562255859375, -0.2677001953125, -0.22507476806640625, -0.1824493408203125, -0.13982391357421875, -0.097198486328125, -0.05457305908203125, -0.0119476318359375, 0.03067779541015625, 0.07330322265625, 0.11592864990234375, 0.1585540771484375, 0.20117950439453125, 0.243804931640625, 0.28643035888671875, 0.3290557861328125, 0.37168121337890625, 0.414306640625, 0.45693206787109375, 0.4995574951171875, 0.5421829223632812, 0.584808349609375, 0.6274337768554688, 0.6700592041015625, 0.7126846313476562, 0.75531005859375, 0.7979354858398438, 0.8405609130859375, 0.8831863403320312, 0.925811767578125, 0.9684371948242188, 1.0110626220703125, 1.0536880493164062, 1.0963134765625, 1.1389389038085938, 1.1815643310546875, 1.2241897583007812, 1.266815185546875, 1.3094406127929688, 1.3520660400390625, 1.3946914672851562, 1.43731689453125, 1.4799423217773438, 1.5225677490234375, 1.5651931762695312, 1.607818603515625, 1.6504440307617188, 1.6930694580078125, 1.7356948852539062, 1.7783203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 9.0, 7.0, 6.0, 13.0, 16.0, 19.0, 32.0, 19.0, 26.0, 18.0, 37.0, 37.0, 60.0, 48.0, 48.0, 51.0, 48.0, 65.0, 56.0, 44.0, 53.0, 43.0, 46.0, 29.0, 39.0, 30.0, 20.0, 25.0, 12.0, 15.0, 8.0, 5.0, 4.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17615127563476562, -0.16846466064453125, -0.16077804565429688, -0.1530914306640625, -0.14540481567382812, -0.13771820068359375, -0.13003158569335938, -0.122344970703125, -0.11465835571289062, -0.10697174072265625, -0.09928512573242188, -0.0915985107421875, -0.08391189575195312, -0.07622528076171875, -0.06853866577148438, -0.06085205078125, -0.053165435791015625, -0.04547882080078125, -0.037792205810546875, -0.0301055908203125, -0.022418975830078125, -0.01473236083984375, -0.007045745849609375, 0.000640869140625, 0.008327484130859375, 0.01601409912109375, 0.023700714111328125, 0.0313873291015625, 0.039073944091796875, 0.04676055908203125, 0.054447174072265625, 0.0621337890625, 0.06982040405273438, 0.07750701904296875, 0.08519363403320312, 0.0928802490234375, 0.10056686401367188, 0.10825347900390625, 0.11594009399414062, 0.123626708984375, 0.13131332397460938, 0.13899993896484375, 0.14668655395507812, 0.1543731689453125, 0.16205978393554688, 0.16974639892578125, 0.17743301391601562, 0.18511962890625, 0.19280624389648438, 0.20049285888671875, 0.20817947387695312, 0.2158660888671875, 0.22355270385742188, 0.23123931884765625, 0.23892593383789062, 0.246612548828125, 0.2542991638183594, 0.26198577880859375, 0.2696723937988281, 0.2773590087890625, 0.2850456237792969, 0.29273223876953125, 0.3004188537597656, 0.30810546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 16.0, 7.0, 14.0, 26.0, 19.0, 42.0, 54.0, 89.0, 134.0, 169.0, 276.0, 470.0, 822.0, 1596.0, 3503.0, 8379.0, 26190.0, 135344.0, 3401878.0, 536264.0, 53679.0, 14607.0, 5414.0, 2395.0, 1204.0, 644.0, 357.0, 222.0, 137.0, 81.0, 65.0, 55.0, 35.0, 31.0, 11.0, 14.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9365234375, -0.9039459228515625, -0.871368408203125, -0.8387908935546875, -0.80621337890625, -0.7736358642578125, -0.741058349609375, -0.7084808349609375, -0.6759033203125, -0.6433258056640625, -0.610748291015625, -0.5781707763671875, -0.54559326171875, -0.5130157470703125, -0.480438232421875, -0.4478607177734375, -0.415283203125, -0.3827056884765625, -0.350128173828125, -0.3175506591796875, -0.28497314453125, -0.2523956298828125, -0.219818115234375, -0.1872406005859375, -0.1546630859375, -0.1220855712890625, -0.089508056640625, -0.0569305419921875, -0.02435302734375, 0.0082244873046875, 0.040802001953125, 0.0733795166015625, 0.10595703125, 0.1385345458984375, 0.171112060546875, 0.2036895751953125, 0.23626708984375, 0.2688446044921875, 0.301422119140625, 0.3339996337890625, 0.3665771484375, 0.3991546630859375, 0.431732177734375, 0.4643096923828125, 0.49688720703125, 0.5294647216796875, 0.562042236328125, 0.5946197509765625, 0.627197265625, 0.6597747802734375, 0.692352294921875, 0.7249298095703125, 0.75750732421875, 0.7900848388671875, 0.822662353515625, 0.8552398681640625, 0.8878173828125, 0.9203948974609375, 0.952972412109375, 0.9855499267578125, 1.01812744140625, 1.0507049560546875, 1.083282470703125, 1.1158599853515625, 1.1484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 18.0, 19.0, 21.0, 46.0, 88.0, 152.0, 382.0, 1122.0, 1303.0, 464.0, 169.0, 108.0, 50.0, 42.0, 22.0, 15.0, 13.0, 11.0, 11.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.0976409912109375, -1.066375732421875, -1.0351104736328125, -1.00384521484375, -0.9725799560546875, -0.941314697265625, -0.9100494384765625, -0.8787841796875, -0.8475189208984375, -0.816253662109375, -0.7849884033203125, -0.75372314453125, -0.7224578857421875, -0.691192626953125, -0.6599273681640625, -0.628662109375, -0.5973968505859375, -0.566131591796875, -0.5348663330078125, -0.50360107421875, -0.4723358154296875, -0.441070556640625, -0.4098052978515625, -0.3785400390625, -0.3472747802734375, -0.316009521484375, -0.2847442626953125, -0.25347900390625, -0.2222137451171875, -0.190948486328125, -0.1596832275390625, -0.12841796875, -0.0971527099609375, -0.065887451171875, -0.0346221923828125, -0.00335693359375, 0.0279083251953125, 0.059173583984375, 0.0904388427734375, 0.1217041015625, 0.1529693603515625, 0.184234619140625, 0.2154998779296875, 0.24676513671875, 0.2780303955078125, 0.309295654296875, 0.3405609130859375, 0.371826171875, 0.4030914306640625, 0.434356689453125, 0.4656219482421875, 0.49688720703125, 0.5281524658203125, 0.559417724609375, 0.5906829833984375, 0.6219482421875, 0.6532135009765625, 0.684478759765625, 0.7157440185546875, 0.74700927734375, 0.7782745361328125, 0.809539794921875, 0.8408050537109375, 0.8720703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 7.0, 13.0, 20.0, 55.0, 125.0, 232.0, 275.0, 137.0, 68.0, 24.0, 13.0, 11.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.797265529632568, -7.581241607666016, -7.365218162536621, -7.149194240570068, -6.933170795440674, -6.717146873474121, -6.501123428344727, -6.285099506378174, -6.069075584411621, -5.853051662445068, -5.637028217315674, -5.421004295349121, -5.204980850219727, -4.988956928253174, -4.772933006286621, -4.556909561157227, -4.340886116027832, -4.124862194061279, -3.9088387489318848, -3.692814826965332, -3.4767911434173584, -3.2607674598693848, -3.044743776321411, -2.8287200927734375, -2.6126961708068848, -2.396672487258911, -2.1806488037109375, -1.9646250009536743, -1.7486011981964111, -1.5325775146484375, -1.3165538311004639, -1.1005300283432007, -0.8845062255859375, -0.6684824824333191, -0.45245876908302307, -0.23643505573272705, -0.020411312580108643, 0.19561243057250977, 0.4116361141204834, 0.6276599168777466, 0.8436836004257202, 1.0597072839736938, 1.275731086730957, 1.4917547702789307, 1.7077784538269043, 1.9238022565841675, 2.1398258209228516, 2.3558497428894043, 2.571873426437378, 2.7878971099853516, 3.003920793533325, 3.219944477081299, 3.4359683990478516, 3.651992082595825, 3.868015766143799, 4.084039688110352, 4.300063133239746, 4.516087055206299, 4.732110500335693, 4.948134422302246, 5.164157867431641, 5.380181789398193, 5.596205711364746, 5.812229156494141, 6.028253078460693]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 8.0, 10.0, 24.0, 26.0, 37.0, 44.0, 36.0, 47.0, 57.0, 61.0, 69.0, 57.0, 63.0, 61.0, 61.0, 53.0, 47.0, 45.0, 28.0, 30.0, 28.0, 26.0, 21.0, 11.0, 6.0, 7.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7288873195648193, -2.6537890434265137, -2.578690767288208, -2.5035927295684814, -2.428494453430176, -2.35339617729187, -2.2782979011535645, -2.203199625015259, -2.128101348876953, -2.0530030727386475, -1.9779049158096313, -1.9028066396713257, -1.8277084827423096, -1.752610206604004, -1.6775119304656982, -1.6024136543273926, -1.527315616607666, -1.4522173404693604, -1.3771191835403442, -1.3020209074020386, -1.2269227504730225, -1.1518244743347168, -1.0767261981964111, -1.0016279220581055, -0.9265297651290894, -0.8514315485954285, -0.7763333320617676, -0.7012350559234619, -0.626136839389801, -0.5510386228561401, -0.47594037652015686, -0.4008421301841736, -0.3257436752319336, -0.2506454586982727, -0.17554721236228943, -0.10044898092746735, -0.025350749492645264, 0.049747467041015625, 0.1248457133769989, 0.19994395971298218, 0.27504217624664307, 0.35014039278030396, 0.42523863911628723, 0.5003368854522705, 0.5754351019859314, 0.6505333185195923, 0.725631594657898, 0.8007298111915588, 0.8758280277252197, 0.9509262442588806, 1.0260244607925415, 1.1011227369308472, 1.1762208938598633, 1.251319169998169, 1.3264174461364746, 1.4015157222747803, 1.4766138792037964, 1.551712155342102, 1.6268103122711182, 1.7019085884094238, 1.7770068645477295, 1.8521050214767456, 1.9272032976150513, 2.0023014545440674, 2.077399730682373]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 3.0, 6.0, 5.0, 12.0, 15.0, 23.0, 15.0, 37.0, 52.0, 71.0, 127.0, 220.0, 435.0, 987.0, 2172.0, 5498.0, 13835.0, 38853.0, 131461.0, 453994.0, 286014.0, 74897.0, 24231.0, 8951.0, 3555.0, 1566.0, 667.0, 315.0, 157.0, 112.0, 74.0, 56.0, 25.0, 28.0, 18.0, 15.0, 9.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-1.2412109375, -1.2065200805664062, -1.1718292236328125, -1.1371383666992188, -1.102447509765625, -1.0677566528320312, -1.0330657958984375, -0.9983749389648438, -0.96368408203125, -0.9289932250976562, -0.8943023681640625, -0.8596115112304688, -0.824920654296875, -0.7902297973632812, -0.7555389404296875, -0.7208480834960938, -0.6861572265625, -0.6514663696289062, -0.6167755126953125, -0.5820846557617188, -0.547393798828125, -0.5127029418945312, -0.4780120849609375, -0.44332122802734375, -0.40863037109375, -0.37393951416015625, -0.3392486572265625, -0.30455780029296875, -0.269866943359375, -0.23517608642578125, -0.2004852294921875, -0.16579437255859375, -0.131103515625, -0.09641265869140625, -0.0617218017578125, -0.02703094482421875, 0.007659912109375, 0.04235076904296875, 0.0770416259765625, 0.11173248291015625, 0.14642333984375, 0.18111419677734375, 0.2158050537109375, 0.25049591064453125, 0.285186767578125, 0.31987762451171875, 0.3545684814453125, 0.38925933837890625, 0.4239501953125, 0.45864105224609375, 0.4933319091796875, 0.5280227661132812, 0.562713623046875, 0.5974044799804688, 0.6320953369140625, 0.6667861938476562, 0.70147705078125, 0.7361679077148438, 0.7708587646484375, 0.8055496215820312, 0.840240478515625, 0.8749313354492188, 0.9096221923828125, 0.9443130493164062, 0.97900390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 13.0, 18.0, 16.0, 25.0, 25.0, 43.0, 38.0, 36.0, 58.0, 54.0, 63.0, 63.0, 79.0, 59.0, 73.0, 72.0, 61.0, 40.0, 32.0, 30.0, 29.0, 19.0, 8.0, 10.0, 8.0, 8.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.233642578125, -0.22358322143554688, -0.21352386474609375, -0.20346450805664062, -0.1934051513671875, -0.18334579467773438, -0.17328643798828125, -0.16322708129882812, -0.153167724609375, -0.14310836791992188, -0.13304901123046875, -0.12298965454101562, -0.1129302978515625, -0.10287094116210938, -0.09281158447265625, -0.08275222778320312, -0.07269287109375, -0.06263351440429688, -0.05257415771484375, -0.042514801025390625, -0.0324554443359375, -0.022396087646484375, -0.01233673095703125, -0.002277374267578125, 0.007781982421875, 0.017841339111328125, 0.02790069580078125, 0.037960052490234375, 0.0480194091796875, 0.058078765869140625, 0.06813812255859375, 0.07819747924804688, 0.0882568359375, 0.09831619262695312, 0.10837554931640625, 0.11843490600585938, 0.1284942626953125, 0.13855361938476562, 0.14861297607421875, 0.15867233276367188, 0.168731689453125, 0.17879104614257812, 0.18885040283203125, 0.19890975952148438, 0.2089691162109375, 0.21902847290039062, 0.22908782958984375, 0.23914718627929688, 0.24920654296875, 0.2592658996582031, 0.26932525634765625, 0.2793846130371094, 0.2894439697265625, 0.2995033264160156, 0.30956268310546875, 0.3196220397949219, 0.329681396484375, 0.3397407531738281, 0.34980010986328125, 0.3598594665527344, 0.3699188232421875, 0.3799781799316406, 0.39003753662109375, 0.4000968933105469, 0.41015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 5.0, 14.0, 35.0, 34.0, 63.0, 98.0, 187.0, 366.0, 676.0, 1466.0, 3392.0, 9236.0, 28074.0, 100728.0, 439525.0, 350020.0, 78989.0, 22492.0, 7691.0, 2879.0, 1227.0, 613.0, 315.0, 170.0, 102.0, 56.0, 32.0, 26.0, 16.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.177734375, -1.1396331787109375, -1.101531982421875, -1.0634307861328125, -1.02532958984375, -0.9872283935546875, -0.949127197265625, -0.9110260009765625, -0.8729248046875, -0.8348236083984375, -0.796722412109375, -0.7586212158203125, -0.72052001953125, -0.6824188232421875, -0.644317626953125, -0.6062164306640625, -0.568115234375, -0.5300140380859375, -0.491912841796875, -0.4538116455078125, -0.41571044921875, -0.3776092529296875, -0.339508056640625, -0.3014068603515625, -0.2633056640625, -0.2252044677734375, -0.187103271484375, -0.1490020751953125, -0.11090087890625, -0.0727996826171875, -0.034698486328125, 0.0034027099609375, 0.04150390625, 0.0796051025390625, 0.117706298828125, 0.1558074951171875, 0.19390869140625, 0.2320098876953125, 0.270111083984375, 0.3082122802734375, 0.3463134765625, 0.3844146728515625, 0.422515869140625, 0.4606170654296875, 0.49871826171875, 0.5368194580078125, 0.574920654296875, 0.6130218505859375, 0.651123046875, 0.6892242431640625, 0.727325439453125, 0.7654266357421875, 0.80352783203125, 0.8416290283203125, 0.879730224609375, 0.9178314208984375, 0.9559326171875, 0.9940338134765625, 1.032135009765625, 1.0702362060546875, 1.10833740234375, 1.1464385986328125, 1.184539794921875, 1.2226409912109375, 1.2607421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 10.0, 12.0, 19.0, 13.0, 26.0, 29.0, 33.0, 24.0, 28.0, 56.0, 49.0, 60.0, 63.0, 45.0, 64.0, 49.0, 45.0, 56.0, 41.0, 48.0, 35.0, 34.0, 27.0, 26.0, 25.0, 18.0, 13.0, 8.0, 9.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8402099609375, -0.815673828125, -0.7911376953125, -0.7666015625, -0.7420654296875, -0.717529296875, -0.6929931640625, -0.66845703125, -0.6439208984375, -0.619384765625, -0.5948486328125, -0.5703125, -0.5457763671875, -0.521240234375, -0.4967041015625, -0.47216796875, -0.4476318359375, -0.423095703125, -0.3985595703125, -0.3740234375, -0.3494873046875, -0.324951171875, -0.3004150390625, -0.27587890625, -0.2513427734375, -0.226806640625, -0.2022705078125, -0.177734375, -0.1531982421875, -0.128662109375, -0.1041259765625, -0.07958984375, -0.0550537109375, -0.030517578125, -0.0059814453125, 0.0185546875, 0.0430908203125, 0.067626953125, 0.0921630859375, 0.11669921875, 0.1412353515625, 0.165771484375, 0.1903076171875, 0.21484375, 0.2393798828125, 0.263916015625, 0.2884521484375, 0.31298828125, 0.3375244140625, 0.362060546875, 0.3865966796875, 0.4111328125, 0.4356689453125, 0.460205078125, 0.4847412109375, 0.50927734375, 0.5338134765625, 0.558349609375, 0.5828857421875, 0.607421875, 0.6319580078125, 0.656494140625, 0.6810302734375, 0.70556640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 8.0, 10.0, 12.0, 17.0, 30.0, 48.0, 54.0, 80.0, 122.0, 222.0, 297.0, 550.0, 920.0, 1714.0, 3075.0, 5845.0, 12512.0, 30430.0, 100029.0, 612173.0, 200546.0, 45631.0, 17325.0, 7936.0, 3926.0, 2111.0, 1153.0, 647.0, 420.0, 264.0, 170.0, 107.0, 49.0, 36.0, 30.0, 17.0, 12.0, 11.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.5994491577148438, -0.5778045654296875, -0.5561599731445312, -0.534515380859375, -0.5128707885742188, -0.4912261962890625, -0.46958160400390625, -0.44793701171875, -0.42629241943359375, -0.4046478271484375, -0.38300323486328125, -0.361358642578125, -0.33971405029296875, -0.3180694580078125, -0.29642486572265625, -0.2747802734375, -0.25313568115234375, -0.2314910888671875, -0.20984649658203125, -0.188201904296875, -0.16655731201171875, -0.1449127197265625, -0.12326812744140625, -0.10162353515625, -0.07997894287109375, -0.0583343505859375, -0.03668975830078125, -0.015045166015625, 0.00659942626953125, 0.0282440185546875, 0.04988861083984375, 0.071533203125, 0.09317779541015625, 0.1148223876953125, 0.13646697998046875, 0.158111572265625, 0.17975616455078125, 0.2014007568359375, 0.22304534912109375, 0.24468994140625, 0.26633453369140625, 0.2879791259765625, 0.30962371826171875, 0.331268310546875, 0.35291290283203125, 0.3745574951171875, 0.39620208740234375, 0.4178466796875, 0.43949127197265625, 0.4611358642578125, 0.48278045654296875, 0.504425048828125, 0.5260696411132812, 0.5477142333984375, 0.5693588256835938, 0.59100341796875, 0.6126480102539062, 0.6342926025390625, 0.6559371948242188, 0.677581787109375, 0.6992263793945312, 0.7208709716796875, 0.7425155639648438, 0.76416015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 15.0, 13.0, 18.0, 31.0, 28.0, 50.0, 114.0, 196.0, 205.0, 115.0, 73.0, 33.0, 21.0, 23.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0002181529998779297, -0.00021308381110429764, -0.0002080146223306656, -0.00020294543355703354, -0.0001978762447834015, -0.00019280705600976944, -0.0001877378672361374, -0.00018266867846250534, -0.0001775994896888733, -0.00017253030091524124, -0.0001674611121416092, -0.00016239192336797714, -0.0001573227345943451, -0.00015225354582071304, -0.000147184357047081, -0.00014211516827344894, -0.0001370459794998169, -0.00013197679072618484, -0.0001269076019525528, -0.00012183841317892075, -0.0001167692244052887, -0.00011170003563165665, -0.0001066308468580246, -0.00010156165808439255, -9.64924693107605e-05, -9.142328053712845e-05, -8.63540917634964e-05, -8.128490298986435e-05, -7.62157142162323e-05, -7.114652544260025e-05, -6.60773366689682e-05, -6.100814789533615e-05, -5.59389591217041e-05, -5.086977034807205e-05, -4.580058157444e-05, -4.073139280080795e-05, -3.56622040271759e-05, -3.0593015253543854e-05, -2.5523826479911804e-05, -2.0454637706279755e-05, -1.5385448932647705e-05, -1.0316260159015656e-05, -5.247071385383606e-06, -1.778826117515564e-07, 4.891306161880493e-06, 9.960494935512543e-06, 1.5029683709144592e-05, 2.0098872482776642e-05, 2.516806125640869e-05, 3.023725003004074e-05, 3.530643880367279e-05, 4.037562757730484e-05, 4.544481635093689e-05, 5.051400512456894e-05, 5.558319389820099e-05, 6.065238267183304e-05, 6.572157144546509e-05, 7.079076021909714e-05, 7.585994899272919e-05, 8.092913776636124e-05, 8.599832653999329e-05, 9.106751531362534e-05, 9.613670408725739e-05, 0.00010120589286088943, 0.00010627508163452148]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 9.0, 6.0, 14.0, 13.0, 23.0, 43.0, 61.0, 99.0, 162.0, 291.0, 549.0, 1146.0, 2178.0, 4400.0, 9810.0, 27230.0, 131531.0, 746587.0, 86604.0, 21730.0, 8214.0, 3811.0, 1927.0, 930.0, 487.0, 289.0, 142.0, 96.0, 50.0, 23.0, 27.0, 15.0, 17.0, 5.0, 3.0, 10.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0395660400390625, -1.002960205078125, -0.9663543701171875, -0.92974853515625, -0.8931427001953125, -0.856536865234375, -0.8199310302734375, -0.7833251953125, -0.7467193603515625, -0.710113525390625, -0.6735076904296875, -0.63690185546875, -0.6002960205078125, -0.563690185546875, -0.5270843505859375, -0.490478515625, -0.4538726806640625, -0.417266845703125, -0.3806610107421875, -0.34405517578125, -0.3074493408203125, -0.270843505859375, -0.2342376708984375, -0.1976318359375, -0.1610260009765625, -0.124420166015625, -0.0878143310546875, -0.05120849609375, -0.0146026611328125, 0.022003173828125, 0.0586090087890625, 0.09521484375, 0.1318206787109375, 0.168426513671875, 0.2050323486328125, 0.24163818359375, 0.2782440185546875, 0.314849853515625, 0.3514556884765625, 0.3880615234375, 0.4246673583984375, 0.461273193359375, 0.4978790283203125, 0.53448486328125, 0.5710906982421875, 0.607696533203125, 0.6443023681640625, 0.680908203125, 0.7175140380859375, 0.754119873046875, 0.7907257080078125, 0.82733154296875, 0.8639373779296875, 0.900543212890625, 0.9371490478515625, 0.9737548828125, 1.0103607177734375, 1.046966552734375, 1.0835723876953125, 1.12017822265625, 1.1567840576171875, 1.193389892578125, 1.2299957275390625, 1.2666015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 8.0, 8.0, 8.0, 8.0, 13.0, 10.0, 24.0, 27.0, 40.0, 35.0, 91.0, 106.0, 129.0, 112.0, 84.0, 51.0, 46.0, 37.0, 22.0, 23.0, 12.0, 12.0, 14.0, 9.0, 7.0, 5.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.59326171875, -0.5746078491210938, -0.5559539794921875, -0.5373001098632812, -0.518646240234375, -0.49999237060546875, -0.4813385009765625, -0.46268463134765625, -0.44403076171875, -0.42537689208984375, -0.4067230224609375, -0.38806915283203125, -0.369415283203125, -0.35076141357421875, -0.3321075439453125, -0.31345367431640625, -0.2947998046875, -0.27614593505859375, -0.2574920654296875, -0.23883819580078125, -0.220184326171875, -0.20153045654296875, -0.1828765869140625, -0.16422271728515625, -0.14556884765625, -0.12691497802734375, -0.1082611083984375, -0.08960723876953125, -0.070953369140625, -0.05229949951171875, -0.0336456298828125, -0.01499176025390625, 0.003662109375, 0.02231597900390625, 0.0409698486328125, 0.05962371826171875, 0.078277587890625, 0.09693145751953125, 0.1155853271484375, 0.13423919677734375, 0.15289306640625, 0.17154693603515625, 0.1902008056640625, 0.20885467529296875, 0.227508544921875, 0.24616241455078125, 0.2648162841796875, 0.28347015380859375, 0.3021240234375, 0.32077789306640625, 0.3394317626953125, 0.35808563232421875, 0.376739501953125, 0.39539337158203125, 0.4140472412109375, 0.43270111083984375, 0.45135498046875, 0.47000885009765625, 0.4886627197265625, 0.5073165893554688, 0.525970458984375, 0.5446243286132812, 0.5632781982421875, 0.5819320678710938, 0.6005859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 8.0, 21.0, 46.0, 122.0, 264.0, 269.0, 143.0, 75.0, 27.0, 13.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.469182014465332, -13.116656303405762, -12.764130592346191, -12.411604881286621, -12.05907917022705, -11.70655345916748, -11.35402774810791, -11.00150203704834, -10.64897632598877, -10.2964506149292, -9.943924903869629, -9.591399192810059, -9.238873481750488, -8.886347770690918, -8.533822059631348, -8.181296348571777, -7.828771114349365, -7.476245403289795, -7.123719692230225, -6.771193981170654, -6.418668270111084, -6.066142559051514, -5.713617324829102, -5.361091613769531, -5.008565902709961, -4.656040191650391, -4.30351448059082, -3.95098876953125, -3.5984630584716797, -3.2459373474121094, -2.893411874771118, -2.540886163711548, -2.1883602142333984, -1.8358345031738281, -1.4833087921142578, -1.130783200263977, -0.7782574892044067, -0.4257317781448364, -0.07320618629455566, 0.27931952476501465, 0.631845235824585, 0.9843709468841553, 1.3368966579437256, 1.6894222497940063, 2.041947841644287, 2.3944735527038574, 2.7469992637634277, 3.099524974822998, 3.4520506858825684, 3.8045763969421387, 4.157102108001709, 4.509627819061279, 4.86215353012085, 5.21467924118042, 5.567204475402832, 5.919730186462402, 6.272255897521973, 6.624781608581543, 6.977307319641113, 7.329833030700684, 7.682358741760254, 8.034884452819824, 8.387410163879395, 8.739935874938965, 9.092461585998535]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 9.0, 12.0, 12.0, 15.0, 11.0, 14.0, 13.0, 18.0, 20.0, 32.0, 27.0, 37.0, 30.0, 46.0, 50.0, 42.0, 40.0, 36.0, 50.0, 46.0, 50.0, 46.0, 37.0, 28.0, 37.0, 30.0, 28.0, 31.0, 27.0, 18.0, 24.0, 13.0, 10.0, 17.0, 14.0, 4.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.562933921813965, -2.492095947265625, -2.4212582111358643, -2.3504202365875244, -2.2795822620391846, -2.208744525909424, -2.137906551361084, -2.067068576812744, -1.9962307214736938, -1.9253928661346436, -1.8545548915863037, -1.7837170362472534, -1.7128791809082031, -1.6420412063598633, -1.571203351020813, -1.5003654956817627, -1.4295275211334229, -1.3586896657943726, -1.2878516912460327, -1.2170138359069824, -1.1461758613586426, -1.0753380060195923, -1.004500150680542, -0.9336622357368469, -0.8628243207931519, -0.7919864058494568, -0.7211484909057617, -0.6503106355667114, -0.5794727206230164, -0.5086348056793213, -0.4377969205379486, -0.3669590353965759, -0.2961210012435913, -0.22528310120105743, -0.15444520115852356, -0.08360730111598969, -0.01276940107345581, 0.05806851387023926, 0.12890639901161194, 0.19974428415298462, 0.2705821990966797, 0.34142011404037476, 0.41225799918174744, 0.4830958843231201, 0.5539337992668152, 0.6247717142105103, 0.6956095695495605, 0.7664474844932556, 0.8372853994369507, 0.9081233143806458, 0.9789612293243408, 1.0497990846633911, 1.1206369400024414, 1.1914749145507812, 1.2623127698898315, 1.3331506252288818, 1.4039885997772217, 1.474826455116272, 1.5456644296646118, 1.616502285003662, 1.687340259552002, 1.7581781148910522, 1.8290159702301025, 1.8998539447784424, 1.9706918001174927]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 11.0, 8.0, 17.0, 27.0, 30.0, 61.0, 69.0, 121.0, 161.0, 260.0, 446.0, 826.0, 1469.0, 2879.0, 5946.0, 15972.0, 58107.0, 938644.0, 2984359.0, 143703.0, 24647.0, 8595.0, 3729.0, 1827.0, 899.0, 568.0, 336.0, 203.0, 116.0, 71.0, 49.0, 34.0, 17.0, 16.0, 15.0, 15.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.763671875, -0.733367919921875, -0.70306396484375, -0.672760009765625, -0.6424560546875, -0.612152099609375, -0.58184814453125, -0.551544189453125, -0.521240234375, -0.490936279296875, -0.46063232421875, -0.430328369140625, -0.4000244140625, -0.369720458984375, -0.33941650390625, -0.309112548828125, -0.27880859375, -0.248504638671875, -0.21820068359375, -0.187896728515625, -0.1575927734375, -0.127288818359375, -0.09698486328125, -0.066680908203125, -0.036376953125, -0.006072998046875, 0.02423095703125, 0.054534912109375, 0.0848388671875, 0.115142822265625, 0.14544677734375, 0.175750732421875, 0.2060546875, 0.236358642578125, 0.26666259765625, 0.296966552734375, 0.3272705078125, 0.357574462890625, 0.38787841796875, 0.418182373046875, 0.448486328125, 0.478790283203125, 0.50909423828125, 0.539398193359375, 0.5697021484375, 0.600006103515625, 0.63031005859375, 0.660614013671875, 0.69091796875, 0.721221923828125, 0.75152587890625, 0.781829833984375, 0.8121337890625, 0.842437744140625, 0.87274169921875, 0.903045654296875, 0.933349609375, 0.963653564453125, 0.99395751953125, 1.024261474609375, 1.0545654296875, 1.084869384765625, 1.11517333984375, 1.145477294921875, 1.17578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 8.0, 7.0, 9.0, 11.0, 20.0, 15.0, 30.0, 32.0, 39.0, 34.0, 38.0, 65.0, 48.0, 48.0, 57.0, 52.0, 52.0, 65.0, 54.0, 42.0, 41.0, 50.0, 29.0, 27.0, 20.0, 22.0, 18.0, 14.0, 10.0, 8.0, 2.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2890625, -0.2791595458984375, -0.269256591796875, -0.2593536376953125, -0.24945068359375, -0.2395477294921875, -0.229644775390625, -0.2197418212890625, -0.2098388671875, -0.1999359130859375, -0.190032958984375, -0.1801300048828125, -0.17022705078125, -0.1603240966796875, -0.150421142578125, -0.1405181884765625, -0.130615234375, -0.1207122802734375, -0.110809326171875, -0.1009063720703125, -0.09100341796875, -0.0811004638671875, -0.071197509765625, -0.0612945556640625, -0.0513916015625, -0.0414886474609375, -0.031585693359375, -0.0216827392578125, -0.01177978515625, -0.0018768310546875, 0.008026123046875, 0.0179290771484375, 0.02783203125, 0.0377349853515625, 0.047637939453125, 0.0575408935546875, 0.06744384765625, 0.0773468017578125, 0.087249755859375, 0.0971527099609375, 0.1070556640625, 0.1169586181640625, 0.126861572265625, 0.1367645263671875, 0.14666748046875, 0.1565704345703125, 0.166473388671875, 0.1763763427734375, 0.186279296875, 0.1961822509765625, 0.206085205078125, 0.2159881591796875, 0.22589111328125, 0.2357940673828125, 0.245697021484375, 0.2555999755859375, 0.2655029296875, 0.2754058837890625, 0.285308837890625, 0.2952117919921875, 0.30511474609375, 0.3150177001953125, 0.324920654296875, 0.3348236083984375, 0.3447265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 11.0, 10.0, 19.0, 13.0, 32.0, 41.0, 55.0, 73.0, 113.0, 157.0, 261.0, 408.0, 678.0, 1081.0, 2004.0, 3613.0, 6657.0, 14606.0, 38029.0, 151257.0, 2797649.0, 1025975.0, 97626.0, 29003.0, 11859.0, 5653.0, 3088.0, 1694.0, 1002.0, 564.0, 353.0, 199.0, 151.0, 96.0, 66.0, 57.0, 39.0, 32.0, 11.0, 14.0, 11.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.92236328125, -0.8951263427734375, -0.867889404296875, -0.8406524658203125, -0.81341552734375, -0.7861785888671875, -0.758941650390625, -0.7317047119140625, -0.7044677734375, -0.6772308349609375, -0.649993896484375, -0.6227569580078125, -0.59552001953125, -0.5682830810546875, -0.541046142578125, -0.5138092041015625, -0.486572265625, -0.4593353271484375, -0.432098388671875, -0.4048614501953125, -0.37762451171875, -0.3503875732421875, -0.323150634765625, -0.2959136962890625, -0.2686767578125, -0.2414398193359375, -0.214202880859375, -0.1869659423828125, -0.15972900390625, -0.1324920654296875, -0.105255126953125, -0.0780181884765625, -0.05078125, -0.0235443115234375, 0.003692626953125, 0.0309295654296875, 0.05816650390625, 0.0854034423828125, 0.112640380859375, 0.1398773193359375, 0.1671142578125, 0.1943511962890625, 0.221588134765625, 0.2488250732421875, 0.27606201171875, 0.3032989501953125, 0.330535888671875, 0.3577728271484375, 0.385009765625, 0.4122467041015625, 0.439483642578125, 0.4667205810546875, 0.49395751953125, 0.5211944580078125, 0.548431396484375, 0.5756683349609375, 0.6029052734375, 0.6301422119140625, 0.657379150390625, 0.6846160888671875, 0.71185302734375, 0.7390899658203125, 0.766326904296875, 0.7935638427734375, 0.82080078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 2.0, 7.0, 8.0, 10.0, 14.0, 19.0, 30.0, 51.0, 85.0, 136.0, 335.0, 867.0, 1365.0, 587.0, 201.0, 125.0, 68.0, 44.0, 33.0, 14.0, 18.0, 10.0, 15.0, 5.0, 6.0, 3.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.0958633422851562, -1.0647735595703125, -1.0336837768554688, -1.002593994140625, -0.9715042114257812, -0.9404144287109375, -0.9093246459960938, -0.87823486328125, -0.8471450805664062, -0.8160552978515625, -0.7849655151367188, -0.753875732421875, -0.7227859497070312, -0.6916961669921875, -0.6606063842773438, -0.6295166015625, -0.5984268188476562, -0.5673370361328125, -0.5362472534179688, -0.505157470703125, -0.47406768798828125, -0.4429779052734375, -0.41188812255859375, -0.38079833984375, -0.34970855712890625, -0.3186187744140625, -0.28752899169921875, -0.256439208984375, -0.22534942626953125, -0.1942596435546875, -0.16316986083984375, -0.132080078125, -0.10099029541015625, -0.0699005126953125, -0.03881072998046875, -0.007720947265625, 0.02336883544921875, 0.0544586181640625, 0.08554840087890625, 0.11663818359375, 0.14772796630859375, 0.1788177490234375, 0.20990753173828125, 0.240997314453125, 0.27208709716796875, 0.3031768798828125, 0.33426666259765625, 0.3653564453125, 0.39644622802734375, 0.4275360107421875, 0.45862579345703125, 0.489715576171875, 0.5208053588867188, 0.5518951416015625, 0.5829849243164062, 0.61407470703125, 0.6451644897460938, 0.6762542724609375, 0.7073440551757812, 0.738433837890625, 0.7695236206054688, 0.8006134033203125, 0.8317031860351562, 0.86279296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 12.0, 17.0, 40.0, 63.0, 134.0, 196.0, 205.0, 138.0, 83.0, 42.0, 21.0, 18.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.343784332275391, -4.162109851837158, -3.980435371398926, -3.7987606525421143, -3.617086172103882, -3.4354116916656494, -3.253736972808838, -3.0720624923706055, -2.890388011932373, -2.7087135314941406, -2.527039051055908, -2.3453643321990967, -2.1636898517608643, -1.9820153713226318, -1.8003407716751099, -1.618666172027588, -1.4369916915893555, -1.255317211151123, -1.073642611503601, -0.8919680714607239, -0.7102935314178467, -0.5286189913749695, -0.3469444513320923, -0.1652698516845703, 0.01640462875366211, 0.1980791687965393, 0.3797537088394165, 0.5614282488822937, 0.7431027889251709, 0.9247773289680481, 1.1064518690109253, 1.2881264686584473, 1.4698009490966797, 1.651475429534912, 1.833150029182434, 2.014824628829956, 2.1964991092681885, 2.378173589706421, 2.5598483085632324, 2.741522789001465, 2.9231972694396973, 3.1048717498779297, 3.286546230316162, 3.4682209491729736, 3.649895429611206, 3.8315699100494385, 4.01324462890625, 4.194919109344482, 4.376593589782715, 4.558268070220947, 4.73994255065918, 4.921617031097412, 5.1032915115356445, 5.284966468811035, 5.466640949249268, 5.6483154296875, 5.829989910125732, 6.011664390563965, 6.193338871002197, 6.37501335144043, 6.55668830871582, 6.738362789154053, 6.920037269592285, 7.101711750030518, 7.28338623046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 10.0, 6.0, 14.0, 11.0, 12.0, 17.0, 11.0, 13.0, 10.0, 33.0, 36.0, 31.0, 24.0, 43.0, 43.0, 49.0, 34.0, 53.0, 47.0, 46.0, 40.0, 43.0, 33.0, 46.0, 40.0, 31.0, 35.0, 24.0, 25.0, 30.0, 14.0, 25.0, 19.0, 13.0, 6.0, 9.0, 11.0, 5.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.435999870300293, -2.3716447353363037, -2.3072896003723145, -2.242934465408325, -2.178579330444336, -2.114224433898926, -2.0498690605163574, -1.9855140447616577, -1.921159029006958, -1.8568038940429688, -1.7924487590789795, -1.7280936241149902, -1.6637386083602905, -1.5993834733963013, -1.535028338432312, -1.4706732034683228, -1.4063180685043335, -1.3419629335403442, -1.277607798576355, -1.2132527828216553, -1.148897647857666, -1.0845425128936768, -1.0201873779296875, -0.9558322429656982, -0.8914771676063538, -0.8271220326423645, -0.76276695728302, -0.6984118223190308, -0.6340566873550415, -0.569701611995697, -0.5053464770317078, -0.4409913718700409, -0.376636266708374, -0.31228116154670715, -0.2479260414838791, -0.18357092142105103, -0.11921581625938416, -0.054860711097717285, 0.009494423866271973, 0.07384952902793884, 0.1382046341896057, 0.20255973935127258, 0.26691484451293945, 0.3312699794769287, 0.3956250846385956, 0.45998018980026245, 0.5243353247642517, 0.5886904001235962, 0.6530455350875854, 0.7174006700515747, 0.7817557454109192, 0.8461108803749084, 0.9104659557342529, 0.9748210906982422, 1.0391762256622314, 1.1035313606262207, 1.16788649559021, 1.2322416305541992, 1.2965967655181885, 1.3609519004821777, 1.4253069162368774, 1.4896620512008667, 1.554017186164856, 1.6183723211288452, 1.682727336883545]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 7.0, 17.0, 23.0, 37.0, 40.0, 63.0, 87.0, 164.0, 264.0, 470.0, 821.0, 1615.0, 3315.0, 7247.0, 16636.0, 41849.0, 111671.0, 296436.0, 343697.0, 136857.0, 50890.0, 19823.0, 8536.0, 3848.0, 1832.0, 964.0, 530.0, 277.0, 175.0, 113.0, 65.0, 45.0, 25.0, 19.0, 18.0, 15.0, 11.0, 13.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.171875, -1.13848876953125, -1.1051025390625, -1.07171630859375, -1.038330078125, -1.00494384765625, -0.9715576171875, -0.93817138671875, -0.90478515625, -0.87139892578125, -0.8380126953125, -0.80462646484375, -0.771240234375, -0.73785400390625, -0.7044677734375, -0.67108154296875, -0.6376953125, -0.60430908203125, -0.5709228515625, -0.53753662109375, -0.504150390625, -0.47076416015625, -0.4373779296875, -0.40399169921875, -0.37060546875, -0.33721923828125, -0.3038330078125, -0.27044677734375, -0.237060546875, -0.20367431640625, -0.1702880859375, -0.13690185546875, -0.103515625, -0.07012939453125, -0.0367431640625, -0.00335693359375, 0.030029296875, 0.06341552734375, 0.0968017578125, 0.13018798828125, 0.16357421875, 0.19696044921875, 0.2303466796875, 0.26373291015625, 0.297119140625, 0.33050537109375, 0.3638916015625, 0.39727783203125, 0.4306640625, 0.46405029296875, 0.4974365234375, 0.53082275390625, 0.564208984375, 0.59759521484375, 0.6309814453125, 0.66436767578125, 0.69775390625, 0.73114013671875, 0.7645263671875, 0.79791259765625, 0.831298828125, 0.86468505859375, 0.8980712890625, 0.93145751953125, 0.96484375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 7.0, 9.0, 15.0, 14.0, 10.0, 19.0, 32.0, 31.0, 43.0, 38.0, 46.0, 52.0, 49.0, 50.0, 57.0, 57.0, 56.0, 63.0, 46.0, 45.0, 42.0, 51.0, 42.0, 25.0, 18.0, 19.0, 13.0, 11.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3134765625, -0.3026771545410156, -0.29187774658203125, -0.2810783386230469, -0.2702789306640625, -0.2594795227050781, -0.24868011474609375, -0.23788070678710938, -0.227081298828125, -0.21628189086914062, -0.20548248291015625, -0.19468307495117188, -0.1838836669921875, -0.17308425903320312, -0.16228485107421875, -0.15148544311523438, -0.14068603515625, -0.12988662719726562, -0.11908721923828125, -0.10828781127929688, -0.0974884033203125, -0.08668899536132812, -0.07588958740234375, -0.06509017944335938, -0.054290771484375, -0.043491363525390625, -0.03269195556640625, -0.021892547607421875, -0.0110931396484375, -0.000293731689453125, 0.01050567626953125, 0.021305084228515625, 0.0321044921875, 0.042903900146484375, 0.05370330810546875, 0.06450271606445312, 0.0753021240234375, 0.08610153198242188, 0.09690093994140625, 0.10770034790039062, 0.118499755859375, 0.12929916381835938, 0.14009857177734375, 0.15089797973632812, 0.1616973876953125, 0.17249679565429688, 0.18329620361328125, 0.19409561157226562, 0.20489501953125, 0.21569442749023438, 0.22649383544921875, 0.23729324340820312, 0.2480926513671875, 0.2588920593261719, 0.26969146728515625, 0.2804908752441406, 0.291290283203125, 0.3020896911621094, 0.31288909912109375, 0.3236885070800781, 0.3344879150390625, 0.3452873229980469, 0.35608673095703125, 0.3668861389160156, 0.377685546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 13.0, 14.0, 7.0, 21.0, 37.0, 39.0, 89.0, 107.0, 157.0, 276.0, 422.0, 730.0, 1228.0, 2202.0, 4199.0, 8603.0, 19307.0, 50311.0, 152510.0, 437414.0, 244325.0, 75338.0, 27453.0, 11593.0, 5498.0, 2802.0, 1515.0, 915.0, 507.0, 348.0, 204.0, 113.0, 66.0, 56.0, 40.0, 29.0, 18.0, 12.0, 9.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0760650634765625, -1.039825439453125, -1.0035858154296875, -0.96734619140625, -0.9311065673828125, -0.894866943359375, -0.8586273193359375, -0.8223876953125, -0.7861480712890625, -0.749908447265625, -0.7136688232421875, -0.67742919921875, -0.6411895751953125, -0.604949951171875, -0.5687103271484375, -0.532470703125, -0.4962310791015625, -0.459991455078125, -0.4237518310546875, -0.38751220703125, -0.3512725830078125, -0.315032958984375, -0.2787933349609375, -0.2425537109375, -0.2063140869140625, -0.170074462890625, -0.1338348388671875, -0.09759521484375, -0.0613555908203125, -0.025115966796875, 0.0111236572265625, 0.04736328125, 0.0836029052734375, 0.119842529296875, 0.1560821533203125, 0.19232177734375, 0.2285614013671875, 0.264801025390625, 0.3010406494140625, 0.3372802734375, 0.3735198974609375, 0.409759521484375, 0.4459991455078125, 0.48223876953125, 0.5184783935546875, 0.554718017578125, 0.5909576416015625, 0.627197265625, 0.6634368896484375, 0.699676513671875, 0.7359161376953125, 0.77215576171875, 0.8083953857421875, 0.844635009765625, 0.8808746337890625, 0.9171142578125, 0.9533538818359375, 0.989593505859375, 1.0258331298828125, 1.06207275390625, 1.0983123779296875, 1.134552001953125, 1.1707916259765625, 1.20703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 9.0, 8.0, 11.0, 18.0, 17.0, 17.0, 19.0, 25.0, 37.0, 45.0, 40.0, 37.0, 50.0, 54.0, 51.0, 58.0, 68.0, 54.0, 52.0, 53.0, 40.0, 49.0, 31.0, 31.0, 29.0, 14.0, 16.0, 11.0, 13.0, 7.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1416015625, -1.1106033325195312, -1.0796051025390625, -1.0486068725585938, -1.017608642578125, -0.9866104125976562, -0.9556121826171875, -0.9246139526367188, -0.89361572265625, -0.8626174926757812, -0.8316192626953125, -0.8006210327148438, -0.769622802734375, -0.7386245727539062, -0.7076263427734375, -0.6766281127929688, -0.6456298828125, -0.6146316528320312, -0.5836334228515625, -0.5526351928710938, -0.521636962890625, -0.49063873291015625, -0.4596405029296875, -0.42864227294921875, -0.39764404296875, -0.36664581298828125, -0.3356475830078125, -0.30464935302734375, -0.273651123046875, -0.24265289306640625, -0.2116546630859375, -0.18065643310546875, -0.149658203125, -0.11865997314453125, -0.0876617431640625, -0.05666351318359375, -0.025665283203125, 0.00533294677734375, 0.0363311767578125, 0.06732940673828125, 0.09832763671875, 0.12932586669921875, 0.1603240966796875, 0.19132232666015625, 0.222320556640625, 0.25331878662109375, 0.2843170166015625, 0.31531524658203125, 0.3463134765625, 0.37731170654296875, 0.4083099365234375, 0.43930816650390625, 0.470306396484375, 0.5013046264648438, 0.5323028564453125, 0.5633010864257812, 0.59429931640625, 0.6252975463867188, 0.6562957763671875, 0.6872940063476562, 0.718292236328125, 0.7492904663085938, 0.7802886962890625, 0.8112869262695312, 0.84228515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 13.0, 13.0, 20.0, 23.0, 29.0, 48.0, 69.0, 95.0, 111.0, 179.0, 301.0, 501.0, 760.0, 1208.0, 2473.0, 5529.0, 15932.0, 78688.0, 709910.0, 190549.0, 26727.0, 8002.0, 3250.0, 1572.0, 873.0, 570.0, 382.0, 201.0, 152.0, 100.0, 66.0, 57.0, 37.0, 28.0, 25.0, 16.0, 12.0, 4.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.74755859375, -0.723968505859375, -0.70037841796875, -0.676788330078125, -0.6531982421875, -0.629608154296875, -0.60601806640625, -0.582427978515625, -0.558837890625, -0.535247802734375, -0.51165771484375, -0.488067626953125, -0.4644775390625, -0.440887451171875, -0.41729736328125, -0.393707275390625, -0.3701171875, -0.346527099609375, -0.32293701171875, -0.299346923828125, -0.2757568359375, -0.252166748046875, -0.22857666015625, -0.204986572265625, -0.181396484375, -0.157806396484375, -0.13421630859375, -0.110626220703125, -0.0870361328125, -0.063446044921875, -0.03985595703125, -0.016265869140625, 0.00732421875, 0.030914306640625, 0.05450439453125, 0.078094482421875, 0.1016845703125, 0.125274658203125, 0.14886474609375, 0.172454833984375, 0.196044921875, 0.219635009765625, 0.24322509765625, 0.266815185546875, 0.2904052734375, 0.313995361328125, 0.33758544921875, 0.361175537109375, 0.384765625, 0.408355712890625, 0.43194580078125, 0.455535888671875, 0.4791259765625, 0.502716064453125, 0.52630615234375, 0.549896240234375, 0.573486328125, 0.597076416015625, 0.62066650390625, 0.644256591796875, 0.6678466796875, 0.691436767578125, 0.71502685546875, 0.738616943359375, 0.76220703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 8.0, 6.0, 11.0, 13.0, 23.0, 39.0, 62.0, 96.0, 171.0, 245.0, 134.0, 74.0, 36.0, 17.0, 12.0, 7.0, 8.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017559528350830078, -0.00017061270773410797, -0.00016563013195991516, -0.00016064755618572235, -0.00015566498041152954, -0.00015068240463733673, -0.00014569982886314392, -0.0001407172530889511, -0.0001357346773147583, -0.0001307521015405655, -0.00012576952576637268, -0.00012078694999217987, -0.00011580437421798706, -0.00011082179844379425, -0.00010583922266960144, -0.00010085664689540863, -9.587407112121582e-05, -9.089149534702301e-05, -8.59089195728302e-05, -8.092634379863739e-05, -7.594376802444458e-05, -7.096119225025177e-05, -6.597861647605896e-05, -6.099604070186615e-05, -5.601346492767334e-05, -5.103088915348053e-05, -4.604831337928772e-05, -4.106573760509491e-05, -3.60831618309021e-05, -3.110058605670929e-05, -2.611801028251648e-05, -2.113543450832367e-05, -1.615285873413086e-05, -1.117028295993805e-05, -6.187707185745239e-06, -1.2051314115524292e-06, 3.777444362640381e-06, 8.760020136833191e-06, 1.3742595911026001e-05, 1.872517168521881e-05, 2.370774745941162e-05, 2.869032323360443e-05, 3.367289900779724e-05, 3.865547478199005e-05, 4.363805055618286e-05, 4.862062633037567e-05, 5.360320210456848e-05, 5.858577787876129e-05, 6.35683536529541e-05, 6.855092942714691e-05, 7.353350520133972e-05, 7.851608097553253e-05, 8.349865674972534e-05, 8.848123252391815e-05, 9.346380829811096e-05, 9.844638407230377e-05, 0.00010342895984649658, 0.00010841153562068939, 0.0001133941113948822, 0.00011837668716907501, 0.00012335926294326782, 0.00012834183871746063, 0.00013332441449165344, 0.00013830699026584625, 0.00014328956604003906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 13.0, 16.0, 32.0, 42.0, 61.0, 112.0, 136.0, 270.0, 400.0, 736.0, 1415.0, 2825.0, 7141.0, 26492.0, 327289.0, 628708.0, 37176.0, 8726.0, 3372.0, 1556.0, 810.0, 464.0, 264.0, 171.0, 100.0, 63.0, 50.0, 36.0, 18.0, 17.0, 12.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9057998657226562, -0.8697052001953125, -0.8336105346679688, -0.797515869140625, -0.7614212036132812, -0.7253265380859375, -0.6892318725585938, -0.65313720703125, -0.6170425415039062, -0.5809478759765625, -0.5448532104492188, -0.508758544921875, -0.47266387939453125, -0.4365692138671875, -0.40047454833984375, -0.3643798828125, -0.32828521728515625, -0.2921905517578125, -0.25609588623046875, -0.220001220703125, -0.18390655517578125, -0.1478118896484375, -0.11171722412109375, -0.07562255859375, -0.03952789306640625, -0.0034332275390625, 0.03266143798828125, 0.068756103515625, 0.10485076904296875, 0.1409454345703125, 0.17704010009765625, 0.213134765625, 0.24922943115234375, 0.2853240966796875, 0.32141876220703125, 0.357513427734375, 0.39360809326171875, 0.4297027587890625, 0.46579742431640625, 0.50189208984375, 0.5379867553710938, 0.5740814208984375, 0.6101760864257812, 0.646270751953125, 0.6823654174804688, 0.7184600830078125, 0.7545547485351562, 0.7906494140625, 0.8267440795898438, 0.8628387451171875, 0.8989334106445312, 0.935028076171875, 0.9711227416992188, 1.0072174072265625, 1.0433120727539062, 1.07940673828125, 1.1155014038085938, 1.1515960693359375, 1.1876907348632812, 1.223785400390625, 1.2598800659179688, 1.2959747314453125, 1.3320693969726562, 1.3681640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 7.0, 11.0, 14.0, 22.0, 22.0, 62.0, 101.0, 188.0, 205.0, 150.0, 79.0, 35.0, 25.0, 20.0, 12.0, 10.0, 7.0, 3.0, 5.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9892578125, -0.9626846313476562, -0.9361114501953125, -0.9095382690429688, -0.882965087890625, -0.8563919067382812, -0.8298187255859375, -0.8032455444335938, -0.77667236328125, -0.7500991821289062, -0.7235260009765625, -0.6969528198242188, -0.670379638671875, -0.6438064575195312, -0.6172332763671875, -0.5906600952148438, -0.5640869140625, -0.5375137329101562, -0.5109405517578125, -0.48436737060546875, -0.457794189453125, -0.43122100830078125, -0.4046478271484375, -0.37807464599609375, -0.35150146484375, -0.32492828369140625, -0.2983551025390625, -0.27178192138671875, -0.245208740234375, -0.21863555908203125, -0.1920623779296875, -0.16548919677734375, -0.138916015625, -0.11234283447265625, -0.0857696533203125, -0.05919647216796875, -0.032623291015625, -0.00605010986328125, 0.0205230712890625, 0.04709625244140625, 0.07366943359375, 0.10024261474609375, 0.1268157958984375, 0.15338897705078125, 0.179962158203125, 0.20653533935546875, 0.2331085205078125, 0.25968170166015625, 0.2862548828125, 0.31282806396484375, 0.3394012451171875, 0.36597442626953125, 0.392547607421875, 0.41912078857421875, 0.4456939697265625, 0.47226715087890625, 0.49884033203125, 0.5254135131835938, 0.5519866943359375, 0.5785598754882812, 0.605133056640625, 0.6317062377929688, 0.6582794189453125, 0.6848526000976562, 0.71142578125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 10.0, 20.0, 31.0, 79.0, 186.0, 260.0, 226.0, 104.0, 39.0, 23.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.947851181030273, -5.645381450653076, -5.342912197113037, -5.04044246673584, -4.737973213195801, -4.4355034828186035, -4.133033752441406, -3.830564260482788, -3.52809476852417, -3.2256252765655518, -2.9231557846069336, -2.6206860542297363, -2.318216562271118, -2.0157470703125, -1.7132774591445923, -1.4108078479766846, -1.1083383560180664, -0.8058688044548035, -0.5033992528915405, -0.2009297013282776, 0.10153985023498535, 0.4040093421936035, 0.7064789533615112, 1.008948564529419, 1.311418056488037, 1.6138875484466553, 1.916357159614563, 2.2188267707824707, 2.521296262741089, 2.823765754699707, 3.1262354850769043, 3.4287049770355225, 3.731175422668457, 4.033645153045654, 4.336114406585693, 4.638584136962891, 4.94105339050293, 5.243523120880127, 5.545992851257324, 5.848462104797363, 6.1509318351745605, 6.453401565551758, 6.755870819091797, 7.058340549468994, 7.360810279846191, 7.6632795333862305, 7.965749263763428, 8.268218994140625, 8.570688247680664, 8.873157501220703, 9.175627708435059, 9.478096961975098, 9.780566215515137, 10.083036422729492, 10.385505676269531, 10.68797492980957, 10.99044418334961, 11.292913436889648, 11.595383644104004, 11.897852897644043, 12.200322151184082, 12.502792358398438, 12.805261611938477, 13.107730865478516, 13.410201072692871]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 7.0, 5.0, 10.0, 5.0, 6.0, 11.0, 16.0, 23.0, 23.0, 17.0, 24.0, 19.0, 36.0, 39.0, 30.0, 40.0, 46.0, 42.0, 47.0, 41.0, 42.0, 35.0, 38.0, 40.0, 40.0, 30.0, 34.0, 30.0, 25.0, 27.0, 18.0, 15.0, 24.0, 20.0, 21.0, 12.0, 9.0, 11.0, 11.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.243656635284424, -2.1755335330963135, -2.1074106693267822, -2.039287567138672, -1.971164584159851, -1.9030416011810303, -1.83491849899292, -1.7667955160140991, -1.6986725330352783, -1.6305495500564575, -1.5624265670776367, -1.4943034648895264, -1.4261804819107056, -1.3580574989318848, -1.2899343967437744, -1.2218114137649536, -1.1536884307861328, -1.085565447807312, -1.0174424648284912, -0.9493193626403809, -0.8811963796615601, -0.8130733966827393, -0.7449503540992737, -0.6768273115158081, -0.6087043285369873, -0.5405813455581665, -0.4724583029747009, -0.40433529019355774, -0.33621227741241455, -0.26808926463127136, -0.19996625185012817, -0.13184323906898499, -0.0637204647064209, 0.00440254807472229, 0.07252556085586548, 0.14064857363700867, 0.20877158641815186, 0.27689459919929504, 0.34501761198043823, 0.4131406247615814, 0.4812636375427246, 0.5493866205215454, 0.617509663105011, 0.6856327056884766, 0.7537556886672974, 0.8218786716461182, 0.8900017142295837, 0.9581247568130493, 1.0262477397918701, 1.094370722770691, 1.1624937057495117, 1.230616807937622, 1.2987397909164429, 1.3668627738952637, 1.434985876083374, 1.5031088590621948, 1.5712318420410156, 1.6393548250198364, 1.7074778079986572, 1.7756009101867676, 1.8437238931655884, 1.9118468761444092, 1.9799699783325195, 2.048092842102051, 2.116215944290161]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 6.0, 12.0, 33.0, 27.0, 44.0, 59.0, 98.0, 186.0, 237.0, 481.0, 827.0, 1510.0, 3310.0, 8380.0, 27488.0, 231518.0, 3415225.0, 453968.0, 33589.0, 9638.0, 3810.0, 1611.0, 856.0, 501.0, 304.0, 171.0, 117.0, 84.0, 47.0, 34.0, 23.0, 23.0, 14.0, 10.0, 11.0, 5.0, 8.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.8867263793945312, -0.8491363525390625, -0.8115463256835938, -0.773956298828125, -0.7363662719726562, -0.6987762451171875, -0.6611862182617188, -0.62359619140625, -0.5860061645507812, -0.5484161376953125, -0.5108261108398438, -0.473236083984375, -0.43564605712890625, -0.3980560302734375, -0.36046600341796875, -0.3228759765625, -0.28528594970703125, -0.2476959228515625, -0.21010589599609375, -0.172515869140625, -0.13492584228515625, -0.0973358154296875, -0.05974578857421875, -0.02215576171875, 0.01543426513671875, 0.0530242919921875, 0.09061431884765625, 0.128204345703125, 0.16579437255859375, 0.2033843994140625, 0.24097442626953125, 0.278564453125, 0.31615447998046875, 0.3537445068359375, 0.39133453369140625, 0.428924560546875, 0.46651458740234375, 0.5041046142578125, 0.5416946411132812, 0.57928466796875, 0.6168746948242188, 0.6544647216796875, 0.6920547485351562, 0.729644775390625, 0.7672348022460938, 0.8048248291015625, 0.8424148559570312, 0.8800048828125, 0.9175949096679688, 0.9551849365234375, 0.9927749633789062, 1.030364990234375, 1.0679550170898438, 1.1055450439453125, 1.1431350708007812, 1.18072509765625, 1.2183151245117188, 1.2559051513671875, 1.2934951782226562, 1.331085205078125, 1.3686752319335938, 1.4062652587890625, 1.4438552856445312, 1.4814453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 1.0, 5.0, 8.0, 15.0, 17.0, 10.0, 16.0, 16.0, 30.0, 33.0, 35.0, 34.0, 51.0, 41.0, 54.0, 34.0, 60.0, 50.0, 55.0, 53.0, 58.0, 45.0, 29.0, 63.0, 36.0, 24.0, 21.0, 19.0, 17.0, 14.0, 10.0, 6.0, 9.0, 2.0, 9.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.24277114868164062, -0.23236846923828125, -0.22196578979492188, -0.2115631103515625, -0.20116043090820312, -0.19075775146484375, -0.18035507202148438, -0.169952392578125, -0.15954971313476562, -0.14914703369140625, -0.13874435424804688, -0.1283416748046875, -0.11793899536132812, -0.10753631591796875, -0.09713363647460938, -0.08673095703125, -0.07632827758789062, -0.06592559814453125, -0.055522918701171875, -0.0451202392578125, -0.034717559814453125, -0.02431488037109375, -0.013912200927734375, -0.003509521484375, 0.006893157958984375, 0.01729583740234375, 0.027698516845703125, 0.0381011962890625, 0.048503875732421875, 0.05890655517578125, 0.06930923461914062, 0.0797119140625, 0.09011459350585938, 0.10051727294921875, 0.11091995239257812, 0.1213226318359375, 0.13172531127929688, 0.14212799072265625, 0.15253067016601562, 0.162933349609375, 0.17333602905273438, 0.18373870849609375, 0.19414138793945312, 0.2045440673828125, 0.21494674682617188, 0.22534942626953125, 0.23575210571289062, 0.24615478515625, 0.2565574645996094, 0.26696014404296875, 0.2773628234863281, 0.2877655029296875, 0.2981681823730469, 0.30857086181640625, 0.3189735412597656, 0.329376220703125, 0.3397789001464844, 0.35018157958984375, 0.3605842590332031, 0.3709869384765625, 0.3813896179199219, 0.39179229736328125, 0.4021949768066406, 0.41259765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 14.0, 18.0, 18.0, 19.0, 23.0, 25.0, 22.0, 38.0, 55.0, 80.0, 100.0, 150.0, 227.0, 301.0, 530.0, 1032.0, 2116.0, 4729.0, 12219.0, 42935.0, 300777.0, 3545183.0, 227053.0, 37028.0, 10971.0, 4256.0, 1880.0, 949.0, 507.0, 306.0, 181.0, 136.0, 92.0, 61.0, 62.0, 31.0, 23.0, 29.0, 32.0, 10.0, 14.0, 10.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.2919921875, -1.2495574951171875, -1.207122802734375, -1.1646881103515625, -1.12225341796875, -1.0798187255859375, -1.037384033203125, -0.9949493408203125, -0.9525146484375, -0.9100799560546875, -0.867645263671875, -0.8252105712890625, -0.78277587890625, -0.7403411865234375, -0.697906494140625, -0.6554718017578125, -0.613037109375, -0.5706024169921875, -0.528167724609375, -0.4857330322265625, -0.44329833984375, -0.4008636474609375, -0.358428955078125, -0.3159942626953125, -0.2735595703125, -0.2311248779296875, -0.188690185546875, -0.1462554931640625, -0.10382080078125, -0.0613861083984375, -0.018951416015625, 0.0234832763671875, 0.06591796875, 0.1083526611328125, 0.150787353515625, 0.1932220458984375, 0.23565673828125, 0.2780914306640625, 0.320526123046875, 0.3629608154296875, 0.4053955078125, 0.4478302001953125, 0.490264892578125, 0.5326995849609375, 0.57513427734375, 0.6175689697265625, 0.660003662109375, 0.7024383544921875, 0.744873046875, 0.7873077392578125, 0.829742431640625, 0.8721771240234375, 0.91461181640625, 0.9570465087890625, 0.999481201171875, 1.0419158935546875, 1.0843505859375, 1.1267852783203125, 1.169219970703125, 1.2116546630859375, 1.25408935546875, 1.2965240478515625, 1.338958740234375, 1.3813934326171875, 1.423828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 9.0, 4.0, 12.0, 10.0, 24.0, 24.0, 47.0, 93.0, 141.0, 383.0, 1151.0, 1260.0, 442.0, 208.0, 88.0, 61.0, 38.0, 27.0, 17.0, 10.0, 7.0, 4.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.931640625, -1.8867874145507812, -1.8419342041015625, -1.7970809936523438, -1.752227783203125, -1.7073745727539062, -1.6625213623046875, -1.6176681518554688, -1.57281494140625, -1.5279617309570312, -1.4831085205078125, -1.4382553100585938, -1.393402099609375, -1.3485488891601562, -1.3036956787109375, -1.2588424682617188, -1.2139892578125, -1.1691360473632812, -1.1242828369140625, -1.0794296264648438, -1.034576416015625, -0.9897232055664062, -0.9448699951171875, -0.9000167846679688, -0.85516357421875, -0.8103103637695312, -0.7654571533203125, -0.7206039428710938, -0.675750732421875, -0.6308975219726562, -0.5860443115234375, -0.5411911010742188, -0.496337890625, -0.45148468017578125, -0.4066314697265625, -0.36177825927734375, -0.316925048828125, -0.27207183837890625, -0.2272186279296875, -0.18236541748046875, -0.13751220703125, -0.09265899658203125, -0.0478057861328125, -0.00295257568359375, 0.041900634765625, 0.08675384521484375, 0.1316070556640625, 0.17646026611328125, 0.2213134765625, 0.26616668701171875, 0.3110198974609375, 0.35587310791015625, 0.400726318359375, 0.44557952880859375, 0.4904327392578125, 0.5352859497070312, 0.58013916015625, 0.6249923706054688, 0.6698455810546875, 0.7146987915039062, 0.759552001953125, 0.8044052124023438, 0.8492584228515625, 0.8941116333007812, 0.93896484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 7.0, 6.0, 11.0, 19.0, 19.0, 31.0, 49.0, 91.0, 152.0, 184.0, 156.0, 99.0, 63.0, 50.0, 22.0, 16.0, 9.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.995985507965088, -7.765048503875732, -7.534111499786377, -7.30317497253418, -7.072237968444824, -6.841300964355469, -6.610363960266113, -6.379426956176758, -6.148489952087402, -5.917552947998047, -5.686615943908691, -5.455678939819336, -5.224742412567139, -4.993805408477783, -4.762868404388428, -4.531931400299072, -4.300994873046875, -4.0700578689575195, -3.839121103286743, -3.6081840991973877, -3.3772473335266113, -3.146310329437256, -2.9153733253479004, -2.684436321258545, -2.4534995555877686, -2.222562551498413, -1.9916257858276367, -1.7606887817382812, -1.5297518968582153, -1.2988150119781494, -1.067878007888794, -0.836941123008728, -0.6060042381286621, -0.3750673234462738, -0.1441304087638855, 0.0868065357208252, 0.3177434206008911, 0.548680305480957, 0.7796173095703125, 1.0105541944503784, 1.2414910793304443, 1.4724279642105103, 1.7033648490905762, 1.9343018531799316, 2.165238857269287, 2.3961756229400635, 2.627112627029419, 2.8580493927001953, 3.088986396789551, 3.3199234008789062, 3.5508601665496826, 3.781797170639038, 4.0127339363098145, 4.24367094039917, 4.474607944488525, 4.705544948577881, 4.936481475830078, 5.167418479919434, 5.398355484008789, 5.6292924880981445, 5.860229015350342, 6.091166019439697, 6.322103023529053, 6.553040027618408, 6.783977031707764]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 3.0, 6.0, 4.0, 9.0, 9.0, 9.0, 12.0, 14.0, 12.0, 18.0, 22.0, 20.0, 32.0, 27.0, 32.0, 31.0, 39.0, 41.0, 34.0, 45.0, 38.0, 35.0, 41.0, 36.0, 40.0, 29.0, 36.0, 23.0, 32.0, 29.0, 29.0, 36.0, 23.0, 18.0, 28.0, 19.0, 21.0, 19.0, 11.0, 6.0, 8.0, 8.0, 7.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.7918624877929688, -2.7075257301330566, -2.6231889724731445, -2.5388522148132324, -2.454515218734741, -2.370178461074829, -2.285841703414917, -2.201504945755005, -2.1171679496765137, -2.0328311920166016, -1.9484943151474, -1.8641575574874878, -1.7798206806182861, -1.695483922958374, -1.611147165298462, -1.5268104076385498, -1.4424736499786377, -1.3581368923187256, -1.273800015449524, -1.1894632577896118, -1.1051263809204102, -1.020789623260498, -0.9364528656005859, -0.852116048336029, -0.7677792310714722, -0.6834424138069153, -0.5991055965423584, -0.5147688388824463, -0.4304320216178894, -0.3460952043533325, -0.2617584466934204, -0.17742162942886353, -0.09308481216430664, -0.00874800980091095, 0.07558879256248474, 0.15992558002471924, 0.24426239728927612, 0.328599214553833, 0.4129359722137451, 0.497272789478302, 0.5816096067428589, 0.6659464240074158, 0.7502832412719727, 0.8346199989318848, 0.9189568161964417, 1.0032936334609985, 1.0876303911209106, 1.1719672679901123, 1.2563040256500244, 1.3406407833099365, 1.4249776601791382, 1.5093144178390503, 1.593651294708252, 1.677988052368164, 1.7623248100280762, 1.8466615676879883, 1.93099844455719, 2.0153353214263916, 2.0996720790863037, 2.184008836746216, 2.268345594406128, 2.352682590484619, 2.4370193481445312, 2.5213561058044434, 2.6056928634643555]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 12.0, 20.0, 21.0, 34.0, 92.0, 181.0, 346.0, 668.0, 1563.0, 3690.0, 9028.0, 25206.0, 81449.0, 325436.0, 435956.0, 112177.0, 32908.0, 11585.0, 4556.0, 1995.0, 837.0, 398.0, 170.0, 89.0, 42.0, 34.0, 22.0, 11.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.70794677734375, -1.6512451171875, -1.59454345703125, -1.537841796875, -1.48114013671875, -1.4244384765625, -1.36773681640625, -1.31103515625, -1.25433349609375, -1.1976318359375, -1.14093017578125, -1.084228515625, -1.02752685546875, -0.9708251953125, -0.91412353515625, -0.857421875, -0.80072021484375, -0.7440185546875, -0.68731689453125, -0.630615234375, -0.57391357421875, -0.5172119140625, -0.46051025390625, -0.40380859375, -0.34710693359375, -0.2904052734375, -0.23370361328125, -0.177001953125, -0.12030029296875, -0.0635986328125, -0.00689697265625, 0.0498046875, 0.10650634765625, 0.1632080078125, 0.21990966796875, 0.276611328125, 0.33331298828125, 0.3900146484375, 0.44671630859375, 0.50341796875, 0.56011962890625, 0.6168212890625, 0.67352294921875, 0.730224609375, 0.78692626953125, 0.8436279296875, 0.90032958984375, 0.95703125, 1.01373291015625, 1.0704345703125, 1.12713623046875, 1.183837890625, 1.24053955078125, 1.2972412109375, 1.35394287109375, 1.41064453125, 1.46734619140625, 1.5240478515625, 1.58074951171875, 1.637451171875, 1.69415283203125, 1.7508544921875, 1.80755615234375, 1.8642578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 7.0, 10.0, 11.0, 13.0, 16.0, 15.0, 12.0, 22.0, 23.0, 32.0, 28.0, 44.0, 39.0, 35.0, 40.0, 29.0, 30.0, 40.0, 40.0, 49.0, 49.0, 35.0, 39.0, 37.0, 41.0, 30.0, 27.0, 31.0, 35.0, 17.0, 20.0, 19.0, 9.0, 20.0, 13.0, 3.0, 5.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2961311340332031, -0.28537750244140625, -0.2746238708496094, -0.2638702392578125, -0.2531166076660156, -0.24236297607421875, -0.23160934448242188, -0.220855712890625, -0.21010208129882812, -0.19934844970703125, -0.18859481811523438, -0.1778411865234375, -0.16708755493164062, -0.15633392333984375, -0.14558029174804688, -0.13482666015625, -0.12407302856445312, -0.11331939697265625, -0.10256576538085938, -0.0918121337890625, -0.08105850219726562, -0.07030487060546875, -0.059551239013671875, -0.048797607421875, -0.038043975830078125, -0.02729034423828125, -0.016536712646484375, -0.0057830810546875, 0.004970550537109375, 0.01572418212890625, 0.026477813720703125, 0.0372314453125, 0.047985076904296875, 0.05873870849609375, 0.06949234008789062, 0.0802459716796875, 0.09099960327148438, 0.10175323486328125, 0.11250686645507812, 0.123260498046875, 0.13401412963867188, 0.14476776123046875, 0.15552139282226562, 0.1662750244140625, 0.17702865600585938, 0.18778228759765625, 0.19853591918945312, 0.20928955078125, 0.22004318237304688, 0.23079681396484375, 0.24155044555664062, 0.2523040771484375, 0.2630577087402344, 0.27381134033203125, 0.2845649719238281, 0.295318603515625, 0.3060722351074219, 0.31682586669921875, 0.3275794982910156, 0.3383331298828125, 0.3490867614746094, 0.35984039306640625, 0.3705940246582031, 0.38134765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 14.0, 12.0, 31.0, 42.0, 80.0, 113.0, 193.0, 346.0, 517.0, 951.0, 1735.0, 3593.0, 7380.0, 17236.0, 44657.0, 134587.0, 454053.0, 258937.0, 74986.0, 27106.0, 11227.0, 5131.0, 2569.0, 1278.0, 716.0, 397.0, 256.0, 142.0, 98.0, 53.0, 30.0, 19.0, 16.0, 10.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.79296875, -1.7428131103515625, -1.692657470703125, -1.6425018310546875, -1.59234619140625, -1.5421905517578125, -1.492034912109375, -1.4418792724609375, -1.3917236328125, -1.3415679931640625, -1.291412353515625, -1.2412567138671875, -1.19110107421875, -1.1409454345703125, -1.090789794921875, -1.0406341552734375, -0.990478515625, -0.9403228759765625, -0.890167236328125, -0.8400115966796875, -0.78985595703125, -0.7397003173828125, -0.689544677734375, -0.6393890380859375, -0.5892333984375, -0.5390777587890625, -0.488922119140625, -0.4387664794921875, -0.38861083984375, -0.3384552001953125, -0.288299560546875, -0.2381439208984375, -0.18798828125, -0.1378326416015625, -0.087677001953125, -0.0375213623046875, 0.01263427734375, 0.0627899169921875, 0.112945556640625, 0.1631011962890625, 0.2132568359375, 0.2634124755859375, 0.313568115234375, 0.3637237548828125, 0.41387939453125, 0.4640350341796875, 0.514190673828125, 0.5643463134765625, 0.614501953125, 0.6646575927734375, 0.714813232421875, 0.7649688720703125, 0.81512451171875, 0.8652801513671875, 0.915435791015625, 0.9655914306640625, 1.0157470703125, 1.0659027099609375, 1.116058349609375, 1.1662139892578125, 1.21636962890625, 1.2665252685546875, 1.316680908203125, 1.3668365478515625, 1.4169921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 9.0, 10.0, 9.0, 11.0, 5.0, 14.0, 20.0, 18.0, 17.0, 25.0, 35.0, 36.0, 31.0, 33.0, 40.0, 37.0, 51.0, 47.0, 43.0, 67.0, 54.0, 46.0, 51.0, 44.0, 37.0, 22.0, 29.0, 28.0, 21.0, 32.0, 15.0, 16.0, 9.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3125, -1.2727508544921875, -1.233001708984375, -1.1932525634765625, -1.15350341796875, -1.1137542724609375, -1.074005126953125, -1.0342559814453125, -0.9945068359375, -0.9547576904296875, -0.915008544921875, -0.8752593994140625, -0.83551025390625, -0.7957611083984375, -0.756011962890625, -0.7162628173828125, -0.676513671875, -0.6367645263671875, -0.597015380859375, -0.5572662353515625, -0.51751708984375, -0.4777679443359375, -0.438018798828125, -0.3982696533203125, -0.3585205078125, -0.3187713623046875, -0.279022216796875, -0.2392730712890625, -0.19952392578125, -0.1597747802734375, -0.120025634765625, -0.0802764892578125, -0.04052734375, -0.0007781982421875, 0.038970947265625, 0.0787200927734375, 0.11846923828125, 0.1582183837890625, 0.197967529296875, 0.2377166748046875, 0.2774658203125, 0.3172149658203125, 0.356964111328125, 0.3967132568359375, 0.43646240234375, 0.4762115478515625, 0.515960693359375, 0.5557098388671875, 0.595458984375, 0.6352081298828125, 0.674957275390625, 0.7147064208984375, 0.75445556640625, 0.7942047119140625, 0.833953857421875, 0.8737030029296875, 0.9134521484375, 0.9532012939453125, 0.992950439453125, 1.0326995849609375, 1.07244873046875, 1.1121978759765625, 1.151947021484375, 1.1916961669921875, 1.2314453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 3.0, 6.0, 20.0, 16.0, 40.0, 41.0, 68.0, 88.0, 193.0, 314.0, 507.0, 814.0, 1477.0, 2924.0, 6863.0, 18198.0, 94000.0, 828936.0, 66614.0, 15310.0, 6029.0, 2773.0, 1427.0, 745.0, 448.0, 265.0, 148.0, 89.0, 60.0, 45.0, 38.0, 13.0, 13.0, 8.0, 5.0, 1.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.294921875, -1.25091552734375, -1.2069091796875, -1.16290283203125, -1.118896484375, -1.07489013671875, -1.0308837890625, -0.98687744140625, -0.94287109375, -0.89886474609375, -0.8548583984375, -0.81085205078125, -0.766845703125, -0.72283935546875, -0.6788330078125, -0.63482666015625, -0.5908203125, -0.54681396484375, -0.5028076171875, -0.45880126953125, -0.414794921875, -0.37078857421875, -0.3267822265625, -0.28277587890625, -0.23876953125, -0.19476318359375, -0.1507568359375, -0.10675048828125, -0.062744140625, -0.01873779296875, 0.0252685546875, 0.06927490234375, 0.11328125, 0.15728759765625, 0.2012939453125, 0.24530029296875, 0.289306640625, 0.33331298828125, 0.3773193359375, 0.42132568359375, 0.46533203125, 0.50933837890625, 0.5533447265625, 0.59735107421875, 0.641357421875, 0.68536376953125, 0.7293701171875, 0.77337646484375, 0.8173828125, 0.86138916015625, 0.9053955078125, 0.94940185546875, 0.993408203125, 1.03741455078125, 1.0814208984375, 1.12542724609375, 1.16943359375, 1.21343994140625, 1.2574462890625, 1.30145263671875, 1.345458984375, 1.38946533203125, 1.4334716796875, 1.47747802734375, 1.521484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 9.0, 5.0, 8.0, 15.0, 36.0, 156.0, 582.0, 102.0, 30.0, 17.0, 8.0, 7.0, 5.0, 6.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007238388061523438, -0.0006992220878601074, -0.0006746053695678711, -0.0006499886512756348, -0.0006253719329833984, -0.0006007552146911621, -0.0005761384963989258, -0.0005515217781066895, -0.0005269050598144531, -0.0005022883415222168, -0.00047767162322998047, -0.00045305490493774414, -0.0004284381866455078, -0.0004038214683532715, -0.00037920475006103516, -0.00035458803176879883, -0.0003299713134765625, -0.00030535459518432617, -0.00028073787689208984, -0.0002561211585998535, -0.0002315044403076172, -0.00020688772201538086, -0.00018227100372314453, -0.0001576542854309082, -0.00013303756713867188, -0.00010842084884643555, -8.380413055419922e-05, -5.918741226196289e-05, -3.457069396972656e-05, -9.953975677490234e-06, 1.4662742614746094e-05, 3.927946090698242e-05, 6.389617919921875e-05, 8.851289749145508e-05, 0.0001131296157836914, 0.00013774633407592773, 0.00016236305236816406, 0.0001869797706604004, 0.00021159648895263672, 0.00023621320724487305, 0.0002608299255371094, 0.0002854466438293457, 0.00031006336212158203, 0.00033468008041381836, 0.0003592967987060547, 0.000383913516998291, 0.00040853023529052734, 0.00043314695358276367, 0.000457763671875, 0.00048238039016723633, 0.0005069971084594727, 0.000531613826751709, 0.0005562305450439453, 0.0005808472633361816, 0.000605463981628418, 0.0006300806999206543, 0.0006546974182128906, 0.000679314136505127, 0.0007039308547973633, 0.0007285475730895996, 0.0007531642913818359, 0.0007777810096740723, 0.0008023977279663086, 0.0008270144462585449, 0.0008516311645507812]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 8.0, 9.0, 9.0, 17.0, 25.0, 37.0, 68.0, 103.0, 195.0, 291.0, 481.0, 837.0, 1569.0, 3064.0, 6121.0, 13283.0, 34251.0, 263330.0, 644375.0, 48550.0, 16504.0, 7451.0, 3604.0, 1928.0, 1054.0, 561.0, 317.0, 185.0, 113.0, 69.0, 42.0, 26.0, 17.0, 16.0, 8.0, 13.0, 4.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4775390625, -1.4366455078125, -1.395751953125, -1.3548583984375, -1.31396484375, -1.2730712890625, -1.232177734375, -1.1912841796875, -1.150390625, -1.1094970703125, -1.068603515625, -1.0277099609375, -0.98681640625, -0.9459228515625, -0.905029296875, -0.8641357421875, -0.8232421875, -0.7823486328125, -0.741455078125, -0.7005615234375, -0.65966796875, -0.6187744140625, -0.577880859375, -0.5369873046875, -0.49609375, -0.4552001953125, -0.414306640625, -0.3734130859375, -0.33251953125, -0.2916259765625, -0.250732421875, -0.2098388671875, -0.1689453125, -0.1280517578125, -0.087158203125, -0.0462646484375, -0.00537109375, 0.0355224609375, 0.076416015625, 0.1173095703125, 0.158203125, 0.1990966796875, 0.239990234375, 0.2808837890625, 0.32177734375, 0.3626708984375, 0.403564453125, 0.4444580078125, 0.4853515625, 0.5262451171875, 0.567138671875, 0.6080322265625, 0.64892578125, 0.6898193359375, 0.730712890625, 0.7716064453125, 0.8125, 0.8533935546875, 0.894287109375, 0.9351806640625, 0.97607421875, 1.0169677734375, 1.057861328125, 1.0987548828125, 1.1396484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 4.0, 6.0, 10.0, 10.0, 12.0, 8.0, 11.0, 25.0, 34.0, 64.0, 93.0, 179.0, 194.0, 111.0, 60.0, 34.0, 27.0, 17.0, 13.0, 12.0, 9.0, 8.0, 5.0, 7.0, 9.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6902618408203125, -0.662750244140625, -0.6352386474609375, -0.60772705078125, -0.5802154541015625, -0.552703857421875, -0.5251922607421875, -0.4976806640625, -0.4701690673828125, -0.442657470703125, -0.4151458740234375, -0.38763427734375, -0.3601226806640625, -0.332611083984375, -0.3050994873046875, -0.277587890625, -0.2500762939453125, -0.222564697265625, -0.1950531005859375, -0.16754150390625, -0.1400299072265625, -0.112518310546875, -0.0850067138671875, -0.0574951171875, -0.0299835205078125, -0.002471923828125, 0.0250396728515625, 0.05255126953125, 0.0800628662109375, 0.107574462890625, 0.1350860595703125, 0.16259765625, 0.1901092529296875, 0.217620849609375, 0.2451324462890625, 0.27264404296875, 0.3001556396484375, 0.327667236328125, 0.3551788330078125, 0.3826904296875, 0.4102020263671875, 0.437713623046875, 0.4652252197265625, 0.49273681640625, 0.5202484130859375, 0.547760009765625, 0.5752716064453125, 0.602783203125, 0.6302947998046875, 0.657806396484375, 0.6853179931640625, 0.71282958984375, 0.7403411865234375, 0.767852783203125, 0.7953643798828125, 0.8228759765625, 0.8503875732421875, 0.877899169921875, 0.9054107666015625, 0.93292236328125, 0.9604339599609375, 0.987945556640625, 1.0154571533203125, 1.04296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 15.0, 17.0, 33.0, 73.0, 178.0, 290.0, 212.0, 88.0, 56.0, 16.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.276638984680176, -9.728499412536621, -9.18035888671875, -8.632219314575195, -8.08407974243164, -7.5359392166137695, -6.987799644470215, -6.439659595489502, -5.891519546508789, -5.343379497528076, -4.795239448547363, -4.247099876403809, -3.6989598274230957, -3.150819778442383, -2.602679967880249, -2.0545401573181152, -1.5064001083374023, -0.958260178565979, -0.41012024879455566, 0.13801968097686768, 0.686159610748291, 1.234299659729004, 1.7824394702911377, 2.3305792808532715, 2.8787193298339844, 3.4268593788146973, 3.974999189376831, 4.523138999938965, 5.071279048919678, 5.619419097900391, 6.167558670043945, 6.715698719024658, 7.263837814331055, 7.811977863311768, 8.36011791229248, 8.908257484436035, 9.456398010253906, 10.004537582397461, 10.552677154541016, 11.10081672668457, 11.648957252502441, 12.197096824645996, 12.745237350463867, 13.293376922607422, 13.841516494750977, 14.389657020568848, 14.937796592712402, 15.485937118530273, 16.034076690673828, 16.582216262817383, 17.130355834960938, 17.678497314453125, 18.22663688659668, 18.774776458740234, 19.32291603088379, 19.871055603027344, 20.41919708251953, 20.967336654663086, 21.51547622680664, 22.063617706298828, 22.611757278442383, 23.159896850585938, 23.708036422729492, 24.256175994873047, 24.8043155670166]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 6.0, 8.0, 10.0, 12.0, 24.0, 21.0, 18.0, 37.0, 35.0, 26.0, 28.0, 38.0, 57.0, 31.0, 41.0, 68.0, 41.0, 53.0, 50.0, 46.0, 47.0, 49.0, 46.0, 39.0, 20.0, 21.0, 25.0, 13.0, 18.0, 5.0, 10.0, 15.0, 8.0, 6.0, 6.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18975567817688, -3.063262462615967, -2.9367692470550537, -2.8102760314941406, -2.6837830543518066, -2.5572898387908936, -2.4307966232299805, -2.3043034076690674, -2.1778101921081543, -2.051316976547241, -1.9248238801956177, -1.7983306646347046, -1.671837568283081, -1.545344352722168, -1.4188511371612549, -1.2923579216003418, -1.1658649444580078, -1.0393717288970947, -0.9128786325454712, -0.7863854169845581, -0.6598922610282898, -0.5333991050720215, -0.4069058895111084, -0.2804127335548401, -0.15391957759857178, -0.027426406741142273, 0.09906676411628723, 0.22555994987487793, 0.35205310583114624, 0.47854626178741455, 0.6050394773483276, 0.731532633304596, 0.8580260276794434, 0.9845191836357117, 1.11101233959198, 1.237505555152893, 1.3639986515045166, 1.4904918670654297, 1.6169850826263428, 1.7434782981872559, 1.8699713945388794, 1.9964646100997925, 2.122957706451416, 2.249450922012329, 2.375944137573242, 2.502437114715576, 2.6289305686950684, 2.7554235458374023, 2.8819167613983154, 3.0084099769592285, 3.1349031925201416, 3.2613964080810547, 3.3878893852233887, 3.5143826007843018, 3.640875816345215, 3.767369031906128, 3.893862247467041, 4.020355224609375, 4.146848678588867, 4.273341655731201, 4.399835109710693, 4.526328086853027, 4.6528215408325195, 4.7793145179748535, 4.9058074951171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 4.0, 10.0, 9.0, 19.0, 24.0, 33.0, 69.0, 125.0, 213.0, 587.0, 1772.0, 8065.0, 85353.0, 3916523.0, 167746.0, 9976.0, 2259.0, 786.0, 333.0, 154.0, 83.0, 55.0, 26.0, 23.0, 12.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.025390625, -2.929595947265625, -2.83380126953125, -2.738006591796875, -2.6422119140625, -2.546417236328125, -2.45062255859375, -2.354827880859375, -2.259033203125, -2.163238525390625, -2.06744384765625, -1.971649169921875, -1.8758544921875, -1.780059814453125, -1.68426513671875, -1.588470458984375, -1.49267578125, -1.396881103515625, -1.30108642578125, -1.205291748046875, -1.1094970703125, -1.013702392578125, -0.91790771484375, -0.822113037109375, -0.726318359375, -0.630523681640625, -0.53472900390625, -0.438934326171875, -0.3431396484375, -0.247344970703125, -0.15155029296875, -0.055755615234375, 0.0400390625, 0.135833740234375, 0.23162841796875, 0.327423095703125, 0.4232177734375, 0.519012451171875, 0.61480712890625, 0.710601806640625, 0.806396484375, 0.902191162109375, 0.99798583984375, 1.093780517578125, 1.1895751953125, 1.285369873046875, 1.38116455078125, 1.476959228515625, 1.57275390625, 1.668548583984375, 1.76434326171875, 1.860137939453125, 1.9559326171875, 2.051727294921875, 2.14752197265625, 2.243316650390625, 2.339111328125, 2.434906005859375, 2.53070068359375, 2.626495361328125, 2.7222900390625, 2.818084716796875, 2.91387939453125, 3.009674072265625, 3.10546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 9.0, 12.0, 23.0, 29.0, 26.0, 37.0, 56.0, 64.0, 62.0, 78.0, 71.0, 86.0, 77.0, 85.0, 59.0, 53.0, 61.0, 25.0, 26.0, 16.0, 10.0, 15.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6306228637695312, -0.6064605712890625, -0.5822982788085938, -0.558135986328125, -0.5339736938476562, -0.5098114013671875, -0.48564910888671875, -0.46148681640625, -0.43732452392578125, -0.4131622314453125, -0.38899993896484375, -0.364837646484375, -0.34067535400390625, -0.3165130615234375, -0.29235076904296875, -0.2681884765625, -0.24402618408203125, -0.2198638916015625, -0.19570159912109375, -0.171539306640625, -0.14737701416015625, -0.1232147216796875, -0.09905242919921875, -0.07489013671875, -0.05072784423828125, -0.0265655517578125, -0.00240325927734375, 0.021759033203125, 0.04592132568359375, 0.0700836181640625, 0.09424591064453125, 0.118408203125, 0.14257049560546875, 0.1667327880859375, 0.19089508056640625, 0.215057373046875, 0.23921966552734375, 0.2633819580078125, 0.28754425048828125, 0.31170654296875, 0.33586883544921875, 0.3600311279296875, 0.38419342041015625, 0.408355712890625, 0.43251800537109375, 0.4566802978515625, 0.48084259033203125, 0.5050048828125, 0.5291671752929688, 0.5533294677734375, 0.5774917602539062, 0.601654052734375, 0.6258163452148438, 0.6499786376953125, 0.6741409301757812, 0.69830322265625, 0.7224655151367188, 0.7466278076171875, 0.7707901000976562, 0.794952392578125, 0.8191146850585938, 0.8432769775390625, 0.8674392700195312, 0.8916015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 7.0, 16.0, 15.0, 22.0, 33.0, 50.0, 82.0, 92.0, 129.0, 180.0, 298.0, 562.0, 1268.0, 3464.0, 16984.0, 727584.0, 3409406.0, 26272.0, 4581.0, 1489.0, 685.0, 340.0, 209.0, 146.0, 111.0, 77.0, 43.0, 45.0, 17.0, 26.0, 10.0, 19.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.217529296875, -3.10302734375, -2.988525390625, -2.8740234375, -2.759521484375, -2.64501953125, -2.530517578125, -2.416015625, -2.301513671875, -2.18701171875, -2.072509765625, -1.9580078125, -1.843505859375, -1.72900390625, -1.614501953125, -1.5, -1.385498046875, -1.27099609375, -1.156494140625, -1.0419921875, -0.927490234375, -0.81298828125, -0.698486328125, -0.583984375, -0.469482421875, -0.35498046875, -0.240478515625, -0.1259765625, -0.011474609375, 0.10302734375, 0.217529296875, 0.33203125, 0.446533203125, 0.56103515625, 0.675537109375, 0.7900390625, 0.904541015625, 1.01904296875, 1.133544921875, 1.248046875, 1.362548828125, 1.47705078125, 1.591552734375, 1.7060546875, 1.820556640625, 1.93505859375, 2.049560546875, 2.1640625, 2.278564453125, 2.39306640625, 2.507568359375, 2.6220703125, 2.736572265625, 2.85107421875, 2.965576171875, 3.080078125, 3.194580078125, 3.30908203125, 3.423583984375, 3.5380859375, 3.652587890625, 3.76708984375, 3.881591796875, 3.99609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 5.0, 9.0, 22.0, 57.0, 154.0, 376.0, 1898.0, 1130.0, 231.0, 98.0, 44.0, 20.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.955291748046875, -1.86566162109375, -1.776031494140625, -1.6864013671875, -1.596771240234375, -1.50714111328125, -1.417510986328125, -1.327880859375, -1.238250732421875, -1.14862060546875, -1.058990478515625, -0.9693603515625, -0.879730224609375, -0.79010009765625, -0.700469970703125, -0.61083984375, -0.521209716796875, -0.43157958984375, -0.341949462890625, -0.2523193359375, -0.162689208984375, -0.07305908203125, 0.016571044921875, 0.106201171875, 0.195831298828125, 0.28546142578125, 0.375091552734375, 0.4647216796875, 0.554351806640625, 0.64398193359375, 0.733612060546875, 0.8232421875, 0.912872314453125, 1.00250244140625, 1.092132568359375, 1.1817626953125, 1.271392822265625, 1.36102294921875, 1.450653076171875, 1.540283203125, 1.629913330078125, 1.71954345703125, 1.809173583984375, 1.8988037109375, 1.988433837890625, 2.07806396484375, 2.167694091796875, 2.25732421875, 2.346954345703125, 2.43658447265625, 2.526214599609375, 2.6158447265625, 2.705474853515625, 2.79510498046875, 2.884735107421875, 2.974365234375, 3.063995361328125, 3.15362548828125, 3.243255615234375, 3.3328857421875, 3.422515869140625, 3.51214599609375, 3.601776123046875, 3.69140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 13.0, 28.0, 81.0, 255.0, 377.0, 160.0, 54.0, 23.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.51102638244629, -21.920936584472656, -21.33084487915039, -20.740755081176758, -20.150665283203125, -19.56057357788086, -18.970483779907227, -18.380393981933594, -17.790302276611328, -17.200212478637695, -16.61012077331543, -16.020030975341797, -15.429941177368164, -14.839850425720215, -14.249759674072266, -13.659669876098633, -13.069580078125, -12.47948932647705, -11.889399528503418, -11.299308776855469, -10.709218978881836, -10.119128227233887, -9.529037475585938, -8.938947677612305, -8.348856925964355, -7.7587666511535645, -7.168676376342773, -6.578585624694824, -5.988495349884033, -5.398405075073242, -4.808314323425293, -4.218224048614502, -3.628131866455078, -3.038041591644287, -2.447951078414917, -1.8578606843948364, -1.2677702903747559, -0.6776800155639648, -0.08758950233459473, 0.5025010108947754, 1.0925912857055664, 1.682681679725647, 2.2727720737457275, 2.8628625869750977, 3.4529528617858887, 4.04304313659668, 4.633133888244629, 5.22322416305542, 5.813314437866211, 6.403404712677002, 6.993494987487793, 7.583585739135742, 8.173675537109375, 8.763766288757324, 9.353857040405273, 9.943946838378906, 10.534037590026855, 11.124128341674805, 11.714218139648438, 12.304308891296387, 12.894399642944336, 13.484489440917969, 14.074580192565918, 14.664670944213867, 15.2547607421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 4.0, 4.0, 13.0, 9.0, 7.0, 16.0, 16.0, 21.0, 30.0, 31.0, 47.0, 48.0, 37.0, 59.0, 58.0, 66.0, 53.0, 52.0, 59.0, 51.0, 51.0, 36.0, 44.0, 36.0, 31.0, 26.0, 20.0, 14.0, 16.0, 14.0, 7.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.273016452789307, -4.156552791595459, -4.040088653564453, -3.9236247539520264, -3.8071608543395996, -3.690696954727173, -3.574233055114746, -3.4577693939208984, -3.3413052558898926, -3.224841356277466, -3.108377456665039, -2.9919135570526123, -2.8754496574401855, -2.758985757827759, -2.642521858215332, -2.5260581970214844, -2.4095942974090576, -2.293130397796631, -2.176666498184204, -2.0602025985717773, -1.9437386989593506, -1.8272747993469238, -1.7108110189437866, -1.5943471193313599, -1.477883219718933, -1.3614193201065063, -1.2449554204940796, -1.1284916400909424, -1.0120277404785156, -0.8955637812614441, -0.7790999412536621, -0.6626360416412354, -0.5461723804473877, -0.42970848083496094, -0.31324461102485657, -0.1967807412147522, -0.08031684160232544, 0.03614705801010132, 0.1526108980178833, 0.26907479763031006, 0.3855386972427368, 0.5020025968551636, 0.6184664964675903, 0.7349303364753723, 0.8513942360877991, 0.9678581357002258, 1.0843219757080078, 1.2007858753204346, 1.3172497749328613, 1.433713674545288, 1.5501775741577148, 1.6666414737701416, 1.7831053733825684, 1.8995692729949951, 2.016033172607422, 2.1324968338012695, 2.2489609718322754, 2.365424871444702, 2.481888771057129, 2.5983526706695557, 2.7148165702819824, 2.831280469894409, 2.947744369506836, 3.0642080307006836, 3.1806719303131104]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 14.0, 15.0, 32.0, 29.0, 55.0, 105.0, 167.0, 296.0, 555.0, 1155.0, 2906.0, 8690.0, 31325.0, 144862.0, 575912.0, 219709.0, 44372.0, 11668.0, 3805.0, 1393.0, 667.0, 325.0, 170.0, 119.0, 73.0, 50.0, 22.0, 16.0, 14.0, 12.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.908203125, -2.830902099609375, -2.75360107421875, -2.676300048828125, -2.5989990234375, -2.521697998046875, -2.44439697265625, -2.367095947265625, -2.289794921875, -2.212493896484375, -2.13519287109375, -2.057891845703125, -1.9805908203125, -1.903289794921875, -1.82598876953125, -1.748687744140625, -1.67138671875, -1.594085693359375, -1.51678466796875, -1.439483642578125, -1.3621826171875, -1.284881591796875, -1.20758056640625, -1.130279541015625, -1.052978515625, -0.975677490234375, -0.89837646484375, -0.821075439453125, -0.7437744140625, -0.666473388671875, -0.58917236328125, -0.511871337890625, -0.4345703125, -0.357269287109375, -0.27996826171875, -0.202667236328125, -0.1253662109375, -0.048065185546875, 0.02923583984375, 0.106536865234375, 0.183837890625, 0.261138916015625, 0.33843994140625, 0.415740966796875, 0.4930419921875, 0.570343017578125, 0.64764404296875, 0.724945068359375, 0.80224609375, 0.879547119140625, 0.95684814453125, 1.034149169921875, 1.1114501953125, 1.188751220703125, 1.26605224609375, 1.343353271484375, 1.420654296875, 1.497955322265625, 1.57525634765625, 1.652557373046875, 1.7298583984375, 1.807159423828125, 1.88446044921875, 1.961761474609375, 2.0390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 10.0, 13.0, 21.0, 23.0, 42.0, 63.0, 47.0, 57.0, 66.0, 91.0, 79.0, 71.0, 74.0, 72.0, 67.0, 50.0, 51.0, 24.0, 23.0, 16.0, 17.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8017578125, -0.7738723754882812, -0.7459869384765625, -0.7181015014648438, -0.690216064453125, -0.6623306274414062, -0.6344451904296875, -0.6065597534179688, -0.57867431640625, -0.5507888793945312, -0.5229034423828125, -0.49501800537109375, -0.467132568359375, -0.43924713134765625, -0.4113616943359375, -0.38347625732421875, -0.3555908203125, -0.32770538330078125, -0.2998199462890625, -0.27193450927734375, -0.244049072265625, -0.21616363525390625, -0.1882781982421875, -0.16039276123046875, -0.13250732421875, -0.10462188720703125, -0.0767364501953125, -0.04885101318359375, -0.020965576171875, 0.00691986083984375, 0.0348052978515625, 0.06269073486328125, 0.090576171875, 0.11846160888671875, 0.1463470458984375, 0.17423248291015625, 0.202117919921875, 0.23000335693359375, 0.2578887939453125, 0.28577423095703125, 0.31365966796875, 0.34154510498046875, 0.3694305419921875, 0.39731597900390625, 0.425201416015625, 0.45308685302734375, 0.4809722900390625, 0.5088577270507812, 0.5367431640625, 0.5646286010742188, 0.5925140380859375, 0.6203994750976562, 0.648284912109375, 0.6761703491210938, 0.7040557861328125, 0.7319412231445312, 0.75982666015625, 0.7877120971679688, 0.8155975341796875, 0.8434829711914062, 0.871368408203125, 0.8992538452148438, 0.9271392822265625, 0.9550247192382812, 0.98291015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 7.0, 18.0, 19.0, 22.0, 34.0, 40.0, 47.0, 63.0, 109.0, 142.0, 202.0, 326.0, 499.0, 767.0, 1414.0, 2720.0, 5815.0, 12791.0, 32042.0, 88579.0, 270901.0, 405095.0, 142006.0, 49492.0, 19112.0, 7883.0, 3725.0, 1865.0, 1009.0, 584.0, 387.0, 241.0, 155.0, 128.0, 75.0, 53.0, 43.0, 32.0, 21.0, 21.0, 13.0, 14.0, 9.0, 4.0, 5.0, 5.0, 1.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1.5068359375, -1.462799072265625, -1.41876220703125, -1.374725341796875, -1.3306884765625, -1.286651611328125, -1.24261474609375, -1.198577880859375, -1.154541015625, -1.110504150390625, -1.06646728515625, -1.022430419921875, -0.9783935546875, -0.934356689453125, -0.89031982421875, -0.846282958984375, -0.80224609375, -0.758209228515625, -0.71417236328125, -0.670135498046875, -0.6260986328125, -0.582061767578125, -0.53802490234375, -0.493988037109375, -0.449951171875, -0.405914306640625, -0.36187744140625, -0.317840576171875, -0.2738037109375, -0.229766845703125, -0.18572998046875, -0.141693115234375, -0.09765625, -0.053619384765625, -0.00958251953125, 0.034454345703125, 0.0784912109375, 0.122528076171875, 0.16656494140625, 0.210601806640625, 0.254638671875, 0.298675537109375, 0.34271240234375, 0.386749267578125, 0.4307861328125, 0.474822998046875, 0.51885986328125, 0.562896728515625, 0.60693359375, 0.650970458984375, 0.69500732421875, 0.739044189453125, 0.7830810546875, 0.827117919921875, 0.87115478515625, 0.915191650390625, 0.959228515625, 1.003265380859375, 1.04730224609375, 1.091339111328125, 1.1353759765625, 1.179412841796875, 1.22344970703125, 1.267486572265625, 1.3115234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 8.0, 7.0, 10.0, 9.0, 16.0, 16.0, 30.0, 44.0, 54.0, 42.0, 48.0, 52.0, 57.0, 71.0, 62.0, 61.0, 60.0, 56.0, 48.0, 49.0, 55.0, 31.0, 23.0, 23.0, 16.0, 16.0, 12.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.784912109375, -1.72216796875, -1.659423828125, -1.5966796875, -1.533935546875, -1.47119140625, -1.408447265625, -1.345703125, -1.282958984375, -1.22021484375, -1.157470703125, -1.0947265625, -1.031982421875, -0.96923828125, -0.906494140625, -0.84375, -0.781005859375, -0.71826171875, -0.655517578125, -0.5927734375, -0.530029296875, -0.46728515625, -0.404541015625, -0.341796875, -0.279052734375, -0.21630859375, -0.153564453125, -0.0908203125, -0.028076171875, 0.03466796875, 0.097412109375, 0.16015625, 0.222900390625, 0.28564453125, 0.348388671875, 0.4111328125, 0.473876953125, 0.53662109375, 0.599365234375, 0.662109375, 0.724853515625, 0.78759765625, 0.850341796875, 0.9130859375, 0.975830078125, 1.03857421875, 1.101318359375, 1.1640625, 1.226806640625, 1.28955078125, 1.352294921875, 1.4150390625, 1.477783203125, 1.54052734375, 1.603271484375, 1.666015625, 1.728759765625, 1.79150390625, 1.854248046875, 1.9169921875, 1.979736328125, 2.04248046875, 2.105224609375, 2.16796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 6.0, 17.0, 22.0, 26.0, 31.0, 66.0, 99.0, 123.0, 189.0, 301.0, 465.0, 686.0, 1023.0, 1559.0, 2493.0, 3952.0, 7101.0, 14338.0, 38297.0, 250244.0, 607441.0, 75591.0, 21148.0, 9669.0, 5141.0, 3076.0, 1839.0, 1189.0, 802.0, 491.0, 364.0, 242.0, 166.0, 109.0, 74.0, 46.0, 33.0, 27.0, 19.0, 10.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.638671875, -0.6182174682617188, -0.5977630615234375, -0.5773086547851562, -0.556854248046875, -0.5363998413085938, -0.5159454345703125, -0.49549102783203125, -0.47503662109375, -0.45458221435546875, -0.4341278076171875, -0.41367340087890625, -0.393218994140625, -0.37276458740234375, -0.3523101806640625, -0.33185577392578125, -0.3114013671875, -0.29094696044921875, -0.2704925537109375, -0.25003814697265625, -0.229583740234375, -0.20912933349609375, -0.1886749267578125, -0.16822052001953125, -0.14776611328125, -0.12731170654296875, -0.1068572998046875, -0.08640289306640625, -0.065948486328125, -0.04549407958984375, -0.0250396728515625, -0.00458526611328125, 0.015869140625, 0.03632354736328125, 0.0567779541015625, 0.07723236083984375, 0.097686767578125, 0.11814117431640625, 0.1385955810546875, 0.15904998779296875, 0.17950439453125, 0.19995880126953125, 0.2204132080078125, 0.24086761474609375, 0.261322021484375, 0.28177642822265625, 0.3022308349609375, 0.32268524169921875, 0.3431396484375, 0.36359405517578125, 0.3840484619140625, 0.40450286865234375, 0.424957275390625, 0.44541168212890625, 0.4658660888671875, 0.48632049560546875, 0.50677490234375, 0.5272293090820312, 0.5476837158203125, 0.5681381225585938, 0.588592529296875, 0.6090469360351562, 0.6295013427734375, 0.6499557495117188, 0.67041015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 12.0, 16.0, 33.0, 59.0, 180.0, 347.0, 181.0, 58.0, 23.0, 18.0, 12.0, 14.0, 9.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036334991455078125, -0.0003501586616039276, -0.000336967408657074, -0.00032377615571022034, -0.0003105849027633667, -0.00029739364981651306, -0.0002842023968696594, -0.0002710111439228058, -0.00025781989097595215, -0.0002446286380290985, -0.00023143738508224487, -0.00021824613213539124, -0.0002050548791885376, -0.00019186362624168396, -0.00017867237329483032, -0.00016548112034797668, -0.00015228986740112305, -0.0001390986144542694, -0.00012590736150741577, -0.00011271610856056213, -9.95248556137085e-05, -8.633360266685486e-05, -7.314234972000122e-05, -5.995109677314758e-05, -4.6759843826293945e-05, -3.356859087944031e-05, -2.037733793258667e-05, -7.186084985733032e-06, 6.0051679611206055e-06, 1.9196420907974243e-05, 3.238767385482788e-05, 4.557892680168152e-05, 5.8770179748535156e-05, 7.19614326953888e-05, 8.515268564224243e-05, 9.834393858909607e-05, 0.00011153519153594971, 0.00012472644448280334, 0.00013791769742965698, 0.00015110895037651062, 0.00016430020332336426, 0.0001774914562702179, 0.00019068270921707153, 0.00020387396216392517, 0.0002170652151107788, 0.00023025646805763245, 0.00024344772100448608, 0.0002566389739513397, 0.00026983022689819336, 0.000283021479845047, 0.00029621273279190063, 0.00030940398573875427, 0.0003225952386856079, 0.00033578649163246155, 0.0003489777445793152, 0.0003621689975261688, 0.00037536025047302246, 0.0003885515034198761, 0.00040174275636672974, 0.0004149340093135834, 0.000428125262260437, 0.00044131651520729065, 0.0004545077681541443, 0.0004676990211009979, 0.00048089027404785156]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 12.0, 11.0, 13.0, 24.0, 30.0, 53.0, 51.0, 76.0, 138.0, 175.0, 272.0, 377.0, 618.0, 970.0, 1523.0, 2647.0, 4643.0, 8915.0, 19342.0, 53765.0, 291412.0, 520029.0, 90759.0, 27056.0, 11382.0, 5938.0, 3204.0, 1899.0, 1129.0, 680.0, 434.0, 292.0, 220.0, 134.0, 99.0, 64.0, 38.0, 32.0, 32.0, 11.0, 16.0, 15.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.6806640625, -0.6607513427734375, -0.640838623046875, -0.6209259033203125, -0.60101318359375, -0.5811004638671875, -0.561187744140625, -0.5412750244140625, -0.5213623046875, -0.5014495849609375, -0.481536865234375, -0.4616241455078125, -0.44171142578125, -0.4217987060546875, -0.401885986328125, -0.3819732666015625, -0.362060546875, -0.3421478271484375, -0.322235107421875, -0.3023223876953125, -0.28240966796875, -0.2624969482421875, -0.242584228515625, -0.2226715087890625, -0.2027587890625, -0.1828460693359375, -0.162933349609375, -0.1430206298828125, -0.12310791015625, -0.1031951904296875, -0.083282470703125, -0.0633697509765625, -0.04345703125, -0.0235443115234375, -0.003631591796875, 0.0162811279296875, 0.03619384765625, 0.0561065673828125, 0.076019287109375, 0.0959320068359375, 0.1158447265625, 0.1357574462890625, 0.155670166015625, 0.1755828857421875, 0.19549560546875, 0.2154083251953125, 0.235321044921875, 0.2552337646484375, 0.275146484375, 0.2950592041015625, 0.314971923828125, 0.3348846435546875, 0.35479736328125, 0.3747100830078125, 0.394622802734375, 0.4145355224609375, 0.4344482421875, 0.4543609619140625, 0.474273681640625, 0.4941864013671875, 0.51409912109375, 0.5340118408203125, 0.553924560546875, 0.5738372802734375, 0.59375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 12.0, 12.0, 24.0, 26.0, 49.0, 62.0, 114.0, 127.0, 139.0, 125.0, 102.0, 52.0, 38.0, 28.0, 14.0, 10.0, 8.0, 7.0, 11.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5857467651367188, -0.5635833740234375, -0.5414199829101562, -0.519256591796875, -0.49709320068359375, -0.4749298095703125, -0.45276641845703125, -0.43060302734375, -0.40843963623046875, -0.3862762451171875, -0.36411285400390625, -0.341949462890625, -0.31978607177734375, -0.2976226806640625, -0.27545928955078125, -0.2532958984375, -0.23113250732421875, -0.2089691162109375, -0.18680572509765625, -0.164642333984375, -0.14247894287109375, -0.1203155517578125, -0.09815216064453125, -0.07598876953125, -0.05382537841796875, -0.0316619873046875, -0.00949859619140625, 0.012664794921875, 0.03482818603515625, 0.0569915771484375, 0.07915496826171875, 0.101318359375, 0.12348175048828125, 0.1456451416015625, 0.16780853271484375, 0.189971923828125, 0.21213531494140625, 0.2342987060546875, 0.25646209716796875, 0.27862548828125, 0.30078887939453125, 0.3229522705078125, 0.34511566162109375, 0.367279052734375, 0.38944244384765625, 0.4116058349609375, 0.43376922607421875, 0.4559326171875, 0.47809600830078125, 0.5002593994140625, 0.5224227905273438, 0.544586181640625, 0.5667495727539062, 0.5889129638671875, 0.6110763549804688, 0.63323974609375, 0.6554031372070312, 0.6775665283203125, 0.6997299194335938, 0.721893310546875, 0.7440567016601562, 0.7662200927734375, 0.7883834838867188, 0.810546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 12.0, 49.0, 105.0, 252.0, 293.0, 181.0, 59.0, 28.0, 10.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.694486618041992, -10.139517784118652, -9.584548950195312, -9.029580116271973, -8.474611282348633, -7.919642448425293, -7.364673614501953, -6.809704780578613, -6.254735946655273, -5.699767112731934, -5.144798278808594, -4.589829444885254, -4.034860610961914, -3.479891777038574, -2.9249229431152344, -2.3699541091918945, -1.8149852752685547, -1.2600164413452148, -0.705047607421875, -0.15007877349853516, 0.4048900604248047, 0.9598588943481445, 1.5148277282714844, 2.069796562194824, 2.624765396118164, 3.179734230041504, 3.7347030639648438, 4.289671897888184, 4.844640731811523, 5.399609565734863, 5.954578399658203, 6.509547233581543, 7.064516067504883, 7.619484901428223, 8.174453735351562, 8.729422569274902, 9.284391403198242, 9.839360237121582, 10.394329071044922, 10.949297904968262, 11.504266738891602, 12.059235572814941, 12.614204406738281, 13.169173240661621, 13.724142074584961, 14.2791109085083, 14.83407974243164, 15.38904857635498, 15.94401741027832, 16.498985290527344, 17.053955078125, 17.608924865722656, 18.16389274597168, 18.718860626220703, 19.27383041381836, 19.828800201416016, 20.38376808166504, 20.938735961914062, 21.49370574951172, 22.048675537109375, 22.6036434173584, 23.158611297607422, 23.713581085205078, 24.268550872802734, 24.823518753051758]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 11.0, 13.0, 5.0, 18.0, 15.0, 16.0, 17.0, 21.0, 24.0, 34.0, 36.0, 41.0, 42.0, 34.0, 39.0, 40.0, 47.0, 56.0, 45.0, 38.0, 42.0, 37.0, 31.0, 42.0, 24.0, 30.0, 39.0, 28.0, 22.0, 24.0, 13.0, 11.0, 15.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4646596908569336, -3.354400634765625, -3.2441413402557373, -3.1338822841644287, -3.023622989654541, -2.9133639335632324, -2.803104877471924, -2.6928458213806152, -2.5825865268707275, -2.472327470779419, -2.3620681762695312, -2.2518091201782227, -2.141550064086914, -2.0312907695770264, -1.9210317134857178, -1.8107725381851196, -1.7005133628845215, -1.5902541875839233, -1.4799950122833252, -1.3697359561920166, -1.2594767808914185, -1.1492176055908203, -1.0389585494995117, -0.9286993741989136, -0.8184401988983154, -0.7081810235977173, -0.5979219079017639, -0.48766276240348816, -0.3774036169052124, -0.26714444160461426, -0.1568853259086609, -0.04662621021270752, 0.06363296508789062, 0.17389211058616638, 0.28415125608444214, 0.3944104015827179, 0.5046695470809937, 0.6149287223815918, 0.7251878380775452, 0.8354469537734985, 0.9457061290740967, 1.0559653043746948, 1.166224479675293, 1.2764835357666016, 1.3867427110671997, 1.4970018863677979, 1.6072609424591064, 1.7175201177597046, 1.8277792930603027, 1.9380384683609009, 2.048297643661499, 2.1585566997528076, 2.2688159942626953, 2.379075050354004, 2.4893341064453125, 2.599593162536621, 2.709852457046509, 2.8201115131378174, 2.930370807647705, 3.0406298637390137, 3.1508889198303223, 3.26114821434021, 3.3714072704315186, 3.4816665649414062, 3.591925621032715]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 7.0, 4.0, 4.0, 9.0, 10.0, 16.0, 18.0, 30.0, 51.0, 63.0, 103.0, 175.0, 302.0, 617.0, 1209.0, 2440.0, 5892.0, 19214.0, 168594.0, 3451813.0, 496840.0, 32747.0, 7953.0, 3130.0, 1408.0, 709.0, 362.0, 214.0, 134.0, 66.0, 52.0, 29.0, 22.0, 15.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.20965576171875, -2.1419677734375, -2.07427978515625, -2.006591796875, -1.93890380859375, -1.8712158203125, -1.80352783203125, -1.73583984375, -1.66815185546875, -1.6004638671875, -1.53277587890625, -1.465087890625, -1.39739990234375, -1.3297119140625, -1.26202392578125, -1.1943359375, -1.12664794921875, -1.0589599609375, -0.99127197265625, -0.923583984375, -0.85589599609375, -0.7882080078125, -0.72052001953125, -0.65283203125, -0.58514404296875, -0.5174560546875, -0.44976806640625, -0.382080078125, -0.31439208984375, -0.2467041015625, -0.17901611328125, -0.111328125, -0.04364013671875, 0.0240478515625, 0.09173583984375, 0.159423828125, 0.22711181640625, 0.2947998046875, 0.36248779296875, 0.43017578125, 0.49786376953125, 0.5655517578125, 0.63323974609375, 0.700927734375, 0.76861572265625, 0.8363037109375, 0.90399169921875, 0.9716796875, 1.03936767578125, 1.1070556640625, 1.17474365234375, 1.242431640625, 1.31011962890625, 1.3778076171875, 1.44549560546875, 1.51318359375, 1.58087158203125, 1.6485595703125, 1.71624755859375, 1.783935546875, 1.85162353515625, 1.9193115234375, 1.98699951171875, 2.0546875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 17.0, 15.0, 20.0, 25.0, 30.0, 38.0, 39.0, 48.0, 54.0, 49.0, 64.0, 61.0, 68.0, 72.0, 50.0, 55.0, 53.0, 39.0, 44.0, 36.0, 20.0, 21.0, 13.0, 10.0, 10.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.6476058959960938, -0.6257781982421875, -0.6039505004882812, -0.582122802734375, -0.5602951049804688, -0.5384674072265625, -0.5166397094726562, -0.49481201171875, -0.47298431396484375, -0.4511566162109375, -0.42932891845703125, -0.407501220703125, -0.38567352294921875, -0.3638458251953125, -0.34201812744140625, -0.3201904296875, -0.29836273193359375, -0.2765350341796875, -0.25470733642578125, -0.232879638671875, -0.21105194091796875, -0.1892242431640625, -0.16739654541015625, -0.14556884765625, -0.12374114990234375, -0.1019134521484375, -0.08008575439453125, -0.058258056640625, -0.03643035888671875, -0.0146026611328125, 0.00722503662109375, 0.029052734375, 0.05088043212890625, 0.0727081298828125, 0.09453582763671875, 0.116363525390625, 0.13819122314453125, 0.1600189208984375, 0.18184661865234375, 0.20367431640625, 0.22550201416015625, 0.2473297119140625, 0.26915740966796875, 0.290985107421875, 0.31281280517578125, 0.3346405029296875, 0.35646820068359375, 0.3782958984375, 0.40012359619140625, 0.4219512939453125, 0.44377899169921875, 0.465606689453125, 0.48743438720703125, 0.5092620849609375, 0.5310897827148438, 0.55291748046875, 0.5747451782226562, 0.5965728759765625, 0.6184005737304688, 0.640228271484375, 0.6620559692382812, 0.6838836669921875, 0.7057113647460938, 0.7275390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 9.0, 11.0, 16.0, 22.0, 19.0, 30.0, 64.0, 67.0, 91.0, 152.0, 175.0, 295.0, 483.0, 999.0, 2389.0, 7920.0, 53808.0, 3906847.0, 199558.0, 14646.0, 3635.0, 1278.0, 608.0, 338.0, 261.0, 152.0, 121.0, 76.0, 44.0, 36.0, 32.0, 16.0, 15.0, 9.0, 10.0, 14.0, 5.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.0726318359375, -2.961669921875, -2.8507080078125, -2.73974609375, -2.6287841796875, -2.517822265625, -2.4068603515625, -2.2958984375, -2.1849365234375, -2.073974609375, -1.9630126953125, -1.85205078125, -1.7410888671875, -1.630126953125, -1.5191650390625, -1.408203125, -1.2972412109375, -1.186279296875, -1.0753173828125, -0.96435546875, -0.8533935546875, -0.742431640625, -0.6314697265625, -0.5205078125, -0.4095458984375, -0.298583984375, -0.1876220703125, -0.07666015625, 0.0343017578125, 0.145263671875, 0.2562255859375, 0.3671875, 0.4781494140625, 0.589111328125, 0.7000732421875, 0.81103515625, 0.9219970703125, 1.032958984375, 1.1439208984375, 1.2548828125, 1.3658447265625, 1.476806640625, 1.5877685546875, 1.69873046875, 1.8096923828125, 1.920654296875, 2.0316162109375, 2.142578125, 2.2535400390625, 2.364501953125, 2.4754638671875, 2.58642578125, 2.6973876953125, 2.808349609375, 2.9193115234375, 3.0302734375, 3.1412353515625, 3.252197265625, 3.3631591796875, 3.47412109375, 3.5850830078125, 3.696044921875, 3.8070068359375, 3.91796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 11.0, 16.0, 24.0, 59.0, 117.0, 406.0, 2034.0, 1068.0, 183.0, 85.0, 29.0, 18.0, 11.0, 8.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.419921875, -2.308746337890625, -2.19757080078125, -2.086395263671875, -1.9752197265625, -1.864044189453125, -1.75286865234375, -1.641693115234375, -1.530517578125, -1.419342041015625, -1.30816650390625, -1.196990966796875, -1.0858154296875, -0.974639892578125, -0.86346435546875, -0.752288818359375, -0.64111328125, -0.529937744140625, -0.41876220703125, -0.307586669921875, -0.1964111328125, -0.085235595703125, 0.02593994140625, 0.137115478515625, 0.248291015625, 0.359466552734375, 0.47064208984375, 0.581817626953125, 0.6929931640625, 0.804168701171875, 0.91534423828125, 1.026519775390625, 1.1376953125, 1.248870849609375, 1.36004638671875, 1.471221923828125, 1.5823974609375, 1.693572998046875, 1.80474853515625, 1.915924072265625, 2.027099609375, 2.138275146484375, 2.24945068359375, 2.360626220703125, 2.4718017578125, 2.582977294921875, 2.69415283203125, 2.805328369140625, 2.91650390625, 3.027679443359375, 3.13885498046875, 3.250030517578125, 3.3612060546875, 3.472381591796875, 3.58355712890625, 3.694732666015625, 3.805908203125, 3.917083740234375, 4.02825927734375, 4.139434814453125, 4.2506103515625, 4.361785888671875, 4.47296142578125, 4.584136962890625, 4.6953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 18.0, 57.0, 147.0, 354.0, 265.0, 95.0, 28.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.45159912109375, -13.785301208496094, -13.119003295898438, -12.452705383300781, -11.786407470703125, -11.120109558105469, -10.453812599182129, -9.787514686584473, -9.121216773986816, -8.45491886138916, -7.788620948791504, -7.122323513031006, -6.45602560043335, -5.789727687835693, -5.123430252075195, -4.457132339477539, -3.790834426879883, -3.1245365142822266, -2.4582388401031494, -1.7919410467147827, -1.125643253326416, -0.45934534072875977, 0.20695233345031738, 0.8732500076293945, 1.5395479202270508, 2.205845832824707, 2.872143507003784, 3.5384411811828613, 4.204739093780518, 4.871037006378174, 5.537334442138672, 6.203632354736328, 6.869932174682617, 7.536230087280273, 8.20252799987793, 8.868825912475586, 9.535123825073242, 10.201421737670898, 10.867718696594238, 11.534016609191895, 12.20031452178955, 12.866612434387207, 13.532910346984863, 14.19920825958252, 14.86550521850586, 15.531803131103516, 16.198101043701172, 16.864398956298828, 17.530696868896484, 18.19699478149414, 18.863292694091797, 19.529590606689453, 20.19588851928711, 20.862186431884766, 21.528484344482422, 22.194782257080078, 22.861080169677734, 23.52737808227539, 24.193675994873047, 24.859973907470703, 25.52627182006836, 26.192569732666016, 26.858867645263672, 27.525165557861328, 28.19146156311035]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 10.0, 14.0, 19.0, 20.0, 26.0, 62.0, 58.0, 61.0, 77.0, 71.0, 91.0, 92.0, 62.0, 80.0, 60.0, 39.0, 44.0, 40.0, 26.0, 10.0, 9.0, 5.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.151947498321533, -4.938779830932617, -4.725612163543701, -4.512444496154785, -4.299277305603027, -4.086109638214111, -3.8729419708251953, -3.6597743034362793, -3.4466068744659424, -3.2334392070770264, -3.0202717781066895, -2.8071041107177734, -2.5939364433288574, -2.3807690143585205, -2.1676013469696045, -1.954433798789978, -1.7412662506103516, -1.528098702430725, -1.3149311542510986, -1.1017634868621826, -0.8885959386825562, -0.6754283905029297, -0.46226072311401367, -0.2490931749343872, -0.03592562675476074, 0.1772419512271881, 0.39040952920913696, 0.6035771369934082, 0.8167446851730347, 1.0299122333526611, 1.2430799007415771, 1.4562474489212036, 1.6694145202636719, 1.8825820684432983, 2.095749616622925, 2.308917284011841, 2.5220847129821777, 2.7352523803710938, 2.9484200477600098, 3.161587715148926, 3.3747551441192627, 3.5879228115081787, 3.8010902404785156, 4.014257907867432, 4.227425575256348, 4.4405927658081055, 4.65376091003418, 4.8669281005859375, 5.0800957679748535, 5.2932634353637695, 5.5064311027526855, 5.719598770141602, 5.932765960693359, 6.145933628082275, 6.359101295471191, 6.572268962860107, 6.785436630249023, 6.9986042976379395, 7.2117719650268555, 7.424939155578613, 7.638106822967529, 7.851274490356445, 8.064441680908203, 8.277609825134277, 8.490777015686035]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 15.0, 27.0, 33.0, 78.0, 105.0, 191.0, 384.0, 861.0, 2197.0, 7454.0, 31293.0, 200636.0, 660264.0, 116049.0, 20496.0, 5282.0, 1691.0, 715.0, 344.0, 191.0, 96.0, 47.0, 29.0, 25.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.74609375, -2.652587890625, -2.55908203125, -2.465576171875, -2.3720703125, -2.278564453125, -2.18505859375, -2.091552734375, -1.998046875, -1.904541015625, -1.81103515625, -1.717529296875, -1.6240234375, -1.530517578125, -1.43701171875, -1.343505859375, -1.25, -1.156494140625, -1.06298828125, -0.969482421875, -0.8759765625, -0.782470703125, -0.68896484375, -0.595458984375, -0.501953125, -0.408447265625, -0.31494140625, -0.221435546875, -0.1279296875, -0.034423828125, 0.05908203125, 0.152587890625, 0.24609375, 0.339599609375, 0.43310546875, 0.526611328125, 0.6201171875, 0.713623046875, 0.80712890625, 0.900634765625, 0.994140625, 1.087646484375, 1.18115234375, 1.274658203125, 1.3681640625, 1.461669921875, 1.55517578125, 1.648681640625, 1.7421875, 1.835693359375, 1.92919921875, 2.022705078125, 2.1162109375, 2.209716796875, 2.30322265625, 2.396728515625, 2.490234375, 2.583740234375, 2.67724609375, 2.770751953125, 2.8642578125, 2.957763671875, 3.05126953125, 3.144775390625, 3.23828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 14.0, 7.0, 20.0, 18.0, 30.0, 27.0, 40.0, 60.0, 55.0, 72.0, 64.0, 62.0, 69.0, 78.0, 53.0, 67.0, 40.0, 45.0, 39.0, 35.0, 22.0, 16.0, 19.0, 20.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0198745727539062, -0.9889678955078125, -0.9580612182617188, -0.927154541015625, -0.8962478637695312, -0.8653411865234375, -0.8344345092773438, -0.80352783203125, -0.7726211547851562, -0.7417144775390625, -0.7108078002929688, -0.679901123046875, -0.6489944458007812, -0.6180877685546875, -0.5871810913085938, -0.5562744140625, -0.5253677368164062, -0.4944610595703125, -0.46355438232421875, -0.432647705078125, -0.40174102783203125, -0.3708343505859375, -0.33992767333984375, -0.30902099609375, -0.27811431884765625, -0.2472076416015625, -0.21630096435546875, -0.185394287109375, -0.15448760986328125, -0.1235809326171875, -0.09267425537109375, -0.061767578125, -0.03086090087890625, 4.57763671875e-05, 0.03095245361328125, 0.061859130859375, 0.09276580810546875, 0.1236724853515625, 0.15457916259765625, 0.18548583984375, 0.21639251708984375, 0.2472991943359375, 0.27820587158203125, 0.309112548828125, 0.34001922607421875, 0.3709259033203125, 0.40183258056640625, 0.4327392578125, 0.46364593505859375, 0.4945526123046875, 0.5254592895507812, 0.556365966796875, 0.5872726440429688, 0.6181793212890625, 0.6490859985351562, 0.67999267578125, 0.7108993530273438, 0.7418060302734375, 0.7727127075195312, 0.803619384765625, 0.8345260620117188, 0.8654327392578125, 0.8963394165039062, 0.92724609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 14.0, 16.0, 30.0, 29.0, 46.0, 62.0, 100.0, 114.0, 171.0, 300.0, 517.0, 1059.0, 2752.0, 9959.0, 49026.0, 409842.0, 501170.0, 56585.0, 11019.0, 3138.0, 1172.0, 533.0, 273.0, 179.0, 122.0, 76.0, 59.0, 60.0, 32.0, 23.0, 17.0, 15.0, 9.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.16302490234375, -2.0799560546875, -1.99688720703125, -1.913818359375, -1.83074951171875, -1.7476806640625, -1.66461181640625, -1.58154296875, -1.49847412109375, -1.4154052734375, -1.33233642578125, -1.249267578125, -1.16619873046875, -1.0831298828125, -1.00006103515625, -0.9169921875, -0.83392333984375, -0.7508544921875, -0.66778564453125, -0.584716796875, -0.50164794921875, -0.4185791015625, -0.33551025390625, -0.25244140625, -0.16937255859375, -0.0863037109375, -0.00323486328125, 0.079833984375, 0.16290283203125, 0.2459716796875, 0.32904052734375, 0.412109375, 0.49517822265625, 0.5782470703125, 0.66131591796875, 0.744384765625, 0.82745361328125, 0.9105224609375, 0.99359130859375, 1.07666015625, 1.15972900390625, 1.2427978515625, 1.32586669921875, 1.408935546875, 1.49200439453125, 1.5750732421875, 1.65814208984375, 1.7412109375, 1.82427978515625, 1.9073486328125, 1.99041748046875, 2.073486328125, 2.15655517578125, 2.2396240234375, 2.32269287109375, 2.40576171875, 2.48883056640625, 2.5718994140625, 2.65496826171875, 2.738037109375, 2.82110595703125, 2.9041748046875, 2.98724365234375, 3.0703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 10.0, 19.0, 18.0, 46.0, 51.0, 88.0, 97.0, 103.0, 136.0, 109.0, 106.0, 85.0, 58.0, 30.0, 22.0, 12.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.809326171875, -4.66552734375, -4.521728515625, -4.3779296875, -4.234130859375, -4.09033203125, -3.946533203125, -3.802734375, -3.658935546875, -3.51513671875, -3.371337890625, -3.2275390625, -3.083740234375, -2.93994140625, -2.796142578125, -2.65234375, -2.508544921875, -2.36474609375, -2.220947265625, -2.0771484375, -1.933349609375, -1.78955078125, -1.645751953125, -1.501953125, -1.358154296875, -1.21435546875, -1.070556640625, -0.9267578125, -0.782958984375, -0.63916015625, -0.495361328125, -0.3515625, -0.207763671875, -0.06396484375, 0.079833984375, 0.2236328125, 0.367431640625, 0.51123046875, 0.655029296875, 0.798828125, 0.942626953125, 1.08642578125, 1.230224609375, 1.3740234375, 1.517822265625, 1.66162109375, 1.805419921875, 1.94921875, 2.093017578125, 2.23681640625, 2.380615234375, 2.5244140625, 2.668212890625, 2.81201171875, 2.955810546875, 3.099609375, 3.243408203125, 3.38720703125, 3.531005859375, 3.6748046875, 3.818603515625, 3.96240234375, 4.106201171875, 4.25]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 7.0, 17.0, 18.0, 28.0, 47.0, 69.0, 118.0, 202.0, 343.0, 621.0, 1119.0, 2084.0, 4445.0, 11107.0, 36431.0, 201008.0, 630648.0, 118889.0, 25211.0, 8611.0, 3597.0, 1745.0, 893.0, 505.0, 329.0, 181.0, 115.0, 68.0, 42.0, 21.0, 8.0, 12.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464111328125, -0.4483070373535156, -0.43250274658203125, -0.4166984558105469, -0.4008941650390625, -0.3850898742675781, -0.36928558349609375, -0.3534812927246094, -0.337677001953125, -0.3218727111816406, -0.30606842041015625, -0.2902641296386719, -0.2744598388671875, -0.2586555480957031, -0.24285125732421875, -0.22704696655273438, -0.21124267578125, -0.19543838500976562, -0.17963409423828125, -0.16382980346679688, -0.1480255126953125, -0.13222122192382812, -0.11641693115234375, -0.10061264038085938, -0.084808349609375, -0.06900405883789062, -0.05319976806640625, -0.037395477294921875, -0.0215911865234375, -0.005786895751953125, 0.01001739501953125, 0.025821685791015625, 0.0416259765625, 0.057430267333984375, 0.07323455810546875, 0.08903884887695312, 0.1048431396484375, 0.12064743041992188, 0.13645172119140625, 0.15225601196289062, 0.168060302734375, 0.18386459350585938, 0.19966888427734375, 0.21547317504882812, 0.2312774658203125, 0.24708175659179688, 0.26288604736328125, 0.2786903381347656, 0.29449462890625, 0.3102989196777344, 0.32610321044921875, 0.3419075012207031, 0.3577117919921875, 0.3735160827636719, 0.38932037353515625, 0.4051246643066406, 0.420928955078125, 0.4367332458496094, 0.45253753662109375, 0.4683418273925781, 0.4841461181640625, 0.4999504089355469, 0.5157546997070312, 0.5315589904785156, 0.54736328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 17.0, 20.0, 28.0, 34.0, 50.0, 91.0, 108.0, 146.0, 164.0, 97.0, 68.0, 43.0, 32.0, 21.0, 13.0, 9.0, 12.0, 2.0, 3.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012755393981933594, -0.0001221913844347, -0.00011682882905006409, -0.00011146627366542816, -0.00010610371828079224, -0.00010074116289615631, -9.537860751152039e-05, -9.001605212688446e-05, -8.465349674224854e-05, -7.929094135761261e-05, -7.392838597297668e-05, -6.856583058834076e-05, -6.320327520370483e-05, -5.784071981906891e-05, -5.2478164434432983e-05, -4.711560904979706e-05, -4.175305366516113e-05, -3.639049828052521e-05, -3.102794289588928e-05, -2.5665387511253357e-05, -2.030283212661743e-05, -1.4940276741981506e-05, -9.577721357345581e-06, -4.215165972709656e-06, 1.1473894119262695e-06, 6.509944796562195e-06, 1.187250018119812e-05, 1.7235055565834045e-05, 2.259761095046997e-05, 2.7960166335105896e-05, 3.332272171974182e-05, 3.8685277104377747e-05, 4.404783248901367e-05, 4.94103878736496e-05, 5.477294325828552e-05, 6.013549864292145e-05, 6.549805402755737e-05, 7.08606094121933e-05, 7.622316479682922e-05, 8.158572018146515e-05, 8.694827556610107e-05, 9.2310830950737e-05, 9.767338633537292e-05, 0.00010303594172000885, 0.00010839849710464478, 0.0001137610524892807, 0.00011912360787391663, 0.00012448616325855255, 0.00012984871864318848, 0.0001352112740278244, 0.00014057382941246033, 0.00014593638479709625, 0.00015129894018173218, 0.0001566614955663681, 0.00016202405095100403, 0.00016738660633563995, 0.00017274916172027588, 0.0001781117171049118, 0.00018347427248954773, 0.00018883682787418365, 0.00019419938325881958, 0.0001995619386434555, 0.00020492449402809143, 0.00021028704941272736, 0.00021564960479736328]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 12.0, 11.0, 19.0, 35.0, 46.0, 56.0, 112.0, 147.0, 243.0, 419.0, 669.0, 1219.0, 2086.0, 3927.0, 8386.0, 21326.0, 87995.0, 571241.0, 276986.0, 46325.0, 14152.0, 6018.0, 2988.0, 1677.0, 953.0, 580.0, 319.0, 228.0, 142.0, 81.0, 48.0, 24.0, 16.0, 24.0, 14.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.4238777160644531, -0.40805816650390625, -0.3922386169433594, -0.3764190673828125, -0.3605995178222656, -0.34477996826171875, -0.3289604187011719, -0.313140869140625, -0.2973213195800781, -0.28150177001953125, -0.2656822204589844, -0.2498626708984375, -0.23404312133789062, -0.21822357177734375, -0.20240402221679688, -0.18658447265625, -0.17076492309570312, -0.15494537353515625, -0.13912582397460938, -0.1233062744140625, -0.10748672485351562, -0.09166717529296875, -0.07584762573242188, -0.060028076171875, -0.044208526611328125, -0.02838897705078125, -0.012569427490234375, 0.0032501220703125, 0.019069671630859375, 0.03488922119140625, 0.050708770751953125, 0.0665283203125, 0.08234786987304688, 0.09816741943359375, 0.11398696899414062, 0.1298065185546875, 0.14562606811523438, 0.16144561767578125, 0.17726516723632812, 0.193084716796875, 0.20890426635742188, 0.22472381591796875, 0.24054336547851562, 0.2563629150390625, 0.2721824645996094, 0.28800201416015625, 0.3038215637207031, 0.31964111328125, 0.3354606628417969, 0.35128021240234375, 0.3670997619628906, 0.3829193115234375, 0.3987388610839844, 0.41455841064453125, 0.4303779602050781, 0.446197509765625, 0.4620170593261719, 0.47783660888671875, 0.4936561584472656, 0.5094757080078125, 0.5252952575683594, 0.5411148071289062, 0.5569343566894531, 0.57275390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 11.0, 8.0, 21.0, 29.0, 26.0, 47.0, 84.0, 76.0, 102.0, 111.0, 101.0, 84.0, 78.0, 43.0, 41.0, 24.0, 22.0, 18.0, 12.0, 15.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.451171875, -0.4363441467285156, -0.42151641845703125, -0.4066886901855469, -0.3918609619140625, -0.3770332336425781, -0.36220550537109375, -0.3473777770996094, -0.332550048828125, -0.3177223205566406, -0.30289459228515625, -0.2880668640136719, -0.2732391357421875, -0.2584114074707031, -0.24358367919921875, -0.22875595092773438, -0.21392822265625, -0.19910049438476562, -0.18427276611328125, -0.16944503784179688, -0.1546173095703125, -0.13978958129882812, -0.12496185302734375, -0.11013412475585938, -0.095306396484375, -0.08047866821289062, -0.06565093994140625, -0.050823211669921875, -0.0359954833984375, -0.021167755126953125, -0.00634002685546875, 0.008487701416015625, 0.0233154296875, 0.038143157958984375, 0.05297088623046875, 0.06779861450195312, 0.0826263427734375, 0.09745407104492188, 0.11228179931640625, 0.12710952758789062, 0.141937255859375, 0.15676498413085938, 0.17159271240234375, 0.18642044067382812, 0.2012481689453125, 0.21607589721679688, 0.23090362548828125, 0.24573135375976562, 0.26055908203125, 0.2753868103027344, 0.29021453857421875, 0.3050422668457031, 0.3198699951171875, 0.3346977233886719, 0.34952545166015625, 0.3643531799316406, 0.379180908203125, 0.3940086364746094, 0.40883636474609375, 0.4236640930175781, 0.4384918212890625, 0.4533195495605469, 0.46814727783203125, 0.4829750061035156, 0.497802734375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 7.0, 20.0, 43.0, 87.0, 158.0, 254.0, 211.0, 108.0, 48.0, 30.0, 10.0, 5.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.735250473022461, -14.3345308303833, -13.933810234069824, -13.533090591430664, -13.132369995117188, -12.731650352478027, -12.330930709838867, -11.93021011352539, -11.529489517211914, -11.128769874572754, -10.728049278259277, -10.327329635620117, -9.92660903930664, -9.52588939666748, -9.12516975402832, -8.724449157714844, -8.323729515075684, -7.923009395599365, -7.522289276123047, -7.121569633483887, -6.72084903717041, -6.32012939453125, -5.919409275054932, -5.518689155578613, -5.117969036102295, -4.717248916625977, -4.316528797149658, -3.915808916091919, -3.5150887966156006, -3.1143686771392822, -2.713648796081543, -2.3129286766052246, -1.9122076034545898, -1.5114874839782715, -1.1107674837112427, -0.7100474834442139, -0.3093273639678955, 0.09139275550842285, 0.4921126365661621, 0.8928327560424805, 1.2935528755187988, 1.6942729949951172, 2.0949931144714355, 2.495712995529175, 2.896433115005493, 3.2971532344818115, 3.697873115539551, 4.098593235015869, 4.4993133544921875, 4.900033473968506, 5.300753593444824, 5.701473236083984, 6.102193832397461, 6.502913475036621, 6.9036335945129395, 7.304353713989258, 7.705073833465576, 8.105793952941895, 8.506513595581055, 8.907234191894531, 9.307953834533691, 9.708674430847168, 10.109394073486328, 10.510114669799805, 10.910834312438965]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 10.0, 13.0, 17.0, 14.0, 28.0, 26.0, 30.0, 28.0, 46.0, 51.0, 51.0, 65.0, 60.0, 59.0, 72.0, 57.0, 58.0, 46.0, 37.0, 42.0, 30.0, 27.0, 25.0, 30.0, 18.0, 16.0, 12.0, 8.0, 10.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.826101779937744, -4.634154319763184, -4.442207336425781, -4.250260353088379, -4.058312892913818, -3.866365671157837, -3.6744184494018555, -3.482471227645874, -3.2905240058898926, -3.098576784133911, -2.9066295623779297, -2.7146823406219482, -2.522735118865967, -2.3307878971099854, -2.138840675354004, -1.9468934535980225, -1.754946231842041, -1.5629990100860596, -1.3710517883300781, -1.1791045665740967, -0.9871573448181152, -0.7952101230621338, -0.6032629013061523, -0.4113156795501709, -0.21936845779418945, -0.027421236038208008, 0.16452598571777344, 0.3564732074737549, 0.5484204292297363, 0.7403676509857178, 0.9323148727416992, 1.1242620944976807, 1.3162097930908203, 1.5081570148468018, 1.7001042366027832, 1.8920514583587646, 2.083998680114746, 2.2759459018707275, 2.467893123626709, 2.6598403453826904, 2.851787567138672, 3.0437347888946533, 3.2356820106506348, 3.427629232406616, 3.6195764541625977, 3.811523675918579, 4.0034708976745605, 4.195418357849121, 4.387365341186523, 4.579312324523926, 4.771259784698486, 4.963207244873047, 5.155154228210449, 5.347101211547852, 5.539048671722412, 5.730996131896973, 5.922943115234375, 6.114890098571777, 6.306837558746338, 6.498785018920898, 6.690732002258301, 6.882678985595703, 7.074626445770264, 7.266573905944824, 7.458520889282227]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 17.0, 31.0, 60.0, 71.0, 113.0, 206.0, 358.0, 753.0, 2028.0, 6464.0, 43219.0, 3118298.0, 992334.0, 22926.0, 4480.0, 1441.0, 604.0, 344.0, 195.0, 124.0, 60.0, 43.0, 26.0, 10.0, 15.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.488616943359375, -3.34246826171875, -3.196319580078125, -3.0501708984375, -2.904022216796875, -2.75787353515625, -2.611724853515625, -2.465576171875, -2.319427490234375, -2.17327880859375, -2.027130126953125, -1.8809814453125, -1.734832763671875, -1.58868408203125, -1.442535400390625, -1.29638671875, -1.150238037109375, -1.00408935546875, -0.857940673828125, -0.7117919921875, -0.565643310546875, -0.41949462890625, -0.273345947265625, -0.127197265625, 0.018951416015625, 0.16510009765625, 0.311248779296875, 0.4573974609375, 0.603546142578125, 0.74969482421875, 0.895843505859375, 1.0419921875, 1.188140869140625, 1.33428955078125, 1.480438232421875, 1.6265869140625, 1.772735595703125, 1.91888427734375, 2.065032958984375, 2.211181640625, 2.357330322265625, 2.50347900390625, 2.649627685546875, 2.7957763671875, 2.941925048828125, 3.08807373046875, 3.234222412109375, 3.38037109375, 3.526519775390625, 3.67266845703125, 3.818817138671875, 3.9649658203125, 4.111114501953125, 4.25726318359375, 4.403411865234375, 4.549560546875, 4.695709228515625, 4.84185791015625, 4.988006591796875, 5.1341552734375, 5.280303955078125, 5.42645263671875, 5.572601318359375, 5.71875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 20.0, 18.0, 25.0, 40.0, 43.0, 52.0, 52.0, 45.0, 47.0, 49.0, 44.0, 54.0, 52.0, 55.0, 52.0, 53.0, 42.0, 41.0, 31.0, 20.0, 17.0, 22.0, 17.0, 11.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.55029296875, -0.53125, -0.51220703125, -0.4931640625, -0.47412109375, -0.455078125, -0.43603515625, -0.4169921875, -0.39794921875, -0.37890625, -0.35986328125, -0.3408203125, -0.32177734375, -0.302734375, -0.28369140625, -0.2646484375, -0.24560546875, -0.2265625, -0.20751953125, -0.1884765625, -0.16943359375, -0.150390625, -0.13134765625, -0.1123046875, -0.09326171875, -0.07421875, -0.05517578125, -0.0361328125, -0.01708984375, 0.001953125, 0.02099609375, 0.0400390625, 0.05908203125, 0.078125, 0.09716796875, 0.1162109375, 0.13525390625, 0.154296875, 0.17333984375, 0.1923828125, 0.21142578125, 0.23046875, 0.24951171875, 0.2685546875, 0.28759765625, 0.306640625, 0.32568359375, 0.3447265625, 0.36376953125, 0.3828125, 0.40185546875, 0.4208984375, 0.43994140625, 0.458984375, 0.47802734375, 0.4970703125, 0.51611328125, 0.53515625, 0.55419921875, 0.5732421875, 0.59228515625, 0.611328125, 0.63037109375, 0.6494140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 14.0, 23.0, 31.0, 50.0, 73.0, 135.0, 273.0, 546.0, 1621.0, 6104.0, 64673.0, 4027634.0, 83485.0, 6507.0, 1711.0, 637.0, 296.0, 169.0, 90.0, 65.0, 40.0, 19.0, 19.0, 14.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.578125, -4.411865234375, -4.24560546875, -4.079345703125, -3.9130859375, -3.746826171875, -3.58056640625, -3.414306640625, -3.248046875, -3.081787109375, -2.91552734375, -2.749267578125, -2.5830078125, -2.416748046875, -2.25048828125, -2.084228515625, -1.91796875, -1.751708984375, -1.58544921875, -1.419189453125, -1.2529296875, -1.086669921875, -0.92041015625, -0.754150390625, -0.587890625, -0.421630859375, -0.25537109375, -0.089111328125, 0.0771484375, 0.243408203125, 0.40966796875, 0.575927734375, 0.7421875, 0.908447265625, 1.07470703125, 1.240966796875, 1.4072265625, 1.573486328125, 1.73974609375, 1.906005859375, 2.072265625, 2.238525390625, 2.40478515625, 2.571044921875, 2.7373046875, 2.903564453125, 3.06982421875, 3.236083984375, 3.40234375, 3.568603515625, 3.73486328125, 3.901123046875, 4.0673828125, 4.233642578125, 4.39990234375, 4.566162109375, 4.732421875, 4.898681640625, 5.06494140625, 5.231201171875, 5.3974609375, 5.563720703125, 5.72998046875, 5.896240234375, 6.0625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 12.0, 19.0, 33.0, 72.0, 125.0, 220.0, 454.0, 811.0, 979.0, 633.0, 340.0, 164.0, 81.0, 48.0, 19.0, 21.0, 5.0, 10.0, 9.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.728515625, -3.628326416015625, -3.52813720703125, -3.427947998046875, -3.3277587890625, -3.227569580078125, -3.12738037109375, -3.027191162109375, -2.927001953125, -2.826812744140625, -2.72662353515625, -2.626434326171875, -2.5262451171875, -2.426055908203125, -2.32586669921875, -2.225677490234375, -2.12548828125, -2.025299072265625, -1.92510986328125, -1.824920654296875, -1.7247314453125, -1.624542236328125, -1.52435302734375, -1.424163818359375, -1.323974609375, -1.223785400390625, -1.12359619140625, -1.023406982421875, -0.9232177734375, -0.823028564453125, -0.72283935546875, -0.622650146484375, -0.5224609375, -0.422271728515625, -0.32208251953125, -0.221893310546875, -0.1217041015625, -0.021514892578125, 0.07867431640625, 0.178863525390625, 0.279052734375, 0.379241943359375, 0.47943115234375, 0.579620361328125, 0.6798095703125, 0.779998779296875, 0.88018798828125, 0.980377197265625, 1.08056640625, 1.180755615234375, 1.28094482421875, 1.381134033203125, 1.4813232421875, 1.581512451171875, 1.68170166015625, 1.781890869140625, 1.882080078125, 1.982269287109375, 2.08245849609375, 2.182647705078125, 2.2828369140625, 2.383026123046875, 2.48321533203125, 2.583404541015625, 2.68359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 37.0, 67.0, 221.0, 398.0, 156.0, 55.0, 17.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.287017822265625, -57.77751159667969, -56.26800537109375, -54.75849914550781, -53.248992919921875, -51.73948287963867, -50.229976654052734, -48.7204704284668, -47.21096420288086, -45.70145797729492, -44.191951751708984, -42.68244552612305, -41.172935485839844, -39.663429260253906, -38.15392303466797, -36.64441680908203, -35.134910583496094, -33.625404357910156, -32.11589813232422, -30.60638999938965, -29.09688377380371, -27.587377548217773, -26.077869415283203, -24.568363189697266, -23.058856964111328, -21.54935073852539, -20.039844512939453, -18.530336380004883, -17.020830154418945, -15.511323928833008, -14.001816749572754, -12.4923095703125, -10.982807159423828, -9.47330093383789, -7.963793754577637, -6.454287052154541, -4.944780349731445, -3.4352736473083496, -1.925766944885254, -0.416259765625, 1.0932464599609375, 2.602753162384033, 4.112259864807129, 5.621766567230225, 7.13127326965332, 8.640779495239258, 10.150286674499512, 11.659793853759766, 13.169300079345703, 14.67880630493164, 16.188312530517578, 17.69782066345215, 19.207326889038086, 20.716833114624023, 22.226341247558594, 23.73584747314453, 25.24535369873047, 26.754859924316406, 28.264366149902344, 29.773874282836914, 31.28338050842285, 32.79288864135742, 34.30239486694336, 35.8119010925293, 37.321407318115234]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 7.0, 11.0, 12.0, 22.0, 26.0, 25.0, 36.0, 41.0, 41.0, 59.0, 54.0, 73.0, 69.0, 72.0, 61.0, 50.0, 75.0, 51.0, 41.0, 43.0, 25.0, 32.0, 18.0, 14.0, 8.0, 9.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.759865760803223, -9.417132377624512, -9.0743989944458, -8.73166561126709, -8.388932228088379, -8.046198844909668, -7.703465461730957, -7.360732078552246, -7.017998695373535, -6.675265312194824, -6.332531929016113, -5.989798545837402, -5.647065162658691, -5.3043317794799805, -4.9615983963012695, -4.618865013122559, -4.2761311531066895, -3.9333977699279785, -3.5906643867492676, -3.2479310035705566, -2.9051976203918457, -2.5624642372131348, -2.2197306156158447, -1.8769972324371338, -1.5342638492584229, -1.191530466079712, -0.8487970232963562, -0.5060635805130005, -0.16333019733428955, 0.1794031858444214, 0.5221366882324219, 0.8648700714111328, 1.2076034545898438, 1.5503368377685547, 1.8930702209472656, 2.2358036041259766, 2.5785369873046875, 2.9212703704833984, 3.2640039920806885, 3.6067373752593994, 3.9494707584381104, 4.2922043800354, 4.634937763214111, 4.977671146392822, 5.320404529571533, 5.663137912750244, 6.005871295928955, 6.348604679107666, 6.691338062286377, 7.034071445465088, 7.376804828643799, 7.71953821182251, 8.062272071838379, 8.40500545501709, 8.7477388381958, 9.090472221374512, 9.433205604553223, 9.775938987731934, 10.118672370910645, 10.461405754089355, 10.804139137268066, 11.146872520446777, 11.489605903625488, 11.8323392868042, 12.17507266998291]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 10.0, 16.0, 19.0, 17.0, 37.0, 40.0, 67.0, 112.0, 170.0, 290.0, 515.0, 982.0, 2159.0, 5814.0, 23366.0, 221431.0, 715118.0, 61117.0, 10727.0, 3417.0, 1385.0, 737.0, 381.0, 222.0, 120.0, 89.0, 60.0, 29.0, 25.0, 26.0, 15.0, 7.0, 10.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.994140625, -2.904083251953125, -2.81402587890625, -2.723968505859375, -2.6339111328125, -2.543853759765625, -2.45379638671875, -2.363739013671875, -2.273681640625, -2.183624267578125, -2.09356689453125, -2.003509521484375, -1.9134521484375, -1.823394775390625, -1.73333740234375, -1.643280029296875, -1.55322265625, -1.463165283203125, -1.37310791015625, -1.283050537109375, -1.1929931640625, -1.102935791015625, -1.01287841796875, -0.922821044921875, -0.832763671875, -0.742706298828125, -0.65264892578125, -0.562591552734375, -0.4725341796875, -0.382476806640625, -0.29241943359375, -0.202362060546875, -0.1123046875, -0.022247314453125, 0.06781005859375, 0.157867431640625, 0.2479248046875, 0.337982177734375, 0.42803955078125, 0.518096923828125, 0.608154296875, 0.698211669921875, 0.78826904296875, 0.878326416015625, 0.9683837890625, 1.058441162109375, 1.14849853515625, 1.238555908203125, 1.32861328125, 1.418670654296875, 1.50872802734375, 1.598785400390625, 1.6888427734375, 1.778900146484375, 1.86895751953125, 1.959014892578125, 2.049072265625, 2.139129638671875, 2.22918701171875, 2.319244384765625, 2.4093017578125, 2.499359130859375, 2.58941650390625, 2.679473876953125, 2.76953125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 9.0, 10.0, 7.0, 14.0, 15.0, 23.0, 25.0, 47.0, 45.0, 58.0, 78.0, 88.0, 67.0, 100.0, 81.0, 79.0, 59.0, 62.0, 45.0, 15.0, 21.0, 17.0, 10.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.21875, -2.15863037109375, -2.0985107421875, -2.03839111328125, -1.978271484375, -1.91815185546875, -1.8580322265625, -1.79791259765625, -1.73779296875, -1.67767333984375, -1.6175537109375, -1.55743408203125, -1.497314453125, -1.43719482421875, -1.3770751953125, -1.31695556640625, -1.2568359375, -1.19671630859375, -1.1365966796875, -1.07647705078125, -1.016357421875, -0.95623779296875, -0.8961181640625, -0.83599853515625, -0.77587890625, -0.71575927734375, -0.6556396484375, -0.59552001953125, -0.535400390625, -0.47528076171875, -0.4151611328125, -0.35504150390625, -0.294921875, -0.23480224609375, -0.1746826171875, -0.11456298828125, -0.054443359375, 0.00567626953125, 0.0657958984375, 0.12591552734375, 0.18603515625, 0.24615478515625, 0.3062744140625, 0.36639404296875, 0.426513671875, 0.48663330078125, 0.5467529296875, 0.60687255859375, 0.6669921875, 0.72711181640625, 0.7872314453125, 0.84735107421875, 0.907470703125, 0.96759033203125, 1.0277099609375, 1.08782958984375, 1.14794921875, 1.20806884765625, 1.2681884765625, 1.32830810546875, 1.388427734375, 1.44854736328125, 1.5086669921875, 1.56878662109375, 1.62890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 6.0, 5.0, 10.0, 6.0, 9.0, 23.0, 25.0, 37.0, 57.0, 76.0, 169.0, 375.0, 1157.0, 8150.0, 885424.0, 147458.0, 4077.0, 838.0, 278.0, 132.0, 76.0, 49.0, 37.0, 22.0, 16.0, 7.0, 4.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.8641357421875, -4.720458984375, -4.5767822265625, -4.43310546875, -4.2894287109375, -4.145751953125, -4.0020751953125, -3.8583984375, -3.7147216796875, -3.571044921875, -3.4273681640625, -3.28369140625, -3.1400146484375, -2.996337890625, -2.8526611328125, -2.708984375, -2.5653076171875, -2.421630859375, -2.2779541015625, -2.13427734375, -1.9906005859375, -1.846923828125, -1.7032470703125, -1.5595703125, -1.4158935546875, -1.272216796875, -1.1285400390625, -0.98486328125, -0.8411865234375, -0.697509765625, -0.5538330078125, -0.41015625, -0.2664794921875, -0.122802734375, 0.0208740234375, 0.16455078125, 0.3082275390625, 0.451904296875, 0.5955810546875, 0.7392578125, 0.8829345703125, 1.026611328125, 1.1702880859375, 1.31396484375, 1.4576416015625, 1.601318359375, 1.7449951171875, 1.888671875, 2.0323486328125, 2.176025390625, 2.3197021484375, 2.46337890625, 2.6070556640625, 2.750732421875, 2.8944091796875, 3.0380859375, 3.1817626953125, 3.325439453125, 3.4691162109375, 3.61279296875, 3.7564697265625, 3.900146484375, 4.0438232421875, 4.1875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 21.0, 17.0, 25.0, 29.0, 50.0, 78.0, 83.0, 86.0, 89.0, 100.0, 72.0, 81.0, 60.0, 58.0, 35.0, 24.0, 23.0, 7.0, 6.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.1451416015625, -5.009033203125, -4.8729248046875, -4.73681640625, -4.6007080078125, -4.464599609375, -4.3284912109375, -4.1923828125, -4.0562744140625, -3.920166015625, -3.7840576171875, -3.64794921875, -3.5118408203125, -3.375732421875, -3.2396240234375, -3.103515625, -2.9674072265625, -2.831298828125, -2.6951904296875, -2.55908203125, -2.4229736328125, -2.286865234375, -2.1507568359375, -2.0146484375, -1.8785400390625, -1.742431640625, -1.6063232421875, -1.47021484375, -1.3341064453125, -1.197998046875, -1.0618896484375, -0.92578125, -0.7896728515625, -0.653564453125, -0.5174560546875, -0.38134765625, -0.2452392578125, -0.109130859375, 0.0269775390625, 0.1630859375, 0.2991943359375, 0.435302734375, 0.5714111328125, 0.70751953125, 0.8436279296875, 0.979736328125, 1.1158447265625, 1.251953125, 1.3880615234375, 1.524169921875, 1.6602783203125, 1.79638671875, 1.9324951171875, 2.068603515625, 2.2047119140625, 2.3408203125, 2.4769287109375, 2.613037109375, 2.7491455078125, 2.88525390625, 3.0213623046875, 3.157470703125, 3.2935791015625, 3.4296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 17.0, 32.0, 41.0, 105.0, 198.0, 449.0, 1055.0, 3570.0, 17943.0, 580100.0, 423119.0, 16321.0, 3520.0, 1090.0, 489.0, 229.0, 114.0, 64.0, 28.0, 17.0, 9.0, 7.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65625, -0.6357269287109375, -0.615203857421875, -0.5946807861328125, -0.57415771484375, -0.5536346435546875, -0.533111572265625, -0.5125885009765625, -0.4920654296875, -0.4715423583984375, -0.451019287109375, -0.4304962158203125, -0.40997314453125, -0.3894500732421875, -0.368927001953125, -0.3484039306640625, -0.327880859375, -0.3073577880859375, -0.286834716796875, -0.2663116455078125, -0.24578857421875, -0.2252655029296875, -0.204742431640625, -0.1842193603515625, -0.1636962890625, -0.1431732177734375, -0.122650146484375, -0.1021270751953125, -0.08160400390625, -0.0610809326171875, -0.040557861328125, -0.0200347900390625, 0.00048828125, 0.0210113525390625, 0.041534423828125, 0.0620574951171875, 0.08258056640625, 0.1031036376953125, 0.123626708984375, 0.1441497802734375, 0.1646728515625, 0.1851959228515625, 0.205718994140625, 0.2262420654296875, 0.24676513671875, 0.2672882080078125, 0.287811279296875, 0.3083343505859375, 0.328857421875, 0.3493804931640625, 0.369903564453125, 0.3904266357421875, 0.41094970703125, 0.4314727783203125, 0.451995849609375, 0.4725189208984375, 0.4930419921875, 0.5135650634765625, 0.534088134765625, 0.5546112060546875, 0.57513427734375, 0.5956573486328125, 0.616180419921875, 0.6367034912109375, 0.6572265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 4.0, 2.0, 7.0, 7.0, 9.0, 16.0, 18.0, 36.0, 42.0, 53.0, 113.0, 149.0, 174.0, 122.0, 71.0, 55.0, 34.0, 16.0, 14.0, 8.0, 10.0, 8.0, 12.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001304149627685547, -0.000125933438539505, -0.00012145191431045532, -0.00011697039008140564, -0.00011248886585235596, -0.00010800734162330627, -0.00010352581739425659, -9.904429316520691e-05, -9.456276893615723e-05, -9.008124470710754e-05, -8.559972047805786e-05, -8.111819624900818e-05, -7.66366720199585e-05, -7.215514779090881e-05, -6.767362356185913e-05, -6.319209933280945e-05, -5.8710575103759766e-05, -5.422905087471008e-05, -4.97475266456604e-05, -4.526600241661072e-05, -4.0784478187561035e-05, -3.630295395851135e-05, -3.182142972946167e-05, -2.7339905500411987e-05, -2.2858381271362305e-05, -1.8376857042312622e-05, -1.389533281326294e-05, -9.413808584213257e-06, -4.932284355163574e-06, -4.507601261138916e-07, 4.030764102935791e-06, 8.512288331985474e-06, 1.2993812561035156e-05, 1.747533679008484e-05, 2.195686101913452e-05, 2.6438385248184204e-05, 3.091990947723389e-05, 3.540143370628357e-05, 3.988295793533325e-05, 4.4364482164382935e-05, 4.884600639343262e-05, 5.33275306224823e-05, 5.780905485153198e-05, 6.229057908058167e-05, 6.677210330963135e-05, 7.125362753868103e-05, 7.573515176773071e-05, 8.02166759967804e-05, 8.469820022583008e-05, 8.917972445487976e-05, 9.366124868392944e-05, 9.814277291297913e-05, 0.00010262429714202881, 0.00010710582137107849, 0.00011158734560012817, 0.00011606886982917786, 0.00012055039405822754, 0.00012503191828727722, 0.0001295134425163269, 0.0001339949667453766, 0.00013847649097442627, 0.00014295801520347595, 0.00014743953943252563, 0.00015192106366157532, 0.000156402587890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 10.0, 13.0, 8.0, 9.0, 7.0, 16.0, 26.0, 43.0, 67.0, 76.0, 167.0, 274.0, 527.0, 1550.0, 5524.0, 72318.0, 948767.0, 14745.0, 2634.0, 901.0, 376.0, 196.0, 91.0, 70.0, 53.0, 25.0, 12.0, 14.0, 13.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.31494140625, -1.275390625, -1.23583984375, -1.1962890625, -1.15673828125, -1.1171875, -1.07763671875, -1.0380859375, -0.99853515625, -0.958984375, -0.91943359375, -0.8798828125, -0.84033203125, -0.80078125, -0.76123046875, -0.7216796875, -0.68212890625, -0.642578125, -0.60302734375, -0.5634765625, -0.52392578125, -0.484375, -0.44482421875, -0.4052734375, -0.36572265625, -0.326171875, -0.28662109375, -0.2470703125, -0.20751953125, -0.16796875, -0.12841796875, -0.0888671875, -0.04931640625, -0.009765625, 0.02978515625, 0.0693359375, 0.10888671875, 0.1484375, 0.18798828125, 0.2275390625, 0.26708984375, 0.306640625, 0.34619140625, 0.3857421875, 0.42529296875, 0.46484375, 0.50439453125, 0.5439453125, 0.58349609375, 0.623046875, 0.66259765625, 0.7021484375, 0.74169921875, 0.78125, 0.82080078125, 0.8603515625, 0.89990234375, 0.939453125, 0.97900390625, 1.0185546875, 1.05810546875, 1.09765625, 1.13720703125, 1.1767578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 5.0, 4.0, 8.0, 3.0, 8.0, 12.0, 11.0, 14.0, 15.0, 20.0, 28.0, 38.0, 46.0, 91.0, 151.0, 138.0, 95.0, 82.0, 57.0, 41.0, 29.0, 20.0, 19.0, 10.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.428466796875, -0.4122200012207031, -0.39597320556640625, -0.3797264099121094, -0.3634796142578125, -0.3472328186035156, -0.33098602294921875, -0.3147392272949219, -0.298492431640625, -0.2822456359863281, -0.26599884033203125, -0.24975204467773438, -0.2335052490234375, -0.21725845336914062, -0.20101165771484375, -0.18476486206054688, -0.16851806640625, -0.15227127075195312, -0.13602447509765625, -0.11977767944335938, -0.1035308837890625, -0.08728408813476562, -0.07103729248046875, -0.054790496826171875, -0.038543701171875, -0.022296905517578125, -0.00605010986328125, 0.010196685791015625, 0.0264434814453125, 0.042690277099609375, 0.05893707275390625, 0.07518386840820312, 0.0914306640625, 0.10767745971679688, 0.12392425537109375, 0.14017105102539062, 0.1564178466796875, 0.17266464233398438, 0.18891143798828125, 0.20515823364257812, 0.221405029296875, 0.23765182495117188, 0.25389862060546875, 0.2701454162597656, 0.2863922119140625, 0.3026390075683594, 0.31888580322265625, 0.3351325988769531, 0.35137939453125, 0.3676261901855469, 0.38387298583984375, 0.4001197814941406, 0.4163665771484375, 0.4326133728027344, 0.44886016845703125, 0.4651069641113281, 0.481353759765625, 0.4976005554199219, 0.5138473510742188, 0.5300941467285156, 0.5463409423828125, 0.5625877380371094, 0.5788345336914062, 0.5950813293457031, 0.611328125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 18.0, 21.0, 38.0, 78.0, 161.0, 236.0, 176.0, 114.0, 46.0, 40.0, 18.0, 18.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.27452278137207, -15.87252426147461, -15.470525741577148, -15.068527221679688, -14.666528701782227, -14.264530181884766, -13.862530708312988, -13.460532188415527, -13.058533668518066, -12.656535148620605, -12.254536628723145, -11.852538108825684, -11.450538635253906, -11.048540115356445, -10.646541595458984, -10.244543075561523, -9.842544555664062, -9.440546035766602, -9.03854751586914, -8.63654899597168, -8.234550476074219, -7.8325514793396, -7.4305524826049805, -7.0285539627075195, -6.626555442810059, -6.224556922912598, -5.822558403015137, -5.420559406280518, -5.018560886383057, -4.616562366485596, -4.214563369750977, -3.8125648498535156, -3.410567283630371, -3.00856876373291, -2.60657000541687, -2.20457124710083, -1.8025727272033691, -1.4005742073059082, -0.9985754489898682, -0.5965766906738281, -0.1945781707763672, 0.2074204683303833, 0.6094191074371338, 1.0114177465438843, 1.4134163856506348, 1.8154149055480957, 2.2174136638641357, 2.619412422180176, 3.0214109420776367, 3.4234094619750977, 3.8254082202911377, 4.227406978607178, 4.629405498504639, 5.0314040184021, 5.433403015136719, 5.83540153503418, 6.237400054931641, 6.639398574829102, 7.0413970947265625, 7.443396091461182, 7.845394611358643, 8.247392654418945, 8.649392127990723, 9.051390647888184, 9.453389167785645]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 2.0, 10.0, 7.0, 10.0, 11.0, 22.0, 21.0, 23.0, 32.0, 44.0, 43.0, 56.0, 61.0, 87.0, 96.0, 63.0, 63.0, 62.0, 53.0, 44.0, 41.0, 24.0, 33.0, 22.0, 25.0, 11.0, 8.0, 5.0, 5.0, 6.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.914539337158203, -8.626532554626465, -8.338525772094727, -8.050518989562988, -7.76251220703125, -7.474505424499512, -7.186498641967773, -6.898491859436035, -6.610485076904297, -6.322478294372559, -6.03447151184082, -5.746464729309082, -5.458457946777344, -5.1704511642456055, -4.882444381713867, -4.594437599182129, -4.306430816650391, -4.018424034118652, -3.730417251586914, -3.442410469055176, -3.1544036865234375, -2.866396903991699, -2.578390121459961, -2.2903833389282227, -2.0023765563964844, -1.714369773864746, -1.4263629913330078, -1.1383562088012695, -0.8503494262695312, -0.562342643737793, -0.2743358612060547, 0.013670921325683594, 0.30167675018310547, 0.5896835327148438, 0.877690315246582, 1.1656970977783203, 1.4537038803100586, 1.7417106628417969, 2.029717445373535, 2.3177242279052734, 2.6057310104370117, 2.89373779296875, 3.1817445755004883, 3.4697513580322266, 3.757758140563965, 4.045764923095703, 4.333771705627441, 4.62177848815918, 4.909785270690918, 5.197792053222656, 5.4857988357543945, 5.773805618286133, 6.061812400817871, 6.349819183349609, 6.637825965881348, 6.925832748413086, 7.213839530944824, 7.5018463134765625, 7.789853096008301, 8.077859878540039, 8.365866661071777, 8.653873443603516, 8.941880226135254, 9.229887008666992, 9.51789379119873]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 4.0, 3.0, 6.0, 7.0, 11.0, 15.0, 25.0, 31.0, 41.0, 55.0, 140.0, 391.0, 68.0, 47.0, 41.0, 27.0, 20.0, 21.0, 17.0, 9.0, 4.0, 4.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.470703125, -3.386810302734375, -3.30291748046875, -3.219024658203125, -3.1351318359375, -3.051239013671875, -2.96734619140625, -2.883453369140625, -2.799560546875, -2.715667724609375, -2.63177490234375, -2.547882080078125, -2.4639892578125, -2.380096435546875, -2.29620361328125, -2.212310791015625, -2.12841796875, -2.044525146484375, -1.96063232421875, -1.876739501953125, -1.7928466796875, -1.708953857421875, -1.62506103515625, -1.541168212890625, -1.457275390625, -1.373382568359375, -1.28948974609375, -1.205596923828125, -1.1217041015625, -1.037811279296875, -0.95391845703125, -0.870025634765625, -0.7861328125, -0.702239990234375, -0.61834716796875, -0.534454345703125, -0.4505615234375, -0.366668701171875, -0.28277587890625, -0.198883056640625, -0.114990234375, -0.031097412109375, 0.05279541015625, 0.136688232421875, 0.2205810546875, 0.304473876953125, 0.38836669921875, 0.472259521484375, 0.55615234375, 0.640045166015625, 0.72393798828125, 0.807830810546875, 0.8917236328125, 0.975616455078125, 1.05950927734375, 1.143402099609375, 1.227294921875, 1.311187744140625, 1.39508056640625, 1.478973388671875, 1.5628662109375, 1.646759033203125, 1.73065185546875, 1.814544677734375, 1.8984375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 17.0, 10.0, 17.0, 18.0, 13.0, 20.0, 34.0, 48.0, 74.0, 120.0, 189.0, 295.0, 482.0, 969.0, 2382.0, 9559.0, 7736259.0, 625474.0, 8536.0, 2171.0, 859.0, 410.0, 224.0, 134.0, 87.0, 44.0, 32.0, 22.0, 23.0, 16.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.168179512023926, -6.98426628112793, -6.800353050231934, -6.6164398193359375, -6.432526588439941, -6.248613357543945, -6.064700126647949, -5.880786895751953, -5.696873664855957, -5.512960433959961, -5.329047203063965, -5.145133972167969, -4.961220741271973, -4.777307510375977, -4.5933942794799805, -4.409481048583984, -4.2255682945251465, -4.04165506362915, -3.8577418327331543, -3.673828601837158, -3.489915370941162, -3.306002140045166, -3.122089147567749, -2.938175916671753, -2.754262685775757, -2.5703494548797607, -2.3864362239837646, -2.2025232315063477, -2.0186100006103516, -1.834696650505066, -1.6507835388183594, -1.4668703079223633, -1.282956600189209, -1.099043369293213, -0.9151301980018616, -0.7312170267105103, -0.5473037958145142, -0.36339056491851807, -0.17947745323181152, 0.00443577766418457, 0.18834900856018066, 0.37226220965385437, 0.5561754107475281, 0.7400885820388794, 0.9240018129348755, 1.1079150438308716, 1.2918281555175781, 1.4757413864135742, 1.6596546173095703, 1.8435678482055664, 2.0274810791015625, 2.2113943099975586, 2.3953075408935547, 2.579220771789551, 2.7631337642669678, 2.947046995162964, 3.13096022605896, 3.314873456954956, 3.498786687850952, 3.682699680328369, 3.8666129112243652, 4.050526142120361, 4.234439373016357, 4.4183526039123535, 4.60226583480835]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 3.0, 7.0, 2.0, 5.0, 37.0, 25.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15488624572754, -16.547809600830078, -15.9407320022583, -15.33365535736084, -14.726578712463379, -14.119501113891602, -13.51242446899414, -12.90534782409668, -12.298271179199219, -11.691194534301758, -11.08411693572998, -10.47704029083252, -9.869963645935059, -9.262886047363281, -8.65580940246582, -8.04873275756836, -7.441655158996582, -6.834578037261963, -6.227501392364502, -5.620424270629883, -5.013347625732422, -4.406270503997803, -3.7991933822631836, -3.1921167373657227, -2.5850396156311035, -1.9779627323150635, -1.3708857297897339, -0.7638087272644043, -0.15673184394836426, 0.4503450393676758, 1.057422161102295, 1.6644988059997559, 2.271575927734375, 2.878652811050415, 3.485729694366455, 4.092806816101074, 4.699883460998535, 5.306960582733154, 5.914037704467773, 6.521114349365234, 7.1281914710998535, 7.735268592834473, 8.342345237731934, 8.949422836303711, 9.556499481201172, 10.163576126098633, 10.770652770996094, 11.377729415893555, 11.984807014465332, 12.591883659362793, 13.19896125793457, 13.806037902832031, 14.413114547729492, 15.020191192626953, 15.62726879119873, 16.234344482421875, 16.84142303466797, 17.44849967956543, 18.05557632446289, 18.662654876708984, 19.269731521606445, 19.876808166503906, 20.483884811401367, 21.090961456298828, 21.69803810119629]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 7.0, 13.0, 17.0, 24.0, 26.0, 25.0, 47.0, 47.0, 70.0, 59.0, 69.0, 77.0, 62.0, 79.0, 74.0, 53.0, 51.0, 47.0, 25.0, 38.0, 26.0, 22.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.244140625, -2.182159423828125, -2.12017822265625, -2.058197021484375, -1.9962158203125, -1.934234619140625, -1.87225341796875, -1.810272216796875, -1.748291015625, -1.686309814453125, -1.62432861328125, -1.562347412109375, -1.5003662109375, -1.438385009765625, -1.37640380859375, -1.314422607421875, -1.25244140625, -1.190460205078125, -1.12847900390625, -1.066497802734375, -1.0045166015625, -0.942535400390625, -0.88055419921875, -0.818572998046875, -0.756591796875, -0.694610595703125, -0.63262939453125, -0.570648193359375, -0.5086669921875, -0.446685791015625, -0.38470458984375, -0.322723388671875, -0.2607421875, -0.198760986328125, -0.13677978515625, -0.074798583984375, -0.0128173828125, 0.049163818359375, 0.11114501953125, 0.173126220703125, 0.235107421875, 0.297088623046875, 0.35906982421875, 0.421051025390625, 0.4830322265625, 0.545013427734375, 0.60699462890625, 0.668975830078125, 0.73095703125, 0.792938232421875, 0.85491943359375, 0.916900634765625, 0.9788818359375, 1.040863037109375, 1.10284423828125, 1.164825439453125, 1.226806640625, 1.288787841796875, 1.35076904296875, 1.412750244140625, 1.4747314453125, 1.536712646484375, 1.59869384765625, 1.660675048828125, 1.72265625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 12.0, 16.0, 13.0, 23.0, 33.0, 60.0, 73.0, 125.0, 231.0, 438.0, 924.0, 1963.0, 5110.0, 15018.0, 62647.0, 294995.0, 106690.0, 22940.0, 7513.0, 2902.0, 1222.0, 558.0, 276.0, 176.0, 104.0, 70.0, 34.0, 33.0, 18.0, 6.0, 13.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.966796875, -8.68359375, -8.400390625, -8.1171875, -7.833984375, -7.55078125, -7.267578125, -6.984375, -6.701171875, -6.41796875, -6.134765625, -5.8515625, -5.568359375, -5.28515625, -5.001953125, -4.71875, -4.435546875, -4.15234375, -3.869140625, -3.5859375, -3.302734375, -3.01953125, -2.736328125, -2.453125, -2.169921875, -1.88671875, -1.603515625, -1.3203125, -1.037109375, -0.75390625, -0.470703125, -0.1875, 0.095703125, 0.37890625, 0.662109375, 0.9453125, 1.228515625, 1.51171875, 1.794921875, 2.078125, 2.361328125, 2.64453125, 2.927734375, 3.2109375, 3.494140625, 3.77734375, 4.060546875, 4.34375, 4.626953125, 4.91015625, 5.193359375, 5.4765625, 5.759765625, 6.04296875, 6.326171875, 6.609375, 6.892578125, 7.17578125, 7.458984375, 7.7421875, 8.025390625, 8.30859375, 8.591796875, 8.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 10.0, 7.0, 14.0, 20.0, 30.0, 49.0, 41.0, 67.0, 78.0, 75.0, 67.0, 92.0, 88.0, 92.0, 74.0, 63.0, 46.0, 22.0, 19.0, 12.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.287109375, -1.2474822998046875, -1.207855224609375, -1.1682281494140625, -1.12860107421875, -1.0889739990234375, -1.049346923828125, -1.0097198486328125, -0.9700927734375, -0.9304656982421875, -0.890838623046875, -0.8512115478515625, -0.81158447265625, -0.7719573974609375, -0.732330322265625, -0.6927032470703125, -0.653076171875, -0.6134490966796875, -0.573822021484375, -0.5341949462890625, -0.49456787109375, -0.4549407958984375, -0.415313720703125, -0.3756866455078125, -0.3360595703125, -0.2964324951171875, -0.256805419921875, -0.2171783447265625, -0.17755126953125, -0.1379241943359375, -0.098297119140625, -0.0586700439453125, -0.01904296875, 0.0205841064453125, 0.060211181640625, 0.0998382568359375, 0.13946533203125, 0.1790924072265625, 0.218719482421875, 0.2583465576171875, 0.2979736328125, 0.3376007080078125, 0.377227783203125, 0.4168548583984375, 0.45648193359375, 0.4961090087890625, 0.535736083984375, 0.5753631591796875, 0.614990234375, 0.6546173095703125, 0.694244384765625, 0.7338714599609375, 0.77349853515625, 0.8131256103515625, 0.852752685546875, 0.8923797607421875, 0.9320068359375, 0.9716339111328125, 1.011260986328125, 1.0508880615234375, 1.09051513671875, 1.1301422119140625, 1.169769287109375, 1.2093963623046875, 1.2490234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 11.0, 16.0, 46.0, 120.0, 165.0, 64.0, 36.0, 15.0, 7.0, 10.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4994351863861084, -2.3093364238739014, -2.1192376613616943, -1.9291387796401978, -1.7390400171279907, -1.5489412546157837, -1.358842372894287, -1.16874361038208, -0.978644847869873, -0.788546085357666, -0.5984472632408142, -0.4083484411239624, -0.21824967861175537, -0.02815091609954834, 0.16194796562194824, 0.3520467281341553, 0.5421454906463623, 0.7322442531585693, 0.9223430752754211, 1.112441897392273, 1.30254065990448, 1.492639422416687, 1.6827383041381836, 1.8728370666503906, 2.0629358291625977, 2.2530345916748047, 2.4431333541870117, 2.6332321166992188, 2.823330879211426, 3.013429641723633, 3.203528642654419, 3.393627405166626, 3.583725929260254, 3.773824691772461, 3.963923454284668, 4.154022216796875, 4.344120979309082, 4.534219741821289, 4.724318504333496, 4.914417266845703, 5.10451602935791, 5.294614791870117, 5.484713554382324, 5.674812316894531, 5.864911079406738, 6.055009841918945, 6.245108604431152, 6.435207366943359, 6.625306606292725, 6.815405368804932, 7.005504131317139, 7.195602893829346, 7.385701656341553, 7.57580041885376, 7.765899658203125, 7.955998420715332, 8.146097183227539, 8.336195945739746, 8.526294708251953, 8.71639347076416, 8.906492233276367, 9.096590995788574, 9.286689758300781, 9.476788520812988, 9.666887283325195]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 6.0, 9.0, 7.0, 5.0, 6.0, 7.0, 6.0, 15.0, 19.0, 23.0, 45.0, 52.0, 78.0, 65.0, 32.0, 22.0, 18.0, 6.0, 4.0, 4.0, 13.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.536627769470215, -2.4501874446868896, -2.3637471199035645, -2.27730655670166, -2.190866231918335, -2.1044259071350098, -2.0179855823516846, -1.9315451383590698, -1.845104694366455, -1.7586643695831299, -1.6722239255905151, -1.58578360080719, -1.4993431568145752, -1.41290283203125, -1.3264625072479248, -1.24002206325531, -1.1535817384719849, -1.0671414136886597, -0.9807009696960449, -0.8942606449127197, -0.807820200920105, -0.7213798761367798, -0.6349394917488098, -0.5484991073608398, -0.4620587229728699, -0.3756183385848999, -0.28917795419692993, -0.20273759961128235, -0.11629721522331238, -0.029856830835342407, 0.056583523750305176, 0.14302390813827515, 0.22946429252624512, 0.3159046769142151, 0.40234506130218506, 0.48878541588783264, 0.575225830078125, 0.6616661548614502, 0.7481065392494202, 0.8345469236373901, 0.9209873080253601, 1.00742769241333, 1.0938680171966553, 1.18030846118927, 1.2667487859725952, 1.35318922996521, 1.4396295547485352, 1.5260698795318604, 1.612510323524475, 1.6989506483078003, 1.785391092300415, 1.8718314170837402, 1.958271861076355, 2.0447123050689697, 2.131152629852295, 2.21759295463562, 2.3040332794189453, 2.3904736042022705, 2.4769139289855957, 2.5633544921875, 2.649794816970825, 2.7362351417541504, 2.8226754665374756, 2.909115791320801, 2.995556354522705]}, "eval/loss": 5.527187824249268, "eval/bleu": 0.0, "eval/runtime": 1371.8331, "eval/samples_per_second": 10.759, "eval/steps_per_second": 1.345} \ No newline at end of file