diff --git "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" --- "a/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" +++ "b/wandb/run-20220310_212039-1nikmzrh/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.1412, "train/learning_rate": 2.377019002375297e-05, "train/epoch": 5.04, "train/global_step": 4500, "_runtime": 26336, "_timestamp": 1646973575, "_step": 4502, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 8.0, 16.0, 19.0, 16.0, 25.0, 26.0, 23.0, 31.0, 30.0, 27.0, 35.0, 43.0, 48.0, 44.0, 37.0, 37.0, 44.0, 41.0, 40.0, 62.0, 32.0, 43.0, 42.0, 20.0, 22.0, 22.0, 20.0, 21.0, 15.0, 9.0, 8.0, 19.0, 13.0, 3.0, 12.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0], "bins": [-42.2806282043457, -41.339698791503906, -40.39876937866211, -39.45783996582031, -38.516910552978516, -37.57598114013672, -36.63505172729492, -35.694122314453125, -34.75318908691406, -33.812259674072266, -32.87133026123047, -31.930400848388672, -30.989471435546875, -30.048542022705078, -29.10761070251465, -28.16668128967285, -27.225753784179688, -26.28482437133789, -25.343894958496094, -24.402965545654297, -23.4620361328125, -22.521106719970703, -21.580175399780273, -20.639245986938477, -19.69831657409668, -18.757387161254883, -17.816457748413086, -16.87552833557129, -15.934597969055176, -14.993668556213379, -14.052738189697266, -13.111808776855469, -12.170879364013672, -11.229949951171875, -10.289020538330078, -9.348090171813965, -8.407160758972168, -7.466231346130371, -6.525301456451416, -5.584371566772461, -4.643442153930664, -3.702512502670288, -2.761582851409912, -1.8206532001495361, -0.8797235488891602, 0.06120586395263672, 1.0021357536315918, 1.9430656433105469, 2.8839950561523438, 3.8249247074127197, 4.765854358673096, 5.706784248352051, 6.647713661193848, 7.5886430740356445, 8.529573440551758, 9.470502853393555, 10.411432266235352, 11.352361679077148, 12.293291091918945, 13.234221458435059, 14.175150871276855, 15.116080284118652, 16.057010650634766, 16.997940063476562, 17.93886947631836]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 8.0, 4.0, 4.0, 11.0, 11.0, 16.0, 14.0, 17.0, 19.0, 28.0, 15.0, 24.0, 36.0, 22.0, 28.0, 33.0, 37.0, 48.0, 33.0, 50.0, 43.0, 40.0, 33.0, 42.0, 30.0, 37.0, 29.0, 36.0, 35.0, 29.0, 26.0, 20.0, 20.0, 18.0, 15.0, 15.0, 14.0, 8.0, 8.0, 10.0, 9.0, 15.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-29.311256408691406, -28.399648666381836, -27.488040924072266, -26.576435089111328, -25.664827346801758, -24.753219604492188, -23.84161376953125, -22.93000602722168, -22.01839828491211, -21.10679054260254, -20.19518280029297, -19.28357696533203, -18.37196922302246, -17.46036148071289, -16.548755645751953, -15.637147903442383, -14.725540161132812, -13.813932418823242, -12.902325630187988, -11.990718841552734, -11.079111099243164, -10.167503356933594, -9.25589656829834, -8.344289779663086, -7.432682037353516, -6.5210747718811035, -5.609467506408691, -4.697860240936279, -3.786252975463867, -2.874645709991455, -1.963038444519043, -1.0514311790466309, -0.13982391357421875, 0.7717833518981934, 1.6833906173706055, 2.5949978828430176, 3.5066051483154297, 4.418212413787842, 5.329819679260254, 6.241426944732666, 7.153034210205078, 8.064641952514648, 8.976248741149902, 9.887855529785156, 10.799463272094727, 11.711071014404297, 12.62267780303955, 13.534284591674805, 14.445892333984375, 15.357500076293945, 16.269107818603516, 17.180713653564453, 18.092321395874023, 19.003929138183594, 19.91553497314453, 20.8271427154541, 21.738750457763672, 22.650358200073242, 23.561965942382812, 24.47357177734375, 25.38517951965332, 26.29678726196289, 27.208393096923828, 28.1200008392334, 29.03160858154297]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 15.0, 24.0, 40.0, 62.0, 114.0, 172.0, 290.0, 473.0, 764.0, 1333.0, 2112.0, 3487.0, 5759.0, 9340.0, 15651.0, 25496.0, 41852.0, 67260.0, 107386.0, 165906.0, 246856.0, 346236.0, 451914.0, 523195.0, 534264.0, 476618.0, 378867.0, 275181.0, 187836.0, 122050.0, 78364.0, 48769.0, 29970.0, 18265.0, 11198.0, 6773.0, 4091.0, 2444.0, 1536.0, 933.0, 565.0, 314.0, 198.0, 122.0, 72.0, 41.0, 30.0, 20.0, 11.0, 9.0, 5.0, 3.0, 1.0, 2.0], "bins": [-25.78125, -25.0263671875, -24.271484375, -23.5166015625, -22.76171875, -22.0068359375, -21.251953125, -20.4970703125, -19.7421875, -18.9873046875, -18.232421875, -17.4775390625, -16.72265625, -15.9677734375, -15.212890625, -14.4580078125, -13.703125, -12.9482421875, -12.193359375, -11.4384765625, -10.68359375, -9.9287109375, -9.173828125, -8.4189453125, -7.6640625, -6.9091796875, -6.154296875, -5.3994140625, -4.64453125, -3.8896484375, -3.134765625, -2.3798828125, -1.625, -0.8701171875, -0.115234375, 0.6396484375, 1.39453125, 2.1494140625, 2.904296875, 3.6591796875, 4.4140625, 5.1689453125, 5.923828125, 6.6787109375, 7.43359375, 8.1884765625, 8.943359375, 9.6982421875, 10.453125, 11.2080078125, 11.962890625, 12.7177734375, 13.47265625, 14.2275390625, 14.982421875, 15.7373046875, 16.4921875, 17.2470703125, 18.001953125, 18.7568359375, 19.51171875, 20.2666015625, 21.021484375, 21.7763671875, 22.53125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 11.0, 12.0, 13.0, 22.0, 24.0, 21.0, 24.0, 20.0, 23.0, 36.0, 31.0, 33.0, 42.0, 55.0, 51.0, 50.0, 40.0, 51.0, 36.0, 46.0, 39.0, 40.0, 36.0, 29.0, 29.0, 31.0, 20.0, 21.0, 17.0, 19.0, 16.0, 9.0, 9.0, 12.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.328125, -27.482421875, -26.63671875, -25.791015625, -24.9453125, -24.099609375, -23.25390625, -22.408203125, -21.5625, -20.716796875, -19.87109375, -19.025390625, -18.1796875, -17.333984375, -16.48828125, -15.642578125, -14.796875, -13.951171875, -13.10546875, -12.259765625, -11.4140625, -10.568359375, -9.72265625, -8.876953125, -8.03125, -7.185546875, -6.33984375, -5.494140625, -4.6484375, -3.802734375, -2.95703125, -2.111328125, -1.265625, -0.419921875, 0.42578125, 1.271484375, 2.1171875, 2.962890625, 3.80859375, 4.654296875, 5.5, 6.345703125, 7.19140625, 8.037109375, 8.8828125, 9.728515625, 10.57421875, 11.419921875, 12.265625, 13.111328125, 13.95703125, 14.802734375, 15.6484375, 16.494140625, 17.33984375, 18.185546875, 19.03125, 19.876953125, 20.72265625, 21.568359375, 22.4140625, 23.259765625, 24.10546875, 24.951171875, 25.796875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 9.0, 20.0, 37.0, 59.0, 113.0, 226.0, 379.0, 584.0, 992.0, 1585.0, 2686.0, 4576.0, 7191.0, 11699.0, 18647.0, 29025.0, 44407.0, 66810.0, 98627.0, 139641.0, 191471.0, 250466.0, 314180.0, 370967.0, 409960.0, 419632.0, 396815.0, 350473.0, 292866.0, 228847.0, 171265.0, 123068.0, 85538.0, 57256.0, 38031.0, 24893.0, 15760.0, 9962.0, 6111.0, 3782.0, 2303.0, 1395.0, 802.0, 464.0, 274.0, 156.0, 108.0, 58.0, 37.0, 9.0, 14.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.40673828125, -18.7666015625, -18.12646484375, -17.486328125, -16.84619140625, -16.2060546875, -15.56591796875, -14.92578125, -14.28564453125, -13.6455078125, -13.00537109375, -12.365234375, -11.72509765625, -11.0849609375, -10.44482421875, -9.8046875, -9.16455078125, -8.5244140625, -7.88427734375, -7.244140625, -6.60400390625, -5.9638671875, -5.32373046875, -4.68359375, -4.04345703125, -3.4033203125, -2.76318359375, -2.123046875, -1.48291015625, -0.8427734375, -0.20263671875, 0.4375, 1.07763671875, 1.7177734375, 2.35791015625, 2.998046875, 3.63818359375, 4.2783203125, 4.91845703125, 5.55859375, 6.19873046875, 6.8388671875, 7.47900390625, 8.119140625, 8.75927734375, 9.3994140625, 10.03955078125, 10.6796875, 11.31982421875, 11.9599609375, 12.60009765625, 13.240234375, 13.88037109375, 14.5205078125, 15.16064453125, 15.80078125, 16.44091796875, 17.0810546875, 17.72119140625, 18.361328125, 19.00146484375, 19.6416015625, 20.28173828125, 20.921875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 12.0, 20.0, 19.0, 29.0, 33.0, 29.0, 38.0, 59.0, 81.0, 93.0, 92.0, 114.0, 117.0, 145.0, 144.0, 150.0, 213.0, 182.0, 200.0, 192.0, 187.0, 189.0, 200.0, 193.0, 137.0, 150.0, 148.0, 126.0, 119.0, 108.0, 80.0, 82.0, 63.0, 56.0, 39.0, 34.0, 41.0, 34.0, 19.0, 17.0, 21.0, 11.0, 8.0, 11.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 4.0], "bins": [-9.9140625, -9.5814208984375, -9.248779296875, -8.9161376953125, -8.58349609375, -8.2508544921875, -7.918212890625, -7.5855712890625, -7.2529296875, -6.9202880859375, -6.587646484375, -6.2550048828125, -5.92236328125, -5.5897216796875, -5.257080078125, -4.9244384765625, -4.591796875, -4.2591552734375, -3.926513671875, -3.5938720703125, -3.26123046875, -2.9285888671875, -2.595947265625, -2.2633056640625, -1.9306640625, -1.5980224609375, -1.265380859375, -0.9327392578125, -0.60009765625, -0.2674560546875, 0.065185546875, 0.3978271484375, 0.73046875, 1.0631103515625, 1.395751953125, 1.7283935546875, 2.06103515625, 2.3936767578125, 2.726318359375, 3.0589599609375, 3.3916015625, 3.7242431640625, 4.056884765625, 4.3895263671875, 4.72216796875, 5.0548095703125, 5.387451171875, 5.7200927734375, 6.052734375, 6.3853759765625, 6.718017578125, 7.0506591796875, 7.38330078125, 7.7159423828125, 8.048583984375, 8.3812255859375, 8.7138671875, 9.0465087890625, 9.379150390625, 9.7117919921875, 10.04443359375, 10.3770751953125, 10.709716796875, 11.0423583984375, 11.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 11.0, 13.0, 11.0, 16.0, 22.0, 31.0, 29.0, 31.0, 34.0, 41.0, 38.0, 35.0, 49.0, 42.0, 61.0, 43.0, 34.0, 60.0, 44.0, 41.0, 45.0, 44.0, 41.0, 22.0, 29.0, 28.0, 15.0, 14.0, 20.0, 13.0, 15.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.362350463867188, -30.337923049926758, -29.313495635986328, -28.28907012939453, -27.2646427154541, -26.240215301513672, -25.215787887573242, -24.191360473632812, -23.166934967041016, -22.142507553100586, -21.118080139160156, -20.09365463256836, -19.06922721862793, -18.0447998046875, -17.02037239074707, -15.99594497680664, -14.971517562866211, -13.947090148925781, -12.922663688659668, -11.898236274719238, -10.873809814453125, -9.849382400512695, -8.824954986572266, -7.800528049468994, -6.776101112365723, -5.751674175262451, -4.72724723815918, -3.70281982421875, -2.6783928871154785, -1.653965950012207, -0.6295385360717773, 0.39488840103149414, 1.4193153381347656, 2.443742275238037, 3.4681694507598877, 4.492596626281738, 5.51702356338501, 6.541450500488281, 7.565877914428711, 8.59030532836914, 9.614731788635254, 10.639159202575684, 11.663585662841797, 12.688013076782227, 13.712440490722656, 14.73686695098877, 15.7612943649292, 16.785720825195312, 17.810148239135742, 18.834575653076172, 19.8590030670166, 20.88343048095703, 21.907855987548828, 22.932283401489258, 23.956710815429688, 24.981138229370117, 26.005565643310547, 27.029993057250977, 28.054420471191406, 29.078845977783203, 30.103273391723633, 31.127700805664062, 32.152130126953125, 33.17655563354492, 34.20098114013672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 5.0, 3.0, 11.0, 10.0, 16.0, 8.0, 16.0, 23.0, 25.0, 22.0, 23.0, 28.0, 25.0, 31.0, 38.0, 49.0, 27.0, 47.0, 39.0, 36.0, 43.0, 41.0, 41.0, 41.0, 28.0, 30.0, 40.0, 40.0, 26.0, 29.0, 25.0, 17.0, 20.0, 8.0, 12.0, 16.0, 12.0, 4.0, 12.0, 7.0, 2.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-32.368343353271484, -31.437801361083984, -30.507261276245117, -29.57672119140625, -28.64617919921875, -27.71563720703125, -26.785097122192383, -25.854557037353516, -24.924015045166016, -23.993473052978516, -23.06293296813965, -22.13239288330078, -21.20185089111328, -20.27130889892578, -19.340768814086914, -18.410228729248047, -17.479686737060547, -16.549144744873047, -15.61860466003418, -14.688063621520996, -13.757522583007812, -12.826981544494629, -11.896440505981445, -10.965899467468262, -10.035358428955078, -9.104817390441895, -8.174276351928711, -7.243735313415527, -6.313194274902344, -5.38265323638916, -4.452112197875977, -3.521571159362793, -2.5910301208496094, -1.6604890823364258, -0.7299480438232422, 0.2005929946899414, 1.131134033203125, 2.0616750717163086, 2.992216110229492, 3.922757148742676, 4.853298187255859, 5.783839225769043, 6.714380264282227, 7.64492130279541, 8.575462341308594, 9.506003379821777, 10.436544418334961, 11.367085456848145, 12.297626495361328, 13.228167533874512, 14.158708572387695, 15.089249610900879, 16.019790649414062, 16.950332641601562, 17.88087272644043, 18.811412811279297, 19.741954803466797, 20.672496795654297, 21.603036880493164, 22.53357696533203, 23.46411895751953, 24.39466094970703, 25.3252010345459, 26.255741119384766, 27.186283111572266]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 8.0, 4.0, 7.0, 9.0, 13.0, 17.0, 38.0, 42.0, 46.0, 67.0, 104.0, 104.0, 157.0, 261.0, 365.0, 512.0, 816.0, 1129.0, 1839.0, 2883.0, 4514.0, 7381.0, 12738.0, 23542.0, 46088.0, 99954.0, 230889.0, 317081.0, 153661.0, 68052.0, 32768.0, 17429.0, 9788.0, 5814.0, 3557.0, 2298.0, 1473.0, 1021.0, 695.0, 404.0, 272.0, 190.0, 153.0, 102.0, 66.0, 56.0, 38.0, 38.0, 24.0, 16.0, 17.0, 5.0, 10.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.0, -18.3720703125, -17.744140625, -17.1162109375, -16.48828125, -15.8603515625, -15.232421875, -14.6044921875, -13.9765625, -13.3486328125, -12.720703125, -12.0927734375, -11.46484375, -10.8369140625, -10.208984375, -9.5810546875, -8.953125, -8.3251953125, -7.697265625, -7.0693359375, -6.44140625, -5.8134765625, -5.185546875, -4.5576171875, -3.9296875, -3.3017578125, -2.673828125, -2.0458984375, -1.41796875, -0.7900390625, -0.162109375, 0.4658203125, 1.09375, 1.7216796875, 2.349609375, 2.9775390625, 3.60546875, 4.2333984375, 4.861328125, 5.4892578125, 6.1171875, 6.7451171875, 7.373046875, 8.0009765625, 8.62890625, 9.2568359375, 9.884765625, 10.5126953125, 11.140625, 11.7685546875, 12.396484375, 13.0244140625, 13.65234375, 14.2802734375, 14.908203125, 15.5361328125, 16.1640625, 16.7919921875, 17.419921875, 18.0478515625, 18.67578125, 19.3037109375, 19.931640625, 20.5595703125, 21.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 9.0, 5.0, 6.0, 4.0, 12.0, 8.0, 15.0, 8.0, 18.0, 21.0, 26.0, 23.0, 22.0, 29.0, 26.0, 29.0, 38.0, 48.0, 26.0, 50.0, 42.0, 37.0, 39.0, 40.0, 45.0, 39.0, 27.0, 31.0, 37.0, 42.0, 30.0, 28.0, 22.0, 19.0, 18.0, 9.0, 11.0, 15.0, 13.0, 6.0, 9.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-32.1875, -31.26416015625, -30.3408203125, -29.41748046875, -28.494140625, -27.57080078125, -26.6474609375, -25.72412109375, -24.80078125, -23.87744140625, -22.9541015625, -22.03076171875, -21.107421875, -20.18408203125, -19.2607421875, -18.33740234375, -17.4140625, -16.49072265625, -15.5673828125, -14.64404296875, -13.720703125, -12.79736328125, -11.8740234375, -10.95068359375, -10.02734375, -9.10400390625, -8.1806640625, -7.25732421875, -6.333984375, -5.41064453125, -4.4873046875, -3.56396484375, -2.640625, -1.71728515625, -0.7939453125, 0.12939453125, 1.052734375, 1.97607421875, 2.8994140625, 3.82275390625, 4.74609375, 5.66943359375, 6.5927734375, 7.51611328125, 8.439453125, 9.36279296875, 10.2861328125, 11.20947265625, 12.1328125, 13.05615234375, 13.9794921875, 14.90283203125, 15.826171875, 16.74951171875, 17.6728515625, 18.59619140625, 19.51953125, 20.44287109375, 21.3662109375, 22.28955078125, 23.212890625, 24.13623046875, 25.0595703125, 25.98291015625, 26.90625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 8.0, 8.0, 13.0, 16.0, 19.0, 26.0, 31.0, 40.0, 57.0, 61.0, 107.0, 147.0, 238.0, 293.0, 459.0, 737.0, 1280.0, 2222.0, 4199.0, 9109.0, 24001.0, 96661.0, 623176.0, 220860.0, 38998.0, 12852.0, 5719.0, 2842.0, 1596.0, 953.0, 582.0, 391.0, 231.0, 176.0, 115.0, 92.0, 58.0, 48.0, 39.0, 26.0, 30.0, 9.0, 12.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -31.00634765625, -30.0283203125, -29.05029296875, -28.072265625, -27.09423828125, -26.1162109375, -25.13818359375, -24.16015625, -23.18212890625, -22.2041015625, -21.22607421875, -20.248046875, -19.27001953125, -18.2919921875, -17.31396484375, -16.3359375, -15.35791015625, -14.3798828125, -13.40185546875, -12.423828125, -11.44580078125, -10.4677734375, -9.48974609375, -8.51171875, -7.53369140625, -6.5556640625, -5.57763671875, -4.599609375, -3.62158203125, -2.6435546875, -1.66552734375, -0.6875, 0.29052734375, 1.2685546875, 2.24658203125, 3.224609375, 4.20263671875, 5.1806640625, 6.15869140625, 7.13671875, 8.11474609375, 9.0927734375, 10.07080078125, 11.048828125, 12.02685546875, 13.0048828125, 13.98291015625, 14.9609375, 15.93896484375, 16.9169921875, 17.89501953125, 18.873046875, 19.85107421875, 20.8291015625, 21.80712890625, 22.78515625, 23.76318359375, 24.7412109375, 25.71923828125, 26.697265625, 27.67529296875, 28.6533203125, 29.63134765625, 30.609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 11.0, 8.0, 6.0, 9.0, 17.0, 10.0, 16.0, 22.0, 18.0, 30.0, 22.0, 28.0, 30.0, 38.0, 28.0, 33.0, 28.0, 37.0, 39.0, 36.0, 34.0, 41.0, 41.0, 41.0, 40.0, 35.0, 30.0, 34.0, 40.0, 27.0, 24.0, 23.0, 18.0, 21.0, 8.0, 14.0, 9.0, 14.0, 6.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-23.4375, -22.77880859375, -22.1201171875, -21.46142578125, -20.802734375, -20.14404296875, -19.4853515625, -18.82666015625, -18.16796875, -17.50927734375, -16.8505859375, -16.19189453125, -15.533203125, -14.87451171875, -14.2158203125, -13.55712890625, -12.8984375, -12.23974609375, -11.5810546875, -10.92236328125, -10.263671875, -9.60498046875, -8.9462890625, -8.28759765625, -7.62890625, -6.97021484375, -6.3115234375, -5.65283203125, -4.994140625, -4.33544921875, -3.6767578125, -3.01806640625, -2.359375, -1.70068359375, -1.0419921875, -0.38330078125, 0.275390625, 0.93408203125, 1.5927734375, 2.25146484375, 2.91015625, 3.56884765625, 4.2275390625, 4.88623046875, 5.544921875, 6.20361328125, 6.8623046875, 7.52099609375, 8.1796875, 8.83837890625, 9.4970703125, 10.15576171875, 10.814453125, 11.47314453125, 12.1318359375, 12.79052734375, 13.44921875, 14.10791015625, 14.7666015625, 15.42529296875, 16.083984375, 16.74267578125, 17.4013671875, 18.06005859375, 18.71875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 6.0, 12.0, 25.0, 31.0, 44.0, 90.0, 135.0, 206.0, 338.0, 661.0, 1342.0, 2769.0, 6786.0, 21086.0, 121588.0, 761989.0, 100739.0, 18908.0, 6286.0, 2629.0, 1182.0, 699.0, 356.0, 213.0, 125.0, 75.0, 59.0, 46.0, 29.0, 18.0, 18.0, 9.0, 12.0, 2.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.1142578125, -18.525390625, -17.9365234375, -17.34765625, -16.7587890625, -16.169921875, -15.5810546875, -14.9921875, -14.4033203125, -13.814453125, -13.2255859375, -12.63671875, -12.0478515625, -11.458984375, -10.8701171875, -10.28125, -9.6923828125, -9.103515625, -8.5146484375, -7.92578125, -7.3369140625, -6.748046875, -6.1591796875, -5.5703125, -4.9814453125, -4.392578125, -3.8037109375, -3.21484375, -2.6259765625, -2.037109375, -1.4482421875, -0.859375, -0.2705078125, 0.318359375, 0.9072265625, 1.49609375, 2.0849609375, 2.673828125, 3.2626953125, 3.8515625, 4.4404296875, 5.029296875, 5.6181640625, 6.20703125, 6.7958984375, 7.384765625, 7.9736328125, 8.5625, 9.1513671875, 9.740234375, 10.3291015625, 10.91796875, 11.5068359375, 12.095703125, 12.6845703125, 13.2734375, 13.8623046875, 14.451171875, 15.0400390625, 15.62890625, 16.2177734375, 16.806640625, 17.3955078125, 17.984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 8.0, 8.0, 8.0, 5.0, 8.0, 10.0, 19.0, 17.0, 18.0, 21.0, 19.0, 34.0, 49.0, 56.0, 55.0, 87.0, 93.0, 80.0, 67.0, 56.0, 51.0, 39.0, 26.0, 45.0, 20.0, 17.0, 8.0, 7.0, 7.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0009813308715820312, -0.0009532496333122253, -0.0009251683950424194, -0.0008970871567726135, -0.0008690059185028076, -0.0008409246802330017, -0.0008128434419631958, -0.0007847622036933899, -0.000756680965423584, -0.0007285997271537781, -0.0007005184888839722, -0.0006724372506141663, -0.0006443560123443604, -0.0006162747740745544, -0.0005881935358047485, -0.0005601122975349426, -0.0005320310592651367, -0.0005039498209953308, -0.0004758685827255249, -0.000447787344455719, -0.0004197061061859131, -0.0003916248679161072, -0.00036354362964630127, -0.00033546239137649536, -0.00030738115310668945, -0.00027929991483688354, -0.00025121867656707764, -0.00022313743829727173, -0.00019505620002746582, -0.0001669749617576599, -0.000138893723487854, -0.0001108124852180481, -8.273124694824219e-05, -5.465000867843628e-05, -2.656877040863037e-05, 1.5124678611755371e-06, 2.9593706130981445e-05, 5.7674944400787354e-05, 8.575618267059326e-05, 0.00011383742094039917, 0.00014191865921020508, 0.00016999989748001099, 0.0001980811357498169, 0.0002261623740196228, 0.0002542436122894287, 0.0002823248505592346, 0.00031040608882904053, 0.00033848732709884644, 0.00036656856536865234, 0.00039464980363845825, 0.00042273104190826416, 0.00045081228017807007, 0.000478893518447876, 0.0005069747567176819, 0.0005350559949874878, 0.0005631372332572937, 0.0005912184715270996, 0.0006192997097969055, 0.0006473809480667114, 0.0006754621863365173, 0.0007035434246063232, 0.0007316246628761292, 0.0007597059011459351, 0.000787787139415741, 0.0008158683776855469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 9.0, 12.0, 11.0, 15.0, 20.0, 24.0, 36.0, 63.0, 115.0, 201.0, 336.0, 595.0, 1147.0, 2180.0, 4291.0, 9007.0, 19823.0, 50064.0, 184376.0, 511050.0, 179172.0, 48586.0, 19533.0, 8955.0, 4227.0, 2139.0, 1154.0, 564.0, 354.0, 175.0, 104.0, 69.0, 37.0, 30.0, 15.0, 19.0, 9.0, 15.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.8701171875, -15.349609375, -14.8291015625, -14.30859375, -13.7880859375, -13.267578125, -12.7470703125, -12.2265625, -11.7060546875, -11.185546875, -10.6650390625, -10.14453125, -9.6240234375, -9.103515625, -8.5830078125, -8.0625, -7.5419921875, -7.021484375, -6.5009765625, -5.98046875, -5.4599609375, -4.939453125, -4.4189453125, -3.8984375, -3.3779296875, -2.857421875, -2.3369140625, -1.81640625, -1.2958984375, -0.775390625, -0.2548828125, 0.265625, 0.7861328125, 1.306640625, 1.8271484375, 2.34765625, 2.8681640625, 3.388671875, 3.9091796875, 4.4296875, 4.9501953125, 5.470703125, 5.9912109375, 6.51171875, 7.0322265625, 7.552734375, 8.0732421875, 8.59375, 9.1142578125, 9.634765625, 10.1552734375, 10.67578125, 11.1962890625, 11.716796875, 12.2373046875, 12.7578125, 13.2783203125, 13.798828125, 14.3193359375, 14.83984375, 15.3603515625, 15.880859375, 16.4013671875, 16.921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 12.0, 17.0, 25.0, 48.0, 82.0, 124.0, 163.0, 150.0, 116.0, 95.0, 64.0, 43.0, 19.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.81634521484375, -7.6170654296875, -7.41778564453125, -7.218505859375, -7.01922607421875, -6.8199462890625, -6.62066650390625, -6.42138671875, -6.22210693359375, -6.0228271484375, -5.82354736328125, -5.624267578125, -5.42498779296875, -5.2257080078125, -5.02642822265625, -4.8271484375, -4.62786865234375, -4.4285888671875, -4.22930908203125, -4.030029296875, -3.83074951171875, -3.6314697265625, -3.43218994140625, -3.23291015625, -3.03363037109375, -2.8343505859375, -2.63507080078125, -2.435791015625, -2.23651123046875, -2.0372314453125, -1.83795166015625, -1.638671875, -1.43939208984375, -1.2401123046875, -1.04083251953125, -0.841552734375, -0.64227294921875, -0.4429931640625, -0.24371337890625, -0.04443359375, 0.15484619140625, 0.3541259765625, 0.55340576171875, 0.752685546875, 0.95196533203125, 1.1512451171875, 1.35052490234375, 1.5498046875, 1.74908447265625, 1.9483642578125, 2.14764404296875, 2.346923828125, 2.54620361328125, 2.7454833984375, 2.94476318359375, 3.14404296875, 3.34332275390625, 3.5426025390625, 3.74188232421875, 3.941162109375, 4.14044189453125, 4.3397216796875, 4.53900146484375, 4.73828125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 10.0, 21.0, 15.0, 15.0, 21.0, 30.0, 30.0, 31.0, 29.0, 39.0, 44.0, 56.0, 37.0, 47.0, 41.0, 41.0, 60.0, 45.0, 41.0, 47.0, 41.0, 38.0, 37.0, 27.0, 32.0, 18.0, 21.0, 10.0, 15.0, 15.0, 10.0, 12.0, 6.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.02405548095703, -30.0318546295166, -29.039653778076172, -28.047454833984375, -27.055253982543945, -26.063053131103516, -25.07085418701172, -24.07865333557129, -23.08645248413086, -22.09425163269043, -21.10205078125, -20.109851837158203, -19.117650985717773, -18.125450134277344, -17.133251190185547, -16.141050338745117, -15.148849487304688, -14.156648635864258, -13.164448738098145, -12.172248840332031, -11.180047988891602, -10.187847137451172, -9.195647239685059, -8.203447341918945, -7.211246490478516, -6.219046115875244, -5.226845741271973, -4.234645366668701, -3.2424449920654297, -2.250244617462158, -1.2580442428588867, -0.26584386825561523, 0.7263565063476562, 1.7185568809509277, 2.710757255554199, 3.7029576301574707, 4.695158004760742, 5.687358379364014, 6.679558753967285, 7.671759128570557, 8.663959503173828, 9.656160354614258, 10.648360252380371, 11.640560150146484, 12.632761001586914, 13.624961853027344, 14.617161750793457, 15.60936164855957, 16.6015625, 17.59376335144043, 18.58596420288086, 19.578163146972656, 20.570363998413086, 21.562564849853516, 22.554763793945312, 23.546964645385742, 24.539165496826172, 25.5313663482666, 26.52356719970703, 27.515766143798828, 28.507966995239258, 29.500167846679688, 30.492366790771484, 31.484567642211914, 32.476768493652344]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 7.0, 4.0, 11.0, 14.0, 13.0, 13.0, 16.0, 32.0, 18.0, 22.0, 22.0, 26.0, 29.0, 32.0, 45.0, 42.0, 43.0, 44.0, 31.0, 40.0, 39.0, 44.0, 44.0, 37.0, 29.0, 36.0, 46.0, 23.0, 33.0, 25.0, 18.0, 18.0, 14.0, 11.0, 15.0, 10.0, 9.0, 9.0, 5.0, 4.0, 8.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.05927276611328, -31.126136779785156, -30.193002700805664, -29.25986671447754, -28.326732635498047, -27.393596649169922, -26.460460662841797, -25.527326583862305, -24.594192504882812, -23.661056518554688, -22.727922439575195, -21.79478645324707, -20.861652374267578, -19.928516387939453, -18.995380401611328, -18.062246322631836, -17.12911033630371, -16.195974349975586, -15.262840270996094, -14.329704284667969, -13.396570205688477, -12.463434219360352, -11.530299186706543, -10.597164154052734, -9.664029121398926, -8.730894088745117, -7.797759056091309, -6.864623546600342, -5.931488513946533, -4.998353481292725, -4.065217971801758, -3.132082939147949, -2.1989479064941406, -1.2658127546310425, -0.33267760276794434, 0.6004576683044434, 1.533592700958252, 2.4667277336120605, 3.3998632431030273, 4.332998275756836, 5.2661333084106445, 6.199268341064453, 7.132403373718262, 8.06553840637207, 8.998674392700195, 9.931808471679688, 10.864944458007812, 11.798079490661621, 12.73121452331543, 13.664349555969238, 14.597484588623047, 15.530620574951172, 16.463754653930664, 17.39689064025879, 18.33002471923828, 19.263160705566406, 20.19629669189453, 21.129432678222656, 22.06256675720215, 22.995702743530273, 23.928836822509766, 24.86197280883789, 25.795108795166016, 26.728242874145508, 27.661376953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 12.0, 19.0, 22.0, 35.0, 64.0, 86.0, 133.0, 211.0, 333.0, 494.0, 886.0, 1379.0, 2119.0, 3444.0, 5245.0, 7960.0, 11976.0, 17436.0, 25465.0, 35153.0, 47023.0, 60169.0, 73561.0, 85950.0, 94194.0, 96629.0, 94190.0, 86228.0, 74175.0, 61007.0, 47767.0, 35878.0, 25623.0, 18297.0, 12277.0, 8304.0, 5297.0, 3444.0, 2217.0, 1424.0, 900.0, 572.0, 359.0, 218.0, 154.0, 74.0, 67.0, 27.0, 23.0, 14.0, 13.0, 3.0, 2.0, 2.0, 2.0], "bins": [-19.40625, -18.84423828125, -18.2822265625, -17.72021484375, -17.158203125, -16.59619140625, -16.0341796875, -15.47216796875, -14.91015625, -14.34814453125, -13.7861328125, -13.22412109375, -12.662109375, -12.10009765625, -11.5380859375, -10.97607421875, -10.4140625, -9.85205078125, -9.2900390625, -8.72802734375, -8.166015625, -7.60400390625, -7.0419921875, -6.47998046875, -5.91796875, -5.35595703125, -4.7939453125, -4.23193359375, -3.669921875, -3.10791015625, -2.5458984375, -1.98388671875, -1.421875, -0.85986328125, -0.2978515625, 0.26416015625, 0.826171875, 1.38818359375, 1.9501953125, 2.51220703125, 3.07421875, 3.63623046875, 4.1982421875, 4.76025390625, 5.322265625, 5.88427734375, 6.4462890625, 7.00830078125, 7.5703125, 8.13232421875, 8.6943359375, 9.25634765625, 9.818359375, 10.38037109375, 10.9423828125, 11.50439453125, 12.06640625, 12.62841796875, 13.1904296875, 13.75244140625, 14.314453125, 14.87646484375, 15.4384765625, 16.00048828125, 16.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 6.0, 10.0, 15.0, 13.0, 12.0, 20.0, 30.0, 16.0, 25.0, 20.0, 26.0, 32.0, 32.0, 46.0, 37.0, 42.0, 43.0, 35.0, 41.0, 38.0, 39.0, 43.0, 43.0, 28.0, 38.0, 38.0, 27.0, 33.0, 23.0, 24.0, 18.0, 10.0, 15.0, 14.0, 9.0, 10.0, 8.0, 4.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.140625, -30.2333984375, -29.326171875, -28.4189453125, -27.51171875, -26.6044921875, -25.697265625, -24.7900390625, -23.8828125, -22.9755859375, -22.068359375, -21.1611328125, -20.25390625, -19.3466796875, -18.439453125, -17.5322265625, -16.625, -15.7177734375, -14.810546875, -13.9033203125, -12.99609375, -12.0888671875, -11.181640625, -10.2744140625, -9.3671875, -8.4599609375, -7.552734375, -6.6455078125, -5.73828125, -4.8310546875, -3.923828125, -3.0166015625, -2.109375, -1.2021484375, -0.294921875, 0.6123046875, 1.51953125, 2.4267578125, 3.333984375, 4.2412109375, 5.1484375, 6.0556640625, 6.962890625, 7.8701171875, 8.77734375, 9.6845703125, 10.591796875, 11.4990234375, 12.40625, 13.3134765625, 14.220703125, 15.1279296875, 16.03515625, 16.9423828125, 17.849609375, 18.7568359375, 19.6640625, 20.5712890625, 21.478515625, 22.3857421875, 23.29296875, 24.2001953125, 25.107421875, 26.0146484375, 26.921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 7.0, 9.0, 11.0, 34.0, 41.0, 85.0, 107.0, 175.0, 261.0, 464.0, 676.0, 1224.0, 1888.0, 3096.0, 5073.0, 8119.0, 12829.0, 19772.0, 29826.0, 43772.0, 60545.0, 80324.0, 97941.0, 110806.0, 114377.0, 109277.0, 95053.0, 76410.0, 57757.0, 40983.0, 27832.0, 18386.0, 11972.0, 7440.0, 4528.0, 2884.0, 1724.0, 1052.0, 677.0, 385.0, 262.0, 165.0, 103.0, 66.0, 45.0, 27.0, 24.0, 13.0, 7.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.798828125, -21.08203125, -20.365234375, -19.6484375, -18.931640625, -18.21484375, -17.498046875, -16.78125, -16.064453125, -15.34765625, -14.630859375, -13.9140625, -13.197265625, -12.48046875, -11.763671875, -11.046875, -10.330078125, -9.61328125, -8.896484375, -8.1796875, -7.462890625, -6.74609375, -6.029296875, -5.3125, -4.595703125, -3.87890625, -3.162109375, -2.4453125, -1.728515625, -1.01171875, -0.294921875, 0.421875, 1.138671875, 1.85546875, 2.572265625, 3.2890625, 4.005859375, 4.72265625, 5.439453125, 6.15625, 6.873046875, 7.58984375, 8.306640625, 9.0234375, 9.740234375, 10.45703125, 11.173828125, 11.890625, 12.607421875, 13.32421875, 14.041015625, 14.7578125, 15.474609375, 16.19140625, 16.908203125, 17.625, 18.341796875, 19.05859375, 19.775390625, 20.4921875, 21.208984375, 21.92578125, 22.642578125, 23.359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 1.0, 4.0, 4.0, 7.0, 3.0, 10.0, 12.0, 14.0, 8.0, 15.0, 9.0, 19.0, 16.0, 23.0, 20.0, 29.0, 32.0, 31.0, 32.0, 31.0, 27.0, 35.0, 46.0, 42.0, 46.0, 34.0, 53.0, 33.0, 49.0, 41.0, 31.0, 29.0, 33.0, 32.0, 19.0, 20.0, 22.0, 19.0, 15.0, 7.0, 8.0, 8.0, 7.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-19.796875, -19.2080078125, -18.619140625, -18.0302734375, -17.44140625, -16.8525390625, -16.263671875, -15.6748046875, -15.0859375, -14.4970703125, -13.908203125, -13.3193359375, -12.73046875, -12.1416015625, -11.552734375, -10.9638671875, -10.375, -9.7861328125, -9.197265625, -8.6083984375, -8.01953125, -7.4306640625, -6.841796875, -6.2529296875, -5.6640625, -5.0751953125, -4.486328125, -3.8974609375, -3.30859375, -2.7197265625, -2.130859375, -1.5419921875, -0.953125, -0.3642578125, 0.224609375, 0.8134765625, 1.40234375, 1.9912109375, 2.580078125, 3.1689453125, 3.7578125, 4.3466796875, 4.935546875, 5.5244140625, 6.11328125, 6.7021484375, 7.291015625, 7.8798828125, 8.46875, 9.0576171875, 9.646484375, 10.2353515625, 10.82421875, 11.4130859375, 12.001953125, 12.5908203125, 13.1796875, 13.7685546875, 14.357421875, 14.9462890625, 15.53515625, 16.1240234375, 16.712890625, 17.3017578125, 17.890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 20.0, 28.0, 45.0, 55.0, 89.0, 131.0, 171.0, 269.0, 396.0, 655.0, 1007.0, 1557.0, 2368.0, 3517.0, 5201.0, 7879.0, 11564.0, 16819.0, 23806.0, 33451.0, 44492.0, 57865.0, 71588.0, 83015.0, 92657.0, 96831.0, 94337.0, 87673.0, 76162.0, 62197.0, 49281.0, 37058.0, 27111.0, 19159.0, 13198.0, 8956.0, 6118.0, 4121.0, 2633.0, 1749.0, 1173.0, 722.0, 499.0, 329.0, 190.0, 142.0, 95.0, 51.0, 52.0, 28.0, 9.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-6.125, -5.93756103515625, -5.7501220703125, -5.56268310546875, -5.375244140625, -5.18780517578125, -5.0003662109375, -4.81292724609375, -4.62548828125, -4.43804931640625, -4.2506103515625, -4.06317138671875, -3.875732421875, -3.68829345703125, -3.5008544921875, -3.31341552734375, -3.1259765625, -2.93853759765625, -2.7510986328125, -2.56365966796875, -2.376220703125, -2.18878173828125, -2.0013427734375, -1.81390380859375, -1.62646484375, -1.43902587890625, -1.2515869140625, -1.06414794921875, -0.876708984375, -0.68927001953125, -0.5018310546875, -0.31439208984375, -0.126953125, 0.06048583984375, 0.2479248046875, 0.43536376953125, 0.622802734375, 0.81024169921875, 0.9976806640625, 1.18511962890625, 1.37255859375, 1.55999755859375, 1.7474365234375, 1.93487548828125, 2.122314453125, 2.30975341796875, 2.4971923828125, 2.68463134765625, 2.8720703125, 3.05950927734375, 3.2469482421875, 3.43438720703125, 3.621826171875, 3.80926513671875, 3.9967041015625, 4.18414306640625, 4.37158203125, 4.55902099609375, 4.7464599609375, 4.93389892578125, 5.121337890625, 5.30877685546875, 5.4962158203125, 5.68365478515625, 5.87109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 6.0, 14.0, 5.0, 11.0, 14.0, 16.0, 23.0, 27.0, 27.0, 21.0, 30.0, 34.0, 42.0, 36.0, 44.0, 49.0, 42.0, 53.0, 50.0, 53.0, 36.0, 36.0, 36.0, 30.0, 31.0, 36.0, 31.0, 20.0, 21.0, 17.0, 14.0, 18.0, 12.0, 11.0, 9.0, 6.0, 7.0, 11.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007643699645996094, -0.0007395818829536438, -0.0007147938013076782, -0.0006900057196617126, -0.0006652176380157471, -0.0006404295563697815, -0.0006156414747238159, -0.0005908533930778503, -0.0005660653114318848, -0.0005412772297859192, -0.0005164891481399536, -0.000491701066493988, -0.00046691298484802246, -0.0004421249032020569, -0.0004173368215560913, -0.00039254873991012573, -0.00036776065826416016, -0.0003429725766181946, -0.000318184494972229, -0.00029339641332626343, -0.00026860833168029785, -0.00024382025003433228, -0.0002190321683883667, -0.00019424408674240112, -0.00016945600509643555, -0.00014466792345046997, -0.0001198798418045044, -9.509176015853882e-05, -7.030367851257324e-05, -4.5515596866607666e-05, -2.072751522064209e-05, 4.060566425323486e-06, 2.8848648071289062e-05, 5.363672971725464e-05, 7.842481136322021e-05, 0.00010321289300918579, 0.00012800097465515137, 0.00015278905630111694, 0.00017757713794708252, 0.0002023652195930481, 0.00022715330123901367, 0.00025194138288497925, 0.0002767294645309448, 0.0003015175461769104, 0.000326305627822876, 0.00035109370946884155, 0.00037588179111480713, 0.0004006698727607727, 0.0004254579544067383, 0.00045024603605270386, 0.00047503411769866943, 0.000499822199344635, 0.0005246102809906006, 0.0005493983626365662, 0.0005741864442825317, 0.0005989745259284973, 0.0006237626075744629, 0.0006485506892204285, 0.000673338770866394, 0.0006981268525123596, 0.0007229149341583252, 0.0007477030158042908, 0.0007724910974502563, 0.0007972791790962219, 0.0008220672607421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 8.0, 9.0, 19.0, 20.0, 31.0, 56.0, 87.0, 170.0, 242.0, 379.0, 656.0, 1043.0, 1690.0, 2578.0, 4326.0, 6763.0, 10494.0, 15962.0, 23950.0, 34718.0, 48289.0, 64183.0, 80696.0, 94946.0, 104122.0, 106168.0, 100359.0, 88745.0, 73026.0, 57045.0, 41802.0, 29389.0, 20129.0, 13182.0, 8662.0, 5481.0, 3406.0, 2198.0, 1299.0, 868.0, 515.0, 309.0, 209.0, 119.0, 86.0, 41.0, 28.0, 22.0, 12.0, 11.0, 4.0, 0.0, 4.0, 0.0, 2.0], "bins": [-6.8046875, -6.60614013671875, -6.4075927734375, -6.20904541015625, -6.010498046875, -5.81195068359375, -5.6134033203125, -5.41485595703125, -5.21630859375, -5.01776123046875, -4.8192138671875, -4.62066650390625, -4.422119140625, -4.22357177734375, -4.0250244140625, -3.82647705078125, -3.6279296875, -3.42938232421875, -3.2308349609375, -3.03228759765625, -2.833740234375, -2.63519287109375, -2.4366455078125, -2.23809814453125, -2.03955078125, -1.84100341796875, -1.6424560546875, -1.44390869140625, -1.245361328125, -1.04681396484375, -0.8482666015625, -0.64971923828125, -0.451171875, -0.25262451171875, -0.0540771484375, 0.14447021484375, 0.343017578125, 0.54156494140625, 0.7401123046875, 0.93865966796875, 1.13720703125, 1.33575439453125, 1.5343017578125, 1.73284912109375, 1.931396484375, 2.12994384765625, 2.3284912109375, 2.52703857421875, 2.7255859375, 2.92413330078125, 3.1226806640625, 3.32122802734375, 3.519775390625, 3.71832275390625, 3.9168701171875, 4.11541748046875, 4.31396484375, 4.51251220703125, 4.7110595703125, 4.90960693359375, 5.108154296875, 5.30670166015625, 5.5052490234375, 5.70379638671875, 5.90234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 7.0, 9.0, 14.0, 15.0, 22.0, 17.0, 13.0, 19.0, 19.0, 20.0, 26.0, 28.0, 36.0, 33.0, 45.0, 50.0, 41.0, 46.0, 65.0, 36.0, 46.0, 33.0, 38.0, 32.0, 29.0, 37.0, 25.0, 26.0, 11.0, 21.0, 20.0, 10.0, 15.0, 16.0, 16.0, 10.0, 12.0, 6.0, 2.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.6912841796875, -2.605224609375, -2.5191650390625, -2.43310546875, -2.3470458984375, -2.260986328125, -2.1749267578125, -2.0888671875, -2.0028076171875, -1.916748046875, -1.8306884765625, -1.74462890625, -1.6585693359375, -1.572509765625, -1.4864501953125, -1.400390625, -1.3143310546875, -1.228271484375, -1.1422119140625, -1.05615234375, -0.9700927734375, -0.884033203125, -0.7979736328125, -0.7119140625, -0.6258544921875, -0.539794921875, -0.4537353515625, -0.36767578125, -0.2816162109375, -0.195556640625, -0.1094970703125, -0.0234375, 0.0626220703125, 0.148681640625, 0.2347412109375, 0.32080078125, 0.4068603515625, 0.492919921875, 0.5789794921875, 0.6650390625, 0.7510986328125, 0.837158203125, 0.9232177734375, 1.00927734375, 1.0953369140625, 1.181396484375, 1.2674560546875, 1.353515625, 1.4395751953125, 1.525634765625, 1.6116943359375, 1.69775390625, 1.7838134765625, 1.869873046875, 1.9559326171875, 2.0419921875, 2.1280517578125, 2.214111328125, 2.3001708984375, 2.38623046875, 2.4722900390625, 2.558349609375, 2.6444091796875, 2.73046875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 6.0, 6.0, 8.0, 21.0, 27.0, 21.0, 26.0, 25.0, 31.0, 38.0, 26.0, 37.0, 40.0, 43.0, 53.0, 49.0, 48.0, 36.0, 53.0, 48.0, 50.0, 46.0, 40.0, 40.0, 30.0, 21.0, 22.0, 17.0, 19.0, 18.0, 13.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.00973892211914, -33.00271987915039, -31.99570083618164, -30.98868179321289, -29.98166275024414, -28.97464370727539, -27.96762466430664, -26.96060562133789, -25.95358657836914, -24.94656753540039, -23.93954849243164, -22.93252944946289, -21.92551040649414, -20.91849136352539, -19.91147232055664, -18.90445327758789, -17.89743423461914, -16.89041519165039, -15.88339614868164, -14.87637710571289, -13.86935806274414, -12.86233901977539, -11.85531997680664, -10.84830093383789, -9.84128189086914, -8.83426284790039, -7.827243804931641, -6.820224761962891, -5.813205718994141, -4.806186676025391, -3.7991676330566406, -2.7921485900878906, -1.7851276397705078, -0.7781085968017578, 0.2289104461669922, 1.2359294891357422, 2.242948532104492, 3.249967575073242, 4.256986618041992, 5.264005661010742, 6.271024703979492, 7.278043746948242, 8.285062789916992, 9.292081832885742, 10.299100875854492, 11.306119918823242, 12.313138961791992, 13.320158004760742, 14.327177047729492, 15.334196090698242, 16.341215133666992, 17.348234176635742, 18.355253219604492, 19.362272262573242, 20.369291305541992, 21.376310348510742, 22.383329391479492, 23.390348434448242, 24.397367477416992, 25.404386520385742, 26.411405563354492, 27.418424606323242, 28.425443649291992, 29.432462692260742, 30.439481735229492]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 3.0, 12.0, 5.0, 15.0, 15.0, 13.0, 19.0, 20.0, 27.0, 27.0, 29.0, 26.0, 36.0, 38.0, 38.0, 44.0, 47.0, 36.0, 49.0, 41.0, 49.0, 51.0, 42.0, 38.0, 38.0, 31.0, 33.0, 25.0, 27.0, 18.0, 15.0, 14.0, 15.0, 12.0, 16.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.078758239746094, -33.99924087524414, -32.91972351074219, -31.84020233154297, -30.760684967041016, -29.681167602539062, -28.601648330688477, -27.52212905883789, -26.442611694335938, -25.363094329833984, -24.2835750579834, -23.204055786132812, -22.12453842163086, -21.045021057128906, -19.96550178527832, -18.885982513427734, -17.80646514892578, -16.726947784423828, -15.647428512573242, -14.567910194396973, -13.488391876220703, -12.408873558044434, -11.329355239868164, -10.249836921691895, -9.170318603515625, -8.090800285339355, -7.011281967163086, -5.931763648986816, -4.852245330810547, -3.7727270126342773, -2.693208694458008, -1.6136903762817383, -0.5341758728027344, 0.5453424453735352, 1.6248607635498047, 2.704379081726074, 3.7838973999023438, 4.863415718078613, 5.942934036254883, 7.022452354431152, 8.101970672607422, 9.181488990783691, 10.261007308959961, 11.34052562713623, 12.4200439453125, 13.49956226348877, 14.579080581665039, 15.658598899841309, 16.738117218017578, 17.81763458251953, 18.897153854370117, 19.976673126220703, 21.056190490722656, 22.13570785522461, 23.215227127075195, 24.29474639892578, 25.374263763427734, 26.453781127929688, 27.533300399780273, 28.61281967163086, 29.692337036132812, 30.771854400634766, 31.85137367248535, 32.93089294433594, 34.01041030883789]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 6.0, 9.0, 13.0, 32.0, 54.0, 60.0, 110.0, 174.0, 307.0, 497.0, 725.0, 1202.0, 1936.0, 3138.0, 4779.0, 7441.0, 11435.0, 17490.0, 27008.0, 40591.0, 60231.0, 88018.0, 125173.0, 172733.0, 229529.0, 291424.0, 348141.0, 393263.0, 412416.0, 403051.0, 365763.0, 310372.0, 248143.0, 189923.0, 139491.0, 98387.0, 68084.0, 46121.0, 30528.0, 20287.0, 13202.0, 8476.0, 5397.0, 3470.0, 2126.0, 1303.0, 852.0, 517.0, 337.0, 201.0, 119.0, 82.0, 47.0, 31.0, 16.0, 15.0, 3.0, 5.0, 1.0, 4.0, 3.0], "bins": [-18.6875, -18.09716796875, -17.5068359375, -16.91650390625, -16.326171875, -15.73583984375, -15.1455078125, -14.55517578125, -13.96484375, -13.37451171875, -12.7841796875, -12.19384765625, -11.603515625, -11.01318359375, -10.4228515625, -9.83251953125, -9.2421875, -8.65185546875, -8.0615234375, -7.47119140625, -6.880859375, -6.29052734375, -5.7001953125, -5.10986328125, -4.51953125, -3.92919921875, -3.3388671875, -2.74853515625, -2.158203125, -1.56787109375, -0.9775390625, -0.38720703125, 0.203125, 0.79345703125, 1.3837890625, 1.97412109375, 2.564453125, 3.15478515625, 3.7451171875, 4.33544921875, 4.92578125, 5.51611328125, 6.1064453125, 6.69677734375, 7.287109375, 7.87744140625, 8.4677734375, 9.05810546875, 9.6484375, 10.23876953125, 10.8291015625, 11.41943359375, 12.009765625, 12.60009765625, 13.1904296875, 13.78076171875, 14.37109375, 14.96142578125, 15.5517578125, 16.14208984375, 16.732421875, 17.32275390625, 17.9130859375, 18.50341796875, 19.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 8.0, 2.0, 11.0, 7.0, 14.0, 16.0, 14.0, 17.0, 19.0, 26.0, 29.0, 26.0, 30.0, 32.0, 40.0, 35.0, 48.0, 38.0, 46.0, 40.0, 43.0, 50.0, 57.0, 37.0, 33.0, 40.0, 35.0, 33.0, 29.0, 29.0, 13.0, 16.0, 17.0, 12.0, 15.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.96875, -28.0791015625, -27.189453125, -26.2998046875, -25.41015625, -24.5205078125, -23.630859375, -22.7412109375, -21.8515625, -20.9619140625, -20.072265625, -19.1826171875, -18.29296875, -17.4033203125, -16.513671875, -15.6240234375, -14.734375, -13.8447265625, -12.955078125, -12.0654296875, -11.17578125, -10.2861328125, -9.396484375, -8.5068359375, -7.6171875, -6.7275390625, -5.837890625, -4.9482421875, -4.05859375, -3.1689453125, -2.279296875, -1.3896484375, -0.5, 0.3896484375, 1.279296875, 2.1689453125, 3.05859375, 3.9482421875, 4.837890625, 5.7275390625, 6.6171875, 7.5068359375, 8.396484375, 9.2861328125, 10.17578125, 11.0654296875, 11.955078125, 12.8447265625, 13.734375, 14.6240234375, 15.513671875, 16.4033203125, 17.29296875, 18.1826171875, 19.072265625, 19.9619140625, 20.8515625, 21.7412109375, 22.630859375, 23.5205078125, 24.41015625, 25.2998046875, 26.189453125, 27.0791015625, 27.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 12.0, 11.0, 20.0, 38.0, 59.0, 106.0, 187.0, 284.0, 441.0, 785.0, 1274.0, 2100.0, 3513.0, 5644.0, 9132.0, 14367.0, 22137.0, 33526.0, 50264.0, 73135.0, 103312.0, 140963.0, 184990.0, 234650.0, 283578.0, 328631.0, 358362.0, 371410.0, 364286.0, 339574.0, 299538.0, 250954.0, 201603.0, 154409.0, 113955.0, 81890.0, 57109.0, 38622.0, 25347.0, 16558.0, 10502.0, 6654.0, 4069.0, 2478.0, 1467.0, 912.0, 576.0, 333.0, 200.0, 135.0, 70.0, 51.0, 27.0, 22.0, 7.0, 3.0, 4.0, 0.0, 3.0], "bins": [-18.890625, -18.312255859375, -17.73388671875, -17.155517578125, -16.5771484375, -15.998779296875, -15.42041015625, -14.842041015625, -14.263671875, -13.685302734375, -13.10693359375, -12.528564453125, -11.9501953125, -11.371826171875, -10.79345703125, -10.215087890625, -9.63671875, -9.058349609375, -8.47998046875, -7.901611328125, -7.3232421875, -6.744873046875, -6.16650390625, -5.588134765625, -5.009765625, -4.431396484375, -3.85302734375, -3.274658203125, -2.6962890625, -2.117919921875, -1.53955078125, -0.961181640625, -0.3828125, 0.195556640625, 0.77392578125, 1.352294921875, 1.9306640625, 2.509033203125, 3.08740234375, 3.665771484375, 4.244140625, 4.822509765625, 5.40087890625, 5.979248046875, 6.5576171875, 7.135986328125, 7.71435546875, 8.292724609375, 8.87109375, 9.449462890625, 10.02783203125, 10.606201171875, 11.1845703125, 11.762939453125, 12.34130859375, 12.919677734375, 13.498046875, 14.076416015625, 14.65478515625, 15.233154296875, 15.8115234375, 16.389892578125, 16.96826171875, 17.546630859375, 18.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 5.0, 11.0, 8.0, 12.0, 15.0, 20.0, 27.0, 30.0, 47.0, 52.0, 71.0, 65.0, 85.0, 95.0, 103.0, 122.0, 139.0, 162.0, 170.0, 183.0, 188.0, 189.0, 186.0, 203.0, 222.0, 201.0, 174.0, 169.0, 162.0, 127.0, 129.0, 118.0, 95.0, 86.0, 70.0, 75.0, 49.0, 44.0, 40.0, 20.0, 25.0, 17.0, 14.0, 11.0, 4.0, 7.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.21875, -10.8544921875, -10.490234375, -10.1259765625, -9.76171875, -9.3974609375, -9.033203125, -8.6689453125, -8.3046875, -7.9404296875, -7.576171875, -7.2119140625, -6.84765625, -6.4833984375, -6.119140625, -5.7548828125, -5.390625, -5.0263671875, -4.662109375, -4.2978515625, -3.93359375, -3.5693359375, -3.205078125, -2.8408203125, -2.4765625, -2.1123046875, -1.748046875, -1.3837890625, -1.01953125, -0.6552734375, -0.291015625, 0.0732421875, 0.4375, 0.8017578125, 1.166015625, 1.5302734375, 1.89453125, 2.2587890625, 2.623046875, 2.9873046875, 3.3515625, 3.7158203125, 4.080078125, 4.4443359375, 4.80859375, 5.1728515625, 5.537109375, 5.9013671875, 6.265625, 6.6298828125, 6.994140625, 7.3583984375, 7.72265625, 8.0869140625, 8.451171875, 8.8154296875, 9.1796875, 9.5439453125, 9.908203125, 10.2724609375, 10.63671875, 11.0009765625, 11.365234375, 11.7294921875, 12.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 9.0, 11.0, 10.0, 9.0, 14.0, 21.0, 21.0, 33.0, 22.0, 28.0, 20.0, 42.0, 36.0, 35.0, 45.0, 49.0, 45.0, 53.0, 52.0, 45.0, 51.0, 33.0, 46.0, 45.0, 33.0, 31.0, 35.0, 13.0, 20.0, 13.0, 19.0, 14.0, 13.0, 6.0, 7.0, 3.0, 2.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.720937728881836, -26.782974243164062, -25.845012664794922, -24.90704917907715, -23.969085693359375, -23.031124114990234, -22.09316062927246, -21.155197143554688, -20.217235565185547, -19.279272079467773, -18.341310501098633, -17.40334701538086, -16.465383529663086, -15.527420997619629, -14.589458465576172, -13.651494979858398, -12.713531494140625, -11.775568962097168, -10.837605476379395, -9.899642944335938, -8.961679458618164, -8.023716926574707, -7.08575439453125, -6.147791385650635, -5.2098283767700195, -4.271865367889404, -3.333902597427368, -2.395939826965332, -1.4579768180847168, -0.5200138092041016, 0.41794872283935547, 1.3559117317199707, 2.293872833251953, 3.2318358421325684, 4.169798851013184, 5.107761383056641, 6.045724391937256, 6.983687400817871, 7.921649932861328, 8.859613418579102, 9.797575950622559, 10.735538482666016, 11.673501968383789, 12.611464500427246, 13.549427032470703, 14.487390518188477, 15.425353050231934, 16.36331558227539, 17.301279067993164, 18.239242553710938, 19.177204132080078, 20.11516761779785, 21.053131103515625, 21.991092681884766, 22.92905616760254, 23.867019653320312, 24.804981231689453, 25.742944717407227, 26.680906295776367, 27.61886978149414, 28.556833267211914, 29.494796752929688, 30.432758331298828, 31.3707218170166, 32.308685302734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 3.0, 7.0, 6.0, 12.0, 20.0, 14.0, 16.0, 21.0, 18.0, 23.0, 21.0, 25.0, 18.0, 36.0, 50.0, 35.0, 37.0, 39.0, 40.0, 35.0, 50.0, 60.0, 45.0, 40.0, 39.0, 30.0, 29.0, 35.0, 33.0, 28.0, 23.0, 15.0, 15.0, 16.0, 18.0, 9.0, 9.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.87775802612305, -34.811649322509766, -33.74553680419922, -32.67942810058594, -31.613317489624023, -30.54720687866211, -29.481098175048828, -28.414987564086914, -27.348876953125, -26.282766342163086, -25.216655731201172, -24.15054702758789, -23.084436416625977, -22.018325805664062, -20.95221710205078, -19.886106491088867, -18.819995880126953, -17.75388526916504, -16.687774658203125, -15.621665954589844, -14.55555534362793, -13.489444732666016, -12.423335075378418, -11.35722541809082, -10.291114807128906, -9.225004196166992, -8.158894538879395, -7.092784404754639, -6.026674270629883, -4.960564136505127, -3.894454002380371, -2.8283438682556152, -1.762237548828125, -0.6961274147033691, 0.3699827194213867, 1.4360928535461426, 2.5022029876708984, 3.5683131217956543, 4.63442325592041, 5.700533390045166, 6.766643524169922, 7.832753658294678, 8.898863792419434, 9.964973449707031, 11.031084060668945, 12.09719467163086, 13.163304328918457, 14.229413986206055, 15.295524597167969, 16.361635208129883, 17.427745819091797, 18.493854522705078, 19.559965133666992, 20.626075744628906, 21.692184448242188, 22.7582950592041, 23.824405670166016, 24.89051628112793, 25.956626892089844, 27.022735595703125, 28.08884620666504, 29.154956817626953, 30.221065521240234, 31.28717613220215, 32.35328674316406]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 18.0, 23.0, 29.0, 49.0, 71.0, 117.0, 130.0, 152.0, 247.0, 345.0, 485.0, 743.0, 1067.0, 1503.0, 2293.0, 3380.0, 5297.0, 8345.0, 13388.0, 22767.0, 40809.0, 73486.0, 134892.0, 218203.0, 216293.0, 133081.0, 72052.0, 39352.0, 22818.0, 13222.0, 8186.0, 5216.0, 3399.0, 2174.0, 1507.0, 1023.0, 700.0, 489.0, 347.0, 230.0, 206.0, 125.0, 86.0, 61.0, 60.0, 31.0, 15.0, 17.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.71875, -15.227294921875, -14.73583984375, -14.244384765625, -13.7529296875, -13.261474609375, -12.77001953125, -12.278564453125, -11.787109375, -11.295654296875, -10.80419921875, -10.312744140625, -9.8212890625, -9.329833984375, -8.83837890625, -8.346923828125, -7.85546875, -7.364013671875, -6.87255859375, -6.381103515625, -5.8896484375, -5.398193359375, -4.90673828125, -4.415283203125, -3.923828125, -3.432373046875, -2.94091796875, -2.449462890625, -1.9580078125, -1.466552734375, -0.97509765625, -0.483642578125, 0.0078125, 0.499267578125, 0.99072265625, 1.482177734375, 1.9736328125, 2.465087890625, 2.95654296875, 3.447998046875, 3.939453125, 4.430908203125, 4.92236328125, 5.413818359375, 5.9052734375, 6.396728515625, 6.88818359375, 7.379638671875, 7.87109375, 8.362548828125, 8.85400390625, 9.345458984375, 9.8369140625, 10.328369140625, 10.81982421875, 11.311279296875, 11.802734375, 12.294189453125, 12.78564453125, 13.277099609375, 13.7685546875, 14.260009765625, 14.75146484375, 15.242919921875, 15.734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 3.0, 5.0, 9.0, 13.0, 16.0, 13.0, 19.0, 20.0, 18.0, 25.0, 19.0, 26.0, 17.0, 38.0, 48.0, 37.0, 33.0, 44.0, 38.0, 33.0, 49.0, 64.0, 42.0, 41.0, 39.0, 28.0, 34.0, 33.0, 29.0, 32.0, 23.0, 13.0, 18.0, 16.0, 16.0, 9.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.90625, -34.84375, -33.78125, -32.71875, -31.65625, -30.59375, -29.53125, -28.46875, -27.40625, -26.34375, -25.28125, -24.21875, -23.15625, -22.09375, -21.03125, -19.96875, -18.90625, -17.84375, -16.78125, -15.71875, -14.65625, -13.59375, -12.53125, -11.46875, -10.40625, -9.34375, -8.28125, -7.21875, -6.15625, -5.09375, -4.03125, -2.96875, -1.90625, -0.84375, 0.21875, 1.28125, 2.34375, 3.40625, 4.46875, 5.53125, 6.59375, 7.65625, 8.71875, 9.78125, 10.84375, 11.90625, 12.96875, 14.03125, 15.09375, 16.15625, 17.21875, 18.28125, 19.34375, 20.40625, 21.46875, 22.53125, 23.59375, 24.65625, 25.71875, 26.78125, 27.84375, 28.90625, 29.96875, 31.03125, 32.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 10.0, 17.0, 21.0, 36.0, 48.0, 63.0, 94.0, 88.0, 155.0, 210.0, 267.0, 410.0, 566.0, 925.0, 1494.0, 2458.0, 4293.0, 7998.0, 16067.0, 37714.0, 109062.0, 357736.0, 337165.0, 101517.0, 35869.0, 15605.0, 7679.0, 4109.0, 2366.0, 1459.0, 899.0, 632.0, 422.0, 319.0, 233.0, 155.0, 104.0, 86.0, 57.0, 44.0, 25.0, 26.0, 13.0, 10.0, 5.0, 5.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-19.65625, -19.06005859375, -18.4638671875, -17.86767578125, -17.271484375, -16.67529296875, -16.0791015625, -15.48291015625, -14.88671875, -14.29052734375, -13.6943359375, -13.09814453125, -12.501953125, -11.90576171875, -11.3095703125, -10.71337890625, -10.1171875, -9.52099609375, -8.9248046875, -8.32861328125, -7.732421875, -7.13623046875, -6.5400390625, -5.94384765625, -5.34765625, -4.75146484375, -4.1552734375, -3.55908203125, -2.962890625, -2.36669921875, -1.7705078125, -1.17431640625, -0.578125, 0.01806640625, 0.6142578125, 1.21044921875, 1.806640625, 2.40283203125, 2.9990234375, 3.59521484375, 4.19140625, 4.78759765625, 5.3837890625, 5.97998046875, 6.576171875, 7.17236328125, 7.7685546875, 8.36474609375, 8.9609375, 9.55712890625, 10.1533203125, 10.74951171875, 11.345703125, 11.94189453125, 12.5380859375, 13.13427734375, 13.73046875, 14.32666015625, 14.9228515625, 15.51904296875, 16.115234375, 16.71142578125, 17.3076171875, 17.90380859375, 18.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 10.0, 17.0, 19.0, 11.0, 15.0, 22.0, 22.0, 28.0, 26.0, 30.0, 36.0, 30.0, 39.0, 31.0, 27.0, 45.0, 56.0, 44.0, 36.0, 33.0, 33.0, 28.0, 44.0, 33.0, 27.0, 25.0, 25.0, 18.0, 24.0, 22.0, 22.0, 15.0, 14.0, 10.0, 9.0, 9.0, 5.0, 4.0, 3.0, 7.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-21.109375, -20.427001953125, -19.74462890625, -19.062255859375, -18.3798828125, -17.697509765625, -17.01513671875, -16.332763671875, -15.650390625, -14.968017578125, -14.28564453125, -13.603271484375, -12.9208984375, -12.238525390625, -11.55615234375, -10.873779296875, -10.19140625, -9.509033203125, -8.82666015625, -8.144287109375, -7.4619140625, -6.779541015625, -6.09716796875, -5.414794921875, -4.732421875, -4.050048828125, -3.36767578125, -2.685302734375, -2.0029296875, -1.320556640625, -0.63818359375, 0.044189453125, 0.7265625, 1.408935546875, 2.09130859375, 2.773681640625, 3.4560546875, 4.138427734375, 4.82080078125, 5.503173828125, 6.185546875, 6.867919921875, 7.55029296875, 8.232666015625, 8.9150390625, 9.597412109375, 10.27978515625, 10.962158203125, 11.64453125, 12.326904296875, 13.00927734375, 13.691650390625, 14.3740234375, 15.056396484375, 15.73876953125, 16.421142578125, 17.103515625, 17.785888671875, 18.46826171875, 19.150634765625, 19.8330078125, 20.515380859375, 21.19775390625, 21.880126953125, 22.5625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 11.0, 13.0, 9.0, 29.0, 37.0, 58.0, 92.0, 125.0, 181.0, 328.0, 555.0, 1099.0, 2369.0, 5645.0, 17061.0, 81225.0, 774723.0, 129503.0, 22472.0, 7021.0, 2911.0, 1395.0, 710.0, 359.0, 196.0, 124.0, 91.0, 56.0, 39.0, 31.0, 14.0, 12.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.34375, -26.420166015625, -25.49658203125, -24.572998046875, -23.6494140625, -22.725830078125, -21.80224609375, -20.878662109375, -19.955078125, -19.031494140625, -18.10791015625, -17.184326171875, -16.2607421875, -15.337158203125, -14.41357421875, -13.489990234375, -12.56640625, -11.642822265625, -10.71923828125, -9.795654296875, -8.8720703125, -7.948486328125, -7.02490234375, -6.101318359375, -5.177734375, -4.254150390625, -3.33056640625, -2.406982421875, -1.4833984375, -0.559814453125, 0.36376953125, 1.287353515625, 2.2109375, 3.134521484375, 4.05810546875, 4.981689453125, 5.9052734375, 6.828857421875, 7.75244140625, 8.676025390625, 9.599609375, 10.523193359375, 11.44677734375, 12.370361328125, 13.2939453125, 14.217529296875, 15.14111328125, 16.064697265625, 16.98828125, 17.911865234375, 18.83544921875, 19.759033203125, 20.6826171875, 21.606201171875, 22.52978515625, 23.453369140625, 24.376953125, 25.300537109375, 26.22412109375, 27.147705078125, 28.0712890625, 28.994873046875, 29.91845703125, 30.842041015625, 31.765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 2.0, 7.0, 3.0, 8.0, 10.0, 19.0, 13.0, 20.0, 21.0, 37.0, 44.0, 84.0, 89.0, 114.0, 106.0, 79.0, 78.0, 54.0, 31.0, 32.0, 27.0, 16.0, 7.0, 9.0, 14.0, 13.0, 12.0, 8.0, 4.0, 4.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014438629150390625, -0.0013903379440307617, -0.001336812973022461, -0.0012832880020141602, -0.0012297630310058594, -0.0011762380599975586, -0.0011227130889892578, -0.001069188117980957, -0.0010156631469726562, -0.0009621381759643555, -0.0009086132049560547, -0.0008550882339477539, -0.0008015632629394531, -0.0007480382919311523, -0.0006945133209228516, -0.0006409883499145508, -0.00058746337890625, -0.0005339384078979492, -0.00048041343688964844, -0.00042688846588134766, -0.0003733634948730469, -0.0003198385238647461, -0.0002663135528564453, -0.00021278858184814453, -0.00015926361083984375, -0.00010573863983154297, -5.221366882324219e-05, 1.3113021850585938e-06, 5.4836273193359375e-05, 0.00010836124420166016, 0.00016188621520996094, 0.00021541118621826172, 0.0002689361572265625, 0.0003224611282348633, 0.00037598609924316406, 0.00042951107025146484, 0.0004830360412597656, 0.0005365610122680664, 0.0005900859832763672, 0.000643610954284668, 0.0006971359252929688, 0.0007506608963012695, 0.0008041858673095703, 0.0008577108383178711, 0.0009112358093261719, 0.0009647607803344727, 0.0010182857513427734, 0.0010718107223510742, 0.001125335693359375, 0.0011788606643676758, 0.0012323856353759766, 0.0012859106063842773, 0.0013394355773925781, 0.001392960548400879, 0.0014464855194091797, 0.0015000104904174805, 0.0015535354614257812, 0.001607060432434082, 0.0016605854034423828, 0.0017141103744506836, 0.0017676353454589844, 0.0018211603164672852, 0.001874685287475586, 0.0019282102584838867, 0.0019817352294921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 8.0, 12.0, 14.0, 14.0, 14.0, 31.0, 36.0, 52.0, 74.0, 97.0, 144.0, 202.0, 258.0, 384.0, 583.0, 836.0, 1296.0, 1825.0, 2645.0, 4300.0, 6866.0, 11932.0, 21765.0, 45192.0, 111620.0, 307512.0, 314733.0, 115521.0, 45858.0, 22455.0, 12209.0, 7032.0, 4282.0, 2744.0, 1879.0, 1218.0, 855.0, 586.0, 422.0, 306.0, 181.0, 169.0, 102.0, 76.0, 60.0, 43.0, 38.0, 16.0, 12.0, 13.0, 2.0, 8.0, 5.0, 4.0, 0.0, 2.0], "bins": [-16.28125, -15.8026123046875, -15.323974609375, -14.8453369140625, -14.36669921875, -13.8880615234375, -13.409423828125, -12.9307861328125, -12.4521484375, -11.9735107421875, -11.494873046875, -11.0162353515625, -10.53759765625, -10.0589599609375, -9.580322265625, -9.1016845703125, -8.623046875, -8.1444091796875, -7.665771484375, -7.1871337890625, -6.70849609375, -6.2298583984375, -5.751220703125, -5.2725830078125, -4.7939453125, -4.3153076171875, -3.836669921875, -3.3580322265625, -2.87939453125, -2.4007568359375, -1.922119140625, -1.4434814453125, -0.96484375, -0.4862060546875, -0.007568359375, 0.4710693359375, 0.94970703125, 1.4283447265625, 1.906982421875, 2.3856201171875, 2.8642578125, 3.3428955078125, 3.821533203125, 4.3001708984375, 4.77880859375, 5.2574462890625, 5.736083984375, 6.2147216796875, 6.693359375, 7.1719970703125, 7.650634765625, 8.1292724609375, 8.60791015625, 9.0865478515625, 9.565185546875, 10.0438232421875, 10.5224609375, 11.0010986328125, 11.479736328125, 11.9583740234375, 12.43701171875, 12.9156494140625, 13.394287109375, 13.8729248046875, 14.3515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 8.0, 5.0, 13.0, 8.0, 11.0, 17.0, 44.0, 39.0, 84.0, 94.0, 116.0, 117.0, 115.0, 104.0, 60.0, 44.0, 38.0, 25.0, 17.0, 8.0, 4.0, 10.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.82904052734375, -4.6151123046875, -4.40118408203125, -4.187255859375, -3.97332763671875, -3.7593994140625, -3.54547119140625, -3.33154296875, -3.11761474609375, -2.9036865234375, -2.68975830078125, -2.475830078125, -2.26190185546875, -2.0479736328125, -1.83404541015625, -1.6201171875, -1.40618896484375, -1.1922607421875, -0.97833251953125, -0.764404296875, -0.55047607421875, -0.3365478515625, -0.12261962890625, 0.09130859375, 0.30523681640625, 0.5191650390625, 0.73309326171875, 0.947021484375, 1.16094970703125, 1.3748779296875, 1.58880615234375, 1.802734375, 2.01666259765625, 2.2305908203125, 2.44451904296875, 2.658447265625, 2.87237548828125, 3.0863037109375, 3.30023193359375, 3.51416015625, 3.72808837890625, 3.9420166015625, 4.15594482421875, 4.369873046875, 4.58380126953125, 4.7977294921875, 5.01165771484375, 5.2255859375, 5.43951416015625, 5.6534423828125, 5.86737060546875, 6.081298828125, 6.29522705078125, 6.5091552734375, 6.72308349609375, 6.93701171875, 7.15093994140625, 7.3648681640625, 7.57879638671875, 7.792724609375, 8.00665283203125, 8.2205810546875, 8.43450927734375, 8.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 3.0, 9.0, 7.0, 16.0, 10.0, 19.0, 19.0, 18.0, 26.0, 28.0, 29.0, 29.0, 33.0, 32.0, 39.0, 46.0, 51.0, 51.0, 51.0, 48.0, 36.0, 51.0, 44.0, 48.0, 44.0, 28.0, 30.0, 21.0, 14.0, 23.0, 19.0, 10.0, 13.0, 15.0, 2.0, 12.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.0669002532959, -25.13973617553711, -24.21257209777832, -23.28540802001953, -22.358243942260742, -21.431079864501953, -20.503915786743164, -19.576751708984375, -18.649587631225586, -17.722423553466797, -16.795259475708008, -15.868095397949219, -14.94093132019043, -14.01376724243164, -13.086603164672852, -12.159439086914062, -11.232275009155273, -10.305110931396484, -9.377946853637695, -8.450782775878906, -7.523618698120117, -6.596454620361328, -5.669290542602539, -4.74212646484375, -3.814962387084961, -2.887798309326172, -1.9606342315673828, -1.0334701538085938, -0.10630607604980469, 0.8208580017089844, 1.7480220794677734, 2.6751861572265625, 3.6023483276367188, 4.529512405395508, 5.456676483154297, 6.383840560913086, 7.311004638671875, 8.238168716430664, 9.165332794189453, 10.092496871948242, 11.019660949707031, 11.94682502746582, 12.87398910522461, 13.801153182983398, 14.728317260742188, 15.655481338500977, 16.582645416259766, 17.509809494018555, 18.436973571777344, 19.364137649536133, 20.291301727294922, 21.21846580505371, 22.1456298828125, 23.07279396057129, 23.999958038330078, 24.927122116088867, 25.854286193847656, 26.781450271606445, 27.708614349365234, 28.635778427124023, 29.562942504882812, 30.4901065826416, 31.41727066040039, 32.34443664550781, 33.27159881591797]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 3.0, 10.0, 16.0, 17.0, 18.0, 15.0, 16.0, 25.0, 21.0, 19.0, 31.0, 21.0, 37.0, 48.0, 40.0, 40.0, 39.0, 32.0, 35.0, 54.0, 58.0, 41.0, 39.0, 39.0, 39.0, 22.0, 32.0, 31.0, 21.0, 22.0, 19.0, 13.0, 17.0, 15.0, 9.0, 10.0, 4.0, 5.0, 10.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.96949005126953, -34.92582321166992, -33.88215637207031, -32.8384895324707, -31.794822692871094, -30.751155853271484, -29.707489013671875, -28.663822174072266, -27.620155334472656, -26.576488494873047, -25.532821655273438, -24.489154815673828, -23.44548797607422, -22.40182113647461, -21.358154296875, -20.31448745727539, -19.27082061767578, -18.227153778076172, -17.183486938476562, -16.139820098876953, -15.096153259277344, -14.052486419677734, -13.008819580078125, -11.965152740478516, -10.921485900878906, -9.877819061279297, -8.834152221679688, -7.790485382080078, -6.746818542480469, -5.703151702880859, -4.65948486328125, -3.6158180236816406, -2.572154998779297, -1.5284881591796875, -0.4848213195800781, 0.5588455200195312, 1.6025123596191406, 2.64617919921875, 3.6898460388183594, 4.733512878417969, 5.777179718017578, 6.8208465576171875, 7.864513397216797, 8.908180236816406, 9.951847076416016, 10.995513916015625, 12.039180755615234, 13.082847595214844, 14.126514434814453, 15.170181274414062, 16.213848114013672, 17.25751495361328, 18.30118179321289, 19.3448486328125, 20.38851547241211, 21.43218231201172, 22.475849151611328, 23.519515991210938, 24.563182830810547, 25.606849670410156, 26.650516510009766, 27.694183349609375, 28.737850189208984, 29.781517028808594, 30.825183868408203]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 16.0, 9.0, 32.0, 36.0, 84.0, 125.0, 213.0, 360.0, 547.0, 822.0, 1378.0, 2191.0, 3355.0, 5320.0, 8102.0, 12024.0, 18077.0, 25895.0, 35914.0, 48836.0, 62687.0, 77572.0, 89858.0, 98392.0, 99691.0, 95926.0, 85968.0, 72783.0, 57897.0, 43957.0, 32266.0, 22760.0, 15821.0, 10293.0, 7033.0, 4512.0, 2895.0, 1787.0, 1176.0, 712.0, 482.0, 302.0, 176.0, 122.0, 68.0, 40.0, 21.0, 11.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.515625, -17.905029296875, -17.29443359375, -16.683837890625, -16.0732421875, -15.462646484375, -14.85205078125, -14.241455078125, -13.630859375, -13.020263671875, -12.40966796875, -11.799072265625, -11.1884765625, -10.577880859375, -9.96728515625, -9.356689453125, -8.74609375, -8.135498046875, -7.52490234375, -6.914306640625, -6.3037109375, -5.693115234375, -5.08251953125, -4.471923828125, -3.861328125, -3.250732421875, -2.64013671875, -2.029541015625, -1.4189453125, -0.808349609375, -0.19775390625, 0.412841796875, 1.0234375, 1.634033203125, 2.24462890625, 2.855224609375, 3.4658203125, 4.076416015625, 4.68701171875, 5.297607421875, 5.908203125, 6.518798828125, 7.12939453125, 7.739990234375, 8.3505859375, 8.961181640625, 9.57177734375, 10.182373046875, 10.79296875, 11.403564453125, 12.01416015625, 12.624755859375, 13.2353515625, 13.845947265625, 14.45654296875, 15.067138671875, 15.677734375, 16.288330078125, 16.89892578125, 17.509521484375, 18.1201171875, 18.730712890625, 19.34130859375, 19.951904296875, 20.5625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 11.0, 17.0, 18.0, 15.0, 15.0, 16.0, 27.0, 20.0, 23.0, 28.0, 26.0, 38.0, 45.0, 37.0, 43.0, 39.0, 29.0, 44.0, 53.0, 54.0, 40.0, 37.0, 41.0, 38.0, 14.0, 39.0, 28.0, 23.0, 23.0, 15.0, 13.0, 18.0, 12.0, 11.0, 8.0, 5.0, 5.0, 9.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-34.4375, -33.4296875, -32.421875, -31.4140625, -30.40625, -29.3984375, -28.390625, -27.3828125, -26.375, -25.3671875, -24.359375, -23.3515625, -22.34375, -21.3359375, -20.328125, -19.3203125, -18.3125, -17.3046875, -16.296875, -15.2890625, -14.28125, -13.2734375, -12.265625, -11.2578125, -10.25, -9.2421875, -8.234375, -7.2265625, -6.21875, -5.2109375, -4.203125, -3.1953125, -2.1875, -1.1796875, -0.171875, 0.8359375, 1.84375, 2.8515625, 3.859375, 4.8671875, 5.875, 6.8828125, 7.890625, 8.8984375, 9.90625, 10.9140625, 11.921875, 12.9296875, 13.9375, 14.9453125, 15.953125, 16.9609375, 17.96875, 18.9765625, 19.984375, 20.9921875, 22.0, 23.0078125, 24.015625, 25.0234375, 26.03125, 27.0390625, 28.046875, 29.0546875, 30.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 10.0, 14.0, 21.0, 31.0, 54.0, 77.0, 137.0, 217.0, 328.0, 489.0, 804.0, 1284.0, 1916.0, 3066.0, 4594.0, 7357.0, 10789.0, 16323.0, 24186.0, 34338.0, 47484.0, 63155.0, 79886.0, 94340.0, 104237.0, 106012.0, 100631.0, 88551.0, 72129.0, 56391.0, 41399.0, 29089.0, 20339.0, 13477.0, 8972.0, 5836.0, 3771.0, 2443.0, 1598.0, 997.0, 650.0, 417.0, 273.0, 163.0, 98.0, 65.0, 35.0, 29.0, 13.0, 9.0, 10.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.078125, -21.3720703125, -20.666015625, -19.9599609375, -19.25390625, -18.5478515625, -17.841796875, -17.1357421875, -16.4296875, -15.7236328125, -15.017578125, -14.3115234375, -13.60546875, -12.8994140625, -12.193359375, -11.4873046875, -10.78125, -10.0751953125, -9.369140625, -8.6630859375, -7.95703125, -7.2509765625, -6.544921875, -5.8388671875, -5.1328125, -4.4267578125, -3.720703125, -3.0146484375, -2.30859375, -1.6025390625, -0.896484375, -0.1904296875, 0.515625, 1.2216796875, 1.927734375, 2.6337890625, 3.33984375, 4.0458984375, 4.751953125, 5.4580078125, 6.1640625, 6.8701171875, 7.576171875, 8.2822265625, 8.98828125, 9.6943359375, 10.400390625, 11.1064453125, 11.8125, 12.5185546875, 13.224609375, 13.9306640625, 14.63671875, 15.3427734375, 16.048828125, 16.7548828125, 17.4609375, 18.1669921875, 18.873046875, 19.5791015625, 20.28515625, 20.9912109375, 21.697265625, 22.4033203125, 23.109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 9.0, 6.0, 9.0, 7.0, 12.0, 16.0, 14.0, 20.0, 21.0, 23.0, 28.0, 27.0, 41.0, 39.0, 30.0, 35.0, 41.0, 39.0, 43.0, 47.0, 37.0, 40.0, 41.0, 34.0, 38.0, 50.0, 27.0, 31.0, 32.0, 21.0, 17.0, 22.0, 16.0, 10.0, 15.0, 15.0, 5.0, 7.0, 9.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-23.71875, -23.041748046875, -22.36474609375, -21.687744140625, -21.0107421875, -20.333740234375, -19.65673828125, -18.979736328125, -18.302734375, -17.625732421875, -16.94873046875, -16.271728515625, -15.5947265625, -14.917724609375, -14.24072265625, -13.563720703125, -12.88671875, -12.209716796875, -11.53271484375, -10.855712890625, -10.1787109375, -9.501708984375, -8.82470703125, -8.147705078125, -7.470703125, -6.793701171875, -6.11669921875, -5.439697265625, -4.7626953125, -4.085693359375, -3.40869140625, -2.731689453125, -2.0546875, -1.377685546875, -0.70068359375, -0.023681640625, 0.6533203125, 1.330322265625, 2.00732421875, 2.684326171875, 3.361328125, 4.038330078125, 4.71533203125, 5.392333984375, 6.0693359375, 6.746337890625, 7.42333984375, 8.100341796875, 8.77734375, 9.454345703125, 10.13134765625, 10.808349609375, 11.4853515625, 12.162353515625, 12.83935546875, 13.516357421875, 14.193359375, 14.870361328125, 15.54736328125, 16.224365234375, 16.9013671875, 17.578369140625, 18.25537109375, 18.932373046875, 19.609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 15.0, 14.0, 20.0, 30.0, 34.0, 78.0, 102.0, 167.0, 220.0, 355.0, 527.0, 882.0, 1517.0, 2416.0, 4035.0, 6786.0, 12517.0, 22800.0, 43154.0, 81357.0, 136573.0, 186757.0, 192970.0, 150532.0, 92975.0, 50793.0, 26834.0, 14409.0, 7917.0, 4769.0, 2649.0, 1602.0, 1004.0, 598.0, 411.0, 254.0, 163.0, 109.0, 67.0, 37.0, 39.0, 21.0, 12.0, 7.0, 11.0, 1.0, 2.0, 6.0, 2.0, 3.0, 1.0], "bins": [-16.703125, -16.2275390625, -15.751953125, -15.2763671875, -14.80078125, -14.3251953125, -13.849609375, -13.3740234375, -12.8984375, -12.4228515625, -11.947265625, -11.4716796875, -10.99609375, -10.5205078125, -10.044921875, -9.5693359375, -9.09375, -8.6181640625, -8.142578125, -7.6669921875, -7.19140625, -6.7158203125, -6.240234375, -5.7646484375, -5.2890625, -4.8134765625, -4.337890625, -3.8623046875, -3.38671875, -2.9111328125, -2.435546875, -1.9599609375, -1.484375, -1.0087890625, -0.533203125, -0.0576171875, 0.41796875, 0.8935546875, 1.369140625, 1.8447265625, 2.3203125, 2.7958984375, 3.271484375, 3.7470703125, 4.22265625, 4.6982421875, 5.173828125, 5.6494140625, 6.125, 6.6005859375, 7.076171875, 7.5517578125, 8.02734375, 8.5029296875, 8.978515625, 9.4541015625, 9.9296875, 10.4052734375, 10.880859375, 11.3564453125, 11.83203125, 12.3076171875, 12.783203125, 13.2587890625, 13.734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 3.0, 2.0, 9.0, 11.0, 11.0, 21.0, 40.0, 40.0, 53.0, 47.0, 75.0, 84.0, 75.0, 83.0, 86.0, 61.0, 63.0, 44.0, 50.0, 26.0, 32.0, 12.0, 20.0, 12.0, 8.0, 4.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018835067749023438, -0.0018233805894851685, -0.0017632544040679932, -0.0017031282186508179, -0.0016430020332336426, -0.0015828758478164673, -0.001522749662399292, -0.0014626234769821167, -0.0014024972915649414, -0.0013423711061477661, -0.0012822449207305908, -0.0012221187353134155, -0.0011619925498962402, -0.001101866364479065, -0.0010417401790618896, -0.0009816139936447144, -0.0009214878082275391, -0.0008613616228103638, -0.0008012354373931885, -0.0007411092519760132, -0.0006809830665588379, -0.0006208568811416626, -0.0005607306957244873, -0.000500604510307312, -0.0004404783248901367, -0.0003803521394729614, -0.00032022595405578613, -0.00026009976863861084, -0.00019997358322143555, -0.00013984739780426025, -7.972121238708496e-05, -1.9595026969909668e-05, 4.0531158447265625e-05, 0.00010065734386444092, 0.0001607835292816162, 0.0002209097146987915, 0.0002810359001159668, 0.0003411620855331421, 0.0004012882709503174, 0.0004614144563674927, 0.000521540641784668, 0.0005816668272018433, 0.0006417930126190186, 0.0007019191980361938, 0.0007620453834533691, 0.0008221715688705444, 0.0008822977542877197, 0.000942423939704895, 0.0010025501251220703, 0.0010626763105392456, 0.001122802495956421, 0.0011829286813735962, 0.0012430548667907715, 0.0013031810522079468, 0.001363307237625122, 0.0014234334230422974, 0.0014835596084594727, 0.001543685793876648, 0.0016038119792938232, 0.0016639381647109985, 0.0017240643501281738, 0.0017841905355453491, 0.0018443167209625244, 0.0019044429063796997, 0.001964569091796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 8.0, 8.0, 10.0, 25.0, 29.0, 38.0, 48.0, 54.0, 100.0, 108.0, 138.0, 240.0, 318.0, 447.0, 625.0, 1007.0, 1615.0, 2629.0, 4664.0, 8482.0, 15914.0, 30758.0, 59860.0, 105678.0, 161799.0, 193671.0, 177134.0, 125069.0, 73883.0, 39259.0, 19915.0, 10539.0, 5703.0, 3205.0, 1917.0, 1163.0, 780.0, 497.0, 352.0, 203.0, 168.0, 118.0, 97.0, 71.0, 55.0, 44.0, 28.0, 30.0, 15.0, 8.0, 7.0, 12.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0], "bins": [-14.421875, -13.966552734375, -13.51123046875, -13.055908203125, -12.6005859375, -12.145263671875, -11.68994140625, -11.234619140625, -10.779296875, -10.323974609375, -9.86865234375, -9.413330078125, -8.9580078125, -8.502685546875, -8.04736328125, -7.592041015625, -7.13671875, -6.681396484375, -6.22607421875, -5.770751953125, -5.3154296875, -4.860107421875, -4.40478515625, -3.949462890625, -3.494140625, -3.038818359375, -2.58349609375, -2.128173828125, -1.6728515625, -1.217529296875, -0.76220703125, -0.306884765625, 0.1484375, 0.603759765625, 1.05908203125, 1.514404296875, 1.9697265625, 2.425048828125, 2.88037109375, 3.335693359375, 3.791015625, 4.246337890625, 4.70166015625, 5.156982421875, 5.6123046875, 6.067626953125, 6.52294921875, 6.978271484375, 7.43359375, 7.888916015625, 8.34423828125, 8.799560546875, 9.2548828125, 9.710205078125, 10.16552734375, 10.620849609375, 11.076171875, 11.531494140625, 11.98681640625, 12.442138671875, 12.8974609375, 13.352783203125, 13.80810546875, 14.263427734375, 14.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 10.0, 15.0, 20.0, 26.0, 25.0, 33.0, 37.0, 50.0, 48.0, 57.0, 58.0, 66.0, 66.0, 69.0, 51.0, 59.0, 61.0, 41.0, 35.0, 41.0, 23.0, 30.0, 25.0, 6.0, 7.0, 13.0, 2.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.35546875, -5.19158935546875, -5.0277099609375, -4.86383056640625, -4.699951171875, -4.53607177734375, -4.3721923828125, -4.20831298828125, -4.04443359375, -3.88055419921875, -3.7166748046875, -3.55279541015625, -3.388916015625, -3.22503662109375, -3.0611572265625, -2.89727783203125, -2.7333984375, -2.56951904296875, -2.4056396484375, -2.24176025390625, -2.077880859375, -1.91400146484375, -1.7501220703125, -1.58624267578125, -1.42236328125, -1.25848388671875, -1.0946044921875, -0.93072509765625, -0.766845703125, -0.60296630859375, -0.4390869140625, -0.27520751953125, -0.111328125, 0.05255126953125, 0.2164306640625, 0.38031005859375, 0.544189453125, 0.70806884765625, 0.8719482421875, 1.03582763671875, 1.19970703125, 1.36358642578125, 1.5274658203125, 1.69134521484375, 1.855224609375, 2.01910400390625, 2.1829833984375, 2.34686279296875, 2.5107421875, 2.67462158203125, 2.8385009765625, 3.00238037109375, 3.166259765625, 3.33013916015625, 3.4940185546875, 3.65789794921875, 3.82177734375, 3.98565673828125, 4.1495361328125, 4.31341552734375, 4.477294921875, 4.64117431640625, 4.8050537109375, 4.96893310546875, 5.1328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 9.0, 11.0, 10.0, 23.0, 27.0, 17.0, 18.0, 21.0, 21.0, 34.0, 31.0, 34.0, 35.0, 55.0, 40.0, 50.0, 33.0, 44.0, 49.0, 46.0, 44.0, 41.0, 41.0, 30.0, 27.0, 33.0, 27.0, 22.0, 19.0, 21.0, 15.0, 7.0, 13.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.40153694152832, -25.504350662231445, -24.607166290283203, -23.709980010986328, -22.812793731689453, -21.91560935974121, -21.018423080444336, -20.121238708496094, -19.22405242919922, -18.326866149902344, -17.4296817779541, -16.532495498657227, -15.635310173034668, -14.73812484741211, -13.840938568115234, -12.943753242492676, -12.0465669631958, -11.149381637573242, -10.252195358276367, -9.355010032653809, -8.45782470703125, -7.560638904571533, -6.663453102111816, -5.766267776489258, -4.869081974029541, -3.9718964099884033, -3.0747108459472656, -2.177525043487549, -1.2803394794464111, -0.38315391540527344, 0.5140318870544434, 1.411217212677002, 2.3084030151367188, 3.2055885791778564, 4.102774143218994, 4.999959945678711, 5.8971452713012695, 6.794331073760986, 7.691516876220703, 8.588702201843262, 9.48588752746582, 10.383072853088379, 11.280259132385254, 12.177444458007812, 13.074629783630371, 13.97181510925293, 14.869001388549805, 15.766186714172363, 16.663372039794922, 17.560558319091797, 18.45774269104004, 19.354928970336914, 20.25211524963379, 21.14929962158203, 22.046485900878906, 22.94367218017578, 23.840858459472656, 24.73804473876953, 25.635229110717773, 26.53241539001465, 27.429601669311523, 28.326786041259766, 29.22397232055664, 30.121158599853516, 31.018342971801758]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 5.0, 6.0, 13.0, 10.0, 11.0, 11.0, 14.0, 22.0, 21.0, 21.0, 17.0, 22.0, 36.0, 25.0, 39.0, 25.0, 28.0, 39.0, 44.0, 34.0, 32.0, 33.0, 39.0, 41.0, 44.0, 40.0, 30.0, 24.0, 37.0, 17.0, 26.0, 28.0, 25.0, 17.0, 15.0, 19.0, 18.0, 11.0, 11.0, 13.0, 4.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-34.50358963012695, -33.491119384765625, -32.47864532470703, -31.466175079345703, -30.453704833984375, -29.441232681274414, -28.428760528564453, -27.416290283203125, -26.403818130493164, -25.391345977783203, -24.378875732421875, -23.366403579711914, -22.353931427001953, -21.341461181640625, -20.328989028930664, -19.316516876220703, -18.304046630859375, -17.291574478149414, -16.279104232788086, -15.266632080078125, -14.25416088104248, -13.241689682006836, -12.229217529296875, -11.21674633026123, -10.204275131225586, -9.191803932189941, -8.179332733154297, -7.166860580444336, -6.154389381408691, -5.141918182373047, -4.129446506500244, -3.1169748306274414, -2.1045055389404297, -1.092034101486206, -0.07956266403198242, 0.9329087734222412, 1.9453802108764648, 2.9578514099121094, 3.970323085784912, 4.982794761657715, 5.995265960693359, 7.007737159729004, 8.020208358764648, 9.03268051147461, 10.045151710510254, 11.057622909545898, 12.07009506225586, 13.082566261291504, 14.095037460327148, 15.107508659362793, 16.119979858398438, 17.1324520111084, 18.14492416381836, 19.157394409179688, 20.16986656188965, 21.18233871459961, 22.194808959960938, 23.2072811126709, 24.219751358032227, 25.232223510742188, 26.244693756103516, 27.257165908813477, 28.269638061523438, 29.282108306884766, 30.294580459594727]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 14.0, 16.0, 38.0, 57.0, 84.0, 166.0, 294.0, 484.0, 815.0, 1371.0, 2323.0, 3772.0, 6365.0, 10268.0, 17325.0, 27574.0, 44424.0, 69763.0, 105849.0, 156601.0, 220681.0, 294707.0, 369235.0, 430508.0, 457799.0, 447563.0, 400792.0, 330665.0, 254637.0, 183811.0, 127947.0, 84498.0, 54695.0, 34708.0, 21475.0, 13036.0, 8079.0, 4806.0, 2891.0, 1657.0, 1013.0, 618.0, 354.0, 206.0, 118.0, 62.0, 48.0, 38.0, 12.0, 9.0, 9.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.03125, -21.358154296875, -20.68505859375, -20.011962890625, -19.3388671875, -18.665771484375, -17.99267578125, -17.319580078125, -16.646484375, -15.973388671875, -15.30029296875, -14.627197265625, -13.9541015625, -13.281005859375, -12.60791015625, -11.934814453125, -11.26171875, -10.588623046875, -9.91552734375, -9.242431640625, -8.5693359375, -7.896240234375, -7.22314453125, -6.550048828125, -5.876953125, -5.203857421875, -4.53076171875, -3.857666015625, -3.1845703125, -2.511474609375, -1.83837890625, -1.165283203125, -0.4921875, 0.180908203125, 0.85400390625, 1.527099609375, 2.2001953125, 2.873291015625, 3.54638671875, 4.219482421875, 4.892578125, 5.565673828125, 6.23876953125, 6.911865234375, 7.5849609375, 8.258056640625, 8.93115234375, 9.604248046875, 10.27734375, 10.950439453125, 11.62353515625, 12.296630859375, 12.9697265625, 13.642822265625, 14.31591796875, 14.989013671875, 15.662109375, 16.335205078125, 17.00830078125, 17.681396484375, 18.3544921875, 19.027587890625, 19.70068359375, 20.373779296875, 21.046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 2.0, 8.0, 10.0, 9.0, 14.0, 7.0, 13.0, 20.0, 22.0, 16.0, 26.0, 15.0, 33.0, 31.0, 33.0, 35.0, 24.0, 37.0, 43.0, 41.0, 33.0, 27.0, 32.0, 45.0, 48.0, 47.0, 25.0, 26.0, 34.0, 25.0, 21.0, 29.0, 27.0, 16.0, 19.0, 16.0, 10.0, 19.0, 13.0, 13.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-29.703125, -28.838134765625, -27.97314453125, -27.108154296875, -26.2431640625, -25.378173828125, -24.51318359375, -23.648193359375, -22.783203125, -21.918212890625, -21.05322265625, -20.188232421875, -19.3232421875, -18.458251953125, -17.59326171875, -16.728271484375, -15.86328125, -14.998291015625, -14.13330078125, -13.268310546875, -12.4033203125, -11.538330078125, -10.67333984375, -9.808349609375, -8.943359375, -8.078369140625, -7.21337890625, -6.348388671875, -5.4833984375, -4.618408203125, -3.75341796875, -2.888427734375, -2.0234375, -1.158447265625, -0.29345703125, 0.571533203125, 1.4365234375, 2.301513671875, 3.16650390625, 4.031494140625, 4.896484375, 5.761474609375, 6.62646484375, 7.491455078125, 8.3564453125, 9.221435546875, 10.08642578125, 10.951416015625, 11.81640625, 12.681396484375, 13.54638671875, 14.411376953125, 15.2763671875, 16.141357421875, 17.00634765625, 17.871337890625, 18.736328125, 19.601318359375, 20.46630859375, 21.331298828125, 22.1962890625, 23.061279296875, 23.92626953125, 24.791259765625, 25.65625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 9.0, 12.0, 20.0, 40.0, 77.0, 108.0, 190.0, 354.0, 609.0, 953.0, 1747.0, 2809.0, 4515.0, 7413.0, 11748.0, 18302.0, 27792.0, 42135.0, 61085.0, 88167.0, 121028.0, 162091.0, 207877.0, 256047.0, 301280.0, 338585.0, 361547.0, 364416.0, 351017.0, 319259.0, 276569.0, 229001.0, 181822.0, 138182.0, 102507.0, 72033.0, 49436.0, 33386.0, 22457.0, 14278.0, 8973.0, 5711.0, 3501.0, 2085.0, 1275.0, 773.0, 456.0, 266.0, 150.0, 82.0, 54.0, 24.0, 13.0, 13.0, 7.0, 7.0, 1.0, 1.0], "bins": [-19.34375, -18.761474609375, -18.17919921875, -17.596923828125, -17.0146484375, -16.432373046875, -15.85009765625, -15.267822265625, -14.685546875, -14.103271484375, -13.52099609375, -12.938720703125, -12.3564453125, -11.774169921875, -11.19189453125, -10.609619140625, -10.02734375, -9.445068359375, -8.86279296875, -8.280517578125, -7.6982421875, -7.115966796875, -6.53369140625, -5.951416015625, -5.369140625, -4.786865234375, -4.20458984375, -3.622314453125, -3.0400390625, -2.457763671875, -1.87548828125, -1.293212890625, -0.7109375, -0.128662109375, 0.45361328125, 1.035888671875, 1.6181640625, 2.200439453125, 2.78271484375, 3.364990234375, 3.947265625, 4.529541015625, 5.11181640625, 5.694091796875, 6.2763671875, 6.858642578125, 7.44091796875, 8.023193359375, 8.60546875, 9.187744140625, 9.77001953125, 10.352294921875, 10.9345703125, 11.516845703125, 12.09912109375, 12.681396484375, 13.263671875, 13.845947265625, 14.42822265625, 15.010498046875, 15.5927734375, 16.175048828125, 16.75732421875, 17.339599609375, 17.921875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 10.0, 9.0, 17.0, 16.0, 26.0, 25.0, 37.0, 55.0, 61.0, 57.0, 72.0, 120.0, 116.0, 139.0, 138.0, 153.0, 160.0, 185.0, 203.0, 183.0, 180.0, 197.0, 170.0, 218.0, 184.0, 190.0, 172.0, 157.0, 113.0, 114.0, 100.0, 89.0, 76.0, 68.0, 58.0, 44.0, 31.0, 36.0, 21.0, 17.0, 10.0, 12.0, 8.0, 8.0, 10.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.09375, -10.6961669921875, -10.298583984375, -9.9010009765625, -9.50341796875, -9.1058349609375, -8.708251953125, -8.3106689453125, -7.9130859375, -7.5155029296875, -7.117919921875, -6.7203369140625, -6.32275390625, -5.9251708984375, -5.527587890625, -5.1300048828125, -4.732421875, -4.3348388671875, -3.937255859375, -3.5396728515625, -3.14208984375, -2.7445068359375, -2.346923828125, -1.9493408203125, -1.5517578125, -1.1541748046875, -0.756591796875, -0.3590087890625, 0.03857421875, 0.4361572265625, 0.833740234375, 1.2313232421875, 1.62890625, 2.0264892578125, 2.424072265625, 2.8216552734375, 3.21923828125, 3.6168212890625, 4.014404296875, 4.4119873046875, 4.8095703125, 5.2071533203125, 5.604736328125, 6.0023193359375, 6.39990234375, 6.7974853515625, 7.195068359375, 7.5926513671875, 7.990234375, 8.3878173828125, 8.785400390625, 9.1829833984375, 9.58056640625, 9.9781494140625, 10.375732421875, 10.7733154296875, 11.1708984375, 11.5684814453125, 11.966064453125, 12.3636474609375, 12.76123046875, 13.1588134765625, 13.556396484375, 13.9539794921875, 14.3515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 10.0, 11.0, 14.0, 13.0, 18.0, 27.0, 23.0, 29.0, 24.0, 30.0, 31.0, 43.0, 35.0, 36.0, 39.0, 44.0, 41.0, 41.0, 46.0, 47.0, 42.0, 37.0, 36.0, 35.0, 30.0, 25.0, 31.0, 24.0, 20.0, 14.0, 25.0, 10.0, 15.0, 10.0, 6.0, 9.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.26859474182129, -26.371686935424805, -25.474777221679688, -24.577869415283203, -23.680959701538086, -22.7840518951416, -21.887142181396484, -20.990234375, -20.093326568603516, -19.19641876220703, -18.299509048461914, -17.40260124206543, -16.505691528320312, -15.608783721923828, -14.711874961853027, -13.814966201782227, -12.918057441711426, -12.021148681640625, -11.124239921569824, -10.227331161499023, -9.330423355102539, -8.433514595031738, -7.5366058349609375, -6.639697551727295, -5.742788791656494, -4.845880031585693, -3.948971748352051, -3.05206298828125, -2.1551544666290283, -1.2582459449768066, -0.36133718490600586, 0.5355710983276367, 1.4324798583984375, 2.329388380050659, 3.226296901702881, 4.123205661773682, 5.020113945007324, 5.917022705078125, 6.813931465148926, 7.710839748382568, 8.607748031616211, 9.504656791687012, 10.401565551757812, 11.298473358154297, 12.195382118225098, 13.092290878295898, 13.9891996383667, 14.8861083984375, 15.7830171585083, 16.6799259185791, 17.576833724975586, 18.473743438720703, 19.370651245117188, 20.267559051513672, 21.16446876525879, 22.061376571655273, 22.95828628540039, 23.855194091796875, 24.752103805541992, 25.649011611938477, 26.545921325683594, 27.442829132080078, 28.339736938476562, 29.23664665222168, 30.133554458618164]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 12.0, 15.0, 21.0, 15.0, 20.0, 31.0, 27.0, 35.0, 33.0, 29.0, 37.0, 35.0, 42.0, 37.0, 50.0, 50.0, 29.0, 41.0, 46.0, 41.0, 45.0, 34.0, 24.0, 36.0, 37.0, 23.0, 25.0, 19.0, 15.0, 13.0, 12.0, 18.0, 14.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.478355407714844, -36.3380241394043, -35.197696685791016, -34.05736541748047, -32.91703414916992, -31.77670669555664, -30.636375427246094, -29.49604606628418, -28.355716705322266, -27.21538734436035, -26.075056076049805, -24.93472671508789, -23.794397354125977, -22.654067993164062, -21.513736724853516, -20.3734073638916, -19.233076095581055, -18.09274673461914, -16.952415466308594, -15.81208610534668, -14.671756744384766, -13.531426429748535, -12.391096115112305, -11.25076675415039, -10.11043643951416, -8.97010612487793, -7.829776763916016, -6.689446449279785, -5.549116611480713, -4.408786773681641, -3.26845645904541, -2.128126621246338, -0.9877967834472656, 0.1525331735610962, 1.292863130569458, 2.4331932067871094, 3.5735230445861816, 4.713852882385254, 5.854183197021484, 6.994513034820557, 8.134842872619629, 9.27517318725586, 10.415502548217773, 11.555832862854004, 12.696163177490234, 13.836492538452148, 14.976822853088379, 16.11715316772461, 17.257482528686523, 18.397811889648438, 19.538143157958984, 20.6784725189209, 21.818801879882812, 22.95913314819336, 24.099462509155273, 25.239791870117188, 26.380123138427734, 27.52045249938965, 28.660783767700195, 29.80111312866211, 30.941442489624023, 32.08177185058594, 33.222103118896484, 34.36243438720703, 35.50276184082031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 11.0, 18.0, 18.0, 22.0, 45.0, 58.0, 80.0, 120.0, 152.0, 257.0, 337.0, 479.0, 757.0, 1222.0, 2213.0, 4052.0, 9352.0, 27548.0, 93404.0, 311827.0, 397540.0, 135087.0, 39462.0, 12887.0, 5011.0, 2444.0, 1385.0, 890.0, 605.0, 374.0, 276.0, 181.0, 125.0, 86.0, 75.0, 43.0, 29.0, 24.0, 16.0, 11.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.473388671875, -25.64990234375, -24.826416015625, -24.0029296875, -23.179443359375, -22.35595703125, -21.532470703125, -20.708984375, -19.885498046875, -19.06201171875, -18.238525390625, -17.4150390625, -16.591552734375, -15.76806640625, -14.944580078125, -14.12109375, -13.297607421875, -12.47412109375, -11.650634765625, -10.8271484375, -10.003662109375, -9.18017578125, -8.356689453125, -7.533203125, -6.709716796875, -5.88623046875, -5.062744140625, -4.2392578125, -3.415771484375, -2.59228515625, -1.768798828125, -0.9453125, -0.121826171875, 0.70166015625, 1.525146484375, 2.3486328125, 3.172119140625, 3.99560546875, 4.819091796875, 5.642578125, 6.466064453125, 7.28955078125, 8.113037109375, 8.9365234375, 9.760009765625, 10.58349609375, 11.406982421875, 12.23046875, 13.053955078125, 13.87744140625, 14.700927734375, 15.5244140625, 16.347900390625, 17.17138671875, 17.994873046875, 18.818359375, 19.641845703125, 20.46533203125, 21.288818359375, 22.1123046875, 22.935791015625, 23.75927734375, 24.582763671875, 25.40625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 12.0, 13.0, 20.0, 17.0, 19.0, 31.0, 24.0, 37.0, 35.0, 26.0, 34.0, 36.0, 40.0, 41.0, 46.0, 52.0, 32.0, 37.0, 46.0, 44.0, 40.0, 37.0, 30.0, 31.0, 39.0, 25.0, 24.0, 19.0, 15.0, 14.0, 13.0, 18.0, 12.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.5, -36.36572265625, -35.2314453125, -34.09716796875, -32.962890625, -31.82861328125, -30.6943359375, -29.56005859375, -28.42578125, -27.29150390625, -26.1572265625, -25.02294921875, -23.888671875, -22.75439453125, -21.6201171875, -20.48583984375, -19.3515625, -18.21728515625, -17.0830078125, -15.94873046875, -14.814453125, -13.68017578125, -12.5458984375, -11.41162109375, -10.27734375, -9.14306640625, -8.0087890625, -6.87451171875, -5.740234375, -4.60595703125, -3.4716796875, -2.33740234375, -1.203125, -0.06884765625, 1.0654296875, 2.19970703125, 3.333984375, 4.46826171875, 5.6025390625, 6.73681640625, 7.87109375, 9.00537109375, 10.1396484375, 11.27392578125, 12.408203125, 13.54248046875, 14.6767578125, 15.81103515625, 16.9453125, 18.07958984375, 19.2138671875, 20.34814453125, 21.482421875, 22.61669921875, 23.7509765625, 24.88525390625, 26.01953125, 27.15380859375, 28.2880859375, 29.42236328125, 30.556640625, 31.69091796875, 32.8251953125, 33.95947265625, 35.09375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 7.0, 4.0, 8.0, 6.0, 24.0, 26.0, 35.0, 36.0, 53.0, 76.0, 119.0, 152.0, 226.0, 321.0, 446.0, 581.0, 779.0, 1160.0, 1826.0, 2818.0, 4257.0, 6973.0, 12240.0, 23768.0, 51487.0, 128793.0, 319255.0, 286491.0, 110467.0, 45567.0, 21159.0, 11078.0, 6461.0, 3876.0, 2470.0, 1608.0, 1154.0, 822.0, 542.0, 425.0, 273.0, 183.0, 177.0, 101.0, 51.0, 48.0, 33.0, 24.0, 25.0, 10.0, 13.0, 5.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-11.7109375, -11.319580078125, -10.92822265625, -10.536865234375, -10.1455078125, -9.754150390625, -9.36279296875, -8.971435546875, -8.580078125, -8.188720703125, -7.79736328125, -7.406005859375, -7.0146484375, -6.623291015625, -6.23193359375, -5.840576171875, -5.44921875, -5.057861328125, -4.66650390625, -4.275146484375, -3.8837890625, -3.492431640625, -3.10107421875, -2.709716796875, -2.318359375, -1.927001953125, -1.53564453125, -1.144287109375, -0.7529296875, -0.361572265625, 0.02978515625, 0.421142578125, 0.8125, 1.203857421875, 1.59521484375, 1.986572265625, 2.3779296875, 2.769287109375, 3.16064453125, 3.552001953125, 3.943359375, 4.334716796875, 4.72607421875, 5.117431640625, 5.5087890625, 5.900146484375, 6.29150390625, 6.682861328125, 7.07421875, 7.465576171875, 7.85693359375, 8.248291015625, 8.6396484375, 9.031005859375, 9.42236328125, 9.813720703125, 10.205078125, 10.596435546875, 10.98779296875, 11.379150390625, 11.7705078125, 12.161865234375, 12.55322265625, 12.944580078125, 13.3359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 7.0, 6.0, 8.0, 11.0, 6.0, 5.0, 9.0, 16.0, 21.0, 17.0, 18.0, 27.0, 21.0, 26.0, 38.0, 28.0, 29.0, 31.0, 37.0, 39.0, 35.0, 50.0, 34.0, 37.0, 37.0, 37.0, 30.0, 32.0, 37.0, 38.0, 36.0, 29.0, 18.0, 25.0, 17.0, 17.0, 15.0, 9.0, 15.0, 15.0, 1.0, 7.0, 6.0, 9.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.234375, -24.44873046875, -23.6630859375, -22.87744140625, -22.091796875, -21.30615234375, -20.5205078125, -19.73486328125, -18.94921875, -18.16357421875, -17.3779296875, -16.59228515625, -15.806640625, -15.02099609375, -14.2353515625, -13.44970703125, -12.6640625, -11.87841796875, -11.0927734375, -10.30712890625, -9.521484375, -8.73583984375, -7.9501953125, -7.16455078125, -6.37890625, -5.59326171875, -4.8076171875, -4.02197265625, -3.236328125, -2.45068359375, -1.6650390625, -0.87939453125, -0.09375, 0.69189453125, 1.4775390625, 2.26318359375, 3.048828125, 3.83447265625, 4.6201171875, 5.40576171875, 6.19140625, 6.97705078125, 7.7626953125, 8.54833984375, 9.333984375, 10.11962890625, 10.9052734375, 11.69091796875, 12.4765625, 13.26220703125, 14.0478515625, 14.83349609375, 15.619140625, 16.40478515625, 17.1904296875, 17.97607421875, 18.76171875, 19.54736328125, 20.3330078125, 21.11865234375, 21.904296875, 22.68994140625, 23.4755859375, 24.26123046875, 25.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 11.0, 7.0, 14.0, 13.0, 28.0, 42.0, 43.0, 49.0, 86.0, 93.0, 111.0, 165.0, 204.0, 239.0, 365.0, 462.0, 735.0, 1140.0, 1992.0, 3970.0, 11529.0, 75847.0, 859214.0, 71268.0, 11195.0, 4052.0, 1937.0, 1107.0, 705.0, 497.0, 328.0, 232.0, 223.0, 155.0, 117.0, 72.0, 59.0, 65.0, 38.0, 33.0, 33.0, 26.0, 14.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.5625, -33.46484375, -32.3671875, -31.26953125, -30.171875, -29.07421875, -27.9765625, -26.87890625, -25.78125, -24.68359375, -23.5859375, -22.48828125, -21.390625, -20.29296875, -19.1953125, -18.09765625, -17.0, -15.90234375, -14.8046875, -13.70703125, -12.609375, -11.51171875, -10.4140625, -9.31640625, -8.21875, -7.12109375, -6.0234375, -4.92578125, -3.828125, -2.73046875, -1.6328125, -0.53515625, 0.5625, 1.66015625, 2.7578125, 3.85546875, 4.953125, 6.05078125, 7.1484375, 8.24609375, 9.34375, 10.44140625, 11.5390625, 12.63671875, 13.734375, 14.83203125, 15.9296875, 17.02734375, 18.125, 19.22265625, 20.3203125, 21.41796875, 22.515625, 23.61328125, 24.7109375, 25.80859375, 26.90625, 28.00390625, 29.1015625, 30.19921875, 31.296875, 32.39453125, 33.4921875, 34.58984375, 35.6875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 10.0, 8.0, 16.0, 14.0, 40.0, 55.0, 105.0, 132.0, 175.0, 148.0, 108.0, 75.0, 45.0, 19.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00211334228515625, -0.0020556747913360596, -0.001998007297515869, -0.0019403398036956787, -0.0018826723098754883, -0.0018250048160552979, -0.0017673373222351074, -0.001709669828414917, -0.0016520023345947266, -0.0015943348407745361, -0.0015366673469543457, -0.0014789998531341553, -0.0014213323593139648, -0.0013636648654937744, -0.001305997371673584, -0.0012483298778533936, -0.0011906623840332031, -0.0011329948902130127, -0.0010753273963928223, -0.0010176599025726318, -0.0009599924087524414, -0.000902324914932251, -0.0008446574211120605, -0.0007869899272918701, -0.0007293224334716797, -0.0006716549396514893, -0.0006139874458312988, -0.0005563199520111084, -0.000498652458190918, -0.00044098496437072754, -0.0003833174705505371, -0.0003256499767303467, -0.00026798248291015625, -0.00021031498908996582, -0.0001526474952697754, -9.498000144958496e-05, -3.731250762939453e-05, 2.03549861907959e-05, 7.802248001098633e-05, 0.00013568997383117676, 0.0001933574676513672, 0.0002510249614715576, 0.00030869245529174805, 0.0003663599491119385, 0.0004240274429321289, 0.00048169493675231934, 0.0005393624305725098, 0.0005970299243927002, 0.0006546974182128906, 0.0007123649120330811, 0.0007700324058532715, 0.0008276998996734619, 0.0008853673934936523, 0.0009430348873138428, 0.0010007023811340332, 0.0010583698749542236, 0.001116037368774414, 0.0011737048625946045, 0.001231372356414795, 0.0012890398502349854, 0.0013467073440551758, 0.0014043748378753662, 0.0014620423316955566, 0.001519709825515747, 0.0015773773193359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 9.0, 5.0, 11.0, 27.0, 34.0, 47.0, 62.0, 89.0, 122.0, 174.0, 275.0, 434.0, 698.0, 1046.0, 1768.0, 3225.0, 6769.0, 18212.0, 75054.0, 504355.0, 356931.0, 52204.0, 14060.0, 5725.0, 2786.0, 1618.0, 950.0, 613.0, 370.0, 272.0, 201.0, 120.0, 62.0, 56.0, 47.0, 23.0, 24.0, 13.0, 20.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.125, -25.279296875, -24.43359375, -23.587890625, -22.7421875, -21.896484375, -21.05078125, -20.205078125, -19.359375, -18.513671875, -17.66796875, -16.822265625, -15.9765625, -15.130859375, -14.28515625, -13.439453125, -12.59375, -11.748046875, -10.90234375, -10.056640625, -9.2109375, -8.365234375, -7.51953125, -6.673828125, -5.828125, -4.982421875, -4.13671875, -3.291015625, -2.4453125, -1.599609375, -0.75390625, 0.091796875, 0.9375, 1.783203125, 2.62890625, 3.474609375, 4.3203125, 5.166015625, 6.01171875, 6.857421875, 7.703125, 8.548828125, 9.39453125, 10.240234375, 11.0859375, 11.931640625, 12.77734375, 13.623046875, 14.46875, 15.314453125, 16.16015625, 17.005859375, 17.8515625, 18.697265625, 19.54296875, 20.388671875, 21.234375, 22.080078125, 22.92578125, 23.771484375, 24.6171875, 25.462890625, 26.30859375, 27.154296875, 28.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 12.0, 21.0, 16.0, 25.0, 62.0, 146.0, 219.0, 200.0, 116.0, 45.0, 27.0, 31.0, 12.0, 11.0, 6.0, 7.0, 4.0, 8.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4453125, -13.0802001953125, -12.715087890625, -12.3499755859375, -11.98486328125, -11.6197509765625, -11.254638671875, -10.8895263671875, -10.5244140625, -10.1593017578125, -9.794189453125, -9.4290771484375, -9.06396484375, -8.6988525390625, -8.333740234375, -7.9686279296875, -7.603515625, -7.2384033203125, -6.873291015625, -6.5081787109375, -6.14306640625, -5.7779541015625, -5.412841796875, -5.0477294921875, -4.6826171875, -4.3175048828125, -3.952392578125, -3.5872802734375, -3.22216796875, -2.8570556640625, -2.491943359375, -2.1268310546875, -1.76171875, -1.3966064453125, -1.031494140625, -0.6663818359375, -0.30126953125, 0.0638427734375, 0.428955078125, 0.7940673828125, 1.1591796875, 1.5242919921875, 1.889404296875, 2.2545166015625, 2.61962890625, 2.9847412109375, 3.349853515625, 3.7149658203125, 4.080078125, 4.4451904296875, 4.810302734375, 5.1754150390625, 5.54052734375, 5.9056396484375, 6.270751953125, 6.6358642578125, 7.0009765625, 7.3660888671875, 7.731201171875, 8.0963134765625, 8.46142578125, 8.8265380859375, 9.191650390625, 9.5567626953125, 9.921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 10.0, 7.0, 16.0, 9.0, 16.0, 17.0, 27.0, 30.0, 26.0, 31.0, 37.0, 33.0, 38.0, 39.0, 35.0, 40.0, 36.0, 42.0, 45.0, 45.0, 49.0, 47.0, 31.0, 39.0, 30.0, 26.0, 29.0, 28.0, 21.0, 14.0, 21.0, 15.0, 14.0, 10.0, 7.0, 5.0, 7.0, 6.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.927095413208008, -26.02306365966797, -25.11903190612793, -24.21500015258789, -23.31096839904785, -22.406936645507812, -21.502906799316406, -20.598873138427734, -19.694843292236328, -18.79081153869629, -17.88677978515625, -16.98274803161621, -16.078716278076172, -15.174684524536133, -14.27065372467041, -13.366621971130371, -12.462589263916016, -11.558557510375977, -10.654525756835938, -9.750494003295898, -8.84646224975586, -7.9424309730529785, -7.038399696350098, -6.134367942810059, -5.2303361892700195, -4.3263044357299805, -3.4222729206085205, -2.5182414054870605, -1.6142096519470215, -0.7101778984069824, 0.19385337829589844, 1.0978851318359375, 2.0019149780273438, 2.905946731567383, 3.8099782466888428, 4.714009761810303, 5.618041515350342, 6.522073268890381, 7.426104545593262, 8.3301362991333, 9.23416805267334, 10.138199806213379, 11.042231559753418, 11.94626235961914, 12.85029411315918, 13.754325866699219, 14.658357620239258, 15.562389373779297, 16.466421127319336, 17.370452880859375, 18.274484634399414, 19.178516387939453, 20.082548141479492, 20.98657989501953, 21.890609741210938, 22.79464340209961, 23.698673248291016, 24.602705001831055, 25.506736755371094, 26.410768508911133, 27.314800262451172, 28.21883201599121, 29.12286376953125, 30.026893615722656, 30.930927276611328]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 3.0, 2.0, 6.0, 5.0, 6.0, 12.0, 16.0, 16.0, 22.0, 27.0, 22.0, 32.0, 35.0, 31.0, 42.0, 26.0, 34.0, 44.0, 41.0, 42.0, 48.0, 35.0, 37.0, 43.0, 42.0, 29.0, 44.0, 36.0, 37.0, 28.0, 23.0, 23.0, 12.0, 20.0, 14.0, 14.0, 11.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-37.615440368652344, -36.495338439941406, -35.37523651123047, -34.25513458251953, -33.135032653808594, -32.014930725097656, -30.89483070373535, -29.774728775024414, -28.654626846313477, -27.53452491760254, -26.4144229888916, -25.294321060180664, -24.17422103881836, -23.054119110107422, -21.934017181396484, -20.813915252685547, -19.69381332397461, -18.573711395263672, -17.453609466552734, -16.333507537841797, -15.213406562805176, -14.093304634094238, -12.973203659057617, -11.85310173034668, -10.732999801635742, -9.612897872924805, -8.492795944213867, -7.372694969177246, -6.252593040466309, -5.132491111755371, -4.012389659881592, -2.8922882080078125, -1.772186279296875, -0.6520845890045166, 0.4680171012878418, 1.5881187915802002, 2.7082204818725586, 3.828322410583496, 4.948423862457275, 6.068525314331055, 7.188627243041992, 8.30872917175293, 9.428831100463867, 10.548932075500488, 11.669034004211426, 12.789135932922363, 13.909236907958984, 15.029338836669922, 16.14944076538086, 17.269542694091797, 18.389644622802734, 19.509746551513672, 20.62984848022461, 21.749950408935547, 22.87005043029785, 23.99015235900879, 25.110254287719727, 26.230356216430664, 27.3504581451416, 28.47056007385254, 29.590660095214844, 30.71076202392578, 31.83086395263672, 32.950965881347656, 34.071067810058594]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 17.0, 24.0, 30.0, 75.0, 96.0, 123.0, 223.0, 330.0, 530.0, 806.0, 1346.0, 2075.0, 3259.0, 5140.0, 7590.0, 11785.0, 17591.0, 25611.0, 35728.0, 48575.0, 62859.0, 77701.0, 90715.0, 99134.0, 101318.0, 95822.0, 86704.0, 73027.0, 57656.0, 44023.0, 32056.0, 22375.0, 15305.0, 10136.0, 6808.0, 4381.0, 2775.0, 1757.0, 1131.0, 743.0, 454.0, 224.0, 158.0, 121.0, 81.0, 52.0, 33.0, 16.0, 12.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0], "bins": [-20.8125, -20.18798828125, -19.5634765625, -18.93896484375, -18.314453125, -17.68994140625, -17.0654296875, -16.44091796875, -15.81640625, -15.19189453125, -14.5673828125, -13.94287109375, -13.318359375, -12.69384765625, -12.0693359375, -11.44482421875, -10.8203125, -10.19580078125, -9.5712890625, -8.94677734375, -8.322265625, -7.69775390625, -7.0732421875, -6.44873046875, -5.82421875, -5.19970703125, -4.5751953125, -3.95068359375, -3.326171875, -2.70166015625, -2.0771484375, -1.45263671875, -0.828125, -0.20361328125, 0.4208984375, 1.04541015625, 1.669921875, 2.29443359375, 2.9189453125, 3.54345703125, 4.16796875, 4.79248046875, 5.4169921875, 6.04150390625, 6.666015625, 7.29052734375, 7.9150390625, 8.53955078125, 9.1640625, 9.78857421875, 10.4130859375, 11.03759765625, 11.662109375, 12.28662109375, 12.9111328125, 13.53564453125, 14.16015625, 14.78466796875, 15.4091796875, 16.03369140625, 16.658203125, 17.28271484375, 17.9072265625, 18.53173828125, 19.15625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 2.0, 5.0, 6.0, 5.0, 12.0, 13.0, 20.0, 19.0, 28.0, 22.0, 29.0, 36.0, 29.0, 43.0, 30.0, 31.0, 43.0, 38.0, 47.0, 48.0, 37.0, 33.0, 45.0, 38.0, 41.0, 32.0, 43.0, 37.0, 26.0, 24.0, 21.0, 15.0, 19.0, 12.0, 17.0, 11.0, 10.0, 7.0, 3.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.78125, -35.68896484375, -34.5966796875, -33.50439453125, -32.412109375, -31.31982421875, -30.2275390625, -29.13525390625, -28.04296875, -26.95068359375, -25.8583984375, -24.76611328125, -23.673828125, -22.58154296875, -21.4892578125, -20.39697265625, -19.3046875, -18.21240234375, -17.1201171875, -16.02783203125, -14.935546875, -13.84326171875, -12.7509765625, -11.65869140625, -10.56640625, -9.47412109375, -8.3818359375, -7.28955078125, -6.197265625, -5.10498046875, -4.0126953125, -2.92041015625, -1.828125, -0.73583984375, 0.3564453125, 1.44873046875, 2.541015625, 3.63330078125, 4.7255859375, 5.81787109375, 6.91015625, 8.00244140625, 9.0947265625, 10.18701171875, 11.279296875, 12.37158203125, 13.4638671875, 14.55615234375, 15.6484375, 16.74072265625, 17.8330078125, 18.92529296875, 20.017578125, 21.10986328125, 22.2021484375, 23.29443359375, 24.38671875, 25.47900390625, 26.5712890625, 27.66357421875, 28.755859375, 29.84814453125, 30.9404296875, 32.03271484375, 33.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 16.0, 30.0, 61.0, 82.0, 122.0, 182.0, 259.0, 407.0, 601.0, 910.0, 1312.0, 2069.0, 3164.0, 4642.0, 7025.0, 10514.0, 15387.0, 22772.0, 32191.0, 44423.0, 58744.0, 74013.0, 88219.0, 98326.0, 102356.0, 99225.0, 89657.0, 76025.0, 61103.0, 46437.0, 33920.0, 23937.0, 16589.0, 11363.0, 7607.0, 5058.0, 3281.0, 2232.0, 1433.0, 997.0, 632.0, 400.0, 265.0, 171.0, 130.0, 84.0, 55.0, 43.0, 22.0, 19.0, 15.0, 2.0, 1.0, 5.0, 3.0, 1.0], "bins": [-21.109375, -20.46142578125, -19.8134765625, -19.16552734375, -18.517578125, -17.86962890625, -17.2216796875, -16.57373046875, -15.92578125, -15.27783203125, -14.6298828125, -13.98193359375, -13.333984375, -12.68603515625, -12.0380859375, -11.39013671875, -10.7421875, -10.09423828125, -9.4462890625, -8.79833984375, -8.150390625, -7.50244140625, -6.8544921875, -6.20654296875, -5.55859375, -4.91064453125, -4.2626953125, -3.61474609375, -2.966796875, -2.31884765625, -1.6708984375, -1.02294921875, -0.375, 0.27294921875, 0.9208984375, 1.56884765625, 2.216796875, 2.86474609375, 3.5126953125, 4.16064453125, 4.80859375, 5.45654296875, 6.1044921875, 6.75244140625, 7.400390625, 8.04833984375, 8.6962890625, 9.34423828125, 9.9921875, 10.64013671875, 11.2880859375, 11.93603515625, 12.583984375, 13.23193359375, 13.8798828125, 14.52783203125, 15.17578125, 15.82373046875, 16.4716796875, 17.11962890625, 17.767578125, 18.41552734375, 19.0634765625, 19.71142578125, 20.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 3.0, 3.0, 7.0, 10.0, 8.0, 14.0, 15.0, 15.0, 19.0, 27.0, 11.0, 24.0, 28.0, 27.0, 24.0, 27.0, 33.0, 30.0, 30.0, 38.0, 44.0, 48.0, 37.0, 36.0, 39.0, 36.0, 30.0, 35.0, 37.0, 25.0, 35.0, 14.0, 23.0, 24.0, 25.0, 16.0, 14.0, 13.0, 12.0, 10.0, 8.0, 6.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-20.21875, -19.5732421875, -18.927734375, -18.2822265625, -17.63671875, -16.9912109375, -16.345703125, -15.7001953125, -15.0546875, -14.4091796875, -13.763671875, -13.1181640625, -12.47265625, -11.8271484375, -11.181640625, -10.5361328125, -9.890625, -9.2451171875, -8.599609375, -7.9541015625, -7.30859375, -6.6630859375, -6.017578125, -5.3720703125, -4.7265625, -4.0810546875, -3.435546875, -2.7900390625, -2.14453125, -1.4990234375, -0.853515625, -0.2080078125, 0.4375, 1.0830078125, 1.728515625, 2.3740234375, 3.01953125, 3.6650390625, 4.310546875, 4.9560546875, 5.6015625, 6.2470703125, 6.892578125, 7.5380859375, 8.18359375, 8.8291015625, 9.474609375, 10.1201171875, 10.765625, 11.4111328125, 12.056640625, 12.7021484375, 13.34765625, 13.9931640625, 14.638671875, 15.2841796875, 15.9296875, 16.5751953125, 17.220703125, 17.8662109375, 18.51171875, 19.1572265625, 19.802734375, 20.4482421875, 21.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 11.0, 15.0, 28.0, 42.0, 72.0, 110.0, 165.0, 244.0, 425.0, 660.0, 983.0, 1653.0, 2815.0, 4910.0, 8827.0, 15688.0, 29387.0, 52817.0, 88610.0, 131027.0, 164372.0, 168520.0, 141725.0, 98716.0, 60383.0, 33857.0, 18505.0, 10111.0, 5592.0, 3191.0, 1926.0, 1182.0, 722.0, 425.0, 257.0, 192.0, 133.0, 83.0, 64.0, 45.0, 20.0, 8.0, 12.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.625, -12.2193603515625, -11.813720703125, -11.4080810546875, -11.00244140625, -10.5968017578125, -10.191162109375, -9.7855224609375, -9.3798828125, -8.9742431640625, -8.568603515625, -8.1629638671875, -7.75732421875, -7.3516845703125, -6.946044921875, -6.5404052734375, -6.134765625, -5.7291259765625, -5.323486328125, -4.9178466796875, -4.51220703125, -4.1065673828125, -3.700927734375, -3.2952880859375, -2.8896484375, -2.4840087890625, -2.078369140625, -1.6727294921875, -1.26708984375, -0.8614501953125, -0.455810546875, -0.0501708984375, 0.35546875, 0.7611083984375, 1.166748046875, 1.5723876953125, 1.97802734375, 2.3836669921875, 2.789306640625, 3.1949462890625, 3.6005859375, 4.0062255859375, 4.411865234375, 4.8175048828125, 5.22314453125, 5.6287841796875, 6.034423828125, 6.4400634765625, 6.845703125, 7.2513427734375, 7.656982421875, 8.0626220703125, 8.46826171875, 8.8739013671875, 9.279541015625, 9.6851806640625, 10.0908203125, 10.4964599609375, 10.902099609375, 11.3077392578125, 11.71337890625, 12.1190185546875, 12.524658203125, 12.9302978515625, 13.3359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 11.0, 16.0, 16.0, 18.0, 26.0, 33.0, 38.0, 37.0, 41.0, 49.0, 43.0, 64.0, 55.0, 61.0, 50.0, 58.0, 58.0, 44.0, 36.0, 45.0, 36.0, 32.0, 26.0, 20.0, 15.0, 17.0, 8.0, 5.0, 9.0, 3.0, 7.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011653900146484375, -0.0011249035596847534, -0.0010844171047210693, -0.0010439306497573853, -0.0010034441947937012, -0.0009629577398300171, -0.000922471284866333, -0.0008819848299026489, -0.0008414983749389648, -0.0008010119199752808, -0.0007605254650115967, -0.0007200390100479126, -0.0006795525550842285, -0.0006390661001205444, -0.0005985796451568604, -0.0005580931901931763, -0.0005176067352294922, -0.0004771202802658081, -0.000436633825302124, -0.00039614737033843994, -0.00035566091537475586, -0.0003151744604110718, -0.0002746880054473877, -0.0002342015504837036, -0.00019371509552001953, -0.00015322864055633545, -0.00011274218559265137, -7.225573062896729e-05, -3.17692756652832e-05, 8.717179298400879e-06, 4.920363426208496e-05, 8.969008922576904e-05, 0.00013017654418945312, 0.0001706629991531372, 0.0002111494541168213, 0.00025163590908050537, 0.00029212236404418945, 0.00033260881900787354, 0.0003730952739715576, 0.0004135817289352417, 0.0004540681838989258, 0.0004945546388626099, 0.0005350410938262939, 0.000575527548789978, 0.0006160140037536621, 0.0006565004587173462, 0.0006969869136810303, 0.0007374733686447144, 0.0007779598236083984, 0.0008184462785720825, 0.0008589327335357666, 0.0008994191884994507, 0.0009399056434631348, 0.0009803920984268188, 0.001020878553390503, 0.001061365008354187, 0.001101851463317871, 0.0011423379182815552, 0.0011828243732452393, 0.0012233108282089233, 0.0012637972831726074, 0.0013042837381362915, 0.0013447701930999756, 0.0013852566480636597, 0.0014257431030273438]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 5.0, 14.0, 16.0, 27.0, 38.0, 66.0, 112.0, 173.0, 312.0, 480.0, 904.0, 1668.0, 2903.0, 5780.0, 11264.0, 22708.0, 45325.0, 85753.0, 140835.0, 187699.0, 192769.0, 150685.0, 95055.0, 51478.0, 25789.0, 12674.0, 6450.0, 3370.0, 1800.0, 984.0, 571.0, 352.0, 200.0, 109.0, 72.0, 42.0, 26.0, 21.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4921875, -13.9940185546875, -13.495849609375, -12.9976806640625, -12.49951171875, -12.0013427734375, -11.503173828125, -11.0050048828125, -10.5068359375, -10.0086669921875, -9.510498046875, -9.0123291015625, -8.51416015625, -8.0159912109375, -7.517822265625, -7.0196533203125, -6.521484375, -6.0233154296875, -5.525146484375, -5.0269775390625, -4.52880859375, -4.0306396484375, -3.532470703125, -3.0343017578125, -2.5361328125, -2.0379638671875, -1.539794921875, -1.0416259765625, -0.54345703125, -0.0452880859375, 0.452880859375, 0.9510498046875, 1.44921875, 1.9473876953125, 2.445556640625, 2.9437255859375, 3.44189453125, 3.9400634765625, 4.438232421875, 4.9364013671875, 5.4345703125, 5.9327392578125, 6.430908203125, 6.9290771484375, 7.42724609375, 7.9254150390625, 8.423583984375, 8.9217529296875, 9.419921875, 9.9180908203125, 10.416259765625, 10.9144287109375, 11.41259765625, 11.9107666015625, 12.408935546875, 12.9071044921875, 13.4052734375, 13.9034423828125, 14.401611328125, 14.8997802734375, 15.39794921875, 15.8961181640625, 16.394287109375, 16.8924560546875, 17.390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 14.0, 26.0, 30.0, 40.0, 50.0, 64.0, 50.0, 53.0, 68.0, 62.0, 57.0, 53.0, 58.0, 60.0, 54.0, 47.0, 37.0, 33.0, 24.0, 17.0, 17.0, 10.0, 9.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.38006591796875, -7.1624755859375, -6.94488525390625, -6.727294921875, -6.50970458984375, -6.2921142578125, -6.07452392578125, -5.85693359375, -5.63934326171875, -5.4217529296875, -5.20416259765625, -4.986572265625, -4.76898193359375, -4.5513916015625, -4.33380126953125, -4.1162109375, -3.89862060546875, -3.6810302734375, -3.46343994140625, -3.245849609375, -3.02825927734375, -2.8106689453125, -2.59307861328125, -2.37548828125, -2.15789794921875, -1.9403076171875, -1.72271728515625, -1.505126953125, -1.28753662109375, -1.0699462890625, -0.85235595703125, -0.634765625, -0.41717529296875, -0.1995849609375, 0.01800537109375, 0.235595703125, 0.45318603515625, 0.6707763671875, 0.88836669921875, 1.10595703125, 1.32354736328125, 1.5411376953125, 1.75872802734375, 1.976318359375, 2.19390869140625, 2.4114990234375, 2.62908935546875, 2.8466796875, 3.06427001953125, 3.2818603515625, 3.49945068359375, 3.717041015625, 3.93463134765625, 4.1522216796875, 4.36981201171875, 4.58740234375, 4.80499267578125, 5.0225830078125, 5.24017333984375, 5.457763671875, 5.67535400390625, 5.8929443359375, 6.11053466796875, 6.328125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 4.0, 3.0, 11.0, 11.0, 10.0, 28.0, 10.0, 23.0, 23.0, 28.0, 33.0, 41.0, 33.0, 44.0, 45.0, 46.0, 26.0, 46.0, 56.0, 50.0, 37.0, 55.0, 32.0, 36.0, 37.0, 40.0, 34.0, 27.0, 21.0, 17.0, 20.0, 13.0, 14.0, 8.0, 11.0, 6.0, 6.0, 3.0, 8.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.083648681640625, -32.109161376953125, -31.134672164916992, -30.160184860229492, -29.18569564819336, -28.21120834350586, -27.236719131469727, -26.262231826782227, -25.287742614746094, -24.313255310058594, -23.33876609802246, -22.36427879333496, -21.389789581298828, -20.415302276611328, -19.440813064575195, -18.466325759887695, -17.491836547851562, -16.517349243164062, -15.54286003112793, -14.568371772766113, -13.593883514404297, -12.619396209716797, -11.644906997680664, -10.670419692993164, -9.695932388305664, -8.721444129943848, -7.746955871582031, -6.772467613220215, -5.797979354858398, -4.82349157333374, -3.849003314971924, -2.8745150566101074, -1.9000263214111328, -0.9255381226539612, 0.04895007610321045, 1.0234382152557373, 1.9979264736175537, 2.972414493560791, 3.9469027519226074, 4.921391010284424, 5.89587926864624, 6.870367527008057, 7.844855785369873, 8.819343566894531, 9.793831825256348, 10.768320083618164, 11.74280834197998, 12.717296600341797, 13.691784858703613, 14.66627311706543, 15.640761375427246, 16.615249633789062, 17.589736938476562, 18.564226150512695, 19.538713455200195, 20.513202667236328, 21.487689971923828, 22.462177276611328, 23.43666648864746, 24.41115379333496, 25.385643005371094, 26.360130310058594, 27.334619522094727, 28.309106826782227, 29.28359603881836]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 10.0, 12.0, 9.0, 7.0, 15.0, 13.0, 13.0, 26.0, 25.0, 23.0, 30.0, 49.0, 39.0, 35.0, 31.0, 31.0, 40.0, 43.0, 44.0, 32.0, 40.0, 44.0, 34.0, 28.0, 32.0, 41.0, 38.0, 39.0, 24.0, 31.0, 17.0, 16.0, 15.0, 10.0, 12.0, 5.0, 8.0, 8.0, 5.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.82529830932617, -35.695011138916016, -34.564727783203125, -33.43444061279297, -32.30415344238281, -31.173870086669922, -30.043582916259766, -28.913297653198242, -27.78301239013672, -26.652727127075195, -25.522441864013672, -24.392154693603516, -23.261869430541992, -22.13158416748047, -21.001296997070312, -19.87101173400879, -18.740726470947266, -17.610441207885742, -16.48015594482422, -15.349868774414062, -14.219583511352539, -13.089298248291016, -11.959012031555176, -10.828725814819336, -9.698440551757812, -8.568155288696289, -7.437869071960449, -6.307583332061768, -5.177297592163086, -4.047011852264404, -2.9167261123657227, -1.786440372467041, -0.6561546325683594, 0.47413110733032227, 1.604416847229004, 2.7347025871276855, 3.864988327026367, 4.995274066925049, 6.1255598068237305, 7.255845546722412, 8.386131286621094, 9.516416549682617, 10.646702766418457, 11.776988983154297, 12.90727424621582, 14.037559509277344, 15.167845726013184, 16.298131942749023, 17.428417205810547, 18.55870246887207, 19.688987731933594, 20.81927490234375, 21.949560165405273, 23.079845428466797, 24.210132598876953, 25.340417861938477, 26.470703125, 27.600988388061523, 28.731273651123047, 29.861560821533203, 30.991846084594727, 32.12213134765625, 33.252418518066406, 34.3827018737793, 35.51298904418945]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 8.0, 5.0, 12.0, 16.0, 22.0, 36.0, 43.0, 107.0, 172.0, 355.0, 612.0, 1062.0, 1757.0, 3091.0, 5539.0, 9377.0, 16494.0, 28035.0, 47841.0, 78189.0, 124351.0, 190645.0, 275610.0, 371133.0, 455695.0, 506640.0, 504622.0, 450610.0, 364149.0, 269062.0, 185320.0, 120468.0, 75379.0, 45134.0, 26889.0, 15575.0, 8916.0, 4951.0, 2829.0, 1573.0, 820.0, 509.0, 296.0, 132.0, 84.0, 65.0, 30.0, 22.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.466552734375, -20.69873046875, -19.930908203125, -19.1630859375, -18.395263671875, -17.62744140625, -16.859619140625, -16.091796875, -15.323974609375, -14.55615234375, -13.788330078125, -13.0205078125, -12.252685546875, -11.48486328125, -10.717041015625, -9.94921875, -9.181396484375, -8.41357421875, -7.645751953125, -6.8779296875, -6.110107421875, -5.34228515625, -4.574462890625, -3.806640625, -3.038818359375, -2.27099609375, -1.503173828125, -0.7353515625, 0.032470703125, 0.80029296875, 1.568115234375, 2.3359375, 3.103759765625, 3.87158203125, 4.639404296875, 5.4072265625, 6.175048828125, 6.94287109375, 7.710693359375, 8.478515625, 9.246337890625, 10.01416015625, 10.781982421875, 11.5498046875, 12.317626953125, 13.08544921875, 13.853271484375, 14.62109375, 15.388916015625, 16.15673828125, 16.924560546875, 17.6923828125, 18.460205078125, 19.22802734375, 19.995849609375, 20.763671875, 21.531494140625, 22.29931640625, 23.067138671875, 23.8349609375, 24.602783203125, 25.37060546875, 26.138427734375, 26.90625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 12.0, 11.0, 9.0, 14.0, 15.0, 18.0, 18.0, 28.0, 18.0, 34.0, 46.0, 38.0, 38.0, 31.0, 31.0, 46.0, 36.0, 47.0, 37.0, 37.0, 30.0, 41.0, 31.0, 40.0, 29.0, 45.0, 32.0, 36.0, 21.0, 14.0, 19.0, 14.0, 17.0, 6.0, 7.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.34375, -30.385009765625, -29.42626953125, -28.467529296875, -27.5087890625, -26.550048828125, -25.59130859375, -24.632568359375, -23.673828125, -22.715087890625, -21.75634765625, -20.797607421875, -19.8388671875, -18.880126953125, -17.92138671875, -16.962646484375, -16.00390625, -15.045166015625, -14.08642578125, -13.127685546875, -12.1689453125, -11.210205078125, -10.25146484375, -9.292724609375, -8.333984375, -7.375244140625, -6.41650390625, -5.457763671875, -4.4990234375, -3.540283203125, -2.58154296875, -1.622802734375, -0.6640625, 0.294677734375, 1.25341796875, 2.212158203125, 3.1708984375, 4.129638671875, 5.08837890625, 6.047119140625, 7.005859375, 7.964599609375, 8.92333984375, 9.882080078125, 10.8408203125, 11.799560546875, 12.75830078125, 13.717041015625, 14.67578125, 15.634521484375, 16.59326171875, 17.552001953125, 18.5107421875, 19.469482421875, 20.42822265625, 21.386962890625, 22.345703125, 23.304443359375, 24.26318359375, 25.221923828125, 26.1806640625, 27.139404296875, 28.09814453125, 29.056884765625, 30.015625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [4.0, 5.0, 9.0, 13.0, 37.0, 33.0, 80.0, 154.0, 279.0, 482.0, 731.0, 1324.0, 2271.0, 3698.0, 6199.0, 10062.0, 16244.0, 25517.0, 39172.0, 58853.0, 85721.0, 120739.0, 163878.0, 212740.0, 266808.0, 314424.0, 354816.0, 375865.0, 379042.0, 359747.0, 323099.0, 274926.0, 224171.0, 173185.0, 128319.0, 91366.0, 63554.0, 42844.0, 27811.0, 17636.0, 11336.0, 6895.0, 4205.0, 2553.0, 1430.0, 878.0, 489.0, 278.0, 162.0, 88.0, 52.0, 33.0, 16.0, 12.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.81689453125, -16.1962890625, -15.57568359375, -14.955078125, -14.33447265625, -13.7138671875, -13.09326171875, -12.47265625, -11.85205078125, -11.2314453125, -10.61083984375, -9.990234375, -9.36962890625, -8.7490234375, -8.12841796875, -7.5078125, -6.88720703125, -6.2666015625, -5.64599609375, -5.025390625, -4.40478515625, -3.7841796875, -3.16357421875, -2.54296875, -1.92236328125, -1.3017578125, -0.68115234375, -0.060546875, 0.56005859375, 1.1806640625, 1.80126953125, 2.421875, 3.04248046875, 3.6630859375, 4.28369140625, 4.904296875, 5.52490234375, 6.1455078125, 6.76611328125, 7.38671875, 8.00732421875, 8.6279296875, 9.24853515625, 9.869140625, 10.48974609375, 11.1103515625, 11.73095703125, 12.3515625, 12.97216796875, 13.5927734375, 14.21337890625, 14.833984375, 15.45458984375, 16.0751953125, 16.69580078125, 17.31640625, 17.93701171875, 18.5576171875, 19.17822265625, 19.798828125, 20.41943359375, 21.0400390625, 21.66064453125, 22.28125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 6.0, 17.0, 22.0, 24.0, 50.0, 38.0, 51.0, 81.0, 61.0, 94.0, 117.0, 119.0, 137.0, 151.0, 195.0, 191.0, 183.0, 208.0, 208.0, 219.0, 210.0, 187.0, 181.0, 186.0, 186.0, 154.0, 144.0, 123.0, 88.0, 100.0, 63.0, 61.0, 39.0, 34.0, 28.0, 24.0, 24.0, 16.0, 4.0, 12.0, 10.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.52099609375, -11.0966796875, -10.67236328125, -10.248046875, -9.82373046875, -9.3994140625, -8.97509765625, -8.55078125, -8.12646484375, -7.7021484375, -7.27783203125, -6.853515625, -6.42919921875, -6.0048828125, -5.58056640625, -5.15625, -4.73193359375, -4.3076171875, -3.88330078125, -3.458984375, -3.03466796875, -2.6103515625, -2.18603515625, -1.76171875, -1.33740234375, -0.9130859375, -0.48876953125, -0.064453125, 0.35986328125, 0.7841796875, 1.20849609375, 1.6328125, 2.05712890625, 2.4814453125, 2.90576171875, 3.330078125, 3.75439453125, 4.1787109375, 4.60302734375, 5.02734375, 5.45166015625, 5.8759765625, 6.30029296875, 6.724609375, 7.14892578125, 7.5732421875, 7.99755859375, 8.421875, 8.84619140625, 9.2705078125, 9.69482421875, 10.119140625, 10.54345703125, 10.9677734375, 11.39208984375, 11.81640625, 12.24072265625, 12.6650390625, 13.08935546875, 13.513671875, 13.93798828125, 14.3623046875, 14.78662109375, 15.2109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 3.0, 14.0, 4.0, 17.0, 17.0, 16.0, 21.0, 21.0, 19.0, 34.0, 35.0, 48.0, 33.0, 38.0, 40.0, 35.0, 37.0, 42.0, 47.0, 45.0, 40.0, 37.0, 31.0, 33.0, 43.0, 32.0, 33.0, 26.0, 27.0, 18.0, 23.0, 14.0, 14.0, 13.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.96746826171875, -27.012842178344727, -26.058218002319336, -25.103591918945312, -24.148967742919922, -23.1943416595459, -22.239717483520508, -21.285091400146484, -20.330467224121094, -19.37584114074707, -18.42121696472168, -17.466590881347656, -16.511966705322266, -15.557340621948242, -14.602716445922852, -13.648090362548828, -12.693465232849121, -11.738840103149414, -10.784214973449707, -9.82958984375, -8.874964714050293, -7.920339107513428, -6.965713977813721, -6.011088848114014, -5.056463718414307, -4.1018385887146, -3.1472134590148926, -2.1925880908966064, -1.2379629611968994, -0.2833375930786133, 0.6712875366210938, 1.6259126663208008, 2.580537796020508, 3.535162925720215, 4.489788055419922, 5.444413185119629, 6.399038314819336, 7.353663921356201, 8.30828857421875, 9.262914657592773, 10.217538833618164, 11.172163963317871, 12.126789093017578, 13.081414222717285, 14.036039352416992, 14.990665435791016, 15.945289611816406, 16.89991569519043, 17.854541778564453, 18.809167861938477, 19.763792037963867, 20.71841812133789, 21.67304229736328, 22.627668380737305, 23.582292556762695, 24.53691864013672, 25.49154281616211, 26.446168899536133, 27.400793075561523, 28.355419158935547, 29.310043334960938, 30.26466941833496, 31.21929359436035, 32.173919677734375, 33.128543853759766]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 14.0, 7.0, 20.0, 19.0, 13.0, 19.0, 23.0, 23.0, 26.0, 26.0, 37.0, 38.0, 40.0, 43.0, 43.0, 45.0, 43.0, 42.0, 33.0, 34.0, 32.0, 32.0, 43.0, 40.0, 33.0, 41.0, 25.0, 25.0, 20.0, 18.0, 12.0, 19.0, 7.0, 8.0, 5.0, 6.0, 9.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.99674606323242, -36.858551025390625, -35.72035598754883, -34.58216094970703, -33.443965911865234, -32.30577087402344, -31.16757583618164, -30.029380798339844, -28.891185760498047, -27.75299072265625, -26.614795684814453, -25.476600646972656, -24.33840560913086, -23.200210571289062, -22.062015533447266, -20.92382049560547, -19.785627365112305, -18.647432327270508, -17.50923728942871, -16.371042251586914, -15.232847213745117, -14.09465217590332, -12.95645809173584, -11.818263053894043, -10.680068016052246, -9.54187297821045, -8.403677940368652, -7.265483379364014, -6.127288341522217, -4.98909330368042, -3.8508987426757812, -2.7127037048339844, -1.5745086669921875, -0.4363137483596802, 0.7018811702728271, 1.840075969696045, 2.978271007537842, 4.116466045379639, 5.254660606384277, 6.392855644226074, 7.531050682067871, 8.669245719909668, 9.807440757751465, 10.945634841918945, 12.083829879760742, 13.222024917602539, 14.360219955444336, 15.498414993286133, 16.63661003112793, 17.774805068969727, 18.913000106811523, 20.05119514465332, 21.189390182495117, 22.327585220336914, 23.465778350830078, 24.603973388671875, 25.742168426513672, 26.88036346435547, 28.018558502197266, 29.156753540039062, 30.29494857788086, 31.433143615722656, 32.57133865356445, 33.70953369140625, 34.84772872924805]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 8.0, 6.0, 12.0, 26.0, 39.0, 50.0, 82.0, 125.0, 218.0, 338.0, 521.0, 859.0, 1345.0, 2173.0, 3668.0, 6016.0, 10159.0, 17201.0, 28650.0, 49011.0, 80373.0, 127891.0, 178169.0, 184597.0, 137051.0, 88002.0, 53504.0, 31725.0, 18555.0, 10991.0, 6662.0, 4056.0, 2441.0, 1540.0, 939.0, 582.0, 381.0, 225.0, 142.0, 83.0, 71.0, 27.0, 19.0, 10.0, 7.0, 5.0, 9.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.4453125, -12.1004638671875, -11.755615234375, -11.4107666015625, -11.06591796875, -10.7210693359375, -10.376220703125, -10.0313720703125, -9.6865234375, -9.3416748046875, -8.996826171875, -8.6519775390625, -8.30712890625, -7.9622802734375, -7.617431640625, -7.2725830078125, -6.927734375, -6.5828857421875, -6.238037109375, -5.8931884765625, -5.54833984375, -5.2034912109375, -4.858642578125, -4.5137939453125, -4.1689453125, -3.8240966796875, -3.479248046875, -3.1343994140625, -2.78955078125, -2.4447021484375, -2.099853515625, -1.7550048828125, -1.41015625, -1.0653076171875, -0.720458984375, -0.3756103515625, -0.03076171875, 0.3140869140625, 0.658935546875, 1.0037841796875, 1.3486328125, 1.6934814453125, 2.038330078125, 2.3831787109375, 2.72802734375, 3.0728759765625, 3.417724609375, 3.7625732421875, 4.107421875, 4.4522705078125, 4.797119140625, 5.1419677734375, 5.48681640625, 5.8316650390625, 6.176513671875, 6.5213623046875, 6.8662109375, 7.2110595703125, 7.555908203125, 7.9007568359375, 8.24560546875, 8.5904541015625, 8.935302734375, 9.2801513671875, 9.625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 18.0, 19.0, 12.0, 19.0, 23.0, 24.0, 26.0, 27.0, 37.0, 38.0, 44.0, 38.0, 43.0, 46.0, 45.0, 39.0, 33.0, 33.0, 33.0, 35.0, 41.0, 40.0, 31.0, 42.0, 25.0, 24.0, 20.0, 20.0, 14.0, 15.0, 6.0, 9.0, 5.0, 6.0, 9.0, 5.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.71875, -36.5830078125, -35.447265625, -34.3115234375, -33.17578125, -32.0400390625, -30.904296875, -29.7685546875, -28.6328125, -27.4970703125, -26.361328125, -25.2255859375, -24.08984375, -22.9541015625, -21.818359375, -20.6826171875, -19.546875, -18.4111328125, -17.275390625, -16.1396484375, -15.00390625, -13.8681640625, -12.732421875, -11.5966796875, -10.4609375, -9.3251953125, -8.189453125, -7.0537109375, -5.91796875, -4.7822265625, -3.646484375, -2.5107421875, -1.375, -0.2392578125, 0.896484375, 2.0322265625, 3.16796875, 4.3037109375, 5.439453125, 6.5751953125, 7.7109375, 8.8466796875, 9.982421875, 11.1181640625, 12.25390625, 13.3896484375, 14.525390625, 15.6611328125, 16.796875, 17.9326171875, 19.068359375, 20.2041015625, 21.33984375, 22.4755859375, 23.611328125, 24.7470703125, 25.8828125, 27.0185546875, 28.154296875, 29.2900390625, 30.42578125, 31.5615234375, 32.697265625, 33.8330078125, 34.96875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 3.0, 10.0, 10.0, 13.0, 24.0, 24.0, 55.0, 55.0, 79.0, 155.0, 202.0, 270.0, 402.0, 608.0, 916.0, 1355.0, 2095.0, 3314.0, 5433.0, 9402.0, 17747.0, 37571.0, 93795.0, 260952.0, 356733.0, 147267.0, 55339.0, 24336.0, 12281.0, 6751.0, 3952.0, 2457.0, 1585.0, 1094.0, 712.0, 489.0, 356.0, 219.0, 148.0, 105.0, 77.0, 56.0, 30.0, 25.0, 13.0, 12.0, 18.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.796875, -13.36865234375, -12.9404296875, -12.51220703125, -12.083984375, -11.65576171875, -11.2275390625, -10.79931640625, -10.37109375, -9.94287109375, -9.5146484375, -9.08642578125, -8.658203125, -8.22998046875, -7.8017578125, -7.37353515625, -6.9453125, -6.51708984375, -6.0888671875, -5.66064453125, -5.232421875, -4.80419921875, -4.3759765625, -3.94775390625, -3.51953125, -3.09130859375, -2.6630859375, -2.23486328125, -1.806640625, -1.37841796875, -0.9501953125, -0.52197265625, -0.09375, 0.33447265625, 0.7626953125, 1.19091796875, 1.619140625, 2.04736328125, 2.4755859375, 2.90380859375, 3.33203125, 3.76025390625, 4.1884765625, 4.61669921875, 5.044921875, 5.47314453125, 5.9013671875, 6.32958984375, 6.7578125, 7.18603515625, 7.6142578125, 8.04248046875, 8.470703125, 8.89892578125, 9.3271484375, 9.75537109375, 10.18359375, 10.61181640625, 11.0400390625, 11.46826171875, 11.896484375, 12.32470703125, 12.7529296875, 13.18115234375, 13.609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 9.0, 11.0, 17.0, 17.0, 17.0, 21.0, 15.0, 19.0, 32.0, 33.0, 27.0, 17.0, 55.0, 35.0, 46.0, 54.0, 43.0, 45.0, 54.0, 44.0, 31.0, 43.0, 59.0, 40.0, 28.0, 26.0, 31.0, 26.0, 18.0, 10.0, 16.0, 11.0, 8.0, 12.0, 9.0, 4.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.8125, -28.83056640625, -27.8486328125, -26.86669921875, -25.884765625, -24.90283203125, -23.9208984375, -22.93896484375, -21.95703125, -20.97509765625, -19.9931640625, -19.01123046875, -18.029296875, -17.04736328125, -16.0654296875, -15.08349609375, -14.1015625, -13.11962890625, -12.1376953125, -11.15576171875, -10.173828125, -9.19189453125, -8.2099609375, -7.22802734375, -6.24609375, -5.26416015625, -4.2822265625, -3.30029296875, -2.318359375, -1.33642578125, -0.3544921875, 0.62744140625, 1.609375, 2.59130859375, 3.5732421875, 4.55517578125, 5.537109375, 6.51904296875, 7.5009765625, 8.48291015625, 9.46484375, 10.44677734375, 11.4287109375, 12.41064453125, 13.392578125, 14.37451171875, 15.3564453125, 16.33837890625, 17.3203125, 18.30224609375, 19.2841796875, 20.26611328125, 21.248046875, 22.22998046875, 23.2119140625, 24.19384765625, 25.17578125, 26.15771484375, 27.1396484375, 28.12158203125, 29.103515625, 30.08544921875, 31.0673828125, 32.04931640625, 33.03125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 11.0, 7.0, 12.0, 14.0, 29.0, 29.0, 44.0, 54.0, 67.0, 116.0, 172.0, 218.0, 354.0, 518.0, 889.0, 1415.0, 2447.0, 4769.0, 9889.0, 24461.0, 82446.0, 525674.0, 304192.0, 54565.0, 18298.0, 7878.0, 3973.0, 2210.0, 1344.0, 758.0, 504.0, 351.0, 241.0, 156.0, 119.0, 91.0, 53.0, 47.0, 35.0, 32.0, 21.0, 14.0, 9.0, 6.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.0828857421875, -13.611083984375, -13.1392822265625, -12.66748046875, -12.1956787109375, -11.723876953125, -11.2520751953125, -10.7802734375, -10.3084716796875, -9.836669921875, -9.3648681640625, -8.89306640625, -8.4212646484375, -7.949462890625, -7.4776611328125, -7.005859375, -6.5340576171875, -6.062255859375, -5.5904541015625, -5.11865234375, -4.6468505859375, -4.175048828125, -3.7032470703125, -3.2314453125, -2.7596435546875, -2.287841796875, -1.8160400390625, -1.34423828125, -0.8724365234375, -0.400634765625, 0.0711669921875, 0.54296875, 1.0147705078125, 1.486572265625, 1.9583740234375, 2.43017578125, 2.9019775390625, 3.373779296875, 3.8455810546875, 4.3173828125, 4.7891845703125, 5.260986328125, 5.7327880859375, 6.20458984375, 6.6763916015625, 7.148193359375, 7.6199951171875, 8.091796875, 8.5635986328125, 9.035400390625, 9.5072021484375, 9.97900390625, 10.4508056640625, 10.922607421875, 11.3944091796875, 11.8662109375, 12.3380126953125, 12.809814453125, 13.2816162109375, 13.75341796875, 14.2252197265625, 14.697021484375, 15.1688232421875, 15.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 7.0, 9.0, 9.0, 10.0, 18.0, 27.0, 27.0, 25.0, 36.0, 42.0, 58.0, 55.0, 78.0, 85.0, 70.0, 78.0, 67.0, 57.0, 44.0, 40.0, 24.0, 28.0, 18.0, 17.0, 12.0, 12.0, 3.0, 9.0, 2.0, 4.0, 8.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007748603820800781, -0.0007491409778594971, -0.000723421573638916, -0.000697702169418335, -0.0006719827651977539, -0.0006462633609771729, -0.0006205439567565918, -0.0005948245525360107, -0.0005691051483154297, -0.0005433857440948486, -0.0005176663398742676, -0.0004919469356536865, -0.00046622753143310547, -0.0004405081272125244, -0.00041478872299194336, -0.0003890693187713623, -0.00036334991455078125, -0.0003376305103302002, -0.00031191110610961914, -0.0002861917018890381, -0.00026047229766845703, -0.00023475289344787598, -0.00020903348922729492, -0.00018331408500671387, -0.0001575946807861328, -0.00013187527656555176, -0.0001061558723449707, -8.043646812438965e-05, -5.4717063903808594e-05, -2.899765968322754e-05, -3.2782554626464844e-06, 2.244114875793457e-05, 4.8160552978515625e-05, 7.387995719909668e-05, 9.959936141967773e-05, 0.0001253187656402588, 0.00015103816986083984, 0.0001767575740814209, 0.00020247697830200195, 0.000228196382522583, 0.00025391578674316406, 0.0002796351909637451, 0.00030535459518432617, 0.0003310739994049072, 0.0003567934036254883, 0.00038251280784606934, 0.0004082322120666504, 0.00043395161628723145, 0.0004596710205078125, 0.00048539042472839355, 0.0005111098289489746, 0.0005368292331695557, 0.0005625486373901367, 0.0005882680416107178, 0.0006139874458312988, 0.0006397068500518799, 0.0006654262542724609, 0.000691145658493042, 0.000716865062713623, 0.0007425844669342041, 0.0007683038711547852, 0.0007940232753753662, 0.0008197426795959473, 0.0008454620838165283, 0.0008711814880371094]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 13.0, 21.0, 30.0, 32.0, 52.0, 78.0, 114.0, 160.0, 240.0, 442.0, 672.0, 1086.0, 1753.0, 2801.0, 4976.0, 8596.0, 15882.0, 31029.0, 63160.0, 136204.0, 263089.0, 258200.0, 132286.0, 61273.0, 30226.0, 15510.0, 8464.0, 4799.0, 2767.0, 1702.0, 1023.0, 640.0, 441.0, 235.0, 205.0, 112.0, 75.0, 57.0, 27.0, 24.0, 17.0, 15.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6484375, -10.3255615234375, -10.002685546875, -9.6798095703125, -9.35693359375, -9.0340576171875, -8.711181640625, -8.3883056640625, -8.0654296875, -7.7425537109375, -7.419677734375, -7.0968017578125, -6.77392578125, -6.4510498046875, -6.128173828125, -5.8052978515625, -5.482421875, -5.1595458984375, -4.836669921875, -4.5137939453125, -4.19091796875, -3.8680419921875, -3.545166015625, -3.2222900390625, -2.8994140625, -2.5765380859375, -2.253662109375, -1.9307861328125, -1.60791015625, -1.2850341796875, -0.962158203125, -0.6392822265625, -0.31640625, 0.0064697265625, 0.329345703125, 0.6522216796875, 0.97509765625, 1.2979736328125, 1.620849609375, 1.9437255859375, 2.2666015625, 2.5894775390625, 2.912353515625, 3.2352294921875, 3.55810546875, 3.8809814453125, 4.203857421875, 4.5267333984375, 4.849609375, 5.1724853515625, 5.495361328125, 5.8182373046875, 6.14111328125, 6.4639892578125, 6.786865234375, 7.1097412109375, 7.4326171875, 7.7554931640625, 8.078369140625, 8.4012451171875, 8.72412109375, 9.0469970703125, 9.369873046875, 9.6927490234375, 10.015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 9.0, 15.0, 12.0, 17.0, 25.0, 25.0, 28.0, 48.0, 44.0, 52.0, 64.0, 70.0, 66.0, 69.0, 65.0, 73.0, 44.0, 25.0, 27.0, 26.0, 38.0, 22.0, 15.0, 5.0, 9.0, 11.0, 8.0, 9.0, 10.0, 9.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.35546875, -5.1971435546875, -5.038818359375, -4.8804931640625, -4.72216796875, -4.5638427734375, -4.405517578125, -4.2471923828125, -4.0888671875, -3.9305419921875, -3.772216796875, -3.6138916015625, -3.45556640625, -3.2972412109375, -3.138916015625, -2.9805908203125, -2.822265625, -2.6639404296875, -2.505615234375, -2.3472900390625, -2.18896484375, -2.0306396484375, -1.872314453125, -1.7139892578125, -1.5556640625, -1.3973388671875, -1.239013671875, -1.0806884765625, -0.92236328125, -0.7640380859375, -0.605712890625, -0.4473876953125, -0.2890625, -0.1307373046875, 0.027587890625, 0.1859130859375, 0.34423828125, 0.5025634765625, 0.660888671875, 0.8192138671875, 0.9775390625, 1.1358642578125, 1.294189453125, 1.4525146484375, 1.61083984375, 1.7691650390625, 1.927490234375, 2.0858154296875, 2.244140625, 2.4024658203125, 2.560791015625, 2.7191162109375, 2.87744140625, 3.0357666015625, 3.194091796875, 3.3524169921875, 3.5107421875, 3.6690673828125, 3.827392578125, 3.9857177734375, 4.14404296875, 4.3023681640625, 4.460693359375, 4.6190185546875, 4.77734375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 12.0, 5.0, 5.0, 9.0, 10.0, 14.0, 22.0, 20.0, 16.0, 16.0, 39.0, 25.0, 34.0, 38.0, 39.0, 42.0, 36.0, 39.0, 36.0, 41.0, 40.0, 46.0, 43.0, 35.0, 27.0, 34.0, 29.0, 39.0, 36.0, 31.0, 19.0, 26.0, 12.0, 19.0, 15.0, 9.0, 12.0, 7.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.130355834960938, -26.19639015197754, -25.262422561645508, -24.32845687866211, -23.394489288330078, -22.46052360534668, -21.52655601501465, -20.59259033203125, -19.65862274169922, -18.72465705871582, -17.79068946838379, -16.85672378540039, -15.92275619506836, -14.988790512084961, -14.05482292175293, -13.120857238769531, -12.186890602111816, -11.252923965454102, -10.318957328796387, -9.384990692138672, -8.451024055480957, -7.5170578956604, -6.5830912590026855, -5.649124622344971, -4.715157985687256, -3.781191349029541, -2.847224712371826, -1.9132583141326904, -0.9792916774749756, -0.045325279235839844, 0.888641357421875, 1.8226079940795898, 2.7565746307373047, 3.6905412673950195, 4.624507904052734, 5.558474540710449, 6.492441177368164, 7.426407337188721, 8.360374450683594, 9.294340133666992, 10.228307723999023, 11.162274360656738, 12.096240997314453, 13.030207633972168, 13.964174270629883, 14.898139953613281, 15.832107543945312, 16.76607322692871, 17.70003890991211, 18.634004592895508, 19.56797218322754, 20.501937866210938, 21.43590545654297, 22.369871139526367, 23.3038387298584, 24.237804412841797, 25.171772003173828, 26.105737686157227, 27.039705276489258, 27.973670959472656, 28.907638549804688, 29.841604232788086, 30.775571823120117, 31.709537506103516, 32.64350509643555]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 13.0, 8.0, 18.0, 21.0, 17.0, 19.0, 16.0, 24.0, 22.0, 31.0, 35.0, 43.0, 42.0, 33.0, 52.0, 45.0, 41.0, 35.0, 39.0, 36.0, 35.0, 33.0, 41.0, 34.0, 36.0, 34.0, 25.0, 25.0, 20.0, 17.0, 24.0, 11.0, 8.0, 12.0, 4.0, 5.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.621097564697266, -36.49016189575195, -35.359222412109375, -34.22828674316406, -33.097347259521484, -31.966411590576172, -30.835474014282227, -29.70453643798828, -28.573598861694336, -27.44266128540039, -26.311723709106445, -25.1807861328125, -24.049850463867188, -22.91891098022461, -21.787975311279297, -20.65703773498535, -19.526100158691406, -18.39516258239746, -17.264225006103516, -16.13328742980957, -15.002350807189941, -13.871413230895996, -12.740476608276367, -11.609539031982422, -10.478601455688477, -9.347663879394531, -8.216726303100586, -7.085789680480957, -5.954852104187012, -4.823914527893066, -3.6929774284362793, -2.562040328979492, -1.4310989379882812, -0.30016160011291504, 0.8307757377624512, 1.9617130756378174, 3.0926504135131836, 4.223587989807129, 5.354525089263916, 6.485462188720703, 7.616399765014648, 8.747337341308594, 9.878274917602539, 11.009211540222168, 12.140149116516113, 13.271086692810059, 14.402023315429688, 15.532960891723633, 16.663898468017578, 17.794836044311523, 18.92577362060547, 20.056711196899414, 21.18764877319336, 22.318584442138672, 23.449522018432617, 24.580459594726562, 25.711397171020508, 26.842334747314453, 27.9732723236084, 29.104209899902344, 30.235145568847656, 31.366085052490234, 32.49702072143555, 33.627960205078125, 34.75889587402344]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 15.0, 45.0, 68.0, 104.0, 169.0, 282.0, 490.0, 766.0, 1211.0, 1967.0, 2961.0, 4677.0, 7216.0, 10561.0, 15787.0, 22565.0, 31629.0, 42777.0, 55448.0, 68776.0, 81891.0, 91611.0, 96003.0, 94813.0, 88911.0, 78452.0, 65461.0, 52493.0, 39785.0, 29020.0, 20952.0, 14106.0, 9667.0, 6571.0, 4179.0, 2573.0, 1740.0, 1074.0, 733.0, 411.0, 232.0, 163.0, 87.0, 42.0, 27.0, 20.0, 15.0, 2.0, 3.0, 0.0, 2.0], "bins": [-21.78125, -21.174072265625, -20.56689453125, -19.959716796875, -19.3525390625, -18.745361328125, -18.13818359375, -17.531005859375, -16.923828125, -16.316650390625, -15.70947265625, -15.102294921875, -14.4951171875, -13.887939453125, -13.28076171875, -12.673583984375, -12.06640625, -11.459228515625, -10.85205078125, -10.244873046875, -9.6376953125, -9.030517578125, -8.42333984375, -7.816162109375, -7.208984375, -6.601806640625, -5.99462890625, -5.387451171875, -4.7802734375, -4.173095703125, -3.56591796875, -2.958740234375, -2.3515625, -1.744384765625, -1.13720703125, -0.530029296875, 0.0771484375, 0.684326171875, 1.29150390625, 1.898681640625, 2.505859375, 3.113037109375, 3.72021484375, 4.327392578125, 4.9345703125, 5.541748046875, 6.14892578125, 6.756103515625, 7.36328125, 7.970458984375, 8.57763671875, 9.184814453125, 9.7919921875, 10.399169921875, 11.00634765625, 11.613525390625, 12.220703125, 12.827880859375, 13.43505859375, 14.042236328125, 14.6494140625, 15.256591796875, 15.86376953125, 16.470947265625, 17.078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 12.0, 7.0, 18.0, 20.0, 16.0, 20.0, 15.0, 24.0, 23.0, 32.0, 34.0, 34.0, 47.0, 33.0, 54.0, 45.0, 36.0, 42.0, 36.0, 36.0, 30.0, 38.0, 39.0, 36.0, 37.0, 33.0, 27.0, 28.0, 18.0, 18.0, 19.0, 14.0, 9.0, 11.0, 6.0, 5.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.625, -35.52783203125, -34.4306640625, -33.33349609375, -32.236328125, -31.13916015625, -30.0419921875, -28.94482421875, -27.84765625, -26.75048828125, -25.6533203125, -24.55615234375, -23.458984375, -22.36181640625, -21.2646484375, -20.16748046875, -19.0703125, -17.97314453125, -16.8759765625, -15.77880859375, -14.681640625, -13.58447265625, -12.4873046875, -11.39013671875, -10.29296875, -9.19580078125, -8.0986328125, -7.00146484375, -5.904296875, -4.80712890625, -3.7099609375, -2.61279296875, -1.515625, -0.41845703125, 0.6787109375, 1.77587890625, 2.873046875, 3.97021484375, 5.0673828125, 6.16455078125, 7.26171875, 8.35888671875, 9.4560546875, 10.55322265625, 11.650390625, 12.74755859375, 13.8447265625, 14.94189453125, 16.0390625, 17.13623046875, 18.2333984375, 19.33056640625, 20.427734375, 21.52490234375, 22.6220703125, 23.71923828125, 24.81640625, 25.91357421875, 27.0107421875, 28.10791015625, 29.205078125, 30.30224609375, 31.3994140625, 32.49658203125, 33.59375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 23.0, 23.0, 50.0, 75.0, 102.0, 218.0, 360.0, 537.0, 904.0, 1571.0, 2699.0, 4302.0, 7323.0, 11502.0, 18747.0, 28823.0, 42824.0, 60643.0, 81537.0, 100675.0, 114781.0, 119316.0, 112369.0, 97198.0, 76498.0, 56670.0, 38830.0, 26300.0, 16699.0, 10392.0, 6581.0, 3950.0, 2461.0, 1373.0, 834.0, 565.0, 278.0, 200.0, 112.0, 64.0, 51.0, 38.0, 17.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.46875, -25.676025390625, -24.88330078125, -24.090576171875, -23.2978515625, -22.505126953125, -21.71240234375, -20.919677734375, -20.126953125, -19.334228515625, -18.54150390625, -17.748779296875, -16.9560546875, -16.163330078125, -15.37060546875, -14.577880859375, -13.78515625, -12.992431640625, -12.19970703125, -11.406982421875, -10.6142578125, -9.821533203125, -9.02880859375, -8.236083984375, -7.443359375, -6.650634765625, -5.85791015625, -5.065185546875, -4.2724609375, -3.479736328125, -2.68701171875, -1.894287109375, -1.1015625, -0.308837890625, 0.48388671875, 1.276611328125, 2.0693359375, 2.862060546875, 3.65478515625, 4.447509765625, 5.240234375, 6.032958984375, 6.82568359375, 7.618408203125, 8.4111328125, 9.203857421875, 9.99658203125, 10.789306640625, 11.58203125, 12.374755859375, 13.16748046875, 13.960205078125, 14.7529296875, 15.545654296875, 16.33837890625, 17.131103515625, 17.923828125, 18.716552734375, 19.50927734375, 20.302001953125, 21.0947265625, 21.887451171875, 22.68017578125, 23.472900390625, 24.265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 8.0, 8.0, 13.0, 14.0, 26.0, 28.0, 24.0, 32.0, 23.0, 36.0, 33.0, 48.0, 36.0, 48.0, 50.0, 44.0, 37.0, 51.0, 50.0, 41.0, 36.0, 44.0, 30.0, 27.0, 32.0, 24.0, 22.0, 21.0, 28.0, 17.0, 10.0, 10.0, 10.0, 2.0, 4.0, 1.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.03125, -28.238525390625, -27.44580078125, -26.653076171875, -25.8603515625, -25.067626953125, -24.27490234375, -23.482177734375, -22.689453125, -21.896728515625, -21.10400390625, -20.311279296875, -19.5185546875, -18.725830078125, -17.93310546875, -17.140380859375, -16.34765625, -15.554931640625, -14.76220703125, -13.969482421875, -13.1767578125, -12.384033203125, -11.59130859375, -10.798583984375, -10.005859375, -9.213134765625, -8.42041015625, -7.627685546875, -6.8349609375, -6.042236328125, -5.24951171875, -4.456787109375, -3.6640625, -2.871337890625, -2.07861328125, -1.285888671875, -0.4931640625, 0.299560546875, 1.09228515625, 1.885009765625, 2.677734375, 3.470458984375, 4.26318359375, 5.055908203125, 5.8486328125, 6.641357421875, 7.43408203125, 8.226806640625, 9.01953125, 9.812255859375, 10.60498046875, 11.397705078125, 12.1904296875, 12.983154296875, 13.77587890625, 14.568603515625, 15.361328125, 16.154052734375, 16.94677734375, 17.739501953125, 18.5322265625, 19.324951171875, 20.11767578125, 20.910400390625, 21.703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 22.0, 13.0, 36.0, 44.0, 84.0, 109.0, 171.0, 244.0, 361.0, 515.0, 816.0, 1320.0, 2136.0, 3462.0, 5980.0, 10384.0, 18234.0, 33083.0, 58975.0, 96333.0, 141214.0, 171696.0, 167459.0, 130541.0, 86635.0, 50928.0, 28631.0, 16064.0, 9121.0, 5304.0, 3255.0, 1960.0, 1184.0, 755.0, 457.0, 336.0, 204.0, 143.0, 107.0, 57.0, 60.0, 36.0, 29.0, 13.0, 9.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.546875, -14.06005859375, -13.5732421875, -13.08642578125, -12.599609375, -12.11279296875, -11.6259765625, -11.13916015625, -10.65234375, -10.16552734375, -9.6787109375, -9.19189453125, -8.705078125, -8.21826171875, -7.7314453125, -7.24462890625, -6.7578125, -6.27099609375, -5.7841796875, -5.29736328125, -4.810546875, -4.32373046875, -3.8369140625, -3.35009765625, -2.86328125, -2.37646484375, -1.8896484375, -1.40283203125, -0.916015625, -0.42919921875, 0.0576171875, 0.54443359375, 1.03125, 1.51806640625, 2.0048828125, 2.49169921875, 2.978515625, 3.46533203125, 3.9521484375, 4.43896484375, 4.92578125, 5.41259765625, 5.8994140625, 6.38623046875, 6.873046875, 7.35986328125, 7.8466796875, 8.33349609375, 8.8203125, 9.30712890625, 9.7939453125, 10.28076171875, 10.767578125, 11.25439453125, 11.7412109375, 12.22802734375, 12.71484375, 13.20166015625, 13.6884765625, 14.17529296875, 14.662109375, 15.14892578125, 15.6357421875, 16.12255859375, 16.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 4.0, 6.0, 9.0, 10.0, 10.0, 9.0, 16.0, 24.0, 18.0, 16.0, 30.0, 21.0, 26.0, 45.0, 45.0, 50.0, 49.0, 45.0, 64.0, 60.0, 45.0, 48.0, 40.0, 25.0, 43.0, 34.0, 40.0, 32.0, 21.0, 19.0, 10.0, 11.0, 14.0, 12.0, 5.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0014524459838867188, -0.0014096498489379883, -0.0013668537139892578, -0.0013240575790405273, -0.0012812614440917969, -0.0012384653091430664, -0.001195669174194336, -0.0011528730392456055, -0.001110076904296875, -0.0010672807693481445, -0.001024484634399414, -0.0009816884994506836, -0.0009388923645019531, -0.0008960962295532227, -0.0008533000946044922, -0.0008105039596557617, -0.0007677078247070312, -0.0007249116897583008, -0.0006821155548095703, -0.0006393194198608398, -0.0005965232849121094, -0.0005537271499633789, -0.0005109310150146484, -0.00046813488006591797, -0.0004253387451171875, -0.00038254261016845703, -0.00033974647521972656, -0.0002969503402709961, -0.0002541542053222656, -0.00021135807037353516, -0.0001685619354248047, -0.00012576580047607422, -8.296966552734375e-05, -4.017353057861328e-05, 2.6226043701171875e-06, 4.5418739318847656e-05, 8.821487426757812e-05, 0.0001310110092163086, 0.00017380714416503906, 0.00021660327911376953, 0.0002593994140625, 0.00030219554901123047, 0.00034499168395996094, 0.0003877878189086914, 0.0004305839538574219, 0.00047338008880615234, 0.0005161762237548828, 0.0005589723587036133, 0.0006017684936523438, 0.0006445646286010742, 0.0006873607635498047, 0.0007301568984985352, 0.0007729530334472656, 0.0008157491683959961, 0.0008585453033447266, 0.000901341438293457, 0.0009441375732421875, 0.000986933708190918, 0.0010297298431396484, 0.001072525978088379, 0.0011153221130371094, 0.0011581182479858398, 0.0012009143829345703, 0.0012437105178833008, 0.0012865066528320312]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 13.0, 13.0, 15.0, 28.0, 24.0, 41.0, 62.0, 100.0, 135.0, 233.0, 312.0, 466.0, 623.0, 1031.0, 1562.0, 2306.0, 3626.0, 5578.0, 9188.0, 14809.0, 23734.0, 38470.0, 59242.0, 86932.0, 116532.0, 138118.0, 140970.0, 123994.0, 96179.0, 66774.0, 43836.0, 27454.0, 17083.0, 10433.0, 6614.0, 4223.0, 2653.0, 1692.0, 1186.0, 727.0, 490.0, 345.0, 219.0, 175.0, 102.0, 75.0, 41.0, 27.0, 19.0, 22.0, 9.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-13.6015625, -13.178466796875, -12.75537109375, -12.332275390625, -11.9091796875, -11.486083984375, -11.06298828125, -10.639892578125, -10.216796875, -9.793701171875, -9.37060546875, -8.947509765625, -8.5244140625, -8.101318359375, -7.67822265625, -7.255126953125, -6.83203125, -6.408935546875, -5.98583984375, -5.562744140625, -5.1396484375, -4.716552734375, -4.29345703125, -3.870361328125, -3.447265625, -3.024169921875, -2.60107421875, -2.177978515625, -1.7548828125, -1.331787109375, -0.90869140625, -0.485595703125, -0.0625, 0.360595703125, 0.78369140625, 1.206787109375, 1.6298828125, 2.052978515625, 2.47607421875, 2.899169921875, 3.322265625, 3.745361328125, 4.16845703125, 4.591552734375, 5.0146484375, 5.437744140625, 5.86083984375, 6.283935546875, 6.70703125, 7.130126953125, 7.55322265625, 7.976318359375, 8.3994140625, 8.822509765625, 9.24560546875, 9.668701171875, 10.091796875, 10.514892578125, 10.93798828125, 11.361083984375, 11.7841796875, 12.207275390625, 12.63037109375, 13.053466796875, 13.4765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 4.0, 13.0, 15.0, 13.0, 12.0, 18.0, 28.0, 22.0, 48.0, 42.0, 56.0, 64.0, 53.0, 69.0, 74.0, 85.0, 63.0, 61.0, 49.0, 46.0, 29.0, 30.0, 31.0, 15.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.25311279296875, -5.0179443359375, -4.78277587890625, -4.547607421875, -4.31243896484375, -4.0772705078125, -3.84210205078125, -3.60693359375, -3.37176513671875, -3.1365966796875, -2.90142822265625, -2.666259765625, -2.43109130859375, -2.1959228515625, -1.96075439453125, -1.7255859375, -1.49041748046875, -1.2552490234375, -1.02008056640625, -0.784912109375, -0.54974365234375, -0.3145751953125, -0.07940673828125, 0.15576171875, 0.39093017578125, 0.6260986328125, 0.86126708984375, 1.096435546875, 1.33160400390625, 1.5667724609375, 1.80194091796875, 2.037109375, 2.27227783203125, 2.5074462890625, 2.74261474609375, 2.977783203125, 3.21295166015625, 3.4481201171875, 3.68328857421875, 3.91845703125, 4.15362548828125, 4.3887939453125, 4.62396240234375, 4.859130859375, 5.09429931640625, 5.3294677734375, 5.56463623046875, 5.7998046875, 6.03497314453125, 6.2701416015625, 6.50531005859375, 6.740478515625, 6.97564697265625, 7.2108154296875, 7.44598388671875, 7.68115234375, 7.91632080078125, 8.1514892578125, 8.38665771484375, 8.621826171875, 8.85699462890625, 9.0921630859375, 9.32733154296875, 9.5625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 9.0, 13.0, 17.0, 17.0, 19.0, 28.0, 30.0, 30.0, 47.0, 28.0, 45.0, 29.0, 33.0, 40.0, 41.0, 41.0, 49.0, 42.0, 39.0, 41.0, 39.0, 34.0, 42.0, 34.0, 30.0, 20.0, 22.0, 17.0, 15.0, 11.0, 15.0, 7.0, 10.0, 8.0, 11.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.053030014038086, -30.091337203979492, -29.1296443939209, -28.167949676513672, -27.206256866455078, -26.244564056396484, -25.28287124633789, -24.321178436279297, -23.359485626220703, -22.39779281616211, -21.436100006103516, -20.474407196044922, -19.512712478637695, -18.5510196685791, -17.589326858520508, -16.627634048461914, -15.665939331054688, -14.704246520996094, -13.742552757263184, -12.78085994720459, -11.81916618347168, -10.857473373413086, -9.895780563354492, -8.934087753295898, -7.972393989562988, -7.010700702667236, -6.049007415771484, -5.087314605712891, -4.125621318817139, -3.1639280319213867, -2.202235221862793, -1.240541934967041, -0.27884674072265625, 0.6828464269638062, 1.6445395946502686, 2.6062326431274414, 3.5679259300231934, 4.529619216918945, 5.491312026977539, 6.453005313873291, 7.414698600769043, 8.376391410827637, 9.338085174560547, 10.29977798461914, 11.261470794677734, 12.223164558410645, 13.184857368469238, 14.146551132202148, 15.108243942260742, 16.069936752319336, 17.03162956237793, 17.993324279785156, 18.95501708984375, 19.916709899902344, 20.878402709960938, 21.84009552001953, 22.801788330078125, 23.76348114013672, 24.725173950195312, 25.686866760253906, 26.648561477661133, 27.610254287719727, 28.57194709777832, 29.533639907836914, 30.49533462524414]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 18.0, 10.0, 15.0, 15.0, 21.0, 32.0, 27.0, 30.0, 30.0, 29.0, 37.0, 34.0, 43.0, 43.0, 43.0, 43.0, 31.0, 44.0, 47.0, 29.0, 46.0, 36.0, 34.0, 24.0, 31.0, 27.0, 31.0, 26.0, 18.0, 20.0, 14.0, 13.0, 4.0, 18.0, 5.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.26028823852539, -42.05245590209961, -40.844627380371094, -39.63679504394531, -38.4289665222168, -37.221134185791016, -36.0133056640625, -34.80547332763672, -33.59764099121094, -32.389808654785156, -31.18198013305664, -29.974149703979492, -28.766319274902344, -27.558486938476562, -26.350656509399414, -25.142826080322266, -23.93499755859375, -22.7271671295166, -21.519336700439453, -20.311506271362305, -19.103675842285156, -17.895843505859375, -16.688013076782227, -15.480182647705078, -14.27235221862793, -13.064521789550781, -11.856691360473633, -10.648859977722168, -9.44102954864502, -8.233199119567871, -7.0253682136535645, -5.817537307739258, -4.609703063964844, -3.401872396469116, -2.1940417289733887, -0.9862110614776611, 0.2216196060180664, 1.4294500350952148, 2.6372809410095215, 3.845111846923828, 5.052942276000977, 6.260772705078125, 7.468603610992432, 8.676434516906738, 9.884264945983887, 11.092095375061035, 12.2999267578125, 13.507757186889648, 14.715587615966797, 15.923418045043945, 17.131248474121094, 18.339078903198242, 19.54690933227539, 20.754741668701172, 21.96257209777832, 23.17040252685547, 24.378232955932617, 25.586063385009766, 26.793893814086914, 28.001724243164062, 29.209556579589844, 30.41738510131836, 31.62521743774414, 32.833045959472656, 34.04087829589844]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 17.0, 28.0, 63.0, 95.0, 140.0, 276.0, 443.0, 752.0, 1280.0, 2092.0, 3471.0, 5726.0, 9546.0, 15471.0, 25116.0, 39791.0, 61101.0, 93259.0, 136488.0, 192828.0, 259412.0, 328742.0, 390402.0, 428681.0, 437050.0, 409938.0, 358612.0, 292087.0, 222666.0, 160705.0, 112356.0, 75213.0, 48748.0, 31253.0, 19797.0, 11964.0, 7562.0, 4512.0, 2683.0, 1632.0, 929.0, 555.0, 339.0, 201.0, 106.0, 62.0, 38.0, 15.0, 15.0, 9.0, 4.0, 3.0, 2.0, 2.0], "bins": [-23.21875, -22.54052734375, -21.8623046875, -21.18408203125, -20.505859375, -19.82763671875, -19.1494140625, -18.47119140625, -17.79296875, -17.11474609375, -16.4365234375, -15.75830078125, -15.080078125, -14.40185546875, -13.7236328125, -13.04541015625, -12.3671875, -11.68896484375, -11.0107421875, -10.33251953125, -9.654296875, -8.97607421875, -8.2978515625, -7.61962890625, -6.94140625, -6.26318359375, -5.5849609375, -4.90673828125, -4.228515625, -3.55029296875, -2.8720703125, -2.19384765625, -1.515625, -0.83740234375, -0.1591796875, 0.51904296875, 1.197265625, 1.87548828125, 2.5537109375, 3.23193359375, 3.91015625, 4.58837890625, 5.2666015625, 5.94482421875, 6.623046875, 7.30126953125, 7.9794921875, 8.65771484375, 9.3359375, 10.01416015625, 10.6923828125, 11.37060546875, 12.048828125, 12.72705078125, 13.4052734375, 14.08349609375, 14.76171875, 15.43994140625, 16.1181640625, 16.79638671875, 17.474609375, 18.15283203125, 18.8310546875, 19.50927734375, 20.1875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 8.0, 16.0, 10.0, 15.0, 20.0, 24.0, 32.0, 25.0, 31.0, 29.0, 38.0, 29.0, 45.0, 40.0, 41.0, 43.0, 39.0, 39.0, 41.0, 39.0, 34.0, 50.0, 36.0, 22.0, 26.0, 36.0, 26.0, 28.0, 25.0, 16.0, 18.0, 14.0, 5.0, 9.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.0, -35.9765625, -34.953125, -33.9296875, -32.90625, -31.8828125, -30.859375, -29.8359375, -28.8125, -27.7890625, -26.765625, -25.7421875, -24.71875, -23.6953125, -22.671875, -21.6484375, -20.625, -19.6015625, -18.578125, -17.5546875, -16.53125, -15.5078125, -14.484375, -13.4609375, -12.4375, -11.4140625, -10.390625, -9.3671875, -8.34375, -7.3203125, -6.296875, -5.2734375, -4.25, -3.2265625, -2.203125, -1.1796875, -0.15625, 0.8671875, 1.890625, 2.9140625, 3.9375, 4.9609375, 5.984375, 7.0078125, 8.03125, 9.0546875, 10.078125, 11.1015625, 12.125, 13.1484375, 14.171875, 15.1953125, 16.21875, 17.2421875, 18.265625, 19.2890625, 20.3125, 21.3359375, 22.359375, 23.3828125, 24.40625, 25.4296875, 26.453125, 27.4765625, 28.5]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 13.0, 22.0, 24.0, 60.0, 67.0, 144.0, 224.0, 351.0, 624.0, 1253.0, 1968.0, 3274.0, 5392.0, 8858.0, 14000.0, 21752.0, 33935.0, 50841.0, 74152.0, 104245.0, 143658.0, 188994.0, 239821.0, 287337.0, 332175.0, 362686.0, 374090.0, 366841.0, 338533.0, 296597.0, 248793.0, 197517.0, 151720.0, 111183.0, 79250.0, 54125.0, 36791.0, 23662.0, 15162.0, 9607.0, 5834.0, 3652.0, 2087.0, 1250.0, 734.0, 450.0, 247.0, 128.0, 59.0, 40.0, 30.0, 16.0, 11.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.6962890625, -18.064453125, -17.4326171875, -16.80078125, -16.1689453125, -15.537109375, -14.9052734375, -14.2734375, -13.6416015625, -13.009765625, -12.3779296875, -11.74609375, -11.1142578125, -10.482421875, -9.8505859375, -9.21875, -8.5869140625, -7.955078125, -7.3232421875, -6.69140625, -6.0595703125, -5.427734375, -4.7958984375, -4.1640625, -3.5322265625, -2.900390625, -2.2685546875, -1.63671875, -1.0048828125, -0.373046875, 0.2587890625, 0.890625, 1.5224609375, 2.154296875, 2.7861328125, 3.41796875, 4.0498046875, 4.681640625, 5.3134765625, 5.9453125, 6.5771484375, 7.208984375, 7.8408203125, 8.47265625, 9.1044921875, 9.736328125, 10.3681640625, 11.0, 11.6318359375, 12.263671875, 12.8955078125, 13.52734375, 14.1591796875, 14.791015625, 15.4228515625, 16.0546875, 16.6865234375, 17.318359375, 17.9501953125, 18.58203125, 19.2138671875, 19.845703125, 20.4775390625, 21.109375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 8.0, 15.0, 14.0, 23.0, 18.0, 38.0, 42.0, 58.0, 55.0, 69.0, 95.0, 119.0, 109.0, 141.0, 159.0, 200.0, 207.0, 227.0, 210.0, 185.0, 235.0, 217.0, 199.0, 189.0, 193.0, 148.0, 135.0, 128.0, 120.0, 98.0, 86.0, 57.0, 58.0, 62.0, 35.0, 29.0, 22.0, 22.0, 9.0, 5.0, 4.0, 7.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.1209716796875, -11.671630859375, -11.2222900390625, -10.77294921875, -10.3236083984375, -9.874267578125, -9.4249267578125, -8.9755859375, -8.5262451171875, -8.076904296875, -7.6275634765625, -7.17822265625, -6.7288818359375, -6.279541015625, -5.8302001953125, -5.380859375, -4.9315185546875, -4.482177734375, -4.0328369140625, -3.58349609375, -3.1341552734375, -2.684814453125, -2.2354736328125, -1.7861328125, -1.3367919921875, -0.887451171875, -0.4381103515625, 0.01123046875, 0.4605712890625, 0.909912109375, 1.3592529296875, 1.80859375, 2.2579345703125, 2.707275390625, 3.1566162109375, 3.60595703125, 4.0552978515625, 4.504638671875, 4.9539794921875, 5.4033203125, 5.8526611328125, 6.302001953125, 6.7513427734375, 7.20068359375, 7.6500244140625, 8.099365234375, 8.5487060546875, 8.998046875, 9.4473876953125, 9.896728515625, 10.3460693359375, 10.79541015625, 11.2447509765625, 11.694091796875, 12.1434326171875, 12.5927734375, 13.0421142578125, 13.491455078125, 13.9407958984375, 14.39013671875, 14.8394775390625, 15.288818359375, 15.7381591796875, 16.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 9.0, 7.0, 24.0, 17.0, 22.0, 24.0, 27.0, 27.0, 26.0, 37.0, 39.0, 39.0, 44.0, 47.0, 42.0, 49.0, 47.0, 53.0, 46.0, 34.0, 36.0, 33.0, 39.0, 33.0, 28.0, 34.0, 17.0, 26.0, 19.0, 15.0, 9.0, 11.0, 13.0, 7.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.84752655029297, -29.82241439819336, -28.79730224609375, -27.77219009399414, -26.74707794189453, -25.721965789794922, -24.696855545043945, -23.671743392944336, -22.646631240844727, -21.621519088745117, -20.596406936645508, -19.5712947845459, -18.546184539794922, -17.521072387695312, -16.495960235595703, -15.470848083496094, -14.445735931396484, -13.420623779296875, -12.395511627197266, -11.370400428771973, -10.345288276672363, -9.320176124572754, -8.295064926147461, -7.269952774047852, -6.244840621948242, -5.219728469848633, -4.194616794586182, -3.1695048809051514, -2.144392967224121, -1.1192808151245117, -0.09416913986206055, 0.9309425354003906, 1.9560508728027344, 2.9811627864837646, 4.006274700164795, 5.031386375427246, 6.0564985275268555, 7.081610679626465, 8.106721878051758, 9.131834030151367, 10.156946182250977, 11.182058334350586, 12.207170486450195, 13.232281684875488, 14.257393836975098, 15.282505989074707, 16.3076171875, 17.33272933959961, 18.35784149169922, 19.382953643798828, 20.408065795898438, 21.433177947998047, 22.458290100097656, 23.483402252197266, 24.508512496948242, 25.53362464904785, 26.55873680114746, 27.58384895324707, 28.60896110534668, 29.63407325744629, 30.659183502197266, 31.684295654296875, 32.709407806396484, 33.734519958496094, 34.7596321105957]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 10.0, 15.0, 14.0, 23.0, 14.0, 22.0, 30.0, 19.0, 34.0, 40.0, 30.0, 32.0, 29.0, 40.0, 57.0, 34.0, 42.0, 26.0, 35.0, 46.0, 37.0, 37.0, 37.0, 43.0, 22.0, 32.0, 27.0, 22.0, 26.0, 18.0, 13.0, 19.0, 13.0, 8.0, 11.0, 4.0, 5.0, 8.0, 6.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-37.08695983886719, -35.967811584472656, -34.84865951538086, -33.72951126098633, -32.61035919189453, -31.4912109375, -30.372060775756836, -29.252910614013672, -28.133760452270508, -27.014610290527344, -25.89546012878418, -24.776309967041016, -23.657161712646484, -22.538009643554688, -21.418861389160156, -20.299711227416992, -19.180561065673828, -18.061410903930664, -16.9422607421875, -15.823111534118652, -14.703961372375488, -13.584811210632324, -12.465662002563477, -11.346511840820312, -10.227361679077148, -9.108211517333984, -7.9890618324279785, -6.869912147521973, -5.750761985778809, -4.6316118240356445, -3.5124621391296387, -2.393312454223633, -1.2741661071777344, -0.15501618385314941, 0.9641337394714355, 2.0832836627960205, 3.2024335861206055, 4.3215837478637695, 5.440733432769775, 6.559883117675781, 7.679033279418945, 8.79818344116211, 9.917333602905273, 11.036482810974121, 12.155632972717285, 13.27478313446045, 14.393932342529297, 15.513082504272461, 16.632232666015625, 17.75138282775879, 18.870532989501953, 19.989683151245117, 21.10883331298828, 22.227981567382812, 23.347131729125977, 24.46628189086914, 25.585432052612305, 26.70458221435547, 27.823732376098633, 28.942882537841797, 30.062030792236328, 31.181182861328125, 32.300331115722656, 33.41947937011719, 34.538631439208984]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 8.0, 7.0, 15.0, 27.0, 38.0, 53.0, 67.0, 111.0, 168.0, 227.0, 405.0, 581.0, 908.0, 1382.0, 2196.0, 3347.0, 5167.0, 8252.0, 12689.0, 20254.0, 32196.0, 51602.0, 83330.0, 132750.0, 183088.0, 177026.0, 125193.0, 77510.0, 47668.0, 30017.0, 18817.0, 12029.0, 7764.0, 4792.0, 3127.0, 1996.0, 1312.0, 854.0, 552.0, 352.0, 227.0, 133.0, 94.0, 86.0, 38.0, 36.0, 26.0, 21.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.6328125, -7.385986328125, -7.13916015625, -6.892333984375, -6.6455078125, -6.398681640625, -6.15185546875, -5.905029296875, -5.658203125, -5.411376953125, -5.16455078125, -4.917724609375, -4.6708984375, -4.424072265625, -4.17724609375, -3.930419921875, -3.68359375, -3.436767578125, -3.18994140625, -2.943115234375, -2.6962890625, -2.449462890625, -2.20263671875, -1.955810546875, -1.708984375, -1.462158203125, -1.21533203125, -0.968505859375, -0.7216796875, -0.474853515625, -0.22802734375, 0.018798828125, 0.265625, 0.512451171875, 0.75927734375, 1.006103515625, 1.2529296875, 1.499755859375, 1.74658203125, 1.993408203125, 2.240234375, 2.487060546875, 2.73388671875, 2.980712890625, 3.2275390625, 3.474365234375, 3.72119140625, 3.968017578125, 4.21484375, 4.461669921875, 4.70849609375, 4.955322265625, 5.2021484375, 5.448974609375, 5.69580078125, 5.942626953125, 6.189453125, 6.436279296875, 6.68310546875, 6.929931640625, 7.1767578125, 7.423583984375, 7.67041015625, 7.917236328125, 8.1640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 11.0, 16.0, 13.0, 22.0, 17.0, 22.0, 30.0, 20.0, 31.0, 41.0, 32.0, 32.0, 33.0, 38.0, 56.0, 31.0, 42.0, 25.0, 39.0, 41.0, 40.0, 37.0, 37.0, 39.0, 28.0, 28.0, 28.0, 23.0, 24.0, 18.0, 13.0, 18.0, 12.0, 9.0, 10.0, 5.0, 5.0, 8.0, 6.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-36.90625, -35.79150390625, -34.6767578125, -33.56201171875, -32.447265625, -31.33251953125, -30.2177734375, -29.10302734375, -27.98828125, -26.87353515625, -25.7587890625, -24.64404296875, -23.529296875, -22.41455078125, -21.2998046875, -20.18505859375, -19.0703125, -17.95556640625, -16.8408203125, -15.72607421875, -14.611328125, -13.49658203125, -12.3818359375, -11.26708984375, -10.15234375, -9.03759765625, -7.9228515625, -6.80810546875, -5.693359375, -4.57861328125, -3.4638671875, -2.34912109375, -1.234375, -0.11962890625, 0.9951171875, 2.10986328125, 3.224609375, 4.33935546875, 5.4541015625, 6.56884765625, 7.68359375, 8.79833984375, 9.9130859375, 11.02783203125, 12.142578125, 13.25732421875, 14.3720703125, 15.48681640625, 16.6015625, 17.71630859375, 18.8310546875, 19.94580078125, 21.060546875, 22.17529296875, 23.2900390625, 24.40478515625, 25.51953125, 26.63427734375, 27.7490234375, 28.86376953125, 29.978515625, 31.09326171875, 32.2080078125, 33.32275390625, 34.4375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 14.0, 10.0, 18.0, 27.0, 37.0, 52.0, 67.0, 81.0, 103.0, 178.0, 266.0, 290.0, 414.0, 631.0, 957.0, 1435.0, 2320.0, 3738.0, 6822.0, 13898.0, 35092.0, 118197.0, 437367.0, 300933.0, 75140.0, 25047.0, 10697.0, 5361.0, 3200.0, 1974.0, 1289.0, 831.0, 599.0, 429.0, 271.0, 209.0, 133.0, 113.0, 65.0, 52.0, 51.0, 34.0, 31.0, 15.0, 16.0, 11.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-15.65625, -15.1793212890625, -14.702392578125, -14.2254638671875, -13.74853515625, -13.2716064453125, -12.794677734375, -12.3177490234375, -11.8408203125, -11.3638916015625, -10.886962890625, -10.4100341796875, -9.93310546875, -9.4561767578125, -8.979248046875, -8.5023193359375, -8.025390625, -7.5484619140625, -7.071533203125, -6.5946044921875, -6.11767578125, -5.6407470703125, -5.163818359375, -4.6868896484375, -4.2099609375, -3.7330322265625, -3.256103515625, -2.7791748046875, -2.30224609375, -1.8253173828125, -1.348388671875, -0.8714599609375, -0.39453125, 0.0823974609375, 0.559326171875, 1.0362548828125, 1.51318359375, 1.9901123046875, 2.467041015625, 2.9439697265625, 3.4208984375, 3.8978271484375, 4.374755859375, 4.8516845703125, 5.32861328125, 5.8055419921875, 6.282470703125, 6.7593994140625, 7.236328125, 7.7132568359375, 8.190185546875, 8.6671142578125, 9.14404296875, 9.6209716796875, 10.097900390625, 10.5748291015625, 11.0517578125, 11.5286865234375, 12.005615234375, 12.4825439453125, 12.95947265625, 13.4364013671875, 13.913330078125, 14.3902587890625, 14.8671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 13.0, 15.0, 15.0, 23.0, 17.0, 27.0, 31.0, 29.0, 30.0, 40.0, 32.0, 41.0, 35.0, 30.0, 32.0, 43.0, 44.0, 55.0, 40.0, 40.0, 24.0, 41.0, 36.0, 34.0, 32.0, 16.0, 24.0, 16.0, 23.0, 22.0, 12.0, 9.0, 8.0, 8.0, 9.0, 6.0, 4.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 4.0], "bins": [-29.109375, -28.2900390625, -27.470703125, -26.6513671875, -25.83203125, -25.0126953125, -24.193359375, -23.3740234375, -22.5546875, -21.7353515625, -20.916015625, -20.0966796875, -19.27734375, -18.4580078125, -17.638671875, -16.8193359375, -16.0, -15.1806640625, -14.361328125, -13.5419921875, -12.72265625, -11.9033203125, -11.083984375, -10.2646484375, -9.4453125, -8.6259765625, -7.806640625, -6.9873046875, -6.16796875, -5.3486328125, -4.529296875, -3.7099609375, -2.890625, -2.0712890625, -1.251953125, -0.4326171875, 0.38671875, 1.2060546875, 2.025390625, 2.8447265625, 3.6640625, 4.4833984375, 5.302734375, 6.1220703125, 6.94140625, 7.7607421875, 8.580078125, 9.3994140625, 10.21875, 11.0380859375, 11.857421875, 12.6767578125, 13.49609375, 14.3154296875, 15.134765625, 15.9541015625, 16.7734375, 17.5927734375, 18.412109375, 19.2314453125, 20.05078125, 20.8701171875, 21.689453125, 22.5087890625, 23.328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 8.0, 8.0, 17.0, 28.0, 40.0, 61.0, 91.0, 118.0, 227.0, 323.0, 527.0, 841.0, 1546.0, 2912.0, 5967.0, 14515.0, 40272.0, 214013.0, 640836.0, 83112.0, 23817.0, 9547.0, 4316.0, 2255.0, 1172.0, 689.0, 434.0, 277.0, 182.0, 138.0, 84.0, 52.0, 38.0, 26.0, 19.0, 12.0, 12.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.5108642578125, -13.092041015625, -12.6732177734375, -12.25439453125, -11.8355712890625, -11.416748046875, -10.9979248046875, -10.5791015625, -10.1602783203125, -9.741455078125, -9.3226318359375, -8.90380859375, -8.4849853515625, -8.066162109375, -7.6473388671875, -7.228515625, -6.8096923828125, -6.390869140625, -5.9720458984375, -5.55322265625, -5.1343994140625, -4.715576171875, -4.2967529296875, -3.8779296875, -3.4591064453125, -3.040283203125, -2.6214599609375, -2.20263671875, -1.7838134765625, -1.364990234375, -0.9461669921875, -0.52734375, -0.1085205078125, 0.310302734375, 0.7291259765625, 1.14794921875, 1.5667724609375, 1.985595703125, 2.4044189453125, 2.8232421875, 3.2420654296875, 3.660888671875, 4.0797119140625, 4.49853515625, 4.9173583984375, 5.336181640625, 5.7550048828125, 6.173828125, 6.5926513671875, 7.011474609375, 7.4302978515625, 7.84912109375, 8.2679443359375, 8.686767578125, 9.1055908203125, 9.5244140625, 9.9432373046875, 10.362060546875, 10.7808837890625, 11.19970703125, 11.6185302734375, 12.037353515625, 12.4561767578125, 12.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 11.0, 8.0, 14.0, 28.0, 33.0, 60.0, 127.0, 195.0, 161.0, 134.0, 65.0, 37.0, 23.0, 11.0, 15.0, 8.0, 11.0, 6.0, 2.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0014047622680664062, -0.00136469304561615, -0.0013246238231658936, -0.0012845546007156372, -0.0012444853782653809, -0.0012044161558151245, -0.0011643469333648682, -0.0011242777109146118, -0.0010842084884643555, -0.0010441392660140991, -0.0010040700435638428, -0.0009640008211135864, -0.0009239315986633301, -0.0008838623762130737, -0.0008437931537628174, -0.000803723931312561, -0.0007636547088623047, -0.0007235854864120483, -0.000683516263961792, -0.0006434470415115356, -0.0006033778190612793, -0.000563308596611023, -0.0005232393741607666, -0.00048317015171051025, -0.0004431009292602539, -0.00040303170680999756, -0.0003629624843597412, -0.00032289326190948486, -0.0002828240394592285, -0.00024275481700897217, -0.00020268559455871582, -0.00016261637210845947, -0.00012254714965820312, -8.247792720794678e-05, -4.240870475769043e-05, -2.339482307434082e-06, 3.7729740142822266e-05, 7.779896259307861e-05, 0.00011786818504333496, 0.0001579374074935913, 0.00019800662994384766, 0.000238075852394104, 0.00027814507484436035, 0.0003182142972946167, 0.00035828351974487305, 0.0003983527421951294, 0.00043842196464538574, 0.0004784911870956421, 0.0005185604095458984, 0.0005586296319961548, 0.0005986988544464111, 0.0006387680768966675, 0.0006788372993469238, 0.0007189065217971802, 0.0007589757442474365, 0.0007990449666976929, 0.0008391141891479492, 0.0008791834115982056, 0.0009192526340484619, 0.0009593218564987183, 0.0009993910789489746, 0.001039460301399231, 0.0010795295238494873, 0.0011195987462997437, 0.00115966796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 18.0, 12.0, 26.0, 41.0, 50.0, 61.0, 121.0, 165.0, 250.0, 399.0, 693.0, 1170.0, 2149.0, 4031.0, 7431.0, 14124.0, 29954.0, 66507.0, 155203.0, 306899.0, 251208.0, 112386.0, 49093.0, 22376.0, 11016.0, 5742.0, 3030.0, 1775.0, 985.0, 586.0, 398.0, 231.0, 126.0, 74.0, 78.0, 37.0, 29.0, 23.0, 18.0, 12.0, 8.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.90625, -8.6171875, -8.328125, -8.0390625, -7.75, -7.4609375, -7.171875, -6.8828125, -6.59375, -6.3046875, -6.015625, -5.7265625, -5.4375, -5.1484375, -4.859375, -4.5703125, -4.28125, -3.9921875, -3.703125, -3.4140625, -3.125, -2.8359375, -2.546875, -2.2578125, -1.96875, -1.6796875, -1.390625, -1.1015625, -0.8125, -0.5234375, -0.234375, 0.0546875, 0.34375, 0.6328125, 0.921875, 1.2109375, 1.5, 1.7890625, 2.078125, 2.3671875, 2.65625, 2.9453125, 3.234375, 3.5234375, 3.8125, 4.1015625, 4.390625, 4.6796875, 4.96875, 5.2578125, 5.546875, 5.8359375, 6.125, 6.4140625, 6.703125, 6.9921875, 7.28125, 7.5703125, 7.859375, 8.1484375, 8.4375, 8.7265625, 9.015625, 9.3046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 10.0, 10.0, 8.0, 11.0, 15.0, 17.0, 28.0, 25.0, 37.0, 50.0, 45.0, 49.0, 68.0, 75.0, 73.0, 64.0, 71.0, 47.0, 54.0, 42.0, 30.0, 22.0, 13.0, 21.0, 20.0, 13.0, 13.0, 8.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.681640625, -3.57159423828125, -3.4615478515625, -3.35150146484375, -3.241455078125, -3.13140869140625, -3.0213623046875, -2.91131591796875, -2.80126953125, -2.69122314453125, -2.5811767578125, -2.47113037109375, -2.361083984375, -2.25103759765625, -2.1409912109375, -2.03094482421875, -1.9208984375, -1.81085205078125, -1.7008056640625, -1.59075927734375, -1.480712890625, -1.37066650390625, -1.2606201171875, -1.15057373046875, -1.04052734375, -0.93048095703125, -0.8204345703125, -0.71038818359375, -0.600341796875, -0.49029541015625, -0.3802490234375, -0.27020263671875, -0.16015625, -0.05010986328125, 0.0599365234375, 0.16998291015625, 0.280029296875, 0.39007568359375, 0.5001220703125, 0.61016845703125, 0.72021484375, 0.83026123046875, 0.9403076171875, 1.05035400390625, 1.160400390625, 1.27044677734375, 1.3804931640625, 1.49053955078125, 1.6005859375, 1.71063232421875, 1.8206787109375, 1.93072509765625, 2.040771484375, 2.15081787109375, 2.2608642578125, 2.37091064453125, 2.48095703125, 2.59100341796875, 2.7010498046875, 2.81109619140625, 2.921142578125, 3.03118896484375, 3.1412353515625, 3.25128173828125, 3.361328125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 7.0, 6.0, 9.0, 14.0, 12.0, 21.0, 25.0, 29.0, 23.0, 34.0, 25.0, 34.0, 43.0, 43.0, 45.0, 39.0, 47.0, 50.0, 38.0, 58.0, 42.0, 34.0, 43.0, 42.0, 34.0, 31.0, 30.0, 26.0, 26.0, 19.0, 20.0, 13.0, 11.0, 8.0, 11.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.220537185668945, -30.17650032043457, -29.132461547851562, -28.088424682617188, -27.044387817382812, -26.000350952148438, -24.95631217956543, -23.912275314331055, -22.868236541748047, -21.824199676513672, -20.780160903930664, -19.73612403869629, -18.692087173461914, -17.648048400878906, -16.60401153564453, -15.559974670410156, -14.515937805175781, -13.47189998626709, -12.427863121032715, -11.383825302124023, -10.339788436889648, -9.295750617980957, -8.251712799072266, -7.207675457000732, -6.163638114929199, -5.119600772857666, -4.075563430786133, -3.0315256118774414, -1.9874882698059082, -0.943450927734375, 0.1005868911743164, 1.1446242332458496, 2.18865966796875, 3.232697010040283, 4.276734352111816, 5.320772171020508, 6.364809513092041, 7.408846855163574, 8.452884674072266, 9.49692153930664, 10.540959358215332, 11.584997177124023, 12.629034042358398, 13.67307186126709, 14.717109680175781, 15.761146545410156, 16.80518341064453, 17.84922218322754, 18.893259048461914, 19.93729591369629, 20.981334686279297, 22.025371551513672, 23.069408416748047, 24.113445281982422, 25.15748405456543, 26.201520919799805, 27.245559692382812, 28.289596557617188, 29.333635330200195, 30.37767219543457, 31.421709060668945, 32.46574783325195, 33.50978469848633, 34.5538215637207, 35.59785842895508]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 14.0, 11.0, 18.0, 27.0, 20.0, 21.0, 30.0, 26.0, 41.0, 20.0, 42.0, 43.0, 38.0, 45.0, 40.0, 33.0, 38.0, 34.0, 47.0, 39.0, 32.0, 31.0, 41.0, 24.0, 38.0, 23.0, 28.0, 21.0, 22.0, 23.0, 14.0, 11.0, 9.0, 6.0, 6.0, 7.0, 8.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.48810577392578, -35.36256790161133, -34.237030029296875, -33.111488342285156, -31.985950469970703, -30.86041259765625, -29.734872817993164, -28.609333038330078, -27.483795166015625, -26.358257293701172, -25.232717514038086, -24.107177734375, -22.981639862060547, -21.856101989746094, -20.730562210083008, -19.605022430419922, -18.47948455810547, -17.353946685791016, -16.22840690612793, -15.10286808013916, -13.97732925415039, -12.851790428161621, -11.726251602172852, -10.600712776184082, -9.475173950195312, -8.349635124206543, -7.224096298217773, -6.098557472229004, -4.973018646240234, -3.847479820251465, -2.7219409942626953, -1.5964021682739258, -0.4708671569824219, 0.6546716690063477, 1.7802104949951172, 2.9057493209838867, 4.031288146972656, 5.156826972961426, 6.282365798950195, 7.407904624938965, 8.533443450927734, 9.658982276916504, 10.784521102905273, 11.910059928894043, 13.035598754882812, 14.161137580871582, 15.286676406860352, 16.412216186523438, 17.53775405883789, 18.663291931152344, 19.78883171081543, 20.914371490478516, 22.03990936279297, 23.165447235107422, 24.290987014770508, 25.416526794433594, 26.542064666748047, 27.6676025390625, 28.793142318725586, 29.918682098388672, 31.044219970703125, 32.16975784301758, 33.29529571533203, 34.42083740234375, 35.5463752746582]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 4.0, 9.0, 14.0, 36.0, 51.0, 73.0, 144.0, 197.0, 286.0, 513.0, 804.0, 1275.0, 1976.0, 3022.0, 4779.0, 7312.0, 10481.0, 16014.0, 22710.0, 31626.0, 42832.0, 55120.0, 67682.0, 79661.0, 89057.0, 94130.0, 93701.0, 88241.0, 78430.0, 66441.0, 53199.0, 41284.0, 30523.0, 21824.0, 15456.0, 10212.0, 6826.0, 4515.0, 3042.0, 1855.0, 1221.0, 735.0, 489.0, 261.0, 162.0, 120.0, 95.0, 44.0, 30.0, 19.0, 10.0, 12.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.474365234375, -16.87060546875, -16.266845703125, -15.6630859375, -15.059326171875, -14.45556640625, -13.851806640625, -13.248046875, -12.644287109375, -12.04052734375, -11.436767578125, -10.8330078125, -10.229248046875, -9.62548828125, -9.021728515625, -8.41796875, -7.814208984375, -7.21044921875, -6.606689453125, -6.0029296875, -5.399169921875, -4.79541015625, -4.191650390625, -3.587890625, -2.984130859375, -2.38037109375, -1.776611328125, -1.1728515625, -0.569091796875, 0.03466796875, 0.638427734375, 1.2421875, 1.845947265625, 2.44970703125, 3.053466796875, 3.6572265625, 4.260986328125, 4.86474609375, 5.468505859375, 6.072265625, 6.676025390625, 7.27978515625, 7.883544921875, 8.4873046875, 9.091064453125, 9.69482421875, 10.298583984375, 10.90234375, 11.506103515625, 12.10986328125, 12.713623046875, 13.3173828125, 13.921142578125, 14.52490234375, 15.128662109375, 15.732421875, 16.336181640625, 16.93994140625, 17.543701171875, 18.1474609375, 18.751220703125, 19.35498046875, 19.958740234375, 20.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 5.0, 13.0, 13.0, 19.0, 23.0, 22.0, 20.0, 26.0, 29.0, 38.0, 21.0, 40.0, 42.0, 38.0, 45.0, 41.0, 34.0, 36.0, 39.0, 41.0, 42.0, 34.0, 30.0, 41.0, 25.0, 37.0, 26.0, 27.0, 23.0, 18.0, 26.0, 13.0, 12.0, 8.0, 8.0, 6.0, 8.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.6875, -34.591796875, -33.49609375, -32.400390625, -31.3046875, -30.208984375, -29.11328125, -28.017578125, -26.921875, -25.826171875, -24.73046875, -23.634765625, -22.5390625, -21.443359375, -20.34765625, -19.251953125, -18.15625, -17.060546875, -15.96484375, -14.869140625, -13.7734375, -12.677734375, -11.58203125, -10.486328125, -9.390625, -8.294921875, -7.19921875, -6.103515625, -5.0078125, -3.912109375, -2.81640625, -1.720703125, -0.625, 0.470703125, 1.56640625, 2.662109375, 3.7578125, 4.853515625, 5.94921875, 7.044921875, 8.140625, 9.236328125, 10.33203125, 11.427734375, 12.5234375, 13.619140625, 14.71484375, 15.810546875, 16.90625, 18.001953125, 19.09765625, 20.193359375, 21.2890625, 22.384765625, 23.48046875, 24.576171875, 25.671875, 26.767578125, 27.86328125, 28.958984375, 30.0546875, 31.150390625, 32.24609375, 33.341796875, 34.4375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 14.0, 40.0, 53.0, 65.0, 107.0, 189.0, 287.0, 466.0, 658.0, 1106.0, 1807.0, 2886.0, 4513.0, 7057.0, 10865.0, 16319.0, 24354.0, 35061.0, 48256.0, 64067.0, 80390.0, 94310.0, 103721.0, 105999.0, 99785.0, 88039.0, 72357.0, 56515.0, 41511.0, 29723.0, 20149.0, 13506.0, 8979.0, 5556.0, 3595.0, 2310.0, 1456.0, 893.0, 622.0, 340.0, 219.0, 147.0, 101.0, 47.0, 37.0, 25.0, 15.0, 8.0, 7.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.234375, -21.545166015625, -20.85595703125, -20.166748046875, -19.4775390625, -18.788330078125, -18.09912109375, -17.409912109375, -16.720703125, -16.031494140625, -15.34228515625, -14.653076171875, -13.9638671875, -13.274658203125, -12.58544921875, -11.896240234375, -11.20703125, -10.517822265625, -9.82861328125, -9.139404296875, -8.4501953125, -7.760986328125, -7.07177734375, -6.382568359375, -5.693359375, -5.004150390625, -4.31494140625, -3.625732421875, -2.9365234375, -2.247314453125, -1.55810546875, -0.868896484375, -0.1796875, 0.509521484375, 1.19873046875, 1.887939453125, 2.5771484375, 3.266357421875, 3.95556640625, 4.644775390625, 5.333984375, 6.023193359375, 6.71240234375, 7.401611328125, 8.0908203125, 8.780029296875, 9.46923828125, 10.158447265625, 10.84765625, 11.536865234375, 12.22607421875, 12.915283203125, 13.6044921875, 14.293701171875, 14.98291015625, 15.672119140625, 16.361328125, 17.050537109375, 17.73974609375, 18.428955078125, 19.1181640625, 19.807373046875, 20.49658203125, 21.185791015625, 21.875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 9.0, 8.0, 13.0, 6.0, 19.0, 13.0, 24.0, 18.0, 31.0, 21.0, 26.0, 39.0, 26.0, 36.0, 46.0, 34.0, 42.0, 44.0, 48.0, 44.0, 48.0, 45.0, 34.0, 43.0, 35.0, 30.0, 38.0, 24.0, 22.0, 22.0, 14.0, 19.0, 15.0, 11.0, 14.0, 6.0, 8.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.0625, -26.297119140625, -25.53173828125, -24.766357421875, -24.0009765625, -23.235595703125, -22.47021484375, -21.704833984375, -20.939453125, -20.174072265625, -19.40869140625, -18.643310546875, -17.8779296875, -17.112548828125, -16.34716796875, -15.581787109375, -14.81640625, -14.051025390625, -13.28564453125, -12.520263671875, -11.7548828125, -10.989501953125, -10.22412109375, -9.458740234375, -8.693359375, -7.927978515625, -7.16259765625, -6.397216796875, -5.6318359375, -4.866455078125, -4.10107421875, -3.335693359375, -2.5703125, -1.804931640625, -1.03955078125, -0.274169921875, 0.4912109375, 1.256591796875, 2.02197265625, 2.787353515625, 3.552734375, 4.318115234375, 5.08349609375, 5.848876953125, 6.6142578125, 7.379638671875, 8.14501953125, 8.910400390625, 9.67578125, 10.441162109375, 11.20654296875, 11.971923828125, 12.7373046875, 13.502685546875, 14.26806640625, 15.033447265625, 15.798828125, 16.564208984375, 17.32958984375, 18.094970703125, 18.8603515625, 19.625732421875, 20.39111328125, 21.156494140625, 21.921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 7.0, 2.0, 5.0, 9.0, 11.0, 14.0, 41.0, 53.0, 69.0, 110.0, 194.0, 283.0, 464.0, 736.0, 1174.0, 1859.0, 3009.0, 5106.0, 8229.0, 13662.0, 22752.0, 36735.0, 56916.0, 82765.0, 109868.0, 130962.0, 137229.0, 126021.0, 102838.0, 75287.0, 50223.0, 31783.0, 19766.0, 11842.0, 7087.0, 4318.0, 2641.0, 1657.0, 1071.0, 633.0, 391.0, 257.0, 171.0, 103.0, 64.0, 43.0, 31.0, 24.0, 18.0, 11.0, 10.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5859375, -10.225341796875, -9.86474609375, -9.504150390625, -9.1435546875, -8.782958984375, -8.42236328125, -8.061767578125, -7.701171875, -7.340576171875, -6.97998046875, -6.619384765625, -6.2587890625, -5.898193359375, -5.53759765625, -5.177001953125, -4.81640625, -4.455810546875, -4.09521484375, -3.734619140625, -3.3740234375, -3.013427734375, -2.65283203125, -2.292236328125, -1.931640625, -1.571044921875, -1.21044921875, -0.849853515625, -0.4892578125, -0.128662109375, 0.23193359375, 0.592529296875, 0.953125, 1.313720703125, 1.67431640625, 2.034912109375, 2.3955078125, 2.756103515625, 3.11669921875, 3.477294921875, 3.837890625, 4.198486328125, 4.55908203125, 4.919677734375, 5.2802734375, 5.640869140625, 6.00146484375, 6.362060546875, 6.72265625, 7.083251953125, 7.44384765625, 7.804443359375, 8.1650390625, 8.525634765625, 8.88623046875, 9.246826171875, 9.607421875, 9.968017578125, 10.32861328125, 10.689208984375, 11.0498046875, 11.410400390625, 11.77099609375, 12.131591796875, 12.4921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 12.0, 15.0, 24.0, 15.0, 18.0, 27.0, 30.0, 22.0, 30.0, 33.0, 42.0, 38.0, 52.0, 45.0, 41.0, 46.0, 38.0, 37.0, 31.0, 38.0, 44.0, 37.0, 29.0, 28.0, 19.0, 31.0, 16.0, 19.0, 21.0, 11.0, 9.0, 14.0, 16.0, 5.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00106048583984375, -0.0010278522968292236, -0.0009952187538146973, -0.0009625852108001709, -0.0009299516677856445, -0.0008973181247711182, -0.0008646845817565918, -0.0008320510387420654, -0.0007994174957275391, -0.0007667839527130127, -0.0007341504096984863, -0.00070151686668396, -0.0006688833236694336, -0.0006362497806549072, -0.0006036162376403809, -0.0005709826946258545, -0.0005383491516113281, -0.0005057156085968018, -0.0004730820655822754, -0.000440448522567749, -0.00040781497955322266, -0.0003751814365386963, -0.0003425478935241699, -0.00030991435050964355, -0.0002772808074951172, -0.0002446472644805908, -0.00021201372146606445, -0.00017938017845153809, -0.00014674663543701172, -0.00011411309242248535, -8.147954940795898e-05, -4.884600639343262e-05, -1.621246337890625e-05, 1.6421079635620117e-05, 4.9054622650146484e-05, 8.168816566467285e-05, 0.00011432170867919922, 0.00014695525169372559, 0.00017958879470825195, 0.00021222233772277832, 0.0002448558807373047, 0.00027748942375183105, 0.0003101229667663574, 0.0003427565097808838, 0.00037539005279541016, 0.0004080235958099365, 0.0004406571388244629, 0.00047329068183898926, 0.0005059242248535156, 0.000538557767868042, 0.0005711913108825684, 0.0006038248538970947, 0.0006364583969116211, 0.0006690919399261475, 0.0007017254829406738, 0.0007343590259552002, 0.0007669925689697266, 0.0007996261119842529, 0.0008322596549987793, 0.0008648931980133057, 0.000897526741027832, 0.0009301602840423584, 0.0009627938270568848, 0.0009954273700714111, 0.0010280609130859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 9.0, 10.0, 16.0, 22.0, 30.0, 43.0, 63.0, 80.0, 169.0, 239.0, 407.0, 723.0, 1217.0, 2258.0, 3994.0, 7449.0, 14008.0, 26347.0, 46875.0, 79317.0, 119245.0, 154922.0, 167833.0, 148694.0, 110735.0, 71652.0, 41930.0, 23056.0, 12308.0, 6555.0, 3594.0, 1979.0, 1125.0, 632.0, 365.0, 208.0, 162.0, 98.0, 48.0, 30.0, 26.0, 24.0, 21.0, 12.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8984375, -13.4256591796875, -12.952880859375, -12.4801025390625, -12.00732421875, -11.5345458984375, -11.061767578125, -10.5889892578125, -10.1162109375, -9.6434326171875, -9.170654296875, -8.6978759765625, -8.22509765625, -7.7523193359375, -7.279541015625, -6.8067626953125, -6.333984375, -5.8612060546875, -5.388427734375, -4.9156494140625, -4.44287109375, -3.9700927734375, -3.497314453125, -3.0245361328125, -2.5517578125, -2.0789794921875, -1.606201171875, -1.1334228515625, -0.66064453125, -0.1878662109375, 0.284912109375, 0.7576904296875, 1.23046875, 1.7032470703125, 2.176025390625, 2.6488037109375, 3.12158203125, 3.5943603515625, 4.067138671875, 4.5399169921875, 5.0126953125, 5.4854736328125, 5.958251953125, 6.4310302734375, 6.90380859375, 7.3765869140625, 7.849365234375, 8.3221435546875, 8.794921875, 9.2677001953125, 9.740478515625, 10.2132568359375, 10.68603515625, 11.1588134765625, 11.631591796875, 12.1043701171875, 12.5771484375, 13.0499267578125, 13.522705078125, 13.9954833984375, 14.46826171875, 14.9410400390625, 15.413818359375, 15.8865966796875, 16.359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 9.0, 3.0, 8.0, 3.0, 4.0, 7.0, 16.0, 10.0, 19.0, 24.0, 31.0, 29.0, 25.0, 43.0, 46.0, 48.0, 47.0, 41.0, 53.0, 45.0, 74.0, 57.0, 49.0, 48.0, 44.0, 28.0, 30.0, 36.0, 26.0, 18.0, 19.0, 13.0, 8.0, 9.0, 10.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.40625, -6.21484375, -6.0234375, -5.83203125, -5.640625, -5.44921875, -5.2578125, -5.06640625, -4.875, -4.68359375, -4.4921875, -4.30078125, -4.109375, -3.91796875, -3.7265625, -3.53515625, -3.34375, -3.15234375, -2.9609375, -2.76953125, -2.578125, -2.38671875, -2.1953125, -2.00390625, -1.8125, -1.62109375, -1.4296875, -1.23828125, -1.046875, -0.85546875, -0.6640625, -0.47265625, -0.28125, -0.08984375, 0.1015625, 0.29296875, 0.484375, 0.67578125, 0.8671875, 1.05859375, 1.25, 1.44140625, 1.6328125, 1.82421875, 2.015625, 2.20703125, 2.3984375, 2.58984375, 2.78125, 2.97265625, 3.1640625, 3.35546875, 3.546875, 3.73828125, 3.9296875, 4.12109375, 4.3125, 4.50390625, 4.6953125, 4.88671875, 5.078125, 5.26953125, 5.4609375, 5.65234375, 5.84375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 14.0, 12.0, 19.0, 17.0, 24.0, 28.0, 29.0, 32.0, 37.0, 44.0, 62.0, 41.0, 39.0, 47.0, 46.0, 44.0, 47.0, 48.0, 44.0, 32.0, 30.0, 41.0, 43.0, 32.0, 23.0, 19.0, 19.0, 15.0, 11.0, 11.0, 13.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.589250564575195, -28.527496337890625, -27.465742111206055, -26.403987884521484, -25.342233657836914, -24.280479431152344, -23.218727111816406, -22.156970977783203, -21.095218658447266, -20.033464431762695, -18.971710205078125, -17.909955978393555, -16.848201751708984, -15.786447525024414, -14.72469425201416, -13.66294002532959, -12.601184844970703, -11.539430618286133, -10.477676391601562, -9.415922164916992, -8.354167938232422, -7.29241418838501, -6.230660438537598, -5.168906211853027, -4.107151985168457, -3.0453977584838867, -1.9836437702178955, -0.9218897819519043, 0.13986444473266602, 1.2016186714172363, 2.2633724212646484, 3.3251266479492188, 4.386878967285156, 5.448633193969727, 6.510387420654297, 7.572141170501709, 8.633895874023438, 9.695650100708008, 10.757403373718262, 11.819157600402832, 12.880911827087402, 13.942666053771973, 15.004420280456543, 16.066173553466797, 17.127927780151367, 18.189682006835938, 19.251436233520508, 20.313190460205078, 21.37494468688965, 22.43669891357422, 23.49845314025879, 24.56020736694336, 25.62196159362793, 26.6837158203125, 27.745468139648438, 28.80722427368164, 29.868976593017578, 30.93073081970215, 31.99248504638672, 33.054237365722656, 34.11599349975586, 35.1777458190918, 36.239501953125, 37.30125427246094, 38.36301040649414]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 13.0, 16.0, 22.0, 18.0, 21.0, 35.0, 43.0, 35.0, 42.0, 38.0, 34.0, 36.0, 44.0, 53.0, 49.0, 51.0, 51.0, 43.0, 48.0, 39.0, 36.0, 29.0, 28.0, 20.0, 24.0, 23.0, 16.0, 11.0, 11.0, 14.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.754581451416016, -46.424312591552734, -45.09404373168945, -43.76377487182617, -42.433502197265625, -41.103233337402344, -39.77296447753906, -38.44269561767578, -37.1124267578125, -35.78215789794922, -34.45188903808594, -33.121620178222656, -31.791349411010742, -30.46108055114746, -29.130809783935547, -27.800540924072266, -26.470272064208984, -25.140003204345703, -23.809734344482422, -22.479463577270508, -21.149194717407227, -19.818925857543945, -18.48865509033203, -17.15838623046875, -15.828117370605469, -14.497848510742188, -13.16757869720459, -11.837308883666992, -10.507040023803711, -9.17677116394043, -7.846501350402832, -6.516231536865234, -5.1859588623046875, -3.855689525604248, -2.5254201889038086, -1.1951508522033691, 0.1351184844970703, 1.4653878211975098, 2.795657157897949, 4.125926971435547, 5.456195831298828, 6.786465167999268, 8.116734504699707, 9.447004318237305, 10.777273178100586, 12.107542037963867, 13.437811851501465, 14.768081665039062, 16.098350524902344, 17.428619384765625, 18.758888244628906, 20.08915901184082, 21.4194278717041, 22.749696731567383, 24.079967498779297, 25.410236358642578, 26.74050521850586, 28.07077407836914, 29.401042938232422, 30.731313705444336, 32.06158447265625, 33.39185333251953, 34.72212219238281, 36.052391052246094, 37.382659912109375]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 16.0, 22.0, 36.0, 60.0, 108.0, 176.0, 288.0, 495.0, 838.0, 1225.0, 2135.0, 3420.0, 5597.0, 9207.0, 14734.0, 23686.0, 37308.0, 57882.0, 87196.0, 127264.0, 179276.0, 241164.0, 307986.0, 368958.0, 413128.0, 428317.0, 412362.0, 368871.0, 307473.0, 241890.0, 179876.0, 128276.0, 87265.0, 57948.0, 37517.0, 24051.0, 14866.0, 9250.0, 5550.0, 3423.0, 2094.0, 1294.0, 705.0, 431.0, 264.0, 148.0, 89.0, 52.0, 28.0, 13.0, 7.0, 6.0, 3.0, 4.0, 2.0], "bins": [-23.265625, -22.59130859375, -21.9169921875, -21.24267578125, -20.568359375, -19.89404296875, -19.2197265625, -18.54541015625, -17.87109375, -17.19677734375, -16.5224609375, -15.84814453125, -15.173828125, -14.49951171875, -13.8251953125, -13.15087890625, -12.4765625, -11.80224609375, -11.1279296875, -10.45361328125, -9.779296875, -9.10498046875, -8.4306640625, -7.75634765625, -7.08203125, -6.40771484375, -5.7333984375, -5.05908203125, -4.384765625, -3.71044921875, -3.0361328125, -2.36181640625, -1.6875, -1.01318359375, -0.3388671875, 0.33544921875, 1.009765625, 1.68408203125, 2.3583984375, 3.03271484375, 3.70703125, 4.38134765625, 5.0556640625, 5.72998046875, 6.404296875, 7.07861328125, 7.7529296875, 8.42724609375, 9.1015625, 9.77587890625, 10.4501953125, 11.12451171875, 11.798828125, 12.47314453125, 13.1474609375, 13.82177734375, 14.49609375, 15.17041015625, 15.8447265625, 16.51904296875, 17.193359375, 17.86767578125, 18.5419921875, 19.21630859375, 19.890625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 2.0, 8.0, 2.0, 11.0, 8.0, 14.0, 14.0, 17.0, 23.0, 22.0, 36.0, 39.0, 35.0, 38.0, 41.0, 30.0, 38.0, 42.0, 51.0, 50.0, 55.0, 48.0, 36.0, 55.0, 48.0, 34.0, 27.0, 27.0, 21.0, 28.0, 21.0, 16.0, 10.0, 14.0, 14.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.21875, -40.083251953125, -38.94775390625, -37.812255859375, -36.6767578125, -35.541259765625, -34.40576171875, -33.270263671875, -32.134765625, -30.999267578125, -29.86376953125, -28.728271484375, -27.5927734375, -26.457275390625, -25.32177734375, -24.186279296875, -23.05078125, -21.915283203125, -20.77978515625, -19.644287109375, -18.5087890625, -17.373291015625, -16.23779296875, -15.102294921875, -13.966796875, -12.831298828125, -11.69580078125, -10.560302734375, -9.4248046875, -8.289306640625, -7.15380859375, -6.018310546875, -4.8828125, -3.747314453125, -2.61181640625, -1.476318359375, -0.3408203125, 0.794677734375, 1.93017578125, 3.065673828125, 4.201171875, 5.336669921875, 6.47216796875, 7.607666015625, 8.7431640625, 9.878662109375, 11.01416015625, 12.149658203125, 13.28515625, 14.420654296875, 15.55615234375, 16.691650390625, 17.8271484375, 18.962646484375, 20.09814453125, 21.233642578125, 22.369140625, 23.504638671875, 24.64013671875, 25.775634765625, 26.9111328125, 28.046630859375, 29.18212890625, 30.317626953125, 31.453125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 5.0, 12.0, 16.0, 19.0, 51.0, 74.0, 139.0, 255.0, 361.0, 613.0, 1042.0, 1680.0, 2818.0, 4466.0, 7043.0, 11308.0, 17089.0, 26159.0, 38851.0, 56725.0, 80220.0, 109626.0, 145421.0, 187978.0, 232273.0, 274289.0, 310978.0, 337015.0, 347707.0, 344481.0, 324428.0, 290703.0, 251013.0, 206104.0, 163533.0, 125435.0, 92873.0, 66214.0, 46195.0, 31440.0, 21149.0, 13412.0, 8858.0, 5475.0, 3413.0, 2156.0, 1231.0, 782.0, 460.0, 274.0, 196.0, 99.0, 58.0, 38.0, 23.0, 10.0, 3.0, 3.0, 1.0, 2.0], "bins": [-19.828125, -19.22216796875, -18.6162109375, -18.01025390625, -17.404296875, -16.79833984375, -16.1923828125, -15.58642578125, -14.98046875, -14.37451171875, -13.7685546875, -13.16259765625, -12.556640625, -11.95068359375, -11.3447265625, -10.73876953125, -10.1328125, -9.52685546875, -8.9208984375, -8.31494140625, -7.708984375, -7.10302734375, -6.4970703125, -5.89111328125, -5.28515625, -4.67919921875, -4.0732421875, -3.46728515625, -2.861328125, -2.25537109375, -1.6494140625, -1.04345703125, -0.4375, 0.16845703125, 0.7744140625, 1.38037109375, 1.986328125, 2.59228515625, 3.1982421875, 3.80419921875, 4.41015625, 5.01611328125, 5.6220703125, 6.22802734375, 6.833984375, 7.43994140625, 8.0458984375, 8.65185546875, 9.2578125, 9.86376953125, 10.4697265625, 11.07568359375, 11.681640625, 12.28759765625, 12.8935546875, 13.49951171875, 14.10546875, 14.71142578125, 15.3173828125, 15.92333984375, 16.529296875, 17.13525390625, 17.7412109375, 18.34716796875, 18.953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 12.0, 13.0, 22.0, 37.0, 37.0, 48.0, 53.0, 61.0, 71.0, 85.0, 88.0, 119.0, 114.0, 145.0, 133.0, 158.0, 156.0, 186.0, 182.0, 192.0, 206.0, 184.0, 183.0, 195.0, 183.0, 167.0, 125.0, 122.0, 116.0, 109.0, 99.0, 80.0, 77.0, 59.0, 46.0, 45.0, 37.0, 28.0, 16.0, 21.0, 16.0, 8.0, 6.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-12.34375, -11.936767578125, -11.52978515625, -11.122802734375, -10.7158203125, -10.308837890625, -9.90185546875, -9.494873046875, -9.087890625, -8.680908203125, -8.27392578125, -7.866943359375, -7.4599609375, -7.052978515625, -6.64599609375, -6.239013671875, -5.83203125, -5.425048828125, -5.01806640625, -4.611083984375, -4.2041015625, -3.797119140625, -3.39013671875, -2.983154296875, -2.576171875, -2.169189453125, -1.76220703125, -1.355224609375, -0.9482421875, -0.541259765625, -0.13427734375, 0.272705078125, 0.6796875, 1.086669921875, 1.49365234375, 1.900634765625, 2.3076171875, 2.714599609375, 3.12158203125, 3.528564453125, 3.935546875, 4.342529296875, 4.74951171875, 5.156494140625, 5.5634765625, 5.970458984375, 6.37744140625, 6.784423828125, 7.19140625, 7.598388671875, 8.00537109375, 8.412353515625, 8.8193359375, 9.226318359375, 9.63330078125, 10.040283203125, 10.447265625, 10.854248046875, 11.26123046875, 11.668212890625, 12.0751953125, 12.482177734375, 12.88916015625, 13.296142578125, 13.703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 5.0, 9.0, 7.0, 12.0, 15.0, 19.0, 18.0, 22.0, 21.0, 33.0, 37.0, 39.0, 34.0, 55.0, 44.0, 58.0, 60.0, 43.0, 49.0, 51.0, 39.0, 44.0, 46.0, 30.0, 29.0, 31.0, 21.0, 27.0, 20.0, 13.0, 13.0, 7.0, 10.0, 7.0, 13.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.40149688720703, -32.34184646606445, -31.28219223022461, -30.2225399017334, -29.162887573242188, -28.103235244750977, -27.043582916259766, -25.983932495117188, -24.924278259277344, -23.864625930786133, -22.804973602294922, -21.74532127380371, -20.6856689453125, -19.62601661682129, -18.566364288330078, -17.5067138671875, -16.44706153869629, -15.387409210205078, -14.327756881713867, -13.268104553222656, -12.208452224731445, -11.148799896240234, -10.08914852142334, -9.029496192932129, -7.969843864440918, -6.910191535949707, -5.850539207458496, -4.790887355804443, -3.7312350273132324, -2.6715826988220215, -1.6119308471679688, -0.5522785186767578, 0.5073738098144531, 1.5670260190963745, 2.626678228378296, 3.6863303184509277, 4.745982646942139, 5.80563497543335, 6.865286827087402, 7.924939155578613, 8.984591484069824, 10.044243812561035, 11.103896141052246, 12.16354751586914, 13.223199844360352, 14.282852172851562, 15.342504501342773, 16.402156829833984, 17.461809158325195, 18.521461486816406, 19.581113815307617, 20.640766143798828, 21.70041847229004, 22.76007080078125, 23.819721221923828, 24.879375457763672, 25.93902587890625, 26.99867820739746, 28.058330535888672, 29.117982864379883, 30.177635192871094, 31.237287521362305, 32.296939849853516, 33.356590270996094, 34.41624450683594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 12.0, 10.0, 12.0, 13.0, 22.0, 30.0, 15.0, 38.0, 45.0, 33.0, 42.0, 43.0, 40.0, 48.0, 39.0, 43.0, 46.0, 44.0, 44.0, 46.0, 49.0, 37.0, 36.0, 42.0, 22.0, 25.0, 14.0, 22.0, 15.0, 14.0, 12.0, 4.0, 7.0, 4.0, 9.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.51961898803711, -42.22698211669922, -40.93434143066406, -39.64170455932617, -38.349063873291016, -37.056427001953125, -35.76378631591797, -34.47114944458008, -33.17851257324219, -31.885873794555664, -30.59323501586914, -29.300596237182617, -28.007957458496094, -26.715320587158203, -25.42268180847168, -24.130043029785156, -22.83740234375, -21.544763565063477, -20.252124786376953, -18.95948600769043, -17.666847229003906, -16.374210357666016, -15.081571578979492, -13.788932800292969, -12.496294021606445, -11.203655242919922, -9.911016464233398, -8.618378639221191, -7.325739860534668, -6.0331010818481445, -4.740462779998779, -3.447824478149414, -2.155181884765625, -0.8625433444976807, 0.43009519577026367, 1.722733736038208, 3.0153722763061523, 4.308011054992676, 5.600649356842041, 6.893287658691406, 8.18592643737793, 9.478565216064453, 10.771203994750977, 12.063841819763184, 13.356480598449707, 14.64911937713623, 15.941757202148438, 17.23439598083496, 18.527034759521484, 19.819673538208008, 21.11231231689453, 22.404951095581055, 23.697589874267578, 24.99022674560547, 26.282865524291992, 27.575504302978516, 28.86814308166504, 30.160781860351562, 31.453420639038086, 32.74605941772461, 34.0386962890625, 35.331336975097656, 36.62397384643555, 37.91661071777344, 39.209251403808594]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 8.0, 15.0, 19.0, 22.0, 36.0, 46.0, 64.0, 97.0, 144.0, 166.0, 240.0, 338.0, 489.0, 677.0, 1003.0, 1510.0, 2622.0, 4421.0, 8797.0, 21597.0, 63132.0, 219035.0, 445126.0, 186020.0, 54377.0, 19228.0, 8051.0, 4048.0, 2470.0, 1497.0, 976.0, 693.0, 435.0, 335.0, 189.0, 186.0, 130.0, 81.0, 68.0, 39.0, 31.0, 39.0, 13.0, 11.0, 4.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.8291015625, -18.189453125, -17.5498046875, -16.91015625, -16.2705078125, -15.630859375, -14.9912109375, -14.3515625, -13.7119140625, -13.072265625, -12.4326171875, -11.79296875, -11.1533203125, -10.513671875, -9.8740234375, -9.234375, -8.5947265625, -7.955078125, -7.3154296875, -6.67578125, -6.0361328125, -5.396484375, -4.7568359375, -4.1171875, -3.4775390625, -2.837890625, -2.1982421875, -1.55859375, -0.9189453125, -0.279296875, 0.3603515625, 1.0, 1.6396484375, 2.279296875, 2.9189453125, 3.55859375, 4.1982421875, 4.837890625, 5.4775390625, 6.1171875, 6.7568359375, 7.396484375, 8.0361328125, 8.67578125, 9.3154296875, 9.955078125, 10.5947265625, 11.234375, 11.8740234375, 12.513671875, 13.1533203125, 13.79296875, 14.4326171875, 15.072265625, 15.7119140625, 16.3515625, 16.9912109375, 17.630859375, 18.2705078125, 18.91015625, 19.5498046875, 20.189453125, 20.8291015625, 21.46875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 13.0, 10.0, 11.0, 13.0, 23.0, 30.0, 17.0, 35.0, 46.0, 35.0, 40.0, 43.0, 43.0, 45.0, 38.0, 48.0, 43.0, 43.0, 43.0, 46.0, 50.0, 38.0, 36.0, 40.0, 24.0, 24.0, 14.0, 21.0, 15.0, 14.0, 12.0, 4.0, 7.0, 6.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.53125, -42.240234375, -40.94921875, -39.658203125, -38.3671875, -37.076171875, -35.78515625, -34.494140625, -33.203125, -31.912109375, -30.62109375, -29.330078125, -28.0390625, -26.748046875, -25.45703125, -24.166015625, -22.875, -21.583984375, -20.29296875, -19.001953125, -17.7109375, -16.419921875, -15.12890625, -13.837890625, -12.546875, -11.255859375, -9.96484375, -8.673828125, -7.3828125, -6.091796875, -4.80078125, -3.509765625, -2.21875, -0.927734375, 0.36328125, 1.654296875, 2.9453125, 4.236328125, 5.52734375, 6.818359375, 8.109375, 9.400390625, 10.69140625, 11.982421875, 13.2734375, 14.564453125, 15.85546875, 17.146484375, 18.4375, 19.728515625, 21.01953125, 22.310546875, 23.6015625, 24.892578125, 26.18359375, 27.474609375, 28.765625, 30.056640625, 31.34765625, 32.638671875, 33.9296875, 35.220703125, 36.51171875, 37.802734375, 39.09375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 14.0, 15.0, 18.0, 31.0, 37.0, 39.0, 62.0, 89.0, 107.0, 151.0, 233.0, 348.0, 581.0, 935.0, 1702.0, 3449.0, 9174.0, 34371.0, 307696.0, 603326.0, 62802.0, 13496.0, 4556.0, 2164.0, 1116.0, 667.0, 425.0, 286.0, 187.0, 131.0, 93.0, 64.0, 59.0, 27.0, 21.0, 22.0, 17.0, 13.0, 5.0, 10.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.890625, -27.0234375, -26.15625, -25.2890625, -24.421875, -23.5546875, -22.6875, -21.8203125, -20.953125, -20.0859375, -19.21875, -18.3515625, -17.484375, -16.6171875, -15.75, -14.8828125, -14.015625, -13.1484375, -12.28125, -11.4140625, -10.546875, -9.6796875, -8.8125, -7.9453125, -7.078125, -6.2109375, -5.34375, -4.4765625, -3.609375, -2.7421875, -1.875, -1.0078125, -0.140625, 0.7265625, 1.59375, 2.4609375, 3.328125, 4.1953125, 5.0625, 5.9296875, 6.796875, 7.6640625, 8.53125, 9.3984375, 10.265625, 11.1328125, 12.0, 12.8671875, 13.734375, 14.6015625, 15.46875, 16.3359375, 17.203125, 18.0703125, 18.9375, 19.8046875, 20.671875, 21.5390625, 22.40625, 23.2734375, 24.140625, 25.0078125, 25.875, 26.7421875, 27.609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 10.0, 13.0, 4.0, 9.0, 18.0, 18.0, 19.0, 26.0, 22.0, 25.0, 29.0, 30.0, 32.0, 41.0, 48.0, 49.0, 43.0, 42.0, 49.0, 47.0, 50.0, 40.0, 38.0, 37.0, 28.0, 23.0, 32.0, 28.0, 25.0, 20.0, 18.0, 8.0, 18.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.90625, -24.0078125, -23.109375, -22.2109375, -21.3125, -20.4140625, -19.515625, -18.6171875, -17.71875, -16.8203125, -15.921875, -15.0234375, -14.125, -13.2265625, -12.328125, -11.4296875, -10.53125, -9.6328125, -8.734375, -7.8359375, -6.9375, -6.0390625, -5.140625, -4.2421875, -3.34375, -2.4453125, -1.546875, -0.6484375, 0.25, 1.1484375, 2.046875, 2.9453125, 3.84375, 4.7421875, 5.640625, 6.5390625, 7.4375, 8.3359375, 9.234375, 10.1328125, 11.03125, 11.9296875, 12.828125, 13.7265625, 14.625, 15.5234375, 16.421875, 17.3203125, 18.21875, 19.1171875, 20.015625, 20.9140625, 21.8125, 22.7109375, 23.609375, 24.5078125, 25.40625, 26.3046875, 27.203125, 28.1015625, 29.0, 29.8984375, 30.796875, 31.6953125, 32.59375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 4.0, 9.0, 10.0, 14.0, 9.0, 27.0, 40.0, 39.0, 56.0, 61.0, 82.0, 114.0, 126.0, 189.0, 265.0, 329.0, 497.0, 686.0, 1165.0, 1895.0, 4017.0, 10024.0, 40240.0, 558164.0, 379810.0, 32852.0, 8826.0, 3624.0, 1866.0, 1040.0, 645.0, 480.0, 314.0, 233.0, 189.0, 154.0, 104.0, 87.0, 59.0, 47.0, 37.0, 28.0, 28.0, 24.0, 13.0, 11.0, 4.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.2918701171875, -14.763427734375, -14.2349853515625, -13.70654296875, -13.1781005859375, -12.649658203125, -12.1212158203125, -11.5927734375, -11.0643310546875, -10.535888671875, -10.0074462890625, -9.47900390625, -8.9505615234375, -8.422119140625, -7.8936767578125, -7.365234375, -6.8367919921875, -6.308349609375, -5.7799072265625, -5.25146484375, -4.7230224609375, -4.194580078125, -3.6661376953125, -3.1376953125, -2.6092529296875, -2.080810546875, -1.5523681640625, -1.02392578125, -0.4954833984375, 0.032958984375, 0.5614013671875, 1.08984375, 1.6182861328125, 2.146728515625, 2.6751708984375, 3.20361328125, 3.7320556640625, 4.260498046875, 4.7889404296875, 5.3173828125, 5.8458251953125, 6.374267578125, 6.9027099609375, 7.43115234375, 7.9595947265625, 8.488037109375, 9.0164794921875, 9.544921875, 10.0733642578125, 10.601806640625, 11.1302490234375, 11.65869140625, 12.1871337890625, 12.715576171875, 13.2440185546875, 13.7724609375, 14.3009033203125, 14.829345703125, 15.3577880859375, 15.88623046875, 16.4146728515625, 16.943115234375, 17.4715576171875, 18.0]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 12.0, 20.0, 37.0, 51.0, 73.0, 105.0, 151.0, 134.0, 135.0, 90.0, 53.0, 39.0, 30.0, 21.0, 9.0, 6.0, 9.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008521080017089844, -0.0008221343159675598, -0.0007921606302261353, -0.0007621869444847107, -0.0007322132587432861, -0.0007022395730018616, -0.000672265887260437, -0.0006422922015190125, -0.0006123185157775879, -0.0005823448300361633, -0.0005523711442947388, -0.0005223974585533142, -0.0004924237728118896, -0.0004624500870704651, -0.00043247640132904053, -0.00040250271558761597, -0.0003725290298461914, -0.00034255534410476685, -0.0003125816583633423, -0.0002826079726219177, -0.00025263428688049316, -0.0002226606011390686, -0.00019268691539764404, -0.00016271322965621948, -0.00013273954391479492, -0.00010276585817337036, -7.27921724319458e-05, -4.281848669052124e-05, -1.284480094909668e-05, 1.712888479232788e-05, 4.710257053375244e-05, 7.7076256275177e-05, 0.00010704994201660156, 0.00013702362775802612, 0.00016699731349945068, 0.00019697099924087524, 0.0002269446849822998, 0.00025691837072372437, 0.0002868920564651489, 0.0003168657422065735, 0.00034683942794799805, 0.0003768131136894226, 0.00040678679943084717, 0.00043676048517227173, 0.0004667341709136963, 0.0004967078566551208, 0.0005266815423965454, 0.00055665522813797, 0.0005866289138793945, 0.0006166025996208191, 0.0006465762853622437, 0.0006765499711036682, 0.0007065236568450928, 0.0007364973425865173, 0.0007664710283279419, 0.0007964447140693665, 0.000826418399810791, 0.0008563920855522156, 0.0008863657712936401, 0.0009163394570350647, 0.0009463131427764893, 0.0009762868285179138, 0.0010062605142593384, 0.001036234200000763, 0.0010662078857421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 10.0, 6.0, 11.0, 19.0, 21.0, 18.0, 39.0, 62.0, 79.0, 92.0, 151.0, 183.0, 256.0, 359.0, 476.0, 674.0, 841.0, 1193.0, 1773.0, 2612.0, 3942.0, 6594.0, 12129.0, 24370.0, 54769.0, 131246.0, 293908.0, 283574.0, 123946.0, 51831.0, 23147.0, 11498.0, 6431.0, 3730.0, 2474.0, 1660.0, 1168.0, 868.0, 603.0, 486.0, 343.0, 289.0, 195.0, 129.0, 110.0, 66.0, 61.0, 37.0, 30.0, 11.0, 14.0, 15.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.890625, -8.603515625, -8.31640625, -8.029296875, -7.7421875, -7.455078125, -7.16796875, -6.880859375, -6.59375, -6.306640625, -6.01953125, -5.732421875, -5.4453125, -5.158203125, -4.87109375, -4.583984375, -4.296875, -4.009765625, -3.72265625, -3.435546875, -3.1484375, -2.861328125, -2.57421875, -2.287109375, -2.0, -1.712890625, -1.42578125, -1.138671875, -0.8515625, -0.564453125, -0.27734375, 0.009765625, 0.296875, 0.583984375, 0.87109375, 1.158203125, 1.4453125, 1.732421875, 2.01953125, 2.306640625, 2.59375, 2.880859375, 3.16796875, 3.455078125, 3.7421875, 4.029296875, 4.31640625, 4.603515625, 4.890625, 5.177734375, 5.46484375, 5.751953125, 6.0390625, 6.326171875, 6.61328125, 6.900390625, 7.1875, 7.474609375, 7.76171875, 8.048828125, 8.3359375, 8.623046875, 8.91015625, 9.197265625, 9.484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 8.0, 9.0, 11.0, 15.0, 27.0, 31.0, 48.0, 60.0, 59.0, 69.0, 153.0, 149.0, 85.0, 62.0, 56.0, 38.0, 37.0, 23.0, 15.0, 16.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.328125, -6.15692138671875, -5.9857177734375, -5.81451416015625, -5.643310546875, -5.47210693359375, -5.3009033203125, -5.12969970703125, -4.95849609375, -4.78729248046875, -4.6160888671875, -4.44488525390625, -4.273681640625, -4.10247802734375, -3.9312744140625, -3.76007080078125, -3.5888671875, -3.41766357421875, -3.2464599609375, -3.07525634765625, -2.904052734375, -2.73284912109375, -2.5616455078125, -2.39044189453125, -2.21923828125, -2.04803466796875, -1.8768310546875, -1.70562744140625, -1.534423828125, -1.36322021484375, -1.1920166015625, -1.02081298828125, -0.849609375, -0.67840576171875, -0.5072021484375, -0.33599853515625, -0.164794921875, 0.00640869140625, 0.1776123046875, 0.34881591796875, 0.52001953125, 0.69122314453125, 0.8624267578125, 1.03363037109375, 1.204833984375, 1.37603759765625, 1.5472412109375, 1.71844482421875, 1.8896484375, 2.06085205078125, 2.2320556640625, 2.40325927734375, 2.574462890625, 2.74566650390625, 2.9168701171875, 3.08807373046875, 3.25927734375, 3.43048095703125, 3.6016845703125, 3.77288818359375, 3.944091796875, 4.11529541015625, 4.2864990234375, 4.45770263671875, 4.62890625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 5.0, 10.0, 14.0, 15.0, 20.0, 20.0, 23.0, 31.0, 30.0, 31.0, 52.0, 44.0, 43.0, 52.0, 49.0, 41.0, 60.0, 54.0, 55.0, 32.0, 36.0, 41.0, 32.0, 21.0, 37.0, 25.0, 17.0, 18.0, 15.0, 12.0, 10.0, 7.0, 6.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.68431854248047, -32.63035583496094, -31.57638931274414, -30.522424697875977, -29.468460083007812, -28.41449737548828, -27.360532760620117, -26.306568145751953, -25.25260353088379, -24.198638916015625, -23.14467430114746, -22.090709686279297, -21.036746978759766, -19.98278045654297, -18.928817749023438, -17.874853134155273, -16.82088851928711, -15.766923904418945, -14.712959289550781, -13.658995628356934, -12.60503101348877, -11.551066398620605, -10.497102737426758, -9.443138122558594, -8.38917350769043, -7.335208892822266, -6.28124475479126, -5.227280616760254, -4.17331600189209, -3.119351387023926, -2.06538724899292, -1.011423110961914, 0.042537689208984375, 1.0965020656585693, 2.1504664421081543, 3.2044308185577393, 4.258395195007324, 5.312359809875488, 6.366323947906494, 7.4202880859375, 8.474252700805664, 9.528217315673828, 10.582181930541992, 11.63614559173584, 12.690110206604004, 13.744074821472168, 14.798038482666016, 15.85200309753418, 16.905967712402344, 17.959932327270508, 19.013896942138672, 20.067861557006836, 21.121826171875, 22.17578887939453, 23.229753494262695, 24.28371810913086, 25.337682723999023, 26.391647338867188, 27.44561195373535, 28.499576568603516, 29.553539276123047, 30.607505798339844, 31.661468505859375, 32.715431213378906, 33.7693977355957]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 15.0, 9.0, 11.0, 23.0, 20.0, 32.0, 23.0, 33.0, 44.0, 43.0, 34.0, 48.0, 43.0, 45.0, 42.0, 59.0, 36.0, 45.0, 43.0, 43.0, 48.0, 32.0, 36.0, 40.0, 20.0, 24.0, 12.0, 16.0, 12.0, 13.0, 7.0, 7.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.84357452392578, -43.52841567993164, -42.213253021240234, -40.898094177246094, -39.58293533325195, -38.26777648925781, -36.952613830566406, -35.637454986572266, -34.322296142578125, -33.007137298583984, -31.69197654724121, -30.376815795898438, -29.061656951904297, -27.746496200561523, -26.43133544921875, -25.11617660522461, -23.801015853881836, -22.485855102539062, -21.170696258544922, -19.85553550720215, -18.540376663208008, -17.225215911865234, -15.910056114196777, -14.59489631652832, -13.279736518859863, -11.964576721191406, -10.64941692352295, -9.334257125854492, -8.019096374511719, -6.70393705368042, -5.388776779174805, -4.073616981506348, -2.7584571838378906, -1.443297266960144, -0.12813735008239746, 1.1870226860046387, 2.5021824836730957, 3.8173422813415527, 5.132502555847168, 6.447662353515625, 7.762822151184082, 9.077981948852539, 10.393141746520996, 11.708301544189453, 13.023462295532227, 14.338621139526367, 15.65378189086914, 16.96894073486328, 18.284101486206055, 19.599262237548828, 20.91442108154297, 22.229581832885742, 23.544740676879883, 24.859901428222656, 26.175060272216797, 27.49022102355957, 28.805381774902344, 30.120542526245117, 31.435701370239258, 32.75086212158203, 34.06602096557617, 35.38117980957031, 36.69634246826172, 38.01150131225586, 39.32666015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 4.0, 5.0, 7.0, 19.0, 12.0, 44.0, 50.0, 98.0, 127.0, 186.0, 313.0, 565.0, 833.0, 1352.0, 2068.0, 3258.0, 4937.0, 7578.0, 11304.0, 16280.0, 23088.0, 32242.0, 42883.0, 54693.0, 67209.0, 79356.0, 88280.0, 92939.0, 92608.0, 87716.0, 78290.0, 66401.0, 53361.0, 41431.0, 30450.0, 22122.0, 15497.0, 10602.0, 7200.0, 4858.0, 3005.0, 1940.0, 1229.0, 848.0, 424.0, 315.0, 186.0, 141.0, 78.0, 57.0, 28.0, 20.0, 8.0, 8.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.265625, -16.70751953125, -16.1494140625, -15.59130859375, -15.033203125, -14.47509765625, -13.9169921875, -13.35888671875, -12.80078125, -12.24267578125, -11.6845703125, -11.12646484375, -10.568359375, -10.01025390625, -9.4521484375, -8.89404296875, -8.3359375, -7.77783203125, -7.2197265625, -6.66162109375, -6.103515625, -5.54541015625, -4.9873046875, -4.42919921875, -3.87109375, -3.31298828125, -2.7548828125, -2.19677734375, -1.638671875, -1.08056640625, -0.5224609375, 0.03564453125, 0.59375, 1.15185546875, 1.7099609375, 2.26806640625, 2.826171875, 3.38427734375, 3.9423828125, 4.50048828125, 5.05859375, 5.61669921875, 6.1748046875, 6.73291015625, 7.291015625, 7.84912109375, 8.4072265625, 8.96533203125, 9.5234375, 10.08154296875, 10.6396484375, 11.19775390625, 11.755859375, 12.31396484375, 12.8720703125, 13.43017578125, 13.98828125, 14.54638671875, 15.1044921875, 15.66259765625, 16.220703125, 16.77880859375, 17.3369140625, 17.89501953125, 18.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 13.0, 11.0, 10.0, 20.0, 23.0, 31.0, 21.0, 34.0, 42.0, 41.0, 36.0, 46.0, 46.0, 41.0, 44.0, 55.0, 43.0, 43.0, 40.0, 43.0, 49.0, 30.0, 40.0, 38.0, 24.0, 23.0, 12.0, 17.0, 13.0, 13.0, 8.0, 7.0, 10.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.78125, -42.5029296875, -41.224609375, -39.9462890625, -38.66796875, -37.3896484375, -36.111328125, -34.8330078125, -33.5546875, -32.2763671875, -30.998046875, -29.7197265625, -28.44140625, -27.1630859375, -25.884765625, -24.6064453125, -23.328125, -22.0498046875, -20.771484375, -19.4931640625, -18.21484375, -16.9365234375, -15.658203125, -14.3798828125, -13.1015625, -11.8232421875, -10.544921875, -9.2666015625, -7.98828125, -6.7099609375, -5.431640625, -4.1533203125, -2.875, -1.5966796875, -0.318359375, 0.9599609375, 2.23828125, 3.5166015625, 4.794921875, 6.0732421875, 7.3515625, 8.6298828125, 9.908203125, 11.1865234375, 12.46484375, 13.7431640625, 15.021484375, 16.2998046875, 17.578125, 18.8564453125, 20.134765625, 21.4130859375, 22.69140625, 23.9697265625, 25.248046875, 26.5263671875, 27.8046875, 29.0830078125, 30.361328125, 31.6396484375, 32.91796875, 34.1962890625, 35.474609375, 36.7529296875, 38.03125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 21.0, 33.0, 48.0, 81.0, 113.0, 195.0, 329.0, 486.0, 809.0, 1296.0, 2089.0, 3325.0, 5277.0, 8230.0, 12618.0, 18849.0, 27369.0, 38832.0, 52106.0, 66585.0, 81004.0, 93599.0, 100744.0, 101020.0, 95705.0, 83973.0, 69686.0, 54832.0, 41197.0, 29508.0, 20332.0, 13526.0, 9023.0, 5828.0, 3720.0, 2296.0, 1446.0, 904.0, 593.0, 328.0, 237.0, 142.0, 69.0, 46.0, 38.0, 25.0, 9.0, 5.0, 5.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-18.703125, -18.081787109375, -17.46044921875, -16.839111328125, -16.2177734375, -15.596435546875, -14.97509765625, -14.353759765625, -13.732421875, -13.111083984375, -12.48974609375, -11.868408203125, -11.2470703125, -10.625732421875, -10.00439453125, -9.383056640625, -8.76171875, -8.140380859375, -7.51904296875, -6.897705078125, -6.2763671875, -5.655029296875, -5.03369140625, -4.412353515625, -3.791015625, -3.169677734375, -2.54833984375, -1.927001953125, -1.3056640625, -0.684326171875, -0.06298828125, 0.558349609375, 1.1796875, 1.801025390625, 2.42236328125, 3.043701171875, 3.6650390625, 4.286376953125, 4.90771484375, 5.529052734375, 6.150390625, 6.771728515625, 7.39306640625, 8.014404296875, 8.6357421875, 9.257080078125, 9.87841796875, 10.499755859375, 11.12109375, 11.742431640625, 12.36376953125, 12.985107421875, 13.6064453125, 14.227783203125, 14.84912109375, 15.470458984375, 16.091796875, 16.713134765625, 17.33447265625, 17.955810546875, 18.5771484375, 19.198486328125, 19.81982421875, 20.441162109375, 21.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 6.0, 4.0, 6.0, 11.0, 15.0, 12.0, 19.0, 17.0, 23.0, 25.0, 31.0, 31.0, 28.0, 39.0, 31.0, 36.0, 34.0, 44.0, 35.0, 43.0, 38.0, 48.0, 41.0, 43.0, 38.0, 34.0, 22.0, 21.0, 28.0, 25.0, 32.0, 20.0, 24.0, 15.0, 12.0, 20.0, 13.0, 7.0, 3.0, 12.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.359375, -21.6533203125, -20.947265625, -20.2412109375, -19.53515625, -18.8291015625, -18.123046875, -17.4169921875, -16.7109375, -16.0048828125, -15.298828125, -14.5927734375, -13.88671875, -13.1806640625, -12.474609375, -11.7685546875, -11.0625, -10.3564453125, -9.650390625, -8.9443359375, -8.23828125, -7.5322265625, -6.826171875, -6.1201171875, -5.4140625, -4.7080078125, -4.001953125, -3.2958984375, -2.58984375, -1.8837890625, -1.177734375, -0.4716796875, 0.234375, 0.9404296875, 1.646484375, 2.3525390625, 3.05859375, 3.7646484375, 4.470703125, 5.1767578125, 5.8828125, 6.5888671875, 7.294921875, 8.0009765625, 8.70703125, 9.4130859375, 10.119140625, 10.8251953125, 11.53125, 12.2373046875, 12.943359375, 13.6494140625, 14.35546875, 15.0615234375, 15.767578125, 16.4736328125, 17.1796875, 17.8857421875, 18.591796875, 19.2978515625, 20.00390625, 20.7099609375, 21.416015625, 22.1220703125, 22.828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 13.0, 19.0, 27.0, 25.0, 55.0, 96.0, 124.0, 215.0, 378.0, 640.0, 1219.0, 2273.0, 4134.0, 7654.0, 13905.0, 24412.0, 41278.0, 65792.0, 95277.0, 124407.0, 142207.0, 142630.0, 124006.0, 95602.0, 65813.0, 41619.0, 24481.0, 13662.0, 7539.0, 4051.0, 2211.0, 1221.0, 641.0, 369.0, 214.0, 138.0, 72.0, 46.0, 30.0, 20.0, 9.0, 4.0, 6.0, 10.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.1796875, -11.8316650390625, -11.483642578125, -11.1356201171875, -10.78759765625, -10.4395751953125, -10.091552734375, -9.7435302734375, -9.3955078125, -9.0474853515625, -8.699462890625, -8.3514404296875, -8.00341796875, -7.6553955078125, -7.307373046875, -6.9593505859375, -6.611328125, -6.2633056640625, -5.915283203125, -5.5672607421875, -5.21923828125, -4.8712158203125, -4.523193359375, -4.1751708984375, -3.8271484375, -3.4791259765625, -3.131103515625, -2.7830810546875, -2.43505859375, -2.0870361328125, -1.739013671875, -1.3909912109375, -1.04296875, -0.6949462890625, -0.346923828125, 0.0010986328125, 0.34912109375, 0.6971435546875, 1.045166015625, 1.3931884765625, 1.7412109375, 2.0892333984375, 2.437255859375, 2.7852783203125, 3.13330078125, 3.4813232421875, 3.829345703125, 4.1773681640625, 4.525390625, 4.8734130859375, 5.221435546875, 5.5694580078125, 5.91748046875, 6.2655029296875, 6.613525390625, 6.9615478515625, 7.3095703125, 7.6575927734375, 8.005615234375, 8.3536376953125, 8.70166015625, 9.0496826171875, 9.397705078125, 9.7457275390625, 10.09375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 6.0, 11.0, 11.0, 10.0, 19.0, 18.0, 19.0, 30.0, 24.0, 43.0, 44.0, 43.0, 44.0, 47.0, 69.0, 48.0, 69.0, 59.0, 66.0, 43.0, 37.0, 33.0, 35.0, 32.0, 26.0, 22.0, 21.0, 15.0, 17.0, 8.0, 7.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00109100341796875, -0.0010508894920349121, -0.0010107755661010742, -0.0009706616401672363, -0.0009305477142333984, -0.0008904337882995605, -0.0008503198623657227, -0.0008102059364318848, -0.0007700920104980469, -0.000729978084564209, -0.0006898641586303711, -0.0006497502326965332, -0.0006096363067626953, -0.0005695223808288574, -0.0005294084548950195, -0.0004892945289611816, -0.00044918060302734375, -0.00040906667709350586, -0.00036895275115966797, -0.0003288388252258301, -0.0002887248992919922, -0.0002486109733581543, -0.0002084970474243164, -0.00016838312149047852, -0.00012826919555664062, -8.815526962280273e-05, -4.8041343688964844e-05, -7.927417755126953e-06, 3.218650817871094e-05, 7.230043411254883e-05, 0.00011241436004638672, 0.0001525282859802246, 0.0001926422119140625, 0.0002327561378479004, 0.0002728700637817383, 0.00031298398971557617, 0.00035309791564941406, 0.00039321184158325195, 0.00043332576751708984, 0.00047343969345092773, 0.0005135536193847656, 0.0005536675453186035, 0.0005937814712524414, 0.0006338953971862793, 0.0006740093231201172, 0.0007141232490539551, 0.000754237174987793, 0.0007943511009216309, 0.0008344650268554688, 0.0008745789527893066, 0.0009146928787231445, 0.0009548068046569824, 0.0009949207305908203, 0.0010350346565246582, 0.001075148582458496, 0.001115262508392334, 0.0011553764343261719, 0.0011954903602600098, 0.0012356042861938477, 0.0012757182121276855, 0.0013158321380615234, 0.0013559460639953613, 0.0013960599899291992, 0.0014361739158630371, 0.001476287841796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 18.0, 19.0, 37.0, 64.0, 97.0, 144.0, 214.0, 337.0, 542.0, 864.0, 1394.0, 2148.0, 3318.0, 5612.0, 8785.0, 14112.0, 21853.0, 33561.0, 49338.0, 69093.0, 91764.0, 110991.0, 121402.0, 120411.0, 107402.0, 87650.0, 66045.0, 46105.0, 31083.0, 20339.0, 12523.0, 7816.0, 5037.0, 3010.0, 1963.0, 1306.0, 788.0, 485.0, 325.0, 180.0, 118.0, 92.0, 67.0, 31.0, 20.0, 20.0, 9.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-11.265625, -10.933349609375, -10.60107421875, -10.268798828125, -9.9365234375, -9.604248046875, -9.27197265625, -8.939697265625, -8.607421875, -8.275146484375, -7.94287109375, -7.610595703125, -7.2783203125, -6.946044921875, -6.61376953125, -6.281494140625, -5.94921875, -5.616943359375, -5.28466796875, -4.952392578125, -4.6201171875, -4.287841796875, -3.95556640625, -3.623291015625, -3.291015625, -2.958740234375, -2.62646484375, -2.294189453125, -1.9619140625, -1.629638671875, -1.29736328125, -0.965087890625, -0.6328125, -0.300537109375, 0.03173828125, 0.364013671875, 0.6962890625, 1.028564453125, 1.36083984375, 1.693115234375, 2.025390625, 2.357666015625, 2.68994140625, 3.022216796875, 3.3544921875, 3.686767578125, 4.01904296875, 4.351318359375, 4.68359375, 5.015869140625, 5.34814453125, 5.680419921875, 6.0126953125, 6.344970703125, 6.67724609375, 7.009521484375, 7.341796875, 7.674072265625, 8.00634765625, 8.338623046875, 8.6708984375, 9.003173828125, 9.33544921875, 9.667724609375, 10.0]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 5.0, 14.0, 11.0, 19.0, 34.0, 29.0, 36.0, 45.0, 49.0, 43.0, 58.0, 76.0, 73.0, 63.0, 91.0, 56.0, 67.0, 46.0, 41.0, 29.0, 28.0, 24.0, 14.0, 6.0, 9.0, 6.0, 8.0, 5.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.742919921875, -8.49365234375, -8.244384765625, -7.9951171875, -7.745849609375, -7.49658203125, -7.247314453125, -6.998046875, -6.748779296875, -6.49951171875, -6.250244140625, -6.0009765625, -5.751708984375, -5.50244140625, -5.253173828125, -5.00390625, -4.754638671875, -4.50537109375, -4.256103515625, -4.0068359375, -3.757568359375, -3.50830078125, -3.259033203125, -3.009765625, -2.760498046875, -2.51123046875, -2.261962890625, -2.0126953125, -1.763427734375, -1.51416015625, -1.264892578125, -1.015625, -0.766357421875, -0.51708984375, -0.267822265625, -0.0185546875, 0.230712890625, 0.47998046875, 0.729248046875, 0.978515625, 1.227783203125, 1.47705078125, 1.726318359375, 1.9755859375, 2.224853515625, 2.47412109375, 2.723388671875, 2.97265625, 3.221923828125, 3.47119140625, 3.720458984375, 3.9697265625, 4.218994140625, 4.46826171875, 4.717529296875, 4.966796875, 5.216064453125, 5.46533203125, 5.714599609375, 5.9638671875, 6.213134765625, 6.46240234375, 6.711669921875, 6.9609375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 8.0, 5.0, 10.0, 13.0, 8.0, 9.0, 6.0, 23.0, 23.0, 22.0, 25.0, 36.0, 31.0, 41.0, 44.0, 44.0, 38.0, 49.0, 44.0, 40.0, 39.0, 44.0, 44.0, 27.0, 41.0, 30.0, 28.0, 29.0, 24.0, 28.0, 18.0, 15.0, 18.0, 15.0, 14.0, 13.0, 7.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.403156280517578, -27.485095977783203, -26.56703758239746, -25.648977279663086, -24.73091697692871, -23.81285858154297, -22.894798278808594, -21.97673797607422, -21.058677673339844, -20.14061737060547, -19.222558975219727, -18.30449867248535, -17.386438369750977, -16.468379974365234, -15.55031967163086, -14.632259368896484, -13.714200973510742, -12.796141624450684, -11.878081321716309, -10.96002197265625, -10.041961669921875, -9.123902320861816, -8.205842971801758, -7.287783145904541, -6.369723320007324, -5.451663494110107, -4.533603668212891, -3.615544319152832, -2.6974844932556152, -1.7794246673583984, -0.8613653182983398, 0.05669450759887695, 0.9747543334960938, 1.892814040184021, 2.8108737468719482, 3.728933334350586, 4.646993160247803, 5.5650529861450195, 6.483112335205078, 7.401172161102295, 8.319231986999512, 9.23729133605957, 10.155351638793945, 11.073410987854004, 11.991470336914062, 12.909530639648438, 13.827589988708496, 14.745649337768555, 15.66370964050293, 16.581769943237305, 17.499828338623047, 18.417888641357422, 19.335948944091797, 20.254009246826172, 21.172067642211914, 22.09012794494629, 23.00818634033203, 23.926246643066406, 24.84430503845215, 25.762365341186523, 26.6804256439209, 27.59848403930664, 28.516544342041016, 29.43460464477539, 30.352664947509766]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 11.0, 6.0, 7.0, 9.0, 9.0, 11.0, 17.0, 15.0, 20.0, 23.0, 27.0, 33.0, 37.0, 35.0, 40.0, 44.0, 55.0, 48.0, 34.0, 32.0, 46.0, 49.0, 50.0, 38.0, 44.0, 28.0, 40.0, 29.0, 29.0, 19.0, 25.0, 22.0, 13.0, 12.0, 8.0, 11.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-42.07172775268555, -40.781211853027344, -39.490692138671875, -38.20017623901367, -36.9096565246582, -35.619140625, -34.32862091064453, -33.03810501098633, -31.74758529663086, -30.457067489624023, -29.166549682617188, -27.87603187561035, -26.585514068603516, -25.29499626159668, -24.004478454589844, -22.71396255493164, -21.423444747924805, -20.13292694091797, -18.842409133911133, -17.551891326904297, -16.26137351989746, -14.970855712890625, -13.680338859558105, -12.38982105255127, -11.099303245544434, -9.808785438537598, -8.518267631530762, -7.227750301361084, -5.937232494354248, -4.646714687347412, -3.3561973571777344, -2.0656795501708984, -0.7751617431640625, 0.5153559446334839, 1.8058736324310303, 3.096391201019287, 4.386909008026123, 5.677426815032959, 6.967944145202637, 8.258461952209473, 9.548979759216309, 10.839497566223145, 12.13001537322998, 13.4205322265625, 14.711050033569336, 16.001567840576172, 17.292085647583008, 18.582603454589844, 19.87312126159668, 21.163639068603516, 22.45415687561035, 23.744674682617188, 25.035192489624023, 26.32571029663086, 27.616226196289062, 28.90674591064453, 30.197261810302734, 31.48777961730957, 32.778297424316406, 34.06881332397461, 35.35933303833008, 36.64984893798828, 37.94036865234375, 39.23088455200195, 40.52140426635742]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 13.0, 13.0, 32.0, 50.0, 69.0, 133.0, 205.0, 292.0, 511.0, 839.0, 1286.0, 2013.0, 3226.0, 4913.0, 7773.0, 12079.0, 18168.0, 27549.0, 40901.0, 58639.0, 83686.0, 116639.0, 156798.0, 202917.0, 253096.0, 301598.0, 339240.0, 366454.0, 369805.0, 355875.0, 322935.0, 278637.0, 228143.0, 180990.0, 136861.0, 100285.0, 71694.0, 50035.0, 33865.0, 22780.0, 15298.0, 10012.0, 6429.0, 4264.0, 2592.0, 1714.0, 1078.0, 701.0, 434.0, 275.0, 173.0, 101.0, 79.0, 39.0, 26.0, 18.0, 6.0, 4.0, 2.0, 2.0, 3.0], "bins": [-19.0625, -18.452880859375, -17.84326171875, -17.233642578125, -16.6240234375, -16.014404296875, -15.40478515625, -14.795166015625, -14.185546875, -13.575927734375, -12.96630859375, -12.356689453125, -11.7470703125, -11.137451171875, -10.52783203125, -9.918212890625, -9.30859375, -8.698974609375, -8.08935546875, -7.479736328125, -6.8701171875, -6.260498046875, -5.65087890625, -5.041259765625, -4.431640625, -3.822021484375, -3.21240234375, -2.602783203125, -1.9931640625, -1.383544921875, -0.77392578125, -0.164306640625, 0.4453125, 1.054931640625, 1.66455078125, 2.274169921875, 2.8837890625, 3.493408203125, 4.10302734375, 4.712646484375, 5.322265625, 5.931884765625, 6.54150390625, 7.151123046875, 7.7607421875, 8.370361328125, 8.97998046875, 9.589599609375, 10.19921875, 10.808837890625, 11.41845703125, 12.028076171875, 12.6376953125, 13.247314453125, 13.85693359375, 14.466552734375, 15.076171875, 15.685791015625, 16.29541015625, 16.905029296875, 17.5146484375, 18.124267578125, 18.73388671875, 19.343505859375, 19.953125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 3.0, 7.0, 11.0, 11.0, 15.0, 15.0, 14.0, 29.0, 25.0, 30.0, 33.0, 33.0, 39.0, 44.0, 45.0, 63.0, 33.0, 37.0, 40.0, 46.0, 48.0, 43.0, 47.0, 32.0, 34.0, 34.0, 32.0, 17.0, 26.0, 21.0, 14.0, 11.0, 14.0, 10.0, 9.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-36.1875, -35.08203125, -33.9765625, -32.87109375, -31.765625, -30.66015625, -29.5546875, -28.44921875, -27.34375, -26.23828125, -25.1328125, -24.02734375, -22.921875, -21.81640625, -20.7109375, -19.60546875, -18.5, -17.39453125, -16.2890625, -15.18359375, -14.078125, -12.97265625, -11.8671875, -10.76171875, -9.65625, -8.55078125, -7.4453125, -6.33984375, -5.234375, -4.12890625, -3.0234375, -1.91796875, -0.8125, 0.29296875, 1.3984375, 2.50390625, 3.609375, 4.71484375, 5.8203125, 6.92578125, 8.03125, 9.13671875, 10.2421875, 11.34765625, 12.453125, 13.55859375, 14.6640625, 15.76953125, 16.875, 17.98046875, 19.0859375, 20.19140625, 21.296875, 22.40234375, 23.5078125, 24.61328125, 25.71875, 26.82421875, 27.9296875, 29.03515625, 30.140625, 31.24609375, 32.3515625, 33.45703125, 34.5625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 12.0, 32.0, 52.0, 84.0, 160.0, 287.0, 402.0, 742.0, 1218.0, 1960.0, 3408.0, 5388.0, 8652.0, 13812.0, 21024.0, 31629.0, 46764.0, 66718.0, 92468.0, 126909.0, 165007.0, 207605.0, 251455.0, 292381.0, 325079.0, 343351.0, 347051.0, 336543.0, 309448.0, 273915.0, 230992.0, 186526.0, 145621.0, 109536.0, 80242.0, 56607.0, 38386.0, 26118.0, 17512.0, 11146.0, 7106.0, 4392.0, 2672.0, 1556.0, 982.0, 534.0, 352.0, 216.0, 95.0, 63.0, 35.0, 13.0, 11.0, 8.0, 0.0, 2.0], "bins": [-21.546875, -20.91796875, -20.2890625, -19.66015625, -19.03125, -18.40234375, -17.7734375, -17.14453125, -16.515625, -15.88671875, -15.2578125, -14.62890625, -14.0, -13.37109375, -12.7421875, -12.11328125, -11.484375, -10.85546875, -10.2265625, -9.59765625, -8.96875, -8.33984375, -7.7109375, -7.08203125, -6.453125, -5.82421875, -5.1953125, -4.56640625, -3.9375, -3.30859375, -2.6796875, -2.05078125, -1.421875, -0.79296875, -0.1640625, 0.46484375, 1.09375, 1.72265625, 2.3515625, 2.98046875, 3.609375, 4.23828125, 4.8671875, 5.49609375, 6.125, 6.75390625, 7.3828125, 8.01171875, 8.640625, 9.26953125, 9.8984375, 10.52734375, 11.15625, 11.78515625, 12.4140625, 13.04296875, 13.671875, 14.30078125, 14.9296875, 15.55859375, 16.1875, 16.81640625, 17.4453125, 18.07421875, 18.703125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 16.0, 16.0, 27.0, 27.0, 32.0, 48.0, 54.0, 84.0, 103.0, 110.0, 137.0, 144.0, 153.0, 190.0, 162.0, 190.0, 188.0, 202.0, 203.0, 199.0, 196.0, 194.0, 194.0, 162.0, 171.0, 148.0, 114.0, 110.0, 104.0, 89.0, 70.0, 36.0, 36.0, 42.0, 31.0, 17.0, 19.0, 15.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.125, -15.6556396484375, -15.186279296875, -14.7169189453125, -14.24755859375, -13.7781982421875, -13.308837890625, -12.8394775390625, -12.3701171875, -11.9007568359375, -11.431396484375, -10.9620361328125, -10.49267578125, -10.0233154296875, -9.553955078125, -9.0845947265625, -8.615234375, -8.1458740234375, -7.676513671875, -7.2071533203125, -6.73779296875, -6.2684326171875, -5.799072265625, -5.3297119140625, -4.8603515625, -4.3909912109375, -3.921630859375, -3.4522705078125, -2.98291015625, -2.5135498046875, -2.044189453125, -1.5748291015625, -1.10546875, -0.6361083984375, -0.166748046875, 0.3026123046875, 0.77197265625, 1.2413330078125, 1.710693359375, 2.1800537109375, 2.6494140625, 3.1187744140625, 3.588134765625, 4.0574951171875, 4.52685546875, 4.9962158203125, 5.465576171875, 5.9349365234375, 6.404296875, 6.8736572265625, 7.343017578125, 7.8123779296875, 8.28173828125, 8.7510986328125, 9.220458984375, 9.6898193359375, 10.1591796875, 10.6285400390625, 11.097900390625, 11.5672607421875, 12.03662109375, 12.5059814453125, 12.975341796875, 13.4447021484375, 13.9140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 5.0, 3.0, 6.0, 11.0, 15.0, 14.0, 17.0, 23.0, 18.0, 26.0, 35.0, 30.0, 39.0, 39.0, 41.0, 50.0, 37.0, 53.0, 38.0, 46.0, 44.0, 46.0, 42.0, 41.0, 36.0, 32.0, 25.0, 33.0, 26.0, 24.0, 14.0, 27.0, 18.0, 10.0, 9.0, 4.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.505916595458984, -31.42090606689453, -30.335895538330078, -29.250885009765625, -28.165874481201172, -27.08086395263672, -25.995853424072266, -24.910842895507812, -23.82583236694336, -22.740821838378906, -21.655811309814453, -20.57080078125, -19.485790252685547, -18.400779724121094, -17.31576919555664, -16.230758666992188, -15.145748138427734, -14.060737609863281, -12.975727081298828, -11.890716552734375, -10.805706024169922, -9.720695495605469, -8.635684967041016, -7.5506744384765625, -6.465663909912109, -5.380653381347656, -4.295642852783203, -3.21063232421875, -2.125621795654297, -1.0406112670898438, 0.044399261474609375, 1.1294097900390625, 2.2144203186035156, 3.2994308471679688, 4.384441375732422, 5.469451904296875, 6.554462432861328, 7.639472961425781, 8.724483489990234, 9.809494018554688, 10.89450454711914, 11.979515075683594, 13.064525604248047, 14.1495361328125, 15.234546661376953, 16.319557189941406, 17.40456771850586, 18.489578247070312, 19.574588775634766, 20.65959930419922, 21.744609832763672, 22.829620361328125, 23.914630889892578, 24.99964141845703, 26.084651947021484, 27.169662475585938, 28.25467300415039, 29.339683532714844, 30.424694061279297, 31.50970458984375, 32.5947151184082, 33.679725646972656, 34.76473617553711, 35.84974670410156, 36.934757232666016]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 6.0, 11.0, 7.0, 9.0, 18.0, 13.0, 21.0, 22.0, 30.0, 36.0, 42.0, 28.0, 35.0, 34.0, 44.0, 45.0, 53.0, 39.0, 40.0, 48.0, 45.0, 37.0, 39.0, 26.0, 35.0, 35.0, 26.0, 29.0, 21.0, 19.0, 14.0, 17.0, 16.0, 14.0, 9.0, 7.0, 4.0, 3.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.774681091308594, -34.55237579345703, -33.33007049560547, -32.10776138305664, -30.885456085205078, -29.663150787353516, -28.440845489501953, -27.21854019165039, -25.996232986450195, -24.773927688598633, -23.551620483398438, -22.329315185546875, -21.107009887695312, -19.884702682495117, -18.662397384643555, -17.44009017944336, -16.217784881591797, -14.995478630065918, -13.773172378540039, -12.550867080688477, -11.328560829162598, -10.106254577636719, -8.883949279785156, -7.661643028259277, -6.439336776733398, -5.2170305252075195, -3.994724750518799, -2.772418737411499, -1.5501127243041992, -0.3278064727783203, 0.8944993019104004, 2.116805076599121, 3.339111328125, 4.561417579650879, 5.7837233543396, 7.00602912902832, 8.2283353805542, 9.450641632080078, 10.67294692993164, 11.89525318145752, 13.117559432983398, 14.339865684509277, 15.562171936035156, 16.78447723388672, 18.00678253173828, 19.229089736938477, 20.45139503479004, 21.673702239990234, 22.896007537841797, 24.11831283569336, 25.340620040893555, 26.562925338745117, 27.785232543945312, 29.007537841796875, 30.229843139648438, 31.4521484375, 32.67445373535156, 33.896759033203125, 35.11906433105469, 36.341373443603516, 37.56367874145508, 38.78598403930664, 40.0082893371582, 41.230594635009766, 42.452903747558594]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 13.0, 13.0, 8.0, 13.0, 30.0, 33.0, 37.0, 61.0, 79.0, 133.0, 188.0, 283.0, 431.0, 676.0, 1040.0, 1711.0, 2672.0, 4333.0, 7597.0, 13029.0, 23644.0, 44662.0, 87832.0, 165323.0, 244312.0, 205304.0, 114685.0, 58790.0, 30922.0, 16558.0, 9418.0, 5579.0, 3400.0, 2066.0, 1239.0, 815.0, 506.0, 327.0, 239.0, 159.0, 111.0, 73.0, 53.0, 47.0, 29.0, 21.0, 15.0, 5.0, 15.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-7.66796875, -7.41827392578125, -7.1685791015625, -6.91888427734375, -6.669189453125, -6.41949462890625, -6.1697998046875, -5.92010498046875, -5.67041015625, -5.42071533203125, -5.1710205078125, -4.92132568359375, -4.671630859375, -4.42193603515625, -4.1722412109375, -3.92254638671875, -3.6728515625, -3.42315673828125, -3.1734619140625, -2.92376708984375, -2.674072265625, -2.42437744140625, -2.1746826171875, -1.92498779296875, -1.67529296875, -1.42559814453125, -1.1759033203125, -0.92620849609375, -0.676513671875, -0.42681884765625, -0.1771240234375, 0.07257080078125, 0.322265625, 0.57196044921875, 0.8216552734375, 1.07135009765625, 1.321044921875, 1.57073974609375, 1.8204345703125, 2.07012939453125, 2.31982421875, 2.56951904296875, 2.8192138671875, 3.06890869140625, 3.318603515625, 3.56829833984375, 3.8179931640625, 4.06768798828125, 4.3173828125, 4.56707763671875, 4.8167724609375, 5.06646728515625, 5.316162109375, 5.56585693359375, 5.8155517578125, 6.06524658203125, 6.31494140625, 6.56463623046875, 6.8143310546875, 7.06402587890625, 7.313720703125, 7.56341552734375, 7.8131103515625, 8.06280517578125, 8.3125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 6.0, 11.0, 7.0, 8.0, 19.0, 12.0, 23.0, 22.0, 29.0, 35.0, 41.0, 32.0, 33.0, 34.0, 43.0, 46.0, 53.0, 40.0, 39.0, 51.0, 44.0, 34.0, 38.0, 26.0, 37.0, 35.0, 27.0, 28.0, 21.0, 18.0, 14.0, 18.0, 15.0, 15.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -34.15380859375, -32.9326171875, -31.71142578125, -30.490234375, -29.26904296875, -28.0478515625, -26.82666015625, -25.60546875, -24.38427734375, -23.1630859375, -21.94189453125, -20.720703125, -19.49951171875, -18.2783203125, -17.05712890625, -15.8359375, -14.61474609375, -13.3935546875, -12.17236328125, -10.951171875, -9.72998046875, -8.5087890625, -7.28759765625, -6.06640625, -4.84521484375, -3.6240234375, -2.40283203125, -1.181640625, 0.03955078125, 1.2607421875, 2.48193359375, 3.703125, 4.92431640625, 6.1455078125, 7.36669921875, 8.587890625, 9.80908203125, 11.0302734375, 12.25146484375, 13.47265625, 14.69384765625, 15.9150390625, 17.13623046875, 18.357421875, 19.57861328125, 20.7998046875, 22.02099609375, 23.2421875, 24.46337890625, 25.6845703125, 26.90576171875, 28.126953125, 29.34814453125, 30.5693359375, 31.79052734375, 33.01171875, 34.23291015625, 35.4541015625, 36.67529296875, 37.896484375, 39.11767578125, 40.3388671875, 41.56005859375, 42.78125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 13.0, 17.0, 28.0, 37.0, 43.0, 44.0, 63.0, 96.0, 113.0, 191.0, 256.0, 371.0, 564.0, 866.0, 1319.0, 2125.0, 3665.0, 7087.0, 13411.0, 30087.0, 76375.0, 221729.0, 387583.0, 184646.0, 64363.0, 26092.0, 12067.0, 6179.0, 3396.0, 1957.0, 1252.0, 761.0, 500.0, 345.0, 228.0, 185.0, 124.0, 90.0, 69.0, 52.0, 40.0, 20.0, 24.0, 15.0, 12.0, 7.0, 12.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-9.4140625, -9.13232421875, -8.8505859375, -8.56884765625, -8.287109375, -8.00537109375, -7.7236328125, -7.44189453125, -7.16015625, -6.87841796875, -6.5966796875, -6.31494140625, -6.033203125, -5.75146484375, -5.4697265625, -5.18798828125, -4.90625, -4.62451171875, -4.3427734375, -4.06103515625, -3.779296875, -3.49755859375, -3.2158203125, -2.93408203125, -2.65234375, -2.37060546875, -2.0888671875, -1.80712890625, -1.525390625, -1.24365234375, -0.9619140625, -0.68017578125, -0.3984375, -0.11669921875, 0.1650390625, 0.44677734375, 0.728515625, 1.01025390625, 1.2919921875, 1.57373046875, 1.85546875, 2.13720703125, 2.4189453125, 2.70068359375, 2.982421875, 3.26416015625, 3.5458984375, 3.82763671875, 4.109375, 4.39111328125, 4.6728515625, 4.95458984375, 5.236328125, 5.51806640625, 5.7998046875, 6.08154296875, 6.36328125, 6.64501953125, 6.9267578125, 7.20849609375, 7.490234375, 7.77197265625, 8.0537109375, 8.33544921875, 8.6171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 8.0, 6.0, 8.0, 8.0, 8.0, 9.0, 3.0, 11.0, 15.0, 21.0, 13.0, 25.0, 32.0, 32.0, 28.0, 25.0, 42.0, 42.0, 38.0, 41.0, 27.0, 30.0, 40.0, 50.0, 36.0, 35.0, 34.0, 37.0, 33.0, 29.0, 25.0, 35.0, 34.0, 17.0, 10.0, 20.0, 14.0, 14.0, 10.0, 9.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.890625, -24.103515625, -23.31640625, -22.529296875, -21.7421875, -20.955078125, -20.16796875, -19.380859375, -18.59375, -17.806640625, -17.01953125, -16.232421875, -15.4453125, -14.658203125, -13.87109375, -13.083984375, -12.296875, -11.509765625, -10.72265625, -9.935546875, -9.1484375, -8.361328125, -7.57421875, -6.787109375, -6.0, -5.212890625, -4.42578125, -3.638671875, -2.8515625, -2.064453125, -1.27734375, -0.490234375, 0.296875, 1.083984375, 1.87109375, 2.658203125, 3.4453125, 4.232421875, 5.01953125, 5.806640625, 6.59375, 7.380859375, 8.16796875, 8.955078125, 9.7421875, 10.529296875, 11.31640625, 12.103515625, 12.890625, 13.677734375, 14.46484375, 15.251953125, 16.0390625, 16.826171875, 17.61328125, 18.400390625, 19.1875, 19.974609375, 20.76171875, 21.548828125, 22.3359375, 23.123046875, 23.91015625, 24.697265625, 25.484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 4.0, 10.0, 13.0, 29.0, 30.0, 45.0, 58.0, 77.0, 133.0, 204.0, 317.0, 482.0, 879.0, 1342.0, 2316.0, 4201.0, 7676.0, 15686.0, 36758.0, 112861.0, 458673.0, 285796.0, 69220.0, 25972.0, 11670.0, 5937.0, 3276.0, 1856.0, 1088.0, 750.0, 392.0, 305.0, 177.0, 102.0, 64.0, 54.0, 29.0, 18.0, 18.0, 13.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.3154296875, -5.158203125, -5.0009765625, -4.84375, -4.6865234375, -4.529296875, -4.3720703125, -4.21484375, -4.0576171875, -3.900390625, -3.7431640625, -3.5859375, -3.4287109375, -3.271484375, -3.1142578125, -2.95703125, -2.7998046875, -2.642578125, -2.4853515625, -2.328125, -2.1708984375, -2.013671875, -1.8564453125, -1.69921875, -1.5419921875, -1.384765625, -1.2275390625, -1.0703125, -0.9130859375, -0.755859375, -0.5986328125, -0.44140625, -0.2841796875, -0.126953125, 0.0302734375, 0.1875, 0.3447265625, 0.501953125, 0.6591796875, 0.81640625, 0.9736328125, 1.130859375, 1.2880859375, 1.4453125, 1.6025390625, 1.759765625, 1.9169921875, 2.07421875, 2.2314453125, 2.388671875, 2.5458984375, 2.703125, 2.8603515625, 3.017578125, 3.1748046875, 3.33203125, 3.4892578125, 3.646484375, 3.8037109375, 3.9609375, 4.1181640625, 4.275390625, 4.4326171875, 4.58984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 8.0, 9.0, 12.0, 16.0, 17.0, 25.0, 31.0, 46.0, 68.0, 78.0, 105.0, 109.0, 81.0, 89.0, 72.0, 55.0, 48.0, 44.0, 30.0, 20.0, 9.0, 8.0, 7.0, 0.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003669261932373047, -0.0003542117774486542, -0.00034149736166000366, -0.00032878294587135315, -0.00031606853008270264, -0.0003033541142940521, -0.0002906396985054016, -0.0002779252827167511, -0.0002652108669281006, -0.0002524964511394501, -0.00023978203535079956, -0.00022706761956214905, -0.00021435320377349854, -0.00020163878798484802, -0.0001889243721961975, -0.000176209956407547, -0.00016349554061889648, -0.00015078112483024597, -0.00013806670904159546, -0.00012535229325294495, -0.00011263787746429443, -9.992346167564392e-05, -8.720904588699341e-05, -7.44946300983429e-05, -6.178021430969238e-05, -4.906579852104187e-05, -3.635138273239136e-05, -2.3636966943740845e-05, -1.0922551155090332e-05, 1.7918646335601807e-06, 1.4506280422210693e-05, 2.7220696210861206e-05, 3.993511199951172e-05, 5.264952778816223e-05, 6.536394357681274e-05, 7.807835936546326e-05, 9.079277515411377e-05, 0.00010350719094276428, 0.0001162216067314148, 0.0001289360225200653, 0.00014165043830871582, 0.00015436485409736633, 0.00016707926988601685, 0.00017979368567466736, 0.00019250810146331787, 0.00020522251725196838, 0.0002179369330406189, 0.0002306513488292694, 0.00024336576461791992, 0.00025608018040657043, 0.00026879459619522095, 0.00028150901198387146, 0.00029422342777252197, 0.0003069378435611725, 0.000319652259349823, 0.0003323666751384735, 0.000345081090927124, 0.00035779550671577454, 0.00037050992250442505, 0.00038322433829307556, 0.0003959387540817261, 0.0004086531698703766, 0.0004213675856590271, 0.0004340820014476776, 0.0004467964172363281]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 16.0, 19.0, 33.0, 40.0, 57.0, 86.0, 117.0, 205.0, 279.0, 392.0, 627.0, 895.0, 1413.0, 2214.0, 3612.0, 5797.0, 9671.0, 17162.0, 30538.0, 57162.0, 106394.0, 186672.0, 236809.0, 173223.0, 96055.0, 51455.0, 28235.0, 15717.0, 9057.0, 5376.0, 3330.0, 1990.0, 1246.0, 861.0, 556.0, 388.0, 245.0, 185.0, 138.0, 78.0, 64.0, 47.0, 28.0, 18.0, 18.0, 7.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.35546875, -4.21685791015625, -4.0782470703125, -3.93963623046875, -3.801025390625, -3.66241455078125, -3.5238037109375, -3.38519287109375, -3.24658203125, -3.10797119140625, -2.9693603515625, -2.83074951171875, -2.692138671875, -2.55352783203125, -2.4149169921875, -2.27630615234375, -2.1376953125, -1.99908447265625, -1.8604736328125, -1.72186279296875, -1.583251953125, -1.44464111328125, -1.3060302734375, -1.16741943359375, -1.02880859375, -0.89019775390625, -0.7515869140625, -0.61297607421875, -0.474365234375, -0.33575439453125, -0.1971435546875, -0.05853271484375, 0.080078125, 0.21868896484375, 0.3572998046875, 0.49591064453125, 0.634521484375, 0.77313232421875, 0.9117431640625, 1.05035400390625, 1.18896484375, 1.32757568359375, 1.4661865234375, 1.60479736328125, 1.743408203125, 1.88201904296875, 2.0206298828125, 2.15924072265625, 2.2978515625, 2.43646240234375, 2.5750732421875, 2.71368408203125, 2.852294921875, 2.99090576171875, 3.1295166015625, 3.26812744140625, 3.40673828125, 3.54534912109375, 3.6839599609375, 3.82257080078125, 3.961181640625, 4.09979248046875, 4.2384033203125, 4.37701416015625, 4.515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 12.0, 6.0, 21.0, 32.0, 36.0, 67.0, 76.0, 104.0, 113.0, 111.0, 121.0, 83.0, 67.0, 40.0, 28.0, 14.0, 9.0, 9.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.46484375, -4.34332275390625, -4.2218017578125, -4.10028076171875, -3.978759765625, -3.85723876953125, -3.7357177734375, -3.61419677734375, -3.49267578125, -3.37115478515625, -3.2496337890625, -3.12811279296875, -3.006591796875, -2.88507080078125, -2.7635498046875, -2.64202880859375, -2.5205078125, -2.39898681640625, -2.2774658203125, -2.15594482421875, -2.034423828125, -1.91290283203125, -1.7913818359375, -1.66986083984375, -1.54833984375, -1.42681884765625, -1.3052978515625, -1.18377685546875, -1.062255859375, -0.94073486328125, -0.8192138671875, -0.69769287109375, -0.576171875, -0.45465087890625, -0.3331298828125, -0.21160888671875, -0.090087890625, 0.03143310546875, 0.1529541015625, 0.27447509765625, 0.39599609375, 0.51751708984375, 0.6390380859375, 0.76055908203125, 0.882080078125, 1.00360107421875, 1.1251220703125, 1.24664306640625, 1.3681640625, 1.48968505859375, 1.6112060546875, 1.73272705078125, 1.854248046875, 1.97576904296875, 2.0972900390625, 2.21881103515625, 2.34033203125, 2.46185302734375, 2.5833740234375, 2.70489501953125, 2.826416015625, 2.94793701171875, 3.0694580078125, 3.19097900390625, 3.3125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 8.0, 10.0, 17.0, 8.0, 17.0, 20.0, 22.0, 23.0, 33.0, 25.0, 43.0, 34.0, 39.0, 47.0, 45.0, 47.0, 44.0, 47.0, 42.0, 39.0, 50.0, 41.0, 42.0, 31.0, 27.0, 30.0, 30.0, 22.0, 16.0, 19.0, 19.0, 17.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.85098648071289, -31.76666831970215, -30.682350158691406, -29.598033905029297, -28.513715744018555, -27.429397583007812, -26.345081329345703, -25.26076316833496, -24.17644500732422, -23.092126846313477, -22.007808685302734, -20.923492431640625, -19.839174270629883, -18.75485610961914, -17.67053985595703, -16.58622169494629, -15.501903533935547, -14.417585372924805, -13.333268165588379, -12.248950958251953, -11.164632797241211, -10.080314636230469, -8.995997428894043, -7.911679744720459, -6.827362060546875, -5.743044376373291, -4.658726692199707, -3.574409008026123, -2.490091323852539, -1.405773639678955, -0.3214559555053711, 0.7628617286682129, 1.8471832275390625, 2.9315009117126465, 4.0158185958862305, 5.1001362800598145, 6.184453964233398, 7.268771648406982, 8.353089332580566, 9.437406539916992, 10.521724700927734, 11.606042861938477, 12.690360069274902, 13.774677276611328, 14.85899543762207, 15.943313598632812, 17.027629852294922, 18.111948013305664, 19.196266174316406, 20.28058433532715, 21.36490249633789, 22.44921875, 23.533536911010742, 24.617855072021484, 25.702171325683594, 26.786489486694336, 27.870807647705078, 28.95512580871582, 30.039443969726562, 31.123760223388672, 32.20807647705078, 33.292396545410156, 34.376712799072266, 35.46103286743164, 36.54534912109375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 9.0, 14.0, 7.0, 21.0, 21.0, 16.0, 37.0, 29.0, 38.0, 36.0, 36.0, 32.0, 40.0, 50.0, 45.0, 46.0, 46.0, 55.0, 38.0, 30.0, 36.0, 30.0, 40.0, 31.0, 24.0, 26.0, 25.0, 16.0, 17.0, 15.0, 19.0, 11.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.312740325927734, -34.09036636352539, -32.86799240112305, -31.645618438720703, -30.42324447631836, -29.200870513916016, -27.97849464416504, -26.756120681762695, -25.53374671936035, -24.311372756958008, -23.088998794555664, -21.86662483215332, -20.644248962402344, -19.421875, -18.199501037597656, -16.977127075195312, -15.754753112792969, -14.532379150390625, -13.310005187988281, -12.087630271911621, -10.865256309509277, -9.642882347106934, -8.420507431030273, -7.19813346862793, -5.975759506225586, -4.753385543823242, -3.5310111045837402, -2.3086369037628174, -1.0862627029418945, 0.13611125946044922, 1.3584856986999512, 2.580860137939453, 3.8032379150390625, 5.025611877441406, 6.247986316680908, 7.47036075592041, 8.692734718322754, 9.915108680725098, 11.137483596801758, 12.359857559204102, 13.582231521606445, 14.804605484008789, 16.026979446411133, 17.249353408813477, 18.471729278564453, 19.694103240966797, 20.91647720336914, 22.138851165771484, 23.361225128173828, 24.583599090576172, 25.805973052978516, 27.02834701538086, 28.250720977783203, 29.473094940185547, 30.695470809936523, 31.917844772338867, 33.140220642089844, 34.36259460449219, 35.58496856689453, 36.807342529296875, 38.02971649169922, 39.25209045410156, 40.474464416503906, 41.69683837890625, 42.919212341308594]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 16.0, 29.0, 58.0, 77.0, 130.0, 215.0, 395.0, 718.0, 1194.0, 1936.0, 3254.0, 5225.0, 8345.0, 12990.0, 19723.0, 29126.0, 41113.0, 55488.0, 71864.0, 87088.0, 98582.0, 105277.0, 103636.0, 95274.0, 81107.0, 66249.0, 50761.0, 36723.0, 25546.0, 16953.0, 11070.0, 7075.0, 4352.0, 2823.0, 1727.0, 1023.0, 550.0, 344.0, 205.0, 134.0, 59.0, 40.0, 27.0, 15.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.37158203125, -18.7431640625, -18.11474609375, -17.486328125, -16.85791015625, -16.2294921875, -15.60107421875, -14.97265625, -14.34423828125, -13.7158203125, -13.08740234375, -12.458984375, -11.83056640625, -11.2021484375, -10.57373046875, -9.9453125, -9.31689453125, -8.6884765625, -8.06005859375, -7.431640625, -6.80322265625, -6.1748046875, -5.54638671875, -4.91796875, -4.28955078125, -3.6611328125, -3.03271484375, -2.404296875, -1.77587890625, -1.1474609375, -0.51904296875, 0.109375, 0.73779296875, 1.3662109375, 1.99462890625, 2.623046875, 3.25146484375, 3.8798828125, 4.50830078125, 5.13671875, 5.76513671875, 6.3935546875, 7.02197265625, 7.650390625, 8.27880859375, 8.9072265625, 9.53564453125, 10.1640625, 10.79248046875, 11.4208984375, 12.04931640625, 12.677734375, 13.30615234375, 13.9345703125, 14.56298828125, 15.19140625, 15.81982421875, 16.4482421875, 17.07666015625, 17.705078125, 18.33349609375, 18.9619140625, 19.59033203125, 20.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 8.0, 13.0, 9.0, 19.0, 20.0, 17.0, 37.0, 26.0, 42.0, 31.0, 37.0, 36.0, 38.0, 43.0, 49.0, 50.0, 39.0, 53.0, 47.0, 28.0, 33.0, 33.0, 40.0, 31.0, 27.0, 27.0, 24.0, 16.0, 17.0, 14.0, 18.0, 13.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.49169921875, -32.2958984375, -31.10009765625, -29.904296875, -28.70849609375, -27.5126953125, -26.31689453125, -25.12109375, -23.92529296875, -22.7294921875, -21.53369140625, -20.337890625, -19.14208984375, -17.9462890625, -16.75048828125, -15.5546875, -14.35888671875, -13.1630859375, -11.96728515625, -10.771484375, -9.57568359375, -8.3798828125, -7.18408203125, -5.98828125, -4.79248046875, -3.5966796875, -2.40087890625, -1.205078125, -0.00927734375, 1.1865234375, 2.38232421875, 3.578125, 4.77392578125, 5.9697265625, 7.16552734375, 8.361328125, 9.55712890625, 10.7529296875, 11.94873046875, 13.14453125, 14.34033203125, 15.5361328125, 16.73193359375, 17.927734375, 19.12353515625, 20.3193359375, 21.51513671875, 22.7109375, 23.90673828125, 25.1025390625, 26.29833984375, 27.494140625, 28.68994140625, 29.8857421875, 31.08154296875, 32.27734375, 33.47314453125, 34.6689453125, 35.86474609375, 37.060546875, 38.25634765625, 39.4521484375, 40.64794921875, 41.84375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 4.0, 8.0, 15.0, 11.0, 27.0, 38.0, 56.0, 101.0, 140.0, 225.0, 415.0, 605.0, 1029.0, 1623.0, 2488.0, 3845.0, 5853.0, 8942.0, 13063.0, 18855.0, 27033.0, 37216.0, 48593.0, 61975.0, 74414.0, 86059.0, 93178.0, 95561.0, 91898.0, 83861.0, 72438.0, 59426.0, 45933.0, 34901.0, 25354.0, 17469.0, 12196.0, 8347.0, 5481.0, 3677.0, 2299.0, 1439.0, 952.0, 540.0, 359.0, 238.0, 161.0, 81.0, 51.0, 31.0, 25.0, 12.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.015625, -17.423095703125, -16.83056640625, -16.238037109375, -15.6455078125, -15.052978515625, -14.46044921875, -13.867919921875, -13.275390625, -12.682861328125, -12.09033203125, -11.497802734375, -10.9052734375, -10.312744140625, -9.72021484375, -9.127685546875, -8.53515625, -7.942626953125, -7.35009765625, -6.757568359375, -6.1650390625, -5.572509765625, -4.97998046875, -4.387451171875, -3.794921875, -3.202392578125, -2.60986328125, -2.017333984375, -1.4248046875, -0.832275390625, -0.23974609375, 0.352783203125, 0.9453125, 1.537841796875, 2.13037109375, 2.722900390625, 3.3154296875, 3.907958984375, 4.50048828125, 5.093017578125, 5.685546875, 6.278076171875, 6.87060546875, 7.463134765625, 8.0556640625, 8.648193359375, 9.24072265625, 9.833251953125, 10.42578125, 11.018310546875, 11.61083984375, 12.203369140625, 12.7958984375, 13.388427734375, 13.98095703125, 14.573486328125, 15.166015625, 15.758544921875, 16.35107421875, 16.943603515625, 17.5361328125, 18.128662109375, 18.72119140625, 19.313720703125, 19.90625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 8.0, 17.0, 8.0, 21.0, 22.0, 18.0, 19.0, 33.0, 41.0, 40.0, 42.0, 36.0, 52.0, 38.0, 31.0, 29.0, 40.0, 45.0, 33.0, 34.0, 32.0, 32.0, 38.0, 35.0, 32.0, 32.0, 14.0, 16.0, 20.0, 13.0, 9.0, 9.0, 14.0, 7.0, 5.0, 5.0, 13.0, 4.0, 7.0, 6.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.34375, -22.607666015625, -21.87158203125, -21.135498046875, -20.3994140625, -19.663330078125, -18.92724609375, -18.191162109375, -17.455078125, -16.718994140625, -15.98291015625, -15.246826171875, -14.5107421875, -13.774658203125, -13.03857421875, -12.302490234375, -11.56640625, -10.830322265625, -10.09423828125, -9.358154296875, -8.6220703125, -7.885986328125, -7.14990234375, -6.413818359375, -5.677734375, -4.941650390625, -4.20556640625, -3.469482421875, -2.7333984375, -1.997314453125, -1.26123046875, -0.525146484375, 0.2109375, 0.947021484375, 1.68310546875, 2.419189453125, 3.1552734375, 3.891357421875, 4.62744140625, 5.363525390625, 6.099609375, 6.835693359375, 7.57177734375, 8.307861328125, 9.0439453125, 9.780029296875, 10.51611328125, 11.252197265625, 11.98828125, 12.724365234375, 13.46044921875, 14.196533203125, 14.9326171875, 15.668701171875, 16.40478515625, 17.140869140625, 17.876953125, 18.613037109375, 19.34912109375, 20.085205078125, 20.8212890625, 21.557373046875, 22.29345703125, 23.029541015625, 23.765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 17.0, 23.0, 26.0, 30.0, 48.0, 93.0, 145.0, 248.0, 416.0, 617.0, 997.0, 1752.0, 3072.0, 5255.0, 9261.0, 16449.0, 28090.0, 45833.0, 71199.0, 100095.0, 126463.0, 141678.0, 136715.0, 117626.0, 89198.0, 60648.0, 38358.0, 23120.0, 13199.0, 7612.0, 4275.0, 2374.0, 1404.0, 849.0, 515.0, 330.0, 191.0, 120.0, 71.0, 52.0, 37.0, 17.0, 11.0, 11.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0078125, -10.6385498046875, -10.269287109375, -9.9000244140625, -9.53076171875, -9.1614990234375, -8.792236328125, -8.4229736328125, -8.0537109375, -7.6844482421875, -7.315185546875, -6.9459228515625, -6.57666015625, -6.2073974609375, -5.838134765625, -5.4688720703125, -5.099609375, -4.7303466796875, -4.361083984375, -3.9918212890625, -3.62255859375, -3.2532958984375, -2.884033203125, -2.5147705078125, -2.1455078125, -1.7762451171875, -1.406982421875, -1.0377197265625, -0.66845703125, -0.2991943359375, 0.070068359375, 0.4393310546875, 0.80859375, 1.1778564453125, 1.547119140625, 1.9163818359375, 2.28564453125, 2.6549072265625, 3.024169921875, 3.3934326171875, 3.7626953125, 4.1319580078125, 4.501220703125, 4.8704833984375, 5.23974609375, 5.6090087890625, 5.978271484375, 6.3475341796875, 6.716796875, 7.0860595703125, 7.455322265625, 7.8245849609375, 8.19384765625, 8.5631103515625, 8.932373046875, 9.3016357421875, 9.6708984375, 10.0401611328125, 10.409423828125, 10.7786865234375, 11.14794921875, 11.5172119140625, 11.886474609375, 12.2557373046875, 12.625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 10.0, 16.0, 14.0, 19.0, 24.0, 19.0, 34.0, 40.0, 39.0, 43.0, 45.0, 59.0, 44.0, 54.0, 60.0, 52.0, 42.0, 45.0, 39.0, 50.0, 33.0, 36.0, 28.0, 33.0, 14.0, 14.0, 22.0, 6.0, 15.0, 7.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011301040649414062, -0.0010917186737060547, -0.0010533332824707031, -0.0010149478912353516, -0.0009765625, -0.0009381771087646484, -0.0008997917175292969, -0.0008614063262939453, -0.0008230209350585938, -0.0007846355438232422, -0.0007462501525878906, -0.0007078647613525391, -0.0006694793701171875, -0.0006310939788818359, -0.0005927085876464844, -0.0005543231964111328, -0.0005159378051757812, -0.0004775524139404297, -0.0004391670227050781, -0.00040078163146972656, -0.000362396240234375, -0.00032401084899902344, -0.0002856254577636719, -0.0002472400665283203, -0.00020885467529296875, -0.0001704692840576172, -0.00013208389282226562, -9.369850158691406e-05, -5.53131103515625e-05, -1.6927719116210938e-05, 2.1457672119140625e-05, 5.984306335449219e-05, 9.822845458984375e-05, 0.0001366138458251953, 0.00017499923706054688, 0.00021338462829589844, 0.00025177001953125, 0.00029015541076660156, 0.0003285408020019531, 0.0003669261932373047, 0.00040531158447265625, 0.0004436969757080078, 0.0004820823669433594, 0.0005204677581787109, 0.0005588531494140625, 0.0005972385406494141, 0.0006356239318847656, 0.0006740093231201172, 0.0007123947143554688, 0.0007507801055908203, 0.0007891654968261719, 0.0008275508880615234, 0.000865936279296875, 0.0009043216705322266, 0.0009427070617675781, 0.0009810924530029297, 0.0010194778442382812, 0.0010578632354736328, 0.0010962486267089844, 0.001134634017944336, 0.0011730194091796875, 0.001211404800415039, 0.0012497901916503906, 0.0012881755828857422, 0.0013265609741210938]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 15.0, 17.0, 33.0, 39.0, 76.0, 135.0, 241.0, 425.0, 750.0, 1237.0, 2035.0, 3837.0, 6648.0, 11768.0, 20382.0, 34062.0, 55290.0, 82551.0, 112912.0, 137015.0, 144715.0, 132141.0, 105487.0, 75643.0, 49764.0, 29803.0, 17692.0, 10210.0, 5909.0, 3252.0, 1889.0, 1058.0, 612.0, 351.0, 230.0, 119.0, 77.0, 53.0, 30.0, 21.0, 13.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.690185546875, -11.26318359375, -10.836181640625, -10.4091796875, -9.982177734375, -9.55517578125, -9.128173828125, -8.701171875, -8.274169921875, -7.84716796875, -7.420166015625, -6.9931640625, -6.566162109375, -6.13916015625, -5.712158203125, -5.28515625, -4.858154296875, -4.43115234375, -4.004150390625, -3.5771484375, -3.150146484375, -2.72314453125, -2.296142578125, -1.869140625, -1.442138671875, -1.01513671875, -0.588134765625, -0.1611328125, 0.265869140625, 0.69287109375, 1.119873046875, 1.546875, 1.973876953125, 2.40087890625, 2.827880859375, 3.2548828125, 3.681884765625, 4.10888671875, 4.535888671875, 4.962890625, 5.389892578125, 5.81689453125, 6.243896484375, 6.6708984375, 7.097900390625, 7.52490234375, 7.951904296875, 8.37890625, 8.805908203125, 9.23291015625, 9.659912109375, 10.0869140625, 10.513916015625, 10.94091796875, 11.367919921875, 11.794921875, 12.221923828125, 12.64892578125, 13.075927734375, 13.5029296875, 13.929931640625, 14.35693359375, 14.783935546875, 15.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 11.0, 12.0, 22.0, 26.0, 19.0, 36.0, 41.0, 39.0, 39.0, 46.0, 45.0, 49.0, 53.0, 44.0, 58.0, 46.0, 47.0, 40.0, 35.0, 34.0, 27.0, 31.0, 28.0, 20.0, 18.0, 22.0, 11.0, 16.0, 10.0, 10.0, 10.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.68084716796875, -4.5218505859375, -4.36285400390625, -4.203857421875, -4.04486083984375, -3.8858642578125, -3.72686767578125, -3.56787109375, -3.40887451171875, -3.2498779296875, -3.09088134765625, -2.931884765625, -2.77288818359375, -2.6138916015625, -2.45489501953125, -2.2958984375, -2.13690185546875, -1.9779052734375, -1.81890869140625, -1.659912109375, -1.50091552734375, -1.3419189453125, -1.18292236328125, -1.02392578125, -0.86492919921875, -0.7059326171875, -0.54693603515625, -0.387939453125, -0.22894287109375, -0.0699462890625, 0.08905029296875, 0.248046875, 0.40704345703125, 0.5660400390625, 0.72503662109375, 0.884033203125, 1.04302978515625, 1.2020263671875, 1.36102294921875, 1.52001953125, 1.67901611328125, 1.8380126953125, 1.99700927734375, 2.156005859375, 2.31500244140625, 2.4739990234375, 2.63299560546875, 2.7919921875, 2.95098876953125, 3.1099853515625, 3.26898193359375, 3.427978515625, 3.58697509765625, 3.7459716796875, 3.90496826171875, 4.06396484375, 4.22296142578125, 4.3819580078125, 4.54095458984375, 4.699951171875, 4.85894775390625, 5.0179443359375, 5.17694091796875, 5.3359375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 7.0, 7.0, 12.0, 16.0, 21.0, 27.0, 22.0, 26.0, 25.0, 34.0, 38.0, 29.0, 41.0, 48.0, 30.0, 41.0, 32.0, 44.0, 53.0, 36.0, 36.0, 49.0, 30.0, 35.0, 39.0, 37.0, 22.0, 20.0, 23.0, 18.0, 16.0, 17.0, 12.0, 10.0, 6.0, 14.0, 3.0, 2.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.44992446899414, -30.42497444152832, -29.4000244140625, -28.375076293945312, -27.350126266479492, -26.325176239013672, -25.300228118896484, -24.275278091430664, -23.250328063964844, -22.225378036499023, -21.200428009033203, -20.175479888916016, -19.150529861450195, -18.125579833984375, -17.100631713867188, -16.075681686401367, -15.050731658935547, -14.025781631469727, -13.000832557678223, -11.975883483886719, -10.950933456420898, -9.925983428955078, -8.901034355163574, -7.876084804534912, -6.85113525390625, -5.826185703277588, -4.801236152648926, -3.7762866020202637, -2.7513370513916016, -1.7263875007629395, -0.7014379501342773, 0.32351160049438477, 1.3484573364257812, 2.3734068870544434, 3.3983564376831055, 4.423305988311768, 5.44825553894043, 6.473205089569092, 7.498154640197754, 8.523103713989258, 9.548053741455078, 10.573003768920898, 11.597952842712402, 12.622901916503906, 13.647851943969727, 14.672801971435547, 15.69775104522705, 16.722700119018555, 17.747650146484375, 18.772600173950195, 19.797550201416016, 20.822498321533203, 21.847448348999023, 22.872398376464844, 23.89734649658203, 24.92229652404785, 25.947246551513672, 26.972196578979492, 27.997146606445312, 29.0220947265625, 30.04704475402832, 31.07199478149414, 32.09694290161133, 33.12189483642578, 34.14684295654297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 3.0, 9.0, 7.0, 16.0, 11.0, 16.0, 23.0, 22.0, 18.0, 26.0, 37.0, 37.0, 31.0, 44.0, 36.0, 61.0, 46.0, 47.0, 38.0, 38.0, 58.0, 43.0, 39.0, 35.0, 25.0, 33.0, 20.0, 28.0, 27.0, 21.0, 12.0, 21.0, 10.0, 13.0, 11.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.10544204711914, -39.828407287597656, -38.55137252807617, -37.27433776855469, -35.99729919433594, -34.72026443481445, -33.44322967529297, -32.166194915771484, -30.88916015625, -29.612125396728516, -28.33509063720703, -27.058053970336914, -25.78101921081543, -24.503984451293945, -23.226947784423828, -21.949913024902344, -20.67287826538086, -19.395843505859375, -18.11880874633789, -16.841772079467773, -15.564737319946289, -14.287702560424805, -13.010666847229004, -11.733631134033203, -10.456596374511719, -9.179561614990234, -7.902525901794434, -6.625490665435791, -5.348455429077148, -4.071420192718506, -2.7943849563598633, -1.5173492431640625, -0.24031448364257812, 1.0367207527160645, 2.313755989074707, 3.5907912254333496, 4.867826461791992, 6.144861698150635, 7.421896934509277, 8.698932647705078, 9.975967407226562, 11.253002166748047, 12.530037879943848, 13.807073593139648, 15.084108352661133, 16.361143112182617, 17.638179779052734, 18.91521453857422, 20.192249298095703, 21.469284057617188, 22.746318817138672, 24.02335548400879, 25.300390243530273, 26.577425003051758, 27.854461669921875, 29.13149642944336, 30.408531188964844, 31.685565948486328, 32.96260070800781, 34.2396354675293, 35.51667022705078, 36.79370880126953, 38.070743560791016, 39.3477783203125, 40.624813079833984]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 17.0, 12.0, 36.0, 69.0, 118.0, 166.0, 276.0, 442.0, 778.0, 1303.0, 2118.0, 3505.0, 5898.0, 9485.0, 15094.0, 24214.0, 37566.0, 57042.0, 84602.0, 121108.0, 167796.0, 222199.0, 281202.0, 336058.0, 377050.0, 400262.0, 395700.0, 369383.0, 322616.0, 265260.0, 207831.0, 154935.0, 111310.0, 76718.0, 51433.0, 33826.0, 21632.0, 13523.0, 8424.0, 5238.0, 3144.0, 1879.0, 1204.0, 699.0, 452.0, 255.0, 168.0, 97.0, 57.0, 43.0, 19.0, 12.0, 5.0, 7.0, 0.0, 0.0, 4.0], "bins": [-22.609375, -21.921630859375, -21.23388671875, -20.546142578125, -19.8583984375, -19.170654296875, -18.48291015625, -17.795166015625, -17.107421875, -16.419677734375, -15.73193359375, -15.044189453125, -14.3564453125, -13.668701171875, -12.98095703125, -12.293212890625, -11.60546875, -10.917724609375, -10.22998046875, -9.542236328125, -8.8544921875, -8.166748046875, -7.47900390625, -6.791259765625, -6.103515625, -5.415771484375, -4.72802734375, -4.040283203125, -3.3525390625, -2.664794921875, -1.97705078125, -1.289306640625, -0.6015625, 0.086181640625, 0.77392578125, 1.461669921875, 2.1494140625, 2.837158203125, 3.52490234375, 4.212646484375, 4.900390625, 5.588134765625, 6.27587890625, 6.963623046875, 7.6513671875, 8.339111328125, 9.02685546875, 9.714599609375, 10.40234375, 11.090087890625, 11.77783203125, 12.465576171875, 13.1533203125, 13.841064453125, 14.52880859375, 15.216552734375, 15.904296875, 16.592041015625, 17.27978515625, 17.967529296875, 18.6552734375, 19.343017578125, 20.03076171875, 20.718505859375, 21.40625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 5.0, 9.0, 6.0, 10.0, 14.0, 13.0, 16.0, 27.0, 18.0, 18.0, 28.0, 41.0, 32.0, 35.0, 47.0, 36.0, 53.0, 48.0, 49.0, 39.0, 47.0, 46.0, 43.0, 40.0, 36.0, 28.0, 27.0, 21.0, 34.0, 25.0, 18.0, 10.0, 22.0, 10.0, 8.0, 10.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.375, -34.265625, -33.15625, -32.046875, -30.9375, -29.828125, -28.71875, -27.609375, -26.5, -25.390625, -24.28125, -23.171875, -22.0625, -20.953125, -19.84375, -18.734375, -17.625, -16.515625, -15.40625, -14.296875, -13.1875, -12.078125, -10.96875, -9.859375, -8.75, -7.640625, -6.53125, -5.421875, -4.3125, -3.203125, -2.09375, -0.984375, 0.125, 1.234375, 2.34375, 3.453125, 4.5625, 5.671875, 6.78125, 7.890625, 9.0, 10.109375, 11.21875, 12.328125, 13.4375, 14.546875, 15.65625, 16.765625, 17.875, 18.984375, 20.09375, 21.203125, 22.3125, 23.421875, 24.53125, 25.640625, 26.75, 27.859375, 28.96875, 30.078125, 31.1875, 32.296875, 33.40625, 34.515625, 35.625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 9.0, 11.0, 21.0, 34.0, 63.0, 135.0, 193.0, 415.0, 615.0, 1060.0, 1825.0, 3015.0, 4924.0, 7924.0, 12586.0, 19397.0, 29208.0, 43266.0, 62432.0, 86634.0, 118172.0, 154967.0, 195800.0, 236989.0, 278605.0, 310917.0, 334444.0, 341762.0, 336893.0, 316276.0, 283259.0, 242114.0, 201504.0, 159945.0, 122037.0, 90153.0, 65161.0, 45308.0, 30901.0, 20548.0, 13309.0, 8347.0, 5196.0, 3211.0, 1969.0, 1152.0, 682.0, 398.0, 239.0, 119.0, 56.0, 51.0, 21.0, 4.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-20.328125, -19.68408203125, -19.0400390625, -18.39599609375, -17.751953125, -17.10791015625, -16.4638671875, -15.81982421875, -15.17578125, -14.53173828125, -13.8876953125, -13.24365234375, -12.599609375, -11.95556640625, -11.3115234375, -10.66748046875, -10.0234375, -9.37939453125, -8.7353515625, -8.09130859375, -7.447265625, -6.80322265625, -6.1591796875, -5.51513671875, -4.87109375, -4.22705078125, -3.5830078125, -2.93896484375, -2.294921875, -1.65087890625, -1.0068359375, -0.36279296875, 0.28125, 0.92529296875, 1.5693359375, 2.21337890625, 2.857421875, 3.50146484375, 4.1455078125, 4.78955078125, 5.43359375, 6.07763671875, 6.7216796875, 7.36572265625, 8.009765625, 8.65380859375, 9.2978515625, 9.94189453125, 10.5859375, 11.22998046875, 11.8740234375, 12.51806640625, 13.162109375, 13.80615234375, 14.4501953125, 15.09423828125, 15.73828125, 16.38232421875, 17.0263671875, 17.67041015625, 18.314453125, 18.95849609375, 19.6025390625, 20.24658203125, 20.890625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 12.0, 10.0, 19.0, 21.0, 15.0, 36.0, 28.0, 40.0, 35.0, 64.0, 76.0, 72.0, 86.0, 107.0, 109.0, 136.0, 129.0, 138.0, 138.0, 172.0, 171.0, 180.0, 157.0, 162.0, 187.0, 179.0, 175.0, 165.0, 153.0, 158.0, 133.0, 111.0, 99.0, 90.0, 71.0, 82.0, 56.0, 47.0, 51.0, 34.0, 46.0, 19.0, 25.0, 17.0, 12.0, 6.0, 10.0, 15.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-12.546875, -12.15478515625, -11.7626953125, -11.37060546875, -10.978515625, -10.58642578125, -10.1943359375, -9.80224609375, -9.41015625, -9.01806640625, -8.6259765625, -8.23388671875, -7.841796875, -7.44970703125, -7.0576171875, -6.66552734375, -6.2734375, -5.88134765625, -5.4892578125, -5.09716796875, -4.705078125, -4.31298828125, -3.9208984375, -3.52880859375, -3.13671875, -2.74462890625, -2.3525390625, -1.96044921875, -1.568359375, -1.17626953125, -0.7841796875, -0.39208984375, 0.0, 0.39208984375, 0.7841796875, 1.17626953125, 1.568359375, 1.96044921875, 2.3525390625, 2.74462890625, 3.13671875, 3.52880859375, 3.9208984375, 4.31298828125, 4.705078125, 5.09716796875, 5.4892578125, 5.88134765625, 6.2734375, 6.66552734375, 7.0576171875, 7.44970703125, 7.841796875, 8.23388671875, 8.6259765625, 9.01806640625, 9.41015625, 9.80224609375, 10.1943359375, 10.58642578125, 10.978515625, 11.37060546875, 11.7626953125, 12.15478515625, 12.546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 8.0, 14.0, 12.0, 19.0, 20.0, 16.0, 26.0, 21.0, 25.0, 38.0, 34.0, 29.0, 39.0, 42.0, 49.0, 42.0, 41.0, 43.0, 43.0, 53.0, 35.0, 45.0, 30.0, 32.0, 26.0, 22.0, 25.0, 33.0, 22.0, 17.0, 14.0, 11.0, 16.0, 11.0, 3.0, 12.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.25745391845703, -29.222204208374023, -28.186954498291016, -27.15170669555664, -26.116456985473633, -25.081207275390625, -24.045957565307617, -23.01070785522461, -21.975460052490234, -20.940210342407227, -19.90496063232422, -18.869712829589844, -17.834463119506836, -16.799213409423828, -15.76396369934082, -14.728713989257812, -13.693464279174805, -12.658214569091797, -11.622965812683105, -10.587716102600098, -9.552467346191406, -8.517217636108398, -7.481967926025391, -6.446718692779541, -5.411469459533691, -4.376220226287842, -3.340970754623413, -2.3057212829589844, -1.2704720497131348, -0.23522281646728516, 0.8000268936157227, 1.8352761268615723, 2.870525360107422, 3.9057745933532715, 4.941023826599121, 5.976273536682129, 7.0115227699279785, 8.046772003173828, 9.082021713256836, 10.117271423339844, 11.152520179748535, 12.187769889831543, 13.223018646240234, 14.258268356323242, 15.29351806640625, 16.328765869140625, 17.364017486572266, 18.39926528930664, 19.43451499938965, 20.469764709472656, 21.505014419555664, 22.540264129638672, 23.575511932373047, 24.610761642456055, 25.646011352539062, 26.68126106262207, 27.716510772705078, 28.751760482788086, 29.787010192871094, 30.82225799560547, 31.857507705688477, 32.892757415771484, 33.928009033203125, 34.9632568359375, 35.998504638671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 13.0, 7.0, 5.0, 6.0, 11.0, 13.0, 16.0, 17.0, 20.0, 35.0, 27.0, 31.0, 24.0, 34.0, 32.0, 38.0, 40.0, 57.0, 42.0, 36.0, 47.0, 44.0, 44.0, 50.0, 40.0, 33.0, 31.0, 26.0, 29.0, 17.0, 31.0, 22.0, 18.0, 14.0, 10.0, 10.0, 8.0, 1.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.57291030883789, -38.352291107177734, -37.13167190551758, -35.91105270385742, -34.690433502197266, -33.469810485839844, -32.24919128417969, -31.02857208251953, -29.807952880859375, -28.58733367919922, -27.366714477539062, -26.146095275878906, -24.925474166870117, -23.70485496520996, -22.484235763549805, -21.263614654541016, -20.042997360229492, -18.822378158569336, -17.60175895690918, -16.38113784790039, -15.160518646240234, -13.939899444580078, -12.719280242919922, -11.49866008758545, -10.278040885925293, -9.057421684265137, -7.836801528930664, -6.616182327270508, -5.395562648773193, -4.174942970275879, -2.9543237686157227, -1.73370361328125, -0.5130844116210938, 0.7075351476669312, 1.928154706954956, 3.1487741470336914, 4.369393825531006, 5.59001350402832, 6.810632705688477, 8.03125286102295, 9.251872062683105, 10.472491264343262, 11.693111419677734, 12.91373062133789, 14.134349822998047, 15.35496997833252, 16.57558822631836, 17.79620933532715, 19.016828536987305, 20.23744773864746, 21.458066940307617, 22.678688049316406, 23.899307250976562, 25.11992645263672, 26.340545654296875, 27.56116485595703, 28.781784057617188, 30.002403259277344, 31.2230224609375, 32.443641662597656, 33.66426086425781, 34.88488006591797, 36.105499267578125, 37.32612228393555, 38.5467414855957]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 9.0, 13.0, 21.0, 26.0, 53.0, 72.0, 102.0, 137.0, 233.0, 327.0, 524.0, 792.0, 1161.0, 1765.0, 2832.0, 4303.0, 6671.0, 10496.0, 16467.0, 26794.0, 42150.0, 67276.0, 103924.0, 145338.0, 168493.0, 149633.0, 107922.0, 70503.0, 44285.0, 27893.0, 17476.0, 10886.0, 6995.0, 4529.0, 2897.0, 1921.0, 1190.0, 831.0, 562.0, 362.0, 258.0, 147.0, 104.0, 72.0, 48.0, 32.0, 18.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.421875, -5.26495361328125, -5.1080322265625, -4.95111083984375, -4.794189453125, -4.63726806640625, -4.4803466796875, -4.32342529296875, -4.16650390625, -4.00958251953125, -3.8526611328125, -3.69573974609375, -3.538818359375, -3.38189697265625, -3.2249755859375, -3.06805419921875, -2.9111328125, -2.75421142578125, -2.5972900390625, -2.44036865234375, -2.283447265625, -2.12652587890625, -1.9696044921875, -1.81268310546875, -1.65576171875, -1.49884033203125, -1.3419189453125, -1.18499755859375, -1.028076171875, -0.87115478515625, -0.7142333984375, -0.55731201171875, -0.400390625, -0.24346923828125, -0.0865478515625, 0.07037353515625, 0.227294921875, 0.38421630859375, 0.5411376953125, 0.69805908203125, 0.85498046875, 1.01190185546875, 1.1688232421875, 1.32574462890625, 1.482666015625, 1.63958740234375, 1.7965087890625, 1.95343017578125, 2.1103515625, 2.26727294921875, 2.4241943359375, 2.58111572265625, 2.738037109375, 2.89495849609375, 3.0518798828125, 3.20880126953125, 3.36572265625, 3.52264404296875, 3.6795654296875, 3.83648681640625, 3.993408203125, 4.15032958984375, 4.3072509765625, 4.46417236328125, 4.62109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 9.0, 3.0, 7.0, 10.0, 13.0, 17.0, 16.0, 20.0, 36.0, 26.0, 30.0, 25.0, 36.0, 30.0, 38.0, 41.0, 53.0, 44.0, 37.0, 47.0, 43.0, 42.0, 52.0, 39.0, 35.0, 28.0, 28.0, 29.0, 17.0, 30.0, 23.0, 18.0, 15.0, 10.0, 10.0, 8.0, 1.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.59375, -38.37548828125, -37.1572265625, -35.93896484375, -34.720703125, -33.50244140625, -32.2841796875, -31.06591796875, -29.84765625, -28.62939453125, -27.4111328125, -26.19287109375, -24.974609375, -23.75634765625, -22.5380859375, -21.31982421875, -20.1015625, -18.88330078125, -17.6650390625, -16.44677734375, -15.228515625, -14.01025390625, -12.7919921875, -11.57373046875, -10.35546875, -9.13720703125, -7.9189453125, -6.70068359375, -5.482421875, -4.26416015625, -3.0458984375, -1.82763671875, -0.609375, 0.60888671875, 1.8271484375, 3.04541015625, 4.263671875, 5.48193359375, 6.7001953125, 7.91845703125, 9.13671875, 10.35498046875, 11.5732421875, 12.79150390625, 14.009765625, 15.22802734375, 16.4462890625, 17.66455078125, 18.8828125, 20.10107421875, 21.3193359375, 22.53759765625, 23.755859375, 24.97412109375, 26.1923828125, 27.41064453125, 28.62890625, 29.84716796875, 31.0654296875, 32.28369140625, 33.501953125, 34.72021484375, 35.9384765625, 37.15673828125, 38.375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 12.0, 12.0, 26.0, 34.0, 46.0, 67.0, 82.0, 125.0, 185.0, 279.0, 420.0, 618.0, 869.0, 1353.0, 2065.0, 3389.0, 5630.0, 10170.0, 19154.0, 39443.0, 89468.0, 206194.0, 310075.0, 194007.0, 84118.0, 37551.0, 18335.0, 9831.0, 5546.0, 3331.0, 2046.0, 1302.0, 900.0, 576.0, 389.0, 270.0, 183.0, 130.0, 95.0, 63.0, 46.0, 46.0, 12.0, 20.0, 6.0, 13.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-6.83984375, -6.629150390625, -6.41845703125, -6.207763671875, -5.9970703125, -5.786376953125, -5.57568359375, -5.364990234375, -5.154296875, -4.943603515625, -4.73291015625, -4.522216796875, -4.3115234375, -4.100830078125, -3.89013671875, -3.679443359375, -3.46875, -3.258056640625, -3.04736328125, -2.836669921875, -2.6259765625, -2.415283203125, -2.20458984375, -1.993896484375, -1.783203125, -1.572509765625, -1.36181640625, -1.151123046875, -0.9404296875, -0.729736328125, -0.51904296875, -0.308349609375, -0.09765625, 0.113037109375, 0.32373046875, 0.534423828125, 0.7451171875, 0.955810546875, 1.16650390625, 1.377197265625, 1.587890625, 1.798583984375, 2.00927734375, 2.219970703125, 2.4306640625, 2.641357421875, 2.85205078125, 3.062744140625, 3.2734375, 3.484130859375, 3.69482421875, 3.905517578125, 4.1162109375, 4.326904296875, 4.53759765625, 4.748291015625, 4.958984375, 5.169677734375, 5.38037109375, 5.591064453125, 5.8017578125, 6.012451171875, 6.22314453125, 6.433837890625, 6.64453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 11.0, 8.0, 12.0, 13.0, 13.0, 20.0, 35.0, 21.0, 23.0, 36.0, 29.0, 43.0, 39.0, 46.0, 43.0, 40.0, 47.0, 43.0, 42.0, 42.0, 43.0, 28.0, 32.0, 27.0, 38.0, 25.0, 39.0, 24.0, 24.0, 21.0, 16.0, 17.0, 8.0, 10.0, 10.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.328125, -22.47314453125, -21.6181640625, -20.76318359375, -19.908203125, -19.05322265625, -18.1982421875, -17.34326171875, -16.48828125, -15.63330078125, -14.7783203125, -13.92333984375, -13.068359375, -12.21337890625, -11.3583984375, -10.50341796875, -9.6484375, -8.79345703125, -7.9384765625, -7.08349609375, -6.228515625, -5.37353515625, -4.5185546875, -3.66357421875, -2.80859375, -1.95361328125, -1.0986328125, -0.24365234375, 0.611328125, 1.46630859375, 2.3212890625, 3.17626953125, 4.03125, 4.88623046875, 5.7412109375, 6.59619140625, 7.451171875, 8.30615234375, 9.1611328125, 10.01611328125, 10.87109375, 11.72607421875, 12.5810546875, 13.43603515625, 14.291015625, 15.14599609375, 16.0009765625, 16.85595703125, 17.7109375, 18.56591796875, 19.4208984375, 20.27587890625, 21.130859375, 21.98583984375, 22.8408203125, 23.69580078125, 24.55078125, 25.40576171875, 26.2607421875, 27.11572265625, 27.970703125, 28.82568359375, 29.6806640625, 30.53564453125, 31.390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 12.0, 10.0, 18.0, 20.0, 35.0, 44.0, 53.0, 96.0, 127.0, 200.0, 306.0, 494.0, 875.0, 1531.0, 3016.0, 5983.0, 13776.0, 39264.0, 166379.0, 605795.0, 149510.0, 36182.0, 12921.0, 5577.0, 2732.0, 1419.0, 803.0, 456.0, 306.0, 186.0, 138.0, 62.0, 69.0, 40.0, 28.0, 20.0, 20.0, 14.0, 13.0, 6.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.52734375, -6.34332275390625, -6.1593017578125, -5.97528076171875, -5.791259765625, -5.60723876953125, -5.4232177734375, -5.23919677734375, -5.05517578125, -4.87115478515625, -4.6871337890625, -4.50311279296875, -4.319091796875, -4.13507080078125, -3.9510498046875, -3.76702880859375, -3.5830078125, -3.39898681640625, -3.2149658203125, -3.03094482421875, -2.846923828125, -2.66290283203125, -2.4788818359375, -2.29486083984375, -2.11083984375, -1.92681884765625, -1.7427978515625, -1.55877685546875, -1.374755859375, -1.19073486328125, -1.0067138671875, -0.82269287109375, -0.638671875, -0.45465087890625, -0.2706298828125, -0.08660888671875, 0.097412109375, 0.28143310546875, 0.4654541015625, 0.64947509765625, 0.83349609375, 1.01751708984375, 1.2015380859375, 1.38555908203125, 1.569580078125, 1.75360107421875, 1.9376220703125, 2.12164306640625, 2.3056640625, 2.48968505859375, 2.6737060546875, 2.85772705078125, 3.041748046875, 3.22576904296875, 3.4097900390625, 3.59381103515625, 3.77783203125, 3.96185302734375, 4.1458740234375, 4.32989501953125, 4.513916015625, 4.69793701171875, 4.8819580078125, 5.06597900390625, 5.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 6.0, 15.0, 21.0, 18.0, 37.0, 32.0, 43.0, 48.0, 56.0, 62.0, 54.0, 71.0, 68.0, 77.0, 59.0, 50.0, 55.0, 39.0, 29.0, 32.0, 29.0, 11.0, 16.0, 15.0, 8.0, 9.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0003352165222167969, -0.0003263428807258606, -0.0003174692392349243, -0.00030859559774398804, -0.00029972195625305176, -0.0002908483147621155, -0.0002819746732711792, -0.0002731010317802429, -0.00026422739028930664, -0.00025535374879837036, -0.0002464801073074341, -0.0002376064658164978, -0.00022873282432556152, -0.00021985918283462524, -0.00021098554134368896, -0.00020211189985275269, -0.0001932382583618164, -0.00018436461687088013, -0.00017549097537994385, -0.00016661733388900757, -0.0001577436923980713, -0.000148870050907135, -0.00013999640941619873, -0.00013112276792526245, -0.00012224912643432617, -0.00011337548494338989, -0.00010450184345245361, -9.562820196151733e-05, -8.675456047058105e-05, -7.788091897964478e-05, -6.90072774887085e-05, -6.013363599777222e-05, -5.125999450683594e-05, -4.238635301589966e-05, -3.351271152496338e-05, -2.46390700340271e-05, -1.576542854309082e-05, -6.891787052154541e-06, 1.9818544387817383e-06, 1.0855495929718018e-05, 1.9729137420654297e-05, 2.8602778911590576e-05, 3.7476420402526855e-05, 4.6350061893463135e-05, 5.5223703384399414e-05, 6.40973448753357e-05, 7.297098636627197e-05, 8.184462785720825e-05, 9.071826934814453e-05, 9.959191083908081e-05, 0.00010846555233001709, 0.00011733919382095337, 0.00012621283531188965, 0.00013508647680282593, 0.0001439601182937622, 0.00015283375978469849, 0.00016170740127563477, 0.00017058104276657104, 0.00017945468425750732, 0.0001883283257484436, 0.00019720196723937988, 0.00020607560873031616, 0.00021494925022125244, 0.00022382289171218872, 0.000232696533203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 12.0, 16.0, 31.0, 43.0, 71.0, 103.0, 135.0, 219.0, 275.0, 434.0, 617.0, 931.0, 1449.0, 2111.0, 3176.0, 4973.0, 7540.0, 11719.0, 18724.0, 29830.0, 49912.0, 83122.0, 134215.0, 188560.0, 183075.0, 126139.0, 76817.0, 46474.0, 28477.0, 17639.0, 10824.0, 7119.0, 4644.0, 3067.0, 1985.0, 1298.0, 918.0, 582.0, 412.0, 266.0, 184.0, 130.0, 97.0, 60.0, 33.0, 27.0, 27.0, 16.0, 4.0, 9.0, 4.0, 2.0, 3.0, 1.0], "bins": [-3.896484375, -3.781646728515625, -3.66680908203125, -3.551971435546875, -3.4371337890625, -3.322296142578125, -3.20745849609375, -3.092620849609375, -2.977783203125, -2.862945556640625, -2.74810791015625, -2.633270263671875, -2.5184326171875, -2.403594970703125, -2.28875732421875, -2.173919677734375, -2.05908203125, -1.944244384765625, -1.82940673828125, -1.714569091796875, -1.5997314453125, -1.484893798828125, -1.37005615234375, -1.255218505859375, -1.140380859375, -1.025543212890625, -0.91070556640625, -0.795867919921875, -0.6810302734375, -0.566192626953125, -0.45135498046875, -0.336517333984375, -0.2216796875, -0.106842041015625, 0.00799560546875, 0.122833251953125, 0.2376708984375, 0.352508544921875, 0.46734619140625, 0.582183837890625, 0.697021484375, 0.811859130859375, 0.92669677734375, 1.041534423828125, 1.1563720703125, 1.271209716796875, 1.38604736328125, 1.500885009765625, 1.61572265625, 1.730560302734375, 1.84539794921875, 1.960235595703125, 2.0750732421875, 2.189910888671875, 2.30474853515625, 2.419586181640625, 2.534423828125, 2.649261474609375, 2.76409912109375, 2.878936767578125, 2.9937744140625, 3.108612060546875, 3.22344970703125, 3.338287353515625, 3.453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 7.0, 12.0, 11.0, 19.0, 19.0, 23.0, 33.0, 36.0, 35.0, 51.0, 45.0, 61.0, 72.0, 68.0, 73.0, 64.0, 57.0, 51.0, 38.0, 42.0, 35.0, 15.0, 21.0, 13.0, 16.0, 13.0, 8.0, 6.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.217559814453125, -2.14801025390625, -2.078460693359375, -2.0089111328125, -1.939361572265625, -1.86981201171875, -1.800262451171875, -1.730712890625, -1.661163330078125, -1.59161376953125, -1.522064208984375, -1.4525146484375, -1.382965087890625, -1.31341552734375, -1.243865966796875, -1.17431640625, -1.104766845703125, -1.03521728515625, -0.965667724609375, -0.8961181640625, -0.826568603515625, -0.75701904296875, -0.687469482421875, -0.617919921875, -0.548370361328125, -0.47882080078125, -0.409271240234375, -0.3397216796875, -0.270172119140625, -0.20062255859375, -0.131072998046875, -0.0615234375, 0.008026123046875, 0.07757568359375, 0.147125244140625, 0.2166748046875, 0.286224365234375, 0.35577392578125, 0.425323486328125, 0.494873046875, 0.564422607421875, 0.63397216796875, 0.703521728515625, 0.7730712890625, 0.842620849609375, 0.91217041015625, 0.981719970703125, 1.05126953125, 1.120819091796875, 1.19036865234375, 1.259918212890625, 1.3294677734375, 1.399017333984375, 1.46856689453125, 1.538116455078125, 1.607666015625, 1.677215576171875, 1.74676513671875, 1.816314697265625, 1.8858642578125, 1.955413818359375, 2.02496337890625, 2.094512939453125, 2.1640625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 3.0, 10.0, 16.0, 11.0, 22.0, 15.0, 20.0, 23.0, 19.0, 30.0, 34.0, 28.0, 32.0, 44.0, 39.0, 48.0, 40.0, 50.0, 41.0, 47.0, 36.0, 39.0, 48.0, 34.0, 25.0, 32.0, 16.0, 30.0, 31.0, 26.0, 17.0, 13.0, 14.0, 11.0, 14.0, 7.0, 5.0, 7.0, 5.0, 1.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.098224639892578, -29.06899642944336, -28.039766311645508, -27.01053810119629, -25.981307983398438, -24.95207977294922, -23.9228515625, -22.89362335205078, -21.86439323425293, -20.83516502380371, -19.80593490600586, -18.77670669555664, -17.747478485107422, -16.71824836730957, -15.689020156860352, -14.659790992736816, -13.630561828613281, -12.601332664489746, -11.572103500366211, -10.542875289916992, -9.513646125793457, -8.484416961669922, -7.455188274383545, -6.425959587097168, -5.396730422973633, -4.367501258850098, -3.3382725715637207, -2.3090436458587646, -1.2798147201538086, -0.25058555603027344, 0.7786431312561035, 1.8078718185424805, 2.8371009826660156, 3.8663299083709717, 4.895558834075928, 5.924787521362305, 6.95401668548584, 7.983245849609375, 9.012474060058594, 10.041703224182129, 11.070932388305664, 12.1001615524292, 13.129390716552734, 14.158618927001953, 15.187848091125488, 16.217077255249023, 17.246305465698242, 18.275535583496094, 19.304763793945312, 20.33399200439453, 21.363222122192383, 22.3924503326416, 23.421680450439453, 24.450908660888672, 25.48013687133789, 26.50936508178711, 27.53859519958496, 28.56782341003418, 29.59705352783203, 30.62628173828125, 31.65550994873047, 32.68473815917969, 33.71397018432617, 34.74319839477539, 35.77242660522461]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 8.0, 7.0, 6.0, 11.0, 15.0, 14.0, 13.0, 25.0, 33.0, 25.0, 30.0, 27.0, 34.0, 39.0, 30.0, 46.0, 42.0, 49.0, 39.0, 43.0, 50.0, 42.0, 57.0, 32.0, 35.0, 32.0, 22.0, 27.0, 23.0, 28.0, 26.0, 14.0, 15.0, 13.0, 5.0, 10.0, 3.0, 1.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.76948928833008, -38.54486846923828, -37.32024383544922, -36.09562301635742, -34.87099838256836, -33.64637756347656, -32.4217529296875, -31.197132110595703, -29.97250747680664, -28.74788475036621, -27.52326202392578, -26.29863929748535, -25.074016571044922, -23.849393844604492, -22.624771118164062, -21.400150299072266, -20.175527572631836, -18.950904846191406, -17.726282119750977, -16.501659393310547, -15.277036666870117, -14.052413940429688, -12.827792167663574, -11.603169441223145, -10.378546714782715, -9.153923988342285, -7.9293012619018555, -6.704679012298584, -5.480056285858154, -4.255433559417725, -3.030811309814453, -1.8061885833740234, -0.5815658569335938, 0.6430567502975464, 1.8676793575286865, 3.092301845550537, 4.316924571990967, 5.5415472984313965, 6.766169548034668, 7.990792274475098, 9.215415000915527, 10.440037727355957, 11.664660453796387, 12.8892822265625, 14.11390495300293, 15.33852767944336, 16.56315040588379, 17.78777313232422, 19.01239585876465, 20.237018585205078, 21.461641311645508, 22.686264038085938, 23.910886764526367, 25.135509490966797, 26.360130310058594, 27.584754943847656, 28.809375762939453, 30.033998489379883, 31.258621215820312, 32.48324203491211, 33.70786666870117, 34.93248748779297, 36.15711212158203, 37.38173294067383, 38.60635757446289]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 10.0, 31.0, 33.0, 44.0, 87.0, 130.0, 235.0, 409.0, 545.0, 866.0, 1347.0, 2044.0, 3231.0, 4827.0, 6937.0, 10294.0, 14626.0, 21096.0, 28091.0, 37632.0, 47749.0, 59750.0, 70403.0, 79783.0, 86043.0, 88503.0, 86132.0, 80505.0, 71218.0, 60017.0, 48829.0, 38709.0, 29120.0, 21477.0, 15392.0, 10786.0, 7216.0, 5098.0, 3283.0, 2153.0, 1393.0, 875.0, 611.0, 383.0, 219.0, 133.0, 101.0, 56.0, 31.0, 21.0, 23.0, 13.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-16.265625, -15.75, -15.234375, -14.71875, -14.203125, -13.6875, -13.171875, -12.65625, -12.140625, -11.625, -11.109375, -10.59375, -10.078125, -9.5625, -9.046875, -8.53125, -8.015625, -7.5, -6.984375, -6.46875, -5.953125, -5.4375, -4.921875, -4.40625, -3.890625, -3.375, -2.859375, -2.34375, -1.828125, -1.3125, -0.796875, -0.28125, 0.234375, 0.75, 1.265625, 1.78125, 2.296875, 2.8125, 3.328125, 3.84375, 4.359375, 4.875, 5.390625, 5.90625, 6.421875, 6.9375, 7.453125, 7.96875, 8.484375, 9.0, 9.515625, 10.03125, 10.546875, 11.0625, 11.578125, 12.09375, 12.609375, 13.125, 13.640625, 14.15625, 14.671875, 15.1875, 15.703125, 16.21875, 16.734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 4.0, 6.0, 10.0, 14.0, 17.0, 14.0, 21.0, 38.0, 26.0, 27.0, 28.0, 36.0, 34.0, 33.0, 44.0, 42.0, 47.0, 41.0, 41.0, 51.0, 41.0, 57.0, 32.0, 36.0, 27.0, 25.0, 30.0, 21.0, 25.0, 29.0, 13.0, 17.0, 12.0, 6.0, 10.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.75, -37.55810546875, -36.3662109375, -35.17431640625, -33.982421875, -32.79052734375, -31.5986328125, -30.40673828125, -29.21484375, -28.02294921875, -26.8310546875, -25.63916015625, -24.447265625, -23.25537109375, -22.0634765625, -20.87158203125, -19.6796875, -18.48779296875, -17.2958984375, -16.10400390625, -14.912109375, -13.72021484375, -12.5283203125, -11.33642578125, -10.14453125, -8.95263671875, -7.7607421875, -6.56884765625, -5.376953125, -4.18505859375, -2.9931640625, -1.80126953125, -0.609375, 0.58251953125, 1.7744140625, 2.96630859375, 4.158203125, 5.35009765625, 6.5419921875, 7.73388671875, 8.92578125, 10.11767578125, 11.3095703125, 12.50146484375, 13.693359375, 14.88525390625, 16.0771484375, 17.26904296875, 18.4609375, 19.65283203125, 20.8447265625, 22.03662109375, 23.228515625, 24.42041015625, 25.6123046875, 26.80419921875, 27.99609375, 29.18798828125, 30.3798828125, 31.57177734375, 32.763671875, 33.95556640625, 35.1474609375, 36.33935546875, 37.53125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 15.0, 34.0, 53.0, 78.0, 124.0, 224.0, 311.0, 641.0, 870.0, 1411.0, 2076.0, 3164.0, 4857.0, 7163.0, 10425.0, 14941.0, 21042.0, 28782.0, 38204.0, 48965.0, 59787.0, 71117.0, 81015.0, 86629.0, 88805.0, 86452.0, 80180.0, 70874.0, 59567.0, 48120.0, 37639.0, 28420.0, 20714.0, 14666.0, 10366.0, 7136.0, 4789.0, 3180.0, 2086.0, 1294.0, 826.0, 570.0, 319.0, 237.0, 151.0, 83.0, 53.0, 33.0, 23.0, 14.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-16.5, -15.975830078125, -15.45166015625, -14.927490234375, -14.4033203125, -13.879150390625, -13.35498046875, -12.830810546875, -12.306640625, -11.782470703125, -11.25830078125, -10.734130859375, -10.2099609375, -9.685791015625, -9.16162109375, -8.637451171875, -8.11328125, -7.589111328125, -7.06494140625, -6.540771484375, -6.0166015625, -5.492431640625, -4.96826171875, -4.444091796875, -3.919921875, -3.395751953125, -2.87158203125, -2.347412109375, -1.8232421875, -1.299072265625, -0.77490234375, -0.250732421875, 0.2734375, 0.797607421875, 1.32177734375, 1.845947265625, 2.3701171875, 2.894287109375, 3.41845703125, 3.942626953125, 4.466796875, 4.990966796875, 5.51513671875, 6.039306640625, 6.5634765625, 7.087646484375, 7.61181640625, 8.135986328125, 8.66015625, 9.184326171875, 9.70849609375, 10.232666015625, 10.7568359375, 11.281005859375, 11.80517578125, 12.329345703125, 12.853515625, 13.377685546875, 13.90185546875, 14.426025390625, 14.9501953125, 15.474365234375, 15.99853515625, 16.522705078125, 17.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 14.0, 10.0, 9.0, 14.0, 13.0, 10.0, 27.0, 16.0, 18.0, 25.0, 21.0, 31.0, 29.0, 46.0, 33.0, 39.0, 28.0, 27.0, 34.0, 41.0, 39.0, 38.0, 49.0, 42.0, 36.0, 27.0, 38.0, 27.0, 27.0, 21.0, 15.0, 26.0, 21.0, 20.0, 10.0, 9.0, 14.0, 11.0, 8.0, 5.0, 7.0, 1.0, 7.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.4345703125, -20.728515625, -20.0224609375, -19.31640625, -18.6103515625, -17.904296875, -17.1982421875, -16.4921875, -15.7861328125, -15.080078125, -14.3740234375, -13.66796875, -12.9619140625, -12.255859375, -11.5498046875, -10.84375, -10.1376953125, -9.431640625, -8.7255859375, -8.01953125, -7.3134765625, -6.607421875, -5.9013671875, -5.1953125, -4.4892578125, -3.783203125, -3.0771484375, -2.37109375, -1.6650390625, -0.958984375, -0.2529296875, 0.453125, 1.1591796875, 1.865234375, 2.5712890625, 3.27734375, 3.9833984375, 4.689453125, 5.3955078125, 6.1015625, 6.8076171875, 7.513671875, 8.2197265625, 8.92578125, 9.6318359375, 10.337890625, 11.0439453125, 11.75, 12.4560546875, 13.162109375, 13.8681640625, 14.57421875, 15.2802734375, 15.986328125, 16.6923828125, 17.3984375, 18.1044921875, 18.810546875, 19.5166015625, 20.22265625, 20.9287109375, 21.634765625, 22.3408203125, 23.046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 8.0, 8.0, 13.0, 16.0, 36.0, 52.0, 83.0, 121.0, 176.0, 300.0, 419.0, 678.0, 1158.0, 1738.0, 2732.0, 4284.0, 6489.0, 9930.0, 14869.0, 21193.0, 30163.0, 41211.0, 53412.0, 67100.0, 79719.0, 89975.0, 94945.0, 95641.0, 90527.0, 80396.0, 68480.0, 54235.0, 41678.0, 30780.0, 21677.0, 15071.0, 10176.0, 6762.0, 4452.0, 2822.0, 1801.0, 1187.0, 789.0, 475.0, 273.0, 179.0, 117.0, 74.0, 52.0, 33.0, 26.0, 10.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0], "bins": [-7.8671875, -7.6290283203125, -7.390869140625, -7.1527099609375, -6.91455078125, -6.6763916015625, -6.438232421875, -6.2000732421875, -5.9619140625, -5.7237548828125, -5.485595703125, -5.2474365234375, -5.00927734375, -4.7711181640625, -4.532958984375, -4.2947998046875, -4.056640625, -3.8184814453125, -3.580322265625, -3.3421630859375, -3.10400390625, -2.8658447265625, -2.627685546875, -2.3895263671875, -2.1513671875, -1.9132080078125, -1.675048828125, -1.4368896484375, -1.19873046875, -0.9605712890625, -0.722412109375, -0.4842529296875, -0.24609375, -0.0079345703125, 0.230224609375, 0.4683837890625, 0.70654296875, 0.9447021484375, 1.182861328125, 1.4210205078125, 1.6591796875, 1.8973388671875, 2.135498046875, 2.3736572265625, 2.61181640625, 2.8499755859375, 3.088134765625, 3.3262939453125, 3.564453125, 3.8026123046875, 4.040771484375, 4.2789306640625, 4.51708984375, 4.7552490234375, 4.993408203125, 5.2315673828125, 5.4697265625, 5.7078857421875, 5.946044921875, 6.1842041015625, 6.42236328125, 6.6605224609375, 6.898681640625, 7.1368408203125, 7.375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 19.0, 12.0, 13.0, 20.0, 22.0, 25.0, 24.0, 22.0, 32.0, 33.0, 40.0, 45.0, 44.0, 31.0, 27.0, 33.0, 54.0, 42.0, 40.0, 47.0, 51.0, 29.0, 32.0, 35.0, 25.0, 26.0, 24.0, 23.0, 23.0, 14.0, 13.0, 13.0, 8.0, 7.0, 9.0, 10.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010309219360351562, -0.0009992718696594238, -0.0009676218032836914, -0.000935971736907959, -0.0009043216705322266, -0.0008726716041564941, -0.0008410215377807617, -0.0008093714714050293, -0.0007777214050292969, -0.0007460713386535645, -0.000714421272277832, -0.0006827712059020996, -0.0006511211395263672, -0.0006194710731506348, -0.0005878210067749023, -0.0005561709403991699, -0.0005245208740234375, -0.0004928708076477051, -0.00046122074127197266, -0.00042957067489624023, -0.0003979206085205078, -0.0003662705421447754, -0.00033462047576904297, -0.00030297040939331055, -0.0002713203430175781, -0.0002396702766418457, -0.00020802021026611328, -0.00017637014389038086, -0.00014472007751464844, -0.00011307001113891602, -8.14199447631836e-05, -4.976987838745117e-05, -1.811981201171875e-05, 1.3530254364013672e-05, 4.5180320739746094e-05, 7.683038711547852e-05, 0.00010848045349121094, 0.00014013051986694336, 0.00017178058624267578, 0.0002034306526184082, 0.00023508071899414062, 0.00026673078536987305, 0.00029838085174560547, 0.0003300309181213379, 0.0003616809844970703, 0.00039333105087280273, 0.00042498111724853516, 0.0004566311836242676, 0.00048828125, 0.0005199313163757324, 0.0005515813827514648, 0.0005832314491271973, 0.0006148815155029297, 0.0006465315818786621, 0.0006781816482543945, 0.000709831714630127, 0.0007414817810058594, 0.0007731318473815918, 0.0008047819137573242, 0.0008364319801330566, 0.0008680820465087891, 0.0008997321128845215, 0.0009313821792602539, 0.0009630322456359863, 0.0009946823120117188]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 18.0, 16.0, 37.0, 50.0, 70.0, 140.0, 231.0, 308.0, 512.0, 778.0, 1203.0, 1913.0, 2943.0, 4739.0, 7386.0, 11228.0, 17307.0, 26324.0, 37684.0, 53014.0, 70226.0, 88401.0, 102814.0, 110810.0, 108970.0, 99849.0, 84162.0, 65702.0, 48871.0, 34847.0, 23832.0, 15581.0, 10282.0, 6540.0, 4215.0, 2725.0, 1731.0, 1103.0, 709.0, 447.0, 283.0, 177.0, 128.0, 97.0, 57.0, 42.0, 27.0, 11.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.015625, -9.6912841796875, -9.366943359375, -9.0426025390625, -8.71826171875, -8.3939208984375, -8.069580078125, -7.7452392578125, -7.4208984375, -7.0965576171875, -6.772216796875, -6.4478759765625, -6.12353515625, -5.7991943359375, -5.474853515625, -5.1505126953125, -4.826171875, -4.5018310546875, -4.177490234375, -3.8531494140625, -3.52880859375, -3.2044677734375, -2.880126953125, -2.5557861328125, -2.2314453125, -1.9071044921875, -1.582763671875, -1.2584228515625, -0.93408203125, -0.6097412109375, -0.285400390625, 0.0389404296875, 0.36328125, 0.6876220703125, 1.011962890625, 1.3363037109375, 1.66064453125, 1.9849853515625, 2.309326171875, 2.6336669921875, 2.9580078125, 3.2823486328125, 3.606689453125, 3.9310302734375, 4.25537109375, 4.5797119140625, 4.904052734375, 5.2283935546875, 5.552734375, 5.8770751953125, 6.201416015625, 6.5257568359375, 6.85009765625, 7.1744384765625, 7.498779296875, 7.8231201171875, 8.1474609375, 8.4718017578125, 8.796142578125, 9.1204833984375, 9.44482421875, 9.7691650390625, 10.093505859375, 10.4178466796875, 10.7421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 9.0, 17.0, 18.0, 21.0, 14.0, 35.0, 30.0, 39.0, 44.0, 49.0, 48.0, 59.0, 58.0, 56.0, 69.0, 59.0, 54.0, 42.0, 47.0, 45.0, 35.0, 38.0, 16.0, 17.0, 16.0, 8.0, 11.0, 4.0, 4.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.90814208984375, -5.7069091796875, -5.50567626953125, -5.304443359375, -5.10321044921875, -4.9019775390625, -4.70074462890625, -4.49951171875, -4.29827880859375, -4.0970458984375, -3.89581298828125, -3.694580078125, -3.49334716796875, -3.2921142578125, -3.09088134765625, -2.8896484375, -2.68841552734375, -2.4871826171875, -2.28594970703125, -2.084716796875, -1.88348388671875, -1.6822509765625, -1.48101806640625, -1.27978515625, -1.07855224609375, -0.8773193359375, -0.67608642578125, -0.474853515625, -0.27362060546875, -0.0723876953125, 0.12884521484375, 0.330078125, 0.53131103515625, 0.7325439453125, 0.93377685546875, 1.135009765625, 1.33624267578125, 1.5374755859375, 1.73870849609375, 1.93994140625, 2.14117431640625, 2.3424072265625, 2.54364013671875, 2.744873046875, 2.94610595703125, 3.1473388671875, 3.34857177734375, 3.5498046875, 3.75103759765625, 3.9522705078125, 4.15350341796875, 4.354736328125, 4.55596923828125, 4.7572021484375, 4.95843505859375, 5.15966796875, 5.36090087890625, 5.5621337890625, 5.76336669921875, 5.964599609375, 6.16583251953125, 6.3670654296875, 6.56829833984375, 6.76953125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 8.0, 12.0, 7.0, 17.0, 14.0, 15.0, 16.0, 17.0, 31.0, 20.0, 38.0, 32.0, 43.0, 40.0, 31.0, 57.0, 40.0, 45.0, 49.0, 52.0, 43.0, 38.0, 43.0, 24.0, 22.0, 31.0, 24.0, 29.0, 26.0, 23.0, 17.0, 23.0, 13.0, 13.0, 11.0, 5.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.32360076904297, -30.26119613647461, -29.19879150390625, -28.136384963989258, -27.0739803314209, -26.01157569885254, -24.949169158935547, -23.886764526367188, -22.824359893798828, -21.76195526123047, -20.69955062866211, -19.637144088745117, -18.574739456176758, -17.5123348236084, -16.449928283691406, -15.387523651123047, -14.325119018554688, -13.262714385986328, -12.200308799743652, -11.137903213500977, -10.075498580932617, -9.013093948364258, -7.950688362121582, -6.8882832527160645, -5.825878143310547, -4.763473033905029, -3.7010679244995117, -2.638662815093994, -1.5762577056884766, -0.513852596282959, 0.5485525131225586, 1.6109576225280762, 2.6733627319335938, 3.7357678413391113, 4.798172950744629, 5.8605780601501465, 6.922983169555664, 7.985388278961182, 9.0477933883667, 10.110198974609375, 11.172603607177734, 12.235008239746094, 13.29741382598877, 14.359819412231445, 15.422224044799805, 16.484628677368164, 17.547035217285156, 18.609439849853516, 19.671844482421875, 20.734249114990234, 21.796653747558594, 22.859060287475586, 23.921464920043945, 24.983869552612305, 26.046276092529297, 27.108680725097656, 28.171085357666016, 29.233489990234375, 30.295894622802734, 31.358301162719727, 32.42070770263672, 33.48311233520508, 34.54551696777344, 35.6079216003418, 36.670326232910156]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 5.0, 8.0, 17.0, 10.0, 14.0, 17.0, 17.0, 13.0, 24.0, 40.0, 21.0, 41.0, 39.0, 26.0, 47.0, 45.0, 47.0, 40.0, 30.0, 49.0, 35.0, 42.0, 44.0, 39.0, 41.0, 34.0, 31.0, 18.0, 24.0, 17.0, 21.0, 18.0, 16.0, 11.0, 12.0, 7.0, 9.0, 8.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-43.800445556640625, -42.559967041015625, -41.319488525390625, -40.079010009765625, -38.838531494140625, -37.598052978515625, -36.357574462890625, -35.117095947265625, -33.876617431640625, -32.636138916015625, -31.395660400390625, -30.155181884765625, -28.914703369140625, -27.674224853515625, -26.433748245239258, -25.193269729614258, -23.95279312133789, -22.71231460571289, -21.47183609008789, -20.23135757446289, -18.99087905883789, -17.75040054321289, -16.509923934936523, -15.269445419311523, -14.028966903686523, -12.788488388061523, -11.548009872436523, -10.30753231048584, -9.06705379486084, -7.82657527923584, -6.586097240447998, -5.345619201660156, -4.105140686035156, -2.8646624088287354, -1.6241841316223145, -0.38370585441589355, 0.8567724227905273, 2.0972509384155273, 3.337728977203369, 4.578207015991211, 5.818685531616211, 7.059164047241211, 8.299642562866211, 9.540120124816895, 10.780598640441895, 12.021077156066895, 13.261554718017578, 14.502033233642578, 15.742511749267578, 16.982990264892578, 18.223468780517578, 19.463947296142578, 20.704425811767578, 21.944904327392578, 23.185380935668945, 24.425859451293945, 25.666337966918945, 26.906816482543945, 28.147294998168945, 29.387773513793945, 30.628250122070312, 31.868728637695312, 33.10920715332031, 34.34968566894531, 35.59016418457031]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 13.0, 12.0, 25.0, 32.0, 51.0, 111.0, 151.0, 289.0, 434.0, 778.0, 1265.0, 1974.0, 3366.0, 5265.0, 8420.0, 13238.0, 20618.0, 31371.0, 47979.0, 69343.0, 97788.0, 135348.0, 178086.0, 229624.0, 278767.0, 323072.0, 357010.0, 373244.0, 369504.0, 345760.0, 305699.0, 258341.0, 207236.0, 158982.0, 118180.0, 84629.0, 58540.0, 39492.0, 25818.0, 16791.0, 10769.0, 6663.0, 4045.0, 2487.0, 1512.0, 935.0, 536.0, 300.0, 188.0, 84.0, 50.0, 32.0, 13.0, 14.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-21.078125, -20.414794921875, -19.75146484375, -19.088134765625, -18.4248046875, -17.761474609375, -17.09814453125, -16.434814453125, -15.771484375, -15.108154296875, -14.44482421875, -13.781494140625, -13.1181640625, -12.454833984375, -11.79150390625, -11.128173828125, -10.46484375, -9.801513671875, -9.13818359375, -8.474853515625, -7.8115234375, -7.148193359375, -6.48486328125, -5.821533203125, -5.158203125, -4.494873046875, -3.83154296875, -3.168212890625, -2.5048828125, -1.841552734375, -1.17822265625, -0.514892578125, 0.1484375, 0.811767578125, 1.47509765625, 2.138427734375, 2.8017578125, 3.465087890625, 4.12841796875, 4.791748046875, 5.455078125, 6.118408203125, 6.78173828125, 7.445068359375, 8.1083984375, 8.771728515625, 9.43505859375, 10.098388671875, 10.76171875, 11.425048828125, 12.08837890625, 12.751708984375, 13.4150390625, 14.078369140625, 14.74169921875, 15.405029296875, 16.068359375, 16.731689453125, 17.39501953125, 18.058349609375, 18.7216796875, 19.385009765625, 20.04833984375, 20.711669921875, 21.375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 12.0, 12.0, 16.0, 14.0, 18.0, 16.0, 17.0, 33.0, 31.0, 38.0, 37.0, 30.0, 45.0, 39.0, 45.0, 45.0, 31.0, 43.0, 36.0, 48.0, 40.0, 43.0, 35.0, 34.0, 35.0, 26.0, 19.0, 18.0, 20.0, 19.0, 19.0, 10.0, 12.0, 10.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-38.28125, -37.205322265625, -36.12939453125, -35.053466796875, -33.9775390625, -32.901611328125, -31.82568359375, -30.749755859375, -29.673828125, -28.597900390625, -27.52197265625, -26.446044921875, -25.3701171875, -24.294189453125, -23.21826171875, -22.142333984375, -21.06640625, -19.990478515625, -18.91455078125, -17.838623046875, -16.7626953125, -15.686767578125, -14.61083984375, -13.534912109375, -12.458984375, -11.383056640625, -10.30712890625, -9.231201171875, -8.1552734375, -7.079345703125, -6.00341796875, -4.927490234375, -3.8515625, -2.775634765625, -1.69970703125, -0.623779296875, 0.4521484375, 1.528076171875, 2.60400390625, 3.679931640625, 4.755859375, 5.831787109375, 6.90771484375, 7.983642578125, 9.0595703125, 10.135498046875, 11.21142578125, 12.287353515625, 13.36328125, 14.439208984375, 15.51513671875, 16.591064453125, 17.6669921875, 18.742919921875, 19.81884765625, 20.894775390625, 21.970703125, 23.046630859375, 24.12255859375, 25.198486328125, 26.2744140625, 27.350341796875, 28.42626953125, 29.502197265625, 30.578125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 24.0, 34.0, 44.0, 77.0, 167.0, 286.0, 509.0, 851.0, 1447.0, 2416.0, 3860.0, 6199.0, 9867.0, 15076.0, 23595.0, 34799.0, 49971.0, 70414.0, 96981.0, 127712.0, 164477.0, 202910.0, 243498.0, 279920.0, 308627.0, 326733.0, 331818.0, 324422.0, 303976.0, 271296.0, 233913.0, 193321.0, 155416.0, 120227.0, 89512.0, 65183.0, 45498.0, 31727.0, 21149.0, 13566.0, 8658.0, 5518.0, 3410.0, 2143.0, 1264.0, 779.0, 469.0, 232.0, 139.0, 57.0, 46.0, 28.0, 13.0, 8.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.75, -19.099853515625, -18.44970703125, -17.799560546875, -17.1494140625, -16.499267578125, -15.84912109375, -15.198974609375, -14.548828125, -13.898681640625, -13.24853515625, -12.598388671875, -11.9482421875, -11.298095703125, -10.64794921875, -9.997802734375, -9.34765625, -8.697509765625, -8.04736328125, -7.397216796875, -6.7470703125, -6.096923828125, -5.44677734375, -4.796630859375, -4.146484375, -3.496337890625, -2.84619140625, -2.196044921875, -1.5458984375, -0.895751953125, -0.24560546875, 0.404541015625, 1.0546875, 1.704833984375, 2.35498046875, 3.005126953125, 3.6552734375, 4.305419921875, 4.95556640625, 5.605712890625, 6.255859375, 6.906005859375, 7.55615234375, 8.206298828125, 8.8564453125, 9.506591796875, 10.15673828125, 10.806884765625, 11.45703125, 12.107177734375, 12.75732421875, 13.407470703125, 14.0576171875, 14.707763671875, 15.35791015625, 16.008056640625, 16.658203125, 17.308349609375, 17.95849609375, 18.608642578125, 19.2587890625, 19.908935546875, 20.55908203125, 21.209228515625, 21.859375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 12.0, 6.0, 13.0, 20.0, 22.0, 21.0, 35.0, 42.0, 44.0, 55.0, 83.0, 91.0, 107.0, 114.0, 137.0, 147.0, 151.0, 186.0, 204.0, 193.0, 214.0, 213.0, 184.0, 200.0, 177.0, 176.0, 173.0, 150.0, 145.0, 122.0, 107.0, 116.0, 75.0, 76.0, 55.0, 38.0, 49.0, 34.0, 18.0, 17.0, 16.0, 17.0, 6.0, 0.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.5797119140625, -13.120361328125, -12.6610107421875, -12.20166015625, -11.7423095703125, -11.282958984375, -10.8236083984375, -10.3642578125, -9.9049072265625, -9.445556640625, -8.9862060546875, -8.52685546875, -8.0675048828125, -7.608154296875, -7.1488037109375, -6.689453125, -6.2301025390625, -5.770751953125, -5.3114013671875, -4.85205078125, -4.3927001953125, -3.933349609375, -3.4739990234375, -3.0146484375, -2.5552978515625, -2.095947265625, -1.6365966796875, -1.17724609375, -0.7178955078125, -0.258544921875, 0.2008056640625, 0.66015625, 1.1195068359375, 1.578857421875, 2.0382080078125, 2.49755859375, 2.9569091796875, 3.416259765625, 3.8756103515625, 4.3349609375, 4.7943115234375, 5.253662109375, 5.7130126953125, 6.17236328125, 6.6317138671875, 7.091064453125, 7.5504150390625, 8.009765625, 8.4691162109375, 8.928466796875, 9.3878173828125, 9.84716796875, 10.3065185546875, 10.765869140625, 11.2252197265625, 11.6845703125, 12.1439208984375, 12.603271484375, 13.0626220703125, 13.52197265625, 13.9813232421875, 14.440673828125, 14.9000244140625, 15.359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 6.0, 7.0, 8.0, 13.0, 10.0, 10.0, 18.0, 16.0, 17.0, 25.0, 34.0, 28.0, 24.0, 28.0, 41.0, 34.0, 43.0, 40.0, 44.0, 39.0, 41.0, 40.0, 40.0, 35.0, 41.0, 40.0, 26.0, 29.0, 21.0, 29.0, 24.0, 20.0, 17.0, 19.0, 13.0, 8.0, 11.0, 13.0, 8.0, 7.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.375167846679688, -29.360464096069336, -28.345760345458984, -27.3310546875, -26.31635093688965, -25.301647186279297, -24.286941528320312, -23.27223777770996, -22.25753402709961, -21.242830276489258, -20.228126525878906, -19.213420867919922, -18.19871711730957, -17.18401336669922, -16.169307708740234, -15.154603958129883, -14.139900207519531, -13.12519645690918, -12.110491752624512, -11.095787048339844, -10.081083297729492, -9.06637954711914, -8.051674842834473, -7.036970615386963, -6.022266387939453, -5.007562160491943, -3.9928579330444336, -2.978153705596924, -1.963449478149414, -0.9487452507019043, 0.06595897674560547, 1.0806632041931152, 2.0953636169433594, 3.110067844390869, 4.124772071838379, 5.139476299285889, 6.154180526733398, 7.168884754180908, 8.183588981628418, 9.198293685913086, 10.212997436523438, 11.227701187133789, 12.242405891418457, 13.257110595703125, 14.271814346313477, 15.286518096923828, 16.301223754882812, 17.315927505493164, 18.330631256103516, 19.345335006713867, 20.36003875732422, 21.374744415283203, 22.389448165893555, 23.404151916503906, 24.41885757446289, 25.433561325073242, 26.448265075683594, 27.462968826293945, 28.477672576904297, 29.49237823486328, 30.507081985473633, 31.521785736083984, 32.53649139404297, 33.55119323730469, 34.56589889526367]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 14.0, 9.0, 7.0, 12.0, 13.0, 17.0, 10.0, 20.0, 19.0, 23.0, 36.0, 38.0, 29.0, 37.0, 50.0, 34.0, 43.0, 30.0, 39.0, 41.0, 46.0, 27.0, 44.0, 32.0, 35.0, 34.0, 39.0, 21.0, 20.0, 22.0, 23.0, 19.0, 19.0, 19.0, 18.0, 8.0, 11.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.163963317871094, -38.01884460449219, -36.87372970581055, -35.72861099243164, -34.583492279052734, -33.438377380371094, -32.29325866699219, -31.14813995361328, -30.003023147583008, -28.857906341552734, -27.712787628173828, -26.567670822143555, -25.42255401611328, -24.277435302734375, -23.1323184967041, -21.987201690673828, -20.842082977294922, -19.69696617126465, -18.551847457885742, -17.40673065185547, -16.261611938476562, -15.116495132446289, -13.971378326416016, -12.826260566711426, -11.681142807006836, -10.536025047302246, -9.390907287597656, -8.245790481567383, -7.100672721862793, -5.955554962158203, -4.8104376792907715, -3.66532039642334, -2.52020263671875, -1.3750851154327393, -0.22996759414672852, 0.9151499271392822, 2.060267448425293, 3.205385208129883, 4.3505024909973145, 5.495619773864746, 6.640737533569336, 7.785855293273926, 8.930973052978516, 10.076089859008789, 11.221207618713379, 12.366325378417969, 13.511442184448242, 14.656559944152832, 15.801677703857422, 16.946794509887695, 18.0919132232666, 19.237030029296875, 20.38214874267578, 21.527265548706055, 22.672382354736328, 23.817501068115234, 24.962617874145508, 26.10773468017578, 27.252853393554688, 28.39797019958496, 29.543087005615234, 30.68820571899414, 31.833322525024414, 32.97843933105469, 34.123558044433594]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 13.0, 10.0, 15.0, 15.0, 35.0, 37.0, 46.0, 77.0, 128.0, 220.0, 340.0, 538.0, 908.0, 1640.0, 3014.0, 5709.0, 12022.0, 27121.0, 68181.0, 173603.0, 326991.0, 248740.0, 104445.0, 40413.0, 17217.0, 7959.0, 4028.0, 2089.0, 1195.0, 694.0, 396.0, 246.0, 156.0, 114.0, 70.0, 34.0, 31.0, 24.0, 10.0, 14.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.4296875, -11.1097412109375, -10.789794921875, -10.4698486328125, -10.14990234375, -9.8299560546875, -9.510009765625, -9.1900634765625, -8.8701171875, -8.5501708984375, -8.230224609375, -7.9102783203125, -7.59033203125, -7.2703857421875, -6.950439453125, -6.6304931640625, -6.310546875, -5.9906005859375, -5.670654296875, -5.3507080078125, -5.03076171875, -4.7108154296875, -4.390869140625, -4.0709228515625, -3.7509765625, -3.4310302734375, -3.111083984375, -2.7911376953125, -2.47119140625, -2.1512451171875, -1.831298828125, -1.5113525390625, -1.19140625, -0.8714599609375, -0.551513671875, -0.2315673828125, 0.08837890625, 0.4083251953125, 0.728271484375, 1.0482177734375, 1.3681640625, 1.6881103515625, 2.008056640625, 2.3280029296875, 2.64794921875, 2.9678955078125, 3.287841796875, 3.6077880859375, 3.927734375, 4.2476806640625, 4.567626953125, 4.8875732421875, 5.20751953125, 5.5274658203125, 5.847412109375, 6.1673583984375, 6.4873046875, 6.8072509765625, 7.127197265625, 7.4471435546875, 7.76708984375, 8.0870361328125, 8.406982421875, 8.7269287109375, 9.046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 12.0, 8.0, 9.0, 12.0, 12.0, 17.0, 11.0, 18.0, 19.0, 24.0, 35.0, 37.0, 27.0, 38.0, 53.0, 34.0, 40.0, 34.0, 37.0, 42.0, 46.0, 29.0, 40.0, 35.0, 34.0, 35.0, 39.0, 20.0, 21.0, 21.0, 22.0, 21.0, 19.0, 19.0, 17.0, 9.0, 9.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-39.34375, -38.1982421875, -37.052734375, -35.9072265625, -34.76171875, -33.6162109375, -32.470703125, -31.3251953125, -30.1796875, -29.0341796875, -27.888671875, -26.7431640625, -25.59765625, -24.4521484375, -23.306640625, -22.1611328125, -21.015625, -19.8701171875, -18.724609375, -17.5791015625, -16.43359375, -15.2880859375, -14.142578125, -12.9970703125, -11.8515625, -10.7060546875, -9.560546875, -8.4150390625, -7.26953125, -6.1240234375, -4.978515625, -3.8330078125, -2.6875, -1.5419921875, -0.396484375, 0.7490234375, 1.89453125, 3.0400390625, 4.185546875, 5.3310546875, 6.4765625, 7.6220703125, 8.767578125, 9.9130859375, 11.05859375, 12.2041015625, 13.349609375, 14.4951171875, 15.640625, 16.7861328125, 17.931640625, 19.0771484375, 20.22265625, 21.3681640625, 22.513671875, 23.6591796875, 24.8046875, 25.9501953125, 27.095703125, 28.2412109375, 29.38671875, 30.5322265625, 31.677734375, 32.8232421875, 33.96875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 12.0, 11.0, 15.0, 20.0, 24.0, 32.0, 49.0, 71.0, 82.0, 108.0, 196.0, 279.0, 429.0, 622.0, 988.0, 1616.0, 2921.0, 5544.0, 11241.0, 25753.0, 69733.0, 216626.0, 409574.0, 193738.0, 62563.0, 23625.0, 10542.0, 5137.0, 2678.0, 1520.0, 925.0, 591.0, 359.0, 270.0, 195.0, 120.0, 79.0, 70.0, 42.0, 41.0, 25.0, 20.0, 20.0, 11.0, 6.0, 10.0, 2.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5234375, -8.2340087890625, -7.944580078125, -7.6551513671875, -7.36572265625, -7.0762939453125, -6.786865234375, -6.4974365234375, -6.2080078125, -5.9185791015625, -5.629150390625, -5.3397216796875, -5.05029296875, -4.7608642578125, -4.471435546875, -4.1820068359375, -3.892578125, -3.6031494140625, -3.313720703125, -3.0242919921875, -2.73486328125, -2.4454345703125, -2.156005859375, -1.8665771484375, -1.5771484375, -1.2877197265625, -0.998291015625, -0.7088623046875, -0.41943359375, -0.1300048828125, 0.159423828125, 0.4488525390625, 0.73828125, 1.0277099609375, 1.317138671875, 1.6065673828125, 1.89599609375, 2.1854248046875, 2.474853515625, 2.7642822265625, 3.0537109375, 3.3431396484375, 3.632568359375, 3.9219970703125, 4.21142578125, 4.5008544921875, 4.790283203125, 5.0797119140625, 5.369140625, 5.6585693359375, 5.947998046875, 6.2374267578125, 6.52685546875, 6.8162841796875, 7.105712890625, 7.3951416015625, 7.6845703125, 7.9739990234375, 8.263427734375, 8.5528564453125, 8.84228515625, 9.1317138671875, 9.421142578125, 9.7105712890625, 10.0]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 12.0, 11.0, 8.0, 14.0, 23.0, 20.0, 24.0, 33.0, 24.0, 30.0, 34.0, 43.0, 32.0, 38.0, 48.0, 32.0, 38.0, 43.0, 43.0, 34.0, 38.0, 31.0, 34.0, 29.0, 41.0, 27.0, 24.0, 18.0, 25.0, 20.0, 19.0, 16.0, 16.0, 14.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.671875, -23.877197265625, -23.08251953125, -22.287841796875, -21.4931640625, -20.698486328125, -19.90380859375, -19.109130859375, -18.314453125, -17.519775390625, -16.72509765625, -15.930419921875, -15.1357421875, -14.341064453125, -13.54638671875, -12.751708984375, -11.95703125, -11.162353515625, -10.36767578125, -9.572998046875, -8.7783203125, -7.983642578125, -7.18896484375, -6.394287109375, -5.599609375, -4.804931640625, -4.01025390625, -3.215576171875, -2.4208984375, -1.626220703125, -0.83154296875, -0.036865234375, 0.7578125, 1.552490234375, 2.34716796875, 3.141845703125, 3.9365234375, 4.731201171875, 5.52587890625, 6.320556640625, 7.115234375, 7.909912109375, 8.70458984375, 9.499267578125, 10.2939453125, 11.088623046875, 11.88330078125, 12.677978515625, 13.47265625, 14.267333984375, 15.06201171875, 15.856689453125, 16.6513671875, 17.446044921875, 18.24072265625, 19.035400390625, 19.830078125, 20.624755859375, 21.41943359375, 22.214111328125, 23.0087890625, 23.803466796875, 24.59814453125, 25.392822265625, 26.1875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 6.0, 0.0, 9.0, 11.0, 15.0, 18.0, 26.0, 34.0, 40.0, 57.0, 89.0, 140.0, 230.0, 394.0, 712.0, 1368.0, 2887.0, 7044.0, 22541.0, 127347.0, 748534.0, 105366.0, 19759.0, 6390.0, 2637.0, 1254.0, 667.0, 347.0, 216.0, 130.0, 86.0, 65.0, 34.0, 31.0, 15.0, 20.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-10.15625, -9.89886474609375, -9.6414794921875, -9.38409423828125, -9.126708984375, -8.86932373046875, -8.6119384765625, -8.35455322265625, -8.09716796875, -7.83978271484375, -7.5823974609375, -7.32501220703125, -7.067626953125, -6.81024169921875, -6.5528564453125, -6.29547119140625, -6.0380859375, -5.78070068359375, -5.5233154296875, -5.26593017578125, -5.008544921875, -4.75115966796875, -4.4937744140625, -4.23638916015625, -3.97900390625, -3.72161865234375, -3.4642333984375, -3.20684814453125, -2.949462890625, -2.69207763671875, -2.4346923828125, -2.17730712890625, -1.919921875, -1.66253662109375, -1.4051513671875, -1.14776611328125, -0.890380859375, -0.63299560546875, -0.3756103515625, -0.11822509765625, 0.13916015625, 0.39654541015625, 0.6539306640625, 0.91131591796875, 1.168701171875, 1.42608642578125, 1.6834716796875, 1.94085693359375, 2.1982421875, 2.45562744140625, 2.7130126953125, 2.97039794921875, 3.227783203125, 3.48516845703125, 3.7425537109375, 3.99993896484375, 4.25732421875, 4.51470947265625, 4.7720947265625, 5.02947998046875, 5.286865234375, 5.54425048828125, 5.8016357421875, 6.05902099609375, 6.31640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 12.0, 15.0, 21.0, 23.0, 53.0, 70.0, 94.0, 131.0, 145.0, 110.0, 119.0, 72.0, 41.0, 28.0, 32.0, 15.0, 10.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003485679626464844, -0.00033321231603622437, -0.00031785666942596436, -0.00030250102281570435, -0.00028714537620544434, -0.0002717897295951843, -0.0002564340829849243, -0.0002410784363746643, -0.0002257227897644043, -0.0002103671431541443, -0.00019501149654388428, -0.00017965584993362427, -0.00016430020332336426, -0.00014894455671310425, -0.00013358891010284424, -0.00011823326349258423, -0.00010287761688232422, -8.752197027206421e-05, -7.21663236618042e-05, -5.681067705154419e-05, -4.145503044128418e-05, -2.609938383102417e-05, -1.074373722076416e-05, 4.61190938949585e-06, 1.996755599975586e-05, 3.532320261001587e-05, 5.067884922027588e-05, 6.603449583053589e-05, 8.13901424407959e-05, 9.674578905105591e-05, 0.00011210143566131592, 0.00012745708227157593, 0.00014281272888183594, 0.00015816837549209595, 0.00017352402210235596, 0.00018887966871261597, 0.00020423531532287598, 0.00021959096193313599, 0.000234946608543396, 0.000250302255153656, 0.000265657901763916, 0.000281013548374176, 0.00029636919498443604, 0.00031172484159469604, 0.00032708048820495605, 0.00034243613481521606, 0.0003577917814254761, 0.0003731474280357361, 0.0003885030746459961, 0.0004038587212562561, 0.0004192143678665161, 0.0004345700144767761, 0.00044992566108703613, 0.00046528130769729614, 0.00048063695430755615, 0.0004959926009178162, 0.0005113482475280762, 0.0005267038941383362, 0.0005420595407485962, 0.0005574151873588562, 0.0005727708339691162, 0.0005881264805793762, 0.0006034821271896362, 0.0006188377737998962, 0.0006341934204101562]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 15.0, 17.0, 20.0, 31.0, 39.0, 72.0, 99.0, 152.0, 212.0, 322.0, 474.0, 709.0, 1253.0, 2122.0, 4458.0, 11105.0, 35460.0, 139543.0, 494775.0, 265007.0, 61564.0, 17656.0, 6342.0, 2887.0, 1583.0, 893.0, 579.0, 393.0, 236.0, 180.0, 101.0, 87.0, 48.0, 26.0, 25.0, 17.0, 15.0, 10.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0], "bins": [-12.4140625, -12.0933837890625, -11.772705078125, -11.4520263671875, -11.13134765625, -10.8106689453125, -10.489990234375, -10.1693115234375, -9.8486328125, -9.5279541015625, -9.207275390625, -8.8865966796875, -8.56591796875, -8.2452392578125, -7.924560546875, -7.6038818359375, -7.283203125, -6.9625244140625, -6.641845703125, -6.3211669921875, -6.00048828125, -5.6798095703125, -5.359130859375, -5.0384521484375, -4.7177734375, -4.3970947265625, -4.076416015625, -3.7557373046875, -3.43505859375, -3.1143798828125, -2.793701171875, -2.4730224609375, -2.15234375, -1.8316650390625, -1.510986328125, -1.1903076171875, -0.86962890625, -0.5489501953125, -0.228271484375, 0.0924072265625, 0.4130859375, 0.7337646484375, 1.054443359375, 1.3751220703125, 1.69580078125, 2.0164794921875, 2.337158203125, 2.6578369140625, 2.978515625, 3.2991943359375, 3.619873046875, 3.9405517578125, 4.26123046875, 4.5819091796875, 4.902587890625, 5.2232666015625, 5.5439453125, 5.8646240234375, 6.185302734375, 6.5059814453125, 6.82666015625, 7.1473388671875, 7.468017578125, 7.7886962890625, 8.109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 9.0, 10.0, 9.0, 9.0, 9.0, 18.0, 13.0, 22.0, 18.0, 29.0, 43.0, 51.0, 68.0, 56.0, 69.0, 69.0, 81.0, 65.0, 51.0, 46.0, 42.0, 22.0, 35.0, 22.0, 13.0, 13.0, 14.0, 11.0, 13.0, 7.0, 7.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.9691619873046875, -1.909027099609375, -1.8488922119140625, -1.78875732421875, -1.7286224365234375, -1.668487548828125, -1.6083526611328125, -1.5482177734375, -1.4880828857421875, -1.427947998046875, -1.3678131103515625, -1.30767822265625, -1.2475433349609375, -1.187408447265625, -1.1272735595703125, -1.067138671875, -1.0070037841796875, -0.946868896484375, -0.8867340087890625, -0.82659912109375, -0.7664642333984375, -0.706329345703125, -0.6461944580078125, -0.5860595703125, -0.5259246826171875, -0.465789794921875, -0.4056549072265625, -0.34552001953125, -0.2853851318359375, -0.225250244140625, -0.1651153564453125, -0.10498046875, -0.0448455810546875, 0.015289306640625, 0.0754241943359375, 0.13555908203125, 0.1956939697265625, 0.255828857421875, 0.3159637451171875, 0.3760986328125, 0.4362335205078125, 0.496368408203125, 0.5565032958984375, 0.61663818359375, 0.6767730712890625, 0.736907958984375, 0.7970428466796875, 0.857177734375, 0.9173126220703125, 0.977447509765625, 1.0375823974609375, 1.09771728515625, 1.1578521728515625, 1.217987060546875, 1.2781219482421875, 1.3382568359375, 1.3983917236328125, 1.458526611328125, 1.5186614990234375, 1.57879638671875, 1.6389312744140625, 1.699066162109375, 1.7592010498046875, 1.8193359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 6.0, 3.0, 7.0, 5.0, 7.0, 5.0, 6.0, 12.0, 13.0, 11.0, 14.0, 15.0, 17.0, 25.0, 27.0, 31.0, 27.0, 26.0, 35.0, 35.0, 43.0, 46.0, 38.0, 44.0, 38.0, 45.0, 37.0, 37.0, 38.0, 45.0, 29.0, 23.0, 30.0, 25.0, 25.0, 19.0, 19.0, 13.0, 20.0, 13.0, 6.0, 13.0, 7.0, 9.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.806119918823242, -29.78373908996582, -28.76136016845703, -27.73897933959961, -26.71660041809082, -25.6942195892334, -24.67184066772461, -23.649459838867188, -22.627079010009766, -21.604698181152344, -20.582319259643555, -19.559938430786133, -18.537559509277344, -17.515178680419922, -16.4927978515625, -15.470418930053711, -14.448040008544922, -13.425660133361816, -12.403280258178711, -11.380899429321289, -10.3585205078125, -9.336139678955078, -8.313759803771973, -7.291379928588867, -6.269000053405762, -5.246620178222656, -4.224240303039551, -3.201859951019287, -2.1794800758361816, -1.1571002006530762, -0.1347198486328125, 0.887660026550293, 1.9100379943847656, 2.932417869567871, 3.9547979831695557, 4.97717809677124, 5.999557971954346, 7.021937847137451, 8.044318199157715, 9.06669807434082, 10.089077949523926, 11.111457824707031, 12.133837699890137, 13.156217575073242, 14.178598403930664, 15.200977325439453, 16.223358154296875, 17.245738983154297, 18.268117904663086, 19.290498733520508, 20.312877655029297, 21.33525848388672, 22.357637405395508, 23.38001823425293, 24.40239715576172, 25.42477798461914, 26.447158813476562, 27.469539642333984, 28.491918563842773, 29.514299392700195, 30.536678314208984, 31.559059143066406, 32.58143997192383, 33.60382080078125, 34.626197814941406]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 13.0, 6.0, 9.0, 14.0, 12.0, 14.0, 16.0, 16.0, 22.0, 26.0, 37.0, 36.0, 27.0, 39.0, 45.0, 36.0, 42.0, 32.0, 39.0, 34.0, 46.0, 36.0, 37.0, 37.0, 29.0, 40.0, 32.0, 22.0, 24.0, 19.0, 24.0, 20.0, 21.0, 17.0, 17.0, 11.0, 7.0, 8.0, 7.0, 5.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-39.06671905517578, -37.92647171020508, -36.786224365234375, -35.64597702026367, -34.50572967529297, -33.365482330322266, -32.22523498535156, -31.08498764038086, -29.944740295410156, -28.804492950439453, -27.66424560546875, -26.523998260498047, -25.383750915527344, -24.24350357055664, -23.103256225585938, -21.963008880615234, -20.82276153564453, -19.682514190673828, -18.542266845703125, -17.402019500732422, -16.26177215576172, -15.121524810791016, -13.981277465820312, -12.84103012084961, -11.700782775878906, -10.560535430908203, -9.4202880859375, -8.280040740966797, -7.139793395996094, -5.999546051025391, -4.8592987060546875, -3.7190513610839844, -2.5788002014160156, -1.4385528564453125, -0.2983055114746094, 0.8419418334960938, 1.9821891784667969, 3.1224365234375, 4.262683868408203, 5.402931213378906, 6.543178558349609, 7.6834259033203125, 8.823673248291016, 9.963920593261719, 11.104167938232422, 12.244415283203125, 13.384662628173828, 14.524909973144531, 15.665157318115234, 16.805404663085938, 17.94565200805664, 19.085899353027344, 20.226146697998047, 21.36639404296875, 22.506641387939453, 23.646888732910156, 24.78713607788086, 25.927383422851562, 27.067630767822266, 28.20787811279297, 29.348125457763672, 30.488372802734375, 31.628620147705078, 32.76886749267578, 33.909114837646484]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 6.0, 16.0, 20.0, 34.0, 44.0, 79.0, 154.0, 257.0, 404.0, 744.0, 1202.0, 1957.0, 3132.0, 5036.0, 7757.0, 11770.0, 17597.0, 25373.0, 35253.0, 47551.0, 61684.0, 74922.0, 87285.0, 95393.0, 97914.0, 94915.0, 86706.0, 75014.0, 60598.0, 46979.0, 34839.0, 24812.0, 17365.0, 11525.0, 7431.0, 4808.0, 3121.0, 1864.0, 1198.0, 725.0, 441.0, 251.0, 163.0, 85.0, 46.0, 27.0, 25.0, 11.0, 12.0, 6.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-18.796875, -18.2353515625, -17.673828125, -17.1123046875, -16.55078125, -15.9892578125, -15.427734375, -14.8662109375, -14.3046875, -13.7431640625, -13.181640625, -12.6201171875, -12.05859375, -11.4970703125, -10.935546875, -10.3740234375, -9.8125, -9.2509765625, -8.689453125, -8.1279296875, -7.56640625, -7.0048828125, -6.443359375, -5.8818359375, -5.3203125, -4.7587890625, -4.197265625, -3.6357421875, -3.07421875, -2.5126953125, -1.951171875, -1.3896484375, -0.828125, -0.2666015625, 0.294921875, 0.8564453125, 1.41796875, 1.9794921875, 2.541015625, 3.1025390625, 3.6640625, 4.2255859375, 4.787109375, 5.3486328125, 5.91015625, 6.4716796875, 7.033203125, 7.5947265625, 8.15625, 8.7177734375, 9.279296875, 9.8408203125, 10.40234375, 10.9638671875, 11.525390625, 12.0869140625, 12.6484375, 13.2099609375, 13.771484375, 14.3330078125, 14.89453125, 15.4560546875, 16.017578125, 16.5791015625, 17.140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 11.0, 10.0, 9.0, 11.0, 12.0, 12.0, 16.0, 16.0, 12.0, 26.0, 27.0, 35.0, 37.0, 32.0, 38.0, 41.0, 38.0, 43.0, 28.0, 39.0, 50.0, 36.0, 35.0, 40.0, 28.0, 38.0, 34.0, 31.0, 22.0, 24.0, 15.0, 27.0, 19.0, 21.0, 14.0, 22.0, 7.0, 8.0, 10.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-38.03125, -36.9140625, -35.796875, -34.6796875, -33.5625, -32.4453125, -31.328125, -30.2109375, -29.09375, -27.9765625, -26.859375, -25.7421875, -24.625, -23.5078125, -22.390625, -21.2734375, -20.15625, -19.0390625, -17.921875, -16.8046875, -15.6875, -14.5703125, -13.453125, -12.3359375, -11.21875, -10.1015625, -8.984375, -7.8671875, -6.75, -5.6328125, -4.515625, -3.3984375, -2.28125, -1.1640625, -0.046875, 1.0703125, 2.1875, 3.3046875, 4.421875, 5.5390625, 6.65625, 7.7734375, 8.890625, 10.0078125, 11.125, 12.2421875, 13.359375, 14.4765625, 15.59375, 16.7109375, 17.828125, 18.9453125, 20.0625, 21.1796875, 22.296875, 23.4140625, 24.53125, 25.6484375, 26.765625, 27.8828125, 29.0, 30.1171875, 31.234375, 32.3515625, 33.46875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 15.0, 30.0, 34.0, 57.0, 85.0, 154.0, 257.0, 397.0, 592.0, 992.0, 1631.0, 2637.0, 4123.0, 6017.0, 9433.0, 13706.0, 19879.0, 28063.0, 37554.0, 48970.0, 61702.0, 73396.0, 83863.0, 90933.0, 92796.0, 89820.0, 82680.0, 71764.0, 60039.0, 47219.0, 36032.0, 26569.0, 19080.0, 13085.0, 8661.0, 5883.0, 3923.0, 2396.0, 1558.0, 941.0, 606.0, 371.0, 222.0, 151.0, 87.0, 50.0, 33.0, 37.0, 14.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -17.14208984375, -16.5966796875, -16.05126953125, -15.505859375, -14.96044921875, -14.4150390625, -13.86962890625, -13.32421875, -12.77880859375, -12.2333984375, -11.68798828125, -11.142578125, -10.59716796875, -10.0517578125, -9.50634765625, -8.9609375, -8.41552734375, -7.8701171875, -7.32470703125, -6.779296875, -6.23388671875, -5.6884765625, -5.14306640625, -4.59765625, -4.05224609375, -3.5068359375, -2.96142578125, -2.416015625, -1.87060546875, -1.3251953125, -0.77978515625, -0.234375, 0.31103515625, 0.8564453125, 1.40185546875, 1.947265625, 2.49267578125, 3.0380859375, 3.58349609375, 4.12890625, 4.67431640625, 5.2197265625, 5.76513671875, 6.310546875, 6.85595703125, 7.4013671875, 7.94677734375, 8.4921875, 9.03759765625, 9.5830078125, 10.12841796875, 10.673828125, 11.21923828125, 11.7646484375, 12.31005859375, 12.85546875, 13.40087890625, 13.9462890625, 14.49169921875, 15.037109375, 15.58251953125, 16.1279296875, 16.67333984375, 17.21875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [7.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 6.0, 8.0, 16.0, 10.0, 13.0, 15.0, 22.0, 28.0, 23.0, 29.0, 34.0, 41.0, 34.0, 53.0, 38.0, 35.0, 43.0, 55.0, 37.0, 44.0, 50.0, 28.0, 42.0, 33.0, 48.0, 23.0, 32.0, 20.0, 21.0, 20.0, 12.0, 9.0, 8.0, 8.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.484375, -18.7197265625, -17.955078125, -17.1904296875, -16.42578125, -15.6611328125, -14.896484375, -14.1318359375, -13.3671875, -12.6025390625, -11.837890625, -11.0732421875, -10.30859375, -9.5439453125, -8.779296875, -8.0146484375, -7.25, -6.4853515625, -5.720703125, -4.9560546875, -4.19140625, -3.4267578125, -2.662109375, -1.8974609375, -1.1328125, -0.3681640625, 0.396484375, 1.1611328125, 1.92578125, 2.6904296875, 3.455078125, 4.2197265625, 4.984375, 5.7490234375, 6.513671875, 7.2783203125, 8.04296875, 8.8076171875, 9.572265625, 10.3369140625, 11.1015625, 11.8662109375, 12.630859375, 13.3955078125, 14.16015625, 14.9248046875, 15.689453125, 16.4541015625, 17.21875, 17.9833984375, 18.748046875, 19.5126953125, 20.27734375, 21.0419921875, 21.806640625, 22.5712890625, 23.3359375, 24.1005859375, 24.865234375, 25.6298828125, 26.39453125, 27.1591796875, 27.923828125, 28.6884765625, 29.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 14.0, 20.0, 21.0, 35.0, 49.0, 65.0, 114.0, 147.0, 237.0, 395.0, 643.0, 1071.0, 1692.0, 2943.0, 4881.0, 8142.0, 13456.0, 22074.0, 34610.0, 51341.0, 72257.0, 93826.0, 112102.0, 122074.0, 119465.0, 107637.0, 87928.0, 65857.0, 46067.0, 30541.0, 19025.0, 11950.0, 7089.0, 4260.0, 2457.0, 1529.0, 952.0, 576.0, 357.0, 227.0, 145.0, 92.0, 59.0, 46.0, 31.0, 18.0, 10.0, 7.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.7109375, -9.396240234375, -9.08154296875, -8.766845703125, -8.4521484375, -8.137451171875, -7.82275390625, -7.508056640625, -7.193359375, -6.878662109375, -6.56396484375, -6.249267578125, -5.9345703125, -5.619873046875, -5.30517578125, -4.990478515625, -4.67578125, -4.361083984375, -4.04638671875, -3.731689453125, -3.4169921875, -3.102294921875, -2.78759765625, -2.472900390625, -2.158203125, -1.843505859375, -1.52880859375, -1.214111328125, -0.8994140625, -0.584716796875, -0.27001953125, 0.044677734375, 0.359375, 0.674072265625, 0.98876953125, 1.303466796875, 1.6181640625, 1.932861328125, 2.24755859375, 2.562255859375, 2.876953125, 3.191650390625, 3.50634765625, 3.821044921875, 4.1357421875, 4.450439453125, 4.76513671875, 5.079833984375, 5.39453125, 5.709228515625, 6.02392578125, 6.338623046875, 6.6533203125, 6.968017578125, 7.28271484375, 7.597412109375, 7.912109375, 8.226806640625, 8.54150390625, 8.856201171875, 9.1708984375, 9.485595703125, 9.80029296875, 10.114990234375, 10.4296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 14.0, 10.0, 9.0, 16.0, 22.0, 19.0, 22.0, 34.0, 29.0, 42.0, 39.0, 45.0, 53.0, 51.0, 51.0, 53.0, 51.0, 49.0, 64.0, 43.0, 50.0, 44.0, 39.0, 31.0, 22.0, 23.0, 9.0, 12.0, 8.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011548995971679688, -0.0011162906885147095, -0.0010776817798614502, -0.001039072871208191, -0.0010004639625549316, -0.0009618550539016724, -0.0009232461452484131, -0.0008846372365951538, -0.0008460283279418945, -0.0008074194192886353, -0.000768810510635376, -0.0007302016019821167, -0.0006915926933288574, -0.0006529837846755981, -0.0006143748760223389, -0.0005757659673690796, -0.0005371570587158203, -0.000498548150062561, -0.00045993924140930176, -0.0004213303327560425, -0.0003827214241027832, -0.0003441125154495239, -0.00030550360679626465, -0.00026689469814300537, -0.0002282857894897461, -0.00018967688083648682, -0.00015106797218322754, -0.00011245906352996826, -7.385015487670898e-05, -3.524124622344971e-05, 3.3676624298095703e-06, 4.197657108306885e-05, 8.058547973632812e-05, 0.0001191943883895874, 0.00015780329704284668, 0.00019641220569610596, 0.00023502111434936523, 0.0002736300230026245, 0.0003122389316558838, 0.00035084784030914307, 0.00038945674896240234, 0.0004280656576156616, 0.0004666745662689209, 0.0005052834749221802, 0.0005438923835754395, 0.0005825012922286987, 0.000621110200881958, 0.0006597191095352173, 0.0006983280181884766, 0.0007369369268417358, 0.0007755458354949951, 0.0008141547441482544, 0.0008527636528015137, 0.000891372561454773, 0.0009299814701080322, 0.0009685903787612915, 0.0010071992874145508, 0.00104580819606781, 0.0010844171047210693, 0.0011230260133743286, 0.0011616349220275879, 0.0012002438306808472, 0.0012388527393341064, 0.0012774616479873657, 0.001316070556640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 20.0, 22.0, 44.0, 76.0, 118.0, 171.0, 274.0, 398.0, 694.0, 1038.0, 1777.0, 2911.0, 4866.0, 8262.0, 13889.0, 22717.0, 36385.0, 56057.0, 81092.0, 106928.0, 127563.0, 134117.0, 125130.0, 104265.0, 77941.0, 53871.0, 34500.0, 21050.0, 12722.0, 7737.0, 4636.0, 2795.0, 1667.0, 1056.0, 624.0, 407.0, 231.0, 185.0, 108.0, 71.0, 46.0, 29.0, 15.0, 13.0, 11.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.787109375, -11.38671875, -10.986328125, -10.5859375, -10.185546875, -9.78515625, -9.384765625, -8.984375, -8.583984375, -8.18359375, -7.783203125, -7.3828125, -6.982421875, -6.58203125, -6.181640625, -5.78125, -5.380859375, -4.98046875, -4.580078125, -4.1796875, -3.779296875, -3.37890625, -2.978515625, -2.578125, -2.177734375, -1.77734375, -1.376953125, -0.9765625, -0.576171875, -0.17578125, 0.224609375, 0.625, 1.025390625, 1.42578125, 1.826171875, 2.2265625, 2.626953125, 3.02734375, 3.427734375, 3.828125, 4.228515625, 4.62890625, 5.029296875, 5.4296875, 5.830078125, 6.23046875, 6.630859375, 7.03125, 7.431640625, 7.83203125, 8.232421875, 8.6328125, 9.033203125, 9.43359375, 9.833984375, 10.234375, 10.634765625, 11.03515625, 11.435546875, 11.8359375, 12.236328125, 12.63671875, 13.037109375, 13.4375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 8.0, 4.0, 9.0, 9.0, 19.0, 15.0, 23.0, 29.0, 26.0, 32.0, 46.0, 44.0, 46.0, 35.0, 38.0, 53.0, 47.0, 49.0, 52.0, 46.0, 54.0, 40.0, 43.0, 24.0, 30.0, 27.0, 24.0, 17.0, 29.0, 19.0, 14.0, 9.0, 2.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.60546875, -5.43853759765625, -5.2716064453125, -5.10467529296875, -4.937744140625, -4.77081298828125, -4.6038818359375, -4.43695068359375, -4.27001953125, -4.10308837890625, -3.9361572265625, -3.76922607421875, -3.602294921875, -3.43536376953125, -3.2684326171875, -3.10150146484375, -2.9345703125, -2.76763916015625, -2.6007080078125, -2.43377685546875, -2.266845703125, -2.09991455078125, -1.9329833984375, -1.76605224609375, -1.59912109375, -1.43218994140625, -1.2652587890625, -1.09832763671875, -0.931396484375, -0.76446533203125, -0.5975341796875, -0.43060302734375, -0.263671875, -0.09674072265625, 0.0701904296875, 0.23712158203125, 0.404052734375, 0.57098388671875, 0.7379150390625, 0.90484619140625, 1.07177734375, 1.23870849609375, 1.4056396484375, 1.57257080078125, 1.739501953125, 1.90643310546875, 2.0733642578125, 2.24029541015625, 2.4072265625, 2.57415771484375, 2.7410888671875, 2.90802001953125, 3.074951171875, 3.24188232421875, 3.4088134765625, 3.57574462890625, 3.74267578125, 3.90960693359375, 4.0765380859375, 4.24346923828125, 4.410400390625, 4.57733154296875, 4.7442626953125, 4.91119384765625, 5.078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 5.0, 3.0, 6.0, 10.0, 6.0, 9.0, 16.0, 7.0, 19.0, 19.0, 15.0, 17.0, 19.0, 23.0, 30.0, 33.0, 29.0, 40.0, 21.0, 39.0, 36.0, 36.0, 39.0, 39.0, 34.0, 29.0, 44.0, 38.0, 34.0, 27.0, 26.0, 29.0, 18.0, 25.0, 20.0, 22.0, 22.0, 19.0, 12.0, 19.0, 10.0, 11.0, 5.0, 4.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-30.002649307250977, -29.071632385253906, -28.140615463256836, -27.209598541259766, -26.278581619262695, -25.347564697265625, -24.416547775268555, -23.485530853271484, -22.554513931274414, -21.623497009277344, -20.692480087280273, -19.761463165283203, -18.830446243286133, -17.899429321289062, -16.968412399291992, -16.037395477294922, -15.106378555297852, -14.175361633300781, -13.244344711303711, -12.31332778930664, -11.38231086730957, -10.4512939453125, -9.52027702331543, -8.58926010131836, -7.658243179321289, -6.727226257324219, -5.796209335327148, -4.865192413330078, -3.934175491333008, -3.0031585693359375, -2.072141647338867, -1.1411247253417969, -0.21010971069335938, 0.7209072113037109, 1.6519241333007812, 2.5829410552978516, 3.513957977294922, 4.444974899291992, 5.3759918212890625, 6.307008743286133, 7.238025665283203, 8.169042587280273, 9.100059509277344, 10.031076431274414, 10.962093353271484, 11.893110275268555, 12.824127197265625, 13.755144119262695, 14.686161041259766, 15.617177963256836, 16.548194885253906, 17.479211807250977, 18.410228729248047, 19.341245651245117, 20.272262573242188, 21.203279495239258, 22.134296417236328, 23.0653133392334, 23.99633026123047, 24.92734718322754, 25.85836410522461, 26.78938102722168, 27.72039794921875, 28.65141487121582, 29.58243179321289]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 6.0, 7.0, 3.0, 4.0, 10.0, 15.0, 16.0, 14.0, 14.0, 15.0, 23.0, 23.0, 23.0, 23.0, 24.0, 44.0, 40.0, 34.0, 40.0, 38.0, 52.0, 40.0, 37.0, 34.0, 41.0, 42.0, 32.0, 28.0, 36.0, 39.0, 34.0, 16.0, 22.0, 20.0, 19.0, 15.0, 15.0, 14.0, 17.0, 6.0, 11.0, 5.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.03581619262695, -40.80253219604492, -39.56924819946289, -38.335960388183594, -37.10267639160156, -35.86939239501953, -34.6361083984375, -33.40282440185547, -32.16953659057617, -30.93625259399414, -29.702966690063477, -28.469682693481445, -27.23639678955078, -26.00311279296875, -24.76982879638672, -23.536542892456055, -22.303258895874023, -21.069974899291992, -19.836688995361328, -18.603404998779297, -17.370119094848633, -16.1368350982666, -14.903550148010254, -13.670265197753906, -12.436980247497559, -11.203695297241211, -9.970410346984863, -8.737125396728516, -7.503840923309326, -6.2705559730529785, -5.037271499633789, -3.8039865493774414, -2.5707015991210938, -1.3374167680740356, -0.10413193702697754, 1.129152774810791, 2.3624377250671387, 3.5957226753234863, 4.829007148742676, 6.062292098999023, 7.295577049255371, 8.528861999511719, 9.762146949768066, 10.995431900024414, 12.228715896606445, 13.46200180053711, 14.69528579711914, 15.928570747375488, 17.161855697631836, 18.395139694213867, 19.62842559814453, 20.861709594726562, 22.094995498657227, 23.328279495239258, 24.561565399169922, 25.794849395751953, 27.028133392333984, 28.261417388916016, 29.49470329284668, 30.72798728942871, 31.961273193359375, 33.194557189941406, 34.42784118652344, 35.66112518310547, 36.894412994384766]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [6.0, 4.0, 4.0, 4.0, 15.0, 22.0, 33.0, 65.0, 97.0, 179.0, 241.0, 466.0, 752.0, 1217.0, 1941.0, 3032.0, 4983.0, 7825.0, 12156.0, 18248.0, 27344.0, 40568.0, 57842.0, 81278.0, 111066.0, 145603.0, 186855.0, 229801.0, 271037.0, 306926.0, 332514.0, 344036.0, 340826.0, 321101.0, 290023.0, 249902.0, 207623.0, 164729.0, 127175.0, 94002.0, 68800.0, 48109.0, 32972.0, 22324.0, 14809.0, 9570.0, 6143.0, 3855.0, 2497.0, 1483.0, 890.0, 565.0, 305.0, 185.0, 113.0, 61.0, 41.0, 16.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0], "bins": [-20.84375, -20.18701171875, -19.5302734375, -18.87353515625, -18.216796875, -17.56005859375, -16.9033203125, -16.24658203125, -15.58984375, -14.93310546875, -14.2763671875, -13.61962890625, -12.962890625, -12.30615234375, -11.6494140625, -10.99267578125, -10.3359375, -9.67919921875, -9.0224609375, -8.36572265625, -7.708984375, -7.05224609375, -6.3955078125, -5.73876953125, -5.08203125, -4.42529296875, -3.7685546875, -3.11181640625, -2.455078125, -1.79833984375, -1.1416015625, -0.48486328125, 0.171875, 0.82861328125, 1.4853515625, 2.14208984375, 2.798828125, 3.45556640625, 4.1123046875, 4.76904296875, 5.42578125, 6.08251953125, 6.7392578125, 7.39599609375, 8.052734375, 8.70947265625, 9.3662109375, 10.02294921875, 10.6796875, 11.33642578125, 11.9931640625, 12.64990234375, 13.306640625, 13.96337890625, 14.6201171875, 15.27685546875, 15.93359375, 16.59033203125, 17.2470703125, 17.90380859375, 18.560546875, 19.21728515625, 19.8740234375, 20.53076171875, 21.1875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 9.0, 4.0, 5.0, 4.0, 9.0, 18.0, 17.0, 9.0, 18.0, 13.0, 24.0, 23.0, 23.0, 27.0, 23.0, 46.0, 38.0, 37.0, 37.0, 34.0, 54.0, 40.0, 38.0, 39.0, 32.0, 43.0, 34.0, 30.0, 39.0, 29.0, 32.0, 18.0, 23.0, 18.0, 20.0, 14.0, 18.0, 13.0, 15.0, 8.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-36.875, -35.78955078125, -34.7041015625, -33.61865234375, -32.533203125, -31.44775390625, -30.3623046875, -29.27685546875, -28.19140625, -27.10595703125, -26.0205078125, -24.93505859375, -23.849609375, -22.76416015625, -21.6787109375, -20.59326171875, -19.5078125, -18.42236328125, -17.3369140625, -16.25146484375, -15.166015625, -14.08056640625, -12.9951171875, -11.90966796875, -10.82421875, -9.73876953125, -8.6533203125, -7.56787109375, -6.482421875, -5.39697265625, -4.3115234375, -3.22607421875, -2.140625, -1.05517578125, 0.0302734375, 1.11572265625, 2.201171875, 3.28662109375, 4.3720703125, 5.45751953125, 6.54296875, 7.62841796875, 8.7138671875, 9.79931640625, 10.884765625, 11.97021484375, 13.0556640625, 14.14111328125, 15.2265625, 16.31201171875, 17.3974609375, 18.48291015625, 19.568359375, 20.65380859375, 21.7392578125, 22.82470703125, 23.91015625, 24.99560546875, 26.0810546875, 27.16650390625, 28.251953125, 29.33740234375, 30.4228515625, 31.50830078125, 32.59375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 14.0, 30.0, 51.0, 87.0, 142.0, 255.0, 461.0, 764.0, 1277.0, 2235.0, 3653.0, 5787.0, 9236.0, 14455.0, 22287.0, 32599.0, 47249.0, 67396.0, 91537.0, 122513.0, 156792.0, 195797.0, 234726.0, 271118.0, 300959.0, 321236.0, 329569.0, 323518.0, 304824.0, 276699.0, 242022.0, 202673.0, 163989.0, 128320.0, 97121.0, 71293.0, 50888.0, 35016.0, 23686.0, 15687.0, 9788.0, 6417.0, 4077.0, 2485.0, 1435.0, 908.0, 549.0, 304.0, 165.0, 75.0, 58.0, 37.0, 11.0, 12.0, 5.0, 3.0, 1.0], "bins": [-22.75, -22.07275390625, -21.3955078125, -20.71826171875, -20.041015625, -19.36376953125, -18.6865234375, -18.00927734375, -17.33203125, -16.65478515625, -15.9775390625, -15.30029296875, -14.623046875, -13.94580078125, -13.2685546875, -12.59130859375, -11.9140625, -11.23681640625, -10.5595703125, -9.88232421875, -9.205078125, -8.52783203125, -7.8505859375, -7.17333984375, -6.49609375, -5.81884765625, -5.1416015625, -4.46435546875, -3.787109375, -3.10986328125, -2.4326171875, -1.75537109375, -1.078125, -0.40087890625, 0.2763671875, 0.95361328125, 1.630859375, 2.30810546875, 2.9853515625, 3.66259765625, 4.33984375, 5.01708984375, 5.6943359375, 6.37158203125, 7.048828125, 7.72607421875, 8.4033203125, 9.08056640625, 9.7578125, 10.43505859375, 11.1123046875, 11.78955078125, 12.466796875, 13.14404296875, 13.8212890625, 14.49853515625, 15.17578125, 15.85302734375, 16.5302734375, 17.20751953125, 17.884765625, 18.56201171875, 19.2392578125, 19.91650390625, 20.59375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 7.0, 8.0, 8.0, 11.0, 15.0, 29.0, 31.0, 43.0, 47.0, 67.0, 86.0, 69.0, 117.0, 132.0, 138.0, 161.0, 161.0, 200.0, 195.0, 215.0, 201.0, 202.0, 196.0, 214.0, 207.0, 188.0, 179.0, 144.0, 129.0, 113.0, 131.0, 93.0, 78.0, 69.0, 55.0, 36.0, 26.0, 23.0, 13.0, 13.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3125, -14.78857421875, -14.2646484375, -13.74072265625, -13.216796875, -12.69287109375, -12.1689453125, -11.64501953125, -11.12109375, -10.59716796875, -10.0732421875, -9.54931640625, -9.025390625, -8.50146484375, -7.9775390625, -7.45361328125, -6.9296875, -6.40576171875, -5.8818359375, -5.35791015625, -4.833984375, -4.31005859375, -3.7861328125, -3.26220703125, -2.73828125, -2.21435546875, -1.6904296875, -1.16650390625, -0.642578125, -0.11865234375, 0.4052734375, 0.92919921875, 1.453125, 1.97705078125, 2.5009765625, 3.02490234375, 3.548828125, 4.07275390625, 4.5966796875, 5.12060546875, 5.64453125, 6.16845703125, 6.6923828125, 7.21630859375, 7.740234375, 8.26416015625, 8.7880859375, 9.31201171875, 9.8359375, 10.35986328125, 10.8837890625, 11.40771484375, 11.931640625, 12.45556640625, 12.9794921875, 13.50341796875, 14.02734375, 14.55126953125, 15.0751953125, 15.59912109375, 16.123046875, 16.64697265625, 17.1708984375, 17.69482421875, 18.21875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 9.0, 7.0, 3.0, 11.0, 13.0, 10.0, 18.0, 20.0, 23.0, 17.0, 34.0, 28.0, 22.0, 23.0, 31.0, 38.0, 37.0, 33.0, 34.0, 43.0, 48.0, 34.0, 38.0, 50.0, 35.0, 37.0, 34.0, 34.0, 28.0, 31.0, 28.0, 21.0, 22.0, 16.0, 21.0, 10.0, 10.0, 7.0, 10.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-37.81067657470703, -36.777008056640625, -35.74333953857422, -34.70967102050781, -33.676002502441406, -32.642333984375, -31.608667373657227, -30.57499885559082, -29.541330337524414, -28.507661819458008, -27.4739933013916, -26.440324783325195, -25.406658172607422, -24.372989654541016, -23.33932113647461, -22.305652618408203, -21.271984100341797, -20.23831558227539, -19.204647064208984, -18.170978546142578, -17.137310028076172, -16.103641510009766, -15.069974899291992, -14.036306381225586, -13.00263786315918, -11.968969345092773, -10.935300827026367, -9.901633262634277, -8.867964744567871, -7.834296226501465, -6.800628185272217, -5.766960144042969, -4.73328971862793, -3.6996214389801025, -2.6659531593322754, -1.6322848796844482, -0.5986166000366211, 0.43505191802978516, 1.4687199592590332, 2.5023880004882812, 3.5360565185546875, 4.569725036621094, 5.603393077850342, 6.63706111907959, 7.670729637145996, 8.704398155212402, 9.738065719604492, 10.771734237670898, 11.805402755737305, 12.839071273803711, 13.872739791870117, 14.906407356262207, 15.940075874328613, 16.973743438720703, 18.00741195678711, 19.041080474853516, 20.074748992919922, 21.108417510986328, 22.142086029052734, 23.17575454711914, 24.209423065185547, 25.243091583251953, 26.276758193969727, 27.310426712036133, 28.34409523010254]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 7.0, 12.0, 16.0, 11.0, 25.0, 16.0, 21.0, 22.0, 34.0, 24.0, 31.0, 31.0, 40.0, 44.0, 39.0, 50.0, 49.0, 34.0, 33.0, 43.0, 48.0, 35.0, 32.0, 25.0, 39.0, 30.0, 26.0, 20.0, 23.0, 27.0, 14.0, 18.0, 12.0, 14.0, 7.0, 6.0, 10.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.48579788208008, -42.18503189086914, -40.8842658996582, -39.583499908447266, -38.28273391723633, -36.98196792602539, -35.68120193481445, -34.38043975830078, -33.079673767089844, -31.778907775878906, -30.47814178466797, -29.17737579345703, -27.876609802246094, -26.575843811035156, -25.27507972717285, -23.974313735961914, -22.673545837402344, -21.372779846191406, -20.07201385498047, -18.77124786376953, -17.470481872558594, -16.169715881347656, -14.868951797485352, -13.568185806274414, -12.267419815063477, -10.966653823852539, -9.665887832641602, -8.36512279510498, -7.064356803894043, -5.7635908126831055, -4.462825298309326, -3.162059783935547, -1.861297607421875, -0.5605318546295166, 0.7402338981628418, 2.0409996509552, 3.3417654037475586, 4.642531394958496, 5.943296909332275, 7.244062423706055, 8.544828414916992, 9.84559440612793, 11.146360397338867, 12.447125434875488, 13.747891426086426, 15.048657417297363, 16.349422454833984, 17.650188446044922, 18.95095443725586, 20.251720428466797, 21.552486419677734, 22.853252410888672, 24.15401840209961, 25.454784393310547, 26.75554847717285, 28.05631446838379, 29.357080459594727, 30.657846450805664, 31.9586124420166, 33.259376525878906, 34.560142517089844, 35.86090850830078, 37.16167449951172, 38.462440490722656, 39.763206481933594]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 11.0, 28.0, 43.0, 49.0, 79.0, 104.0, 194.0, 287.0, 408.0, 682.0, 1074.0, 1724.0, 2888.0, 4816.0, 8357.0, 14417.0, 25695.0, 46702.0, 83420.0, 142023.0, 202804.0, 197634.0, 135307.0, 78491.0, 43646.0, 24407.0, 13547.0, 7770.0, 4598.0, 2896.0, 1676.0, 1026.0, 621.0, 368.0, 242.0, 166.0, 110.0, 56.0, 55.0, 40.0, 21.0, 18.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0], "bins": [-6.20703125, -6.03436279296875, -5.8616943359375, -5.68902587890625, -5.516357421875, -5.34368896484375, -5.1710205078125, -4.99835205078125, -4.82568359375, -4.65301513671875, -4.4803466796875, -4.30767822265625, -4.135009765625, -3.96234130859375, -3.7896728515625, -3.61700439453125, -3.4443359375, -3.27166748046875, -3.0989990234375, -2.92633056640625, -2.753662109375, -2.58099365234375, -2.4083251953125, -2.23565673828125, -2.06298828125, -1.89031982421875, -1.7176513671875, -1.54498291015625, -1.372314453125, -1.19964599609375, -1.0269775390625, -0.85430908203125, -0.681640625, -0.50897216796875, -0.3363037109375, -0.16363525390625, 0.009033203125, 0.18170166015625, 0.3543701171875, 0.52703857421875, 0.69970703125, 0.87237548828125, 1.0450439453125, 1.21771240234375, 1.390380859375, 1.56304931640625, 1.7357177734375, 1.90838623046875, 2.0810546875, 2.25372314453125, 2.4263916015625, 2.59906005859375, 2.771728515625, 2.94439697265625, 3.1170654296875, 3.28973388671875, 3.46240234375, 3.63507080078125, 3.8077392578125, 3.98040771484375, 4.153076171875, 4.32574462890625, 4.4984130859375, 4.67108154296875, 4.84375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 12.0, 16.0, 10.0, 26.0, 16.0, 22.0, 22.0, 33.0, 23.0, 32.0, 31.0, 39.0, 45.0, 38.0, 50.0, 48.0, 36.0, 34.0, 41.0, 46.0, 39.0, 31.0, 25.0, 37.0, 31.0, 26.0, 22.0, 22.0, 28.0, 13.0, 17.0, 13.0, 14.0, 6.0, 7.0, 10.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -42.1669921875, -40.865234375, -39.5634765625, -38.26171875, -36.9599609375, -35.658203125, -34.3564453125, -33.0546875, -31.7529296875, -30.451171875, -29.1494140625, -27.84765625, -26.5458984375, -25.244140625, -23.9423828125, -22.640625, -21.3388671875, -20.037109375, -18.7353515625, -17.43359375, -16.1318359375, -14.830078125, -13.5283203125, -12.2265625, -10.9248046875, -9.623046875, -8.3212890625, -7.01953125, -5.7177734375, -4.416015625, -3.1142578125, -1.8125, -0.5107421875, 0.791015625, 2.0927734375, 3.39453125, 4.6962890625, 5.998046875, 7.2998046875, 8.6015625, 9.9033203125, 11.205078125, 12.5068359375, 13.80859375, 15.1103515625, 16.412109375, 17.7138671875, 19.015625, 20.3173828125, 21.619140625, 22.9208984375, 24.22265625, 25.5244140625, 26.826171875, 28.1279296875, 29.4296875, 30.7314453125, 32.033203125, 33.3349609375, 34.63671875, 35.9384765625, 37.240234375, 38.5419921875, 39.84375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 11.0, 5.0, 14.0, 28.0, 36.0, 57.0, 72.0, 81.0, 156.0, 195.0, 301.0, 424.0, 678.0, 973.0, 1576.0, 2420.0, 4175.0, 7203.0, 13074.0, 25238.0, 51475.0, 113474.0, 239548.0, 286308.0, 158441.0, 70524.0, 32797.0, 16616.0, 8929.0, 5189.0, 2991.0, 1849.0, 1207.0, 803.0, 547.0, 340.0, 214.0, 166.0, 126.0, 89.0, 60.0, 35.0, 36.0, 25.0, 11.0, 11.0, 13.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.7115478515625, -5.509033203125, -5.3065185546875, -5.10400390625, -4.9014892578125, -4.698974609375, -4.4964599609375, -4.2939453125, -4.0914306640625, -3.888916015625, -3.6864013671875, -3.48388671875, -3.2813720703125, -3.078857421875, -2.8763427734375, -2.673828125, -2.4713134765625, -2.268798828125, -2.0662841796875, -1.86376953125, -1.6612548828125, -1.458740234375, -1.2562255859375, -1.0537109375, -0.8511962890625, -0.648681640625, -0.4461669921875, -0.24365234375, -0.0411376953125, 0.161376953125, 0.3638916015625, 0.56640625, 0.7689208984375, 0.971435546875, 1.1739501953125, 1.37646484375, 1.5789794921875, 1.781494140625, 1.9840087890625, 2.1865234375, 2.3890380859375, 2.591552734375, 2.7940673828125, 2.99658203125, 3.1990966796875, 3.401611328125, 3.6041259765625, 3.806640625, 4.0091552734375, 4.211669921875, 4.4141845703125, 4.61669921875, 4.8192138671875, 5.021728515625, 5.2242431640625, 5.4267578125, 5.6292724609375, 5.831787109375, 6.0343017578125, 6.23681640625, 6.4393310546875, 6.641845703125, 6.8443603515625, 7.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 8.0, 14.0, 16.0, 15.0, 22.0, 29.0, 28.0, 34.0, 34.0, 45.0, 40.0, 49.0, 45.0, 50.0, 52.0, 49.0, 42.0, 53.0, 36.0, 39.0, 30.0, 41.0, 31.0, 26.0, 29.0, 17.0, 9.0, 14.0, 14.0, 16.0, 7.0, 6.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.229736328125, -28.25634765625, -27.282958984375, -26.3095703125, -25.336181640625, -24.36279296875, -23.389404296875, -22.416015625, -21.442626953125, -20.46923828125, -19.495849609375, -18.5224609375, -17.549072265625, -16.57568359375, -15.602294921875, -14.62890625, -13.655517578125, -12.68212890625, -11.708740234375, -10.7353515625, -9.761962890625, -8.78857421875, -7.815185546875, -6.841796875, -5.868408203125, -4.89501953125, -3.921630859375, -2.9482421875, -1.974853515625, -1.00146484375, -0.028076171875, 0.9453125, 1.918701171875, 2.89208984375, 3.865478515625, 4.8388671875, 5.812255859375, 6.78564453125, 7.759033203125, 8.732421875, 9.705810546875, 10.67919921875, 11.652587890625, 12.6259765625, 13.599365234375, 14.57275390625, 15.546142578125, 16.51953125, 17.492919921875, 18.46630859375, 19.439697265625, 20.4130859375, 21.386474609375, 22.35986328125, 23.333251953125, 24.306640625, 25.280029296875, 26.25341796875, 27.226806640625, 28.2001953125, 29.173583984375, 30.14697265625, 31.120361328125, 32.09375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 13.0, 14.0, 15.0, 23.0, 35.0, 47.0, 57.0, 78.0, 95.0, 146.0, 211.0, 290.0, 435.0, 643.0, 954.0, 1470.0, 2460.0, 3978.0, 7013.0, 13525.0, 29265.0, 77235.0, 302064.0, 421448.0, 111044.0, 37916.0, 17129.0, 8429.0, 4739.0, 2849.0, 1700.0, 1063.0, 700.0, 424.0, 343.0, 211.0, 137.0, 99.0, 71.0, 50.0, 39.0, 27.0, 20.0, 15.0, 8.0, 11.0, 4.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.055511474609375, -2.94696044921875, -2.838409423828125, -2.7298583984375, -2.621307373046875, -2.51275634765625, -2.404205322265625, -2.295654296875, -2.187103271484375, -2.07855224609375, -1.970001220703125, -1.8614501953125, -1.752899169921875, -1.64434814453125, -1.535797119140625, -1.42724609375, -1.318695068359375, -1.21014404296875, -1.101593017578125, -0.9930419921875, -0.884490966796875, -0.77593994140625, -0.667388916015625, -0.558837890625, -0.450286865234375, -0.34173583984375, -0.233184814453125, -0.1246337890625, -0.016082763671875, 0.09246826171875, 0.201019287109375, 0.3095703125, 0.418121337890625, 0.52667236328125, 0.635223388671875, 0.7437744140625, 0.852325439453125, 0.96087646484375, 1.069427490234375, 1.177978515625, 1.286529541015625, 1.39508056640625, 1.503631591796875, 1.6121826171875, 1.720733642578125, 1.82928466796875, 1.937835693359375, 2.04638671875, 2.154937744140625, 2.26348876953125, 2.372039794921875, 2.4805908203125, 2.589141845703125, 2.69769287109375, 2.806243896484375, 2.914794921875, 3.023345947265625, 3.13189697265625, 3.240447998046875, 3.3489990234375, 3.457550048828125, 3.56610107421875, 3.674652099609375, 3.783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 6.0, 8.0, 14.0, 7.0, 13.0, 9.0, 14.0, 19.0, 33.0, 29.0, 27.0, 40.0, 49.0, 45.0, 44.0, 47.0, 49.0, 48.0, 34.0, 62.0, 43.0, 34.0, 42.0, 37.0, 34.0, 26.0, 37.0, 27.0, 23.0, 20.0, 11.0, 18.0, 10.0, 3.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00015974044799804688, -0.00015488825738430023, -0.0001500360667705536, -0.00014518387615680695, -0.0001403316855430603, -0.00013547949492931366, -0.00013062730431556702, -0.00012577511370182037, -0.00012092292308807373, -0.00011607073247432709, -0.00011121854186058044, -0.0001063663512468338, -0.00010151416063308716, -9.666197001934052e-05, -9.180977940559387e-05, -8.695758879184723e-05, -8.210539817810059e-05, -7.725320756435394e-05, -7.24010169506073e-05, -6.754882633686066e-05, -6.269663572311401e-05, -5.784444510936737e-05, -5.299225449562073e-05, -4.8140063881874084e-05, -4.328787326812744e-05, -3.84356826543808e-05, -3.3583492040634155e-05, -2.8731301426887512e-05, -2.387911081314087e-05, -1.9026920199394226e-05, -1.4174729585647583e-05, -9.32253897190094e-06, -4.470348358154297e-06, 3.818422555923462e-07, 5.234032869338989e-06, 1.0086223483085632e-05, 1.4938414096832275e-05, 1.979060471057892e-05, 2.464279532432556e-05, 2.9494985938072205e-05, 3.434717655181885e-05, 3.919936716556549e-05, 4.4051557779312134e-05, 4.890374839305878e-05, 5.375593900680542e-05, 5.860812962055206e-05, 6.34603202342987e-05, 6.831251084804535e-05, 7.316470146179199e-05, 7.801689207553864e-05, 8.286908268928528e-05, 8.772127330303192e-05, 9.257346391677856e-05, 9.742565453052521e-05, 0.00010227784514427185, 0.0001071300357580185, 0.00011198222637176514, 0.00011683441698551178, 0.00012168660759925842, 0.00012653879821300507, 0.0001313909888267517, 0.00013624317944049835, 0.000141095370054245, 0.00014594756066799164, 0.00015079975128173828]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 12.0, 17.0, 30.0, 46.0, 68.0, 102.0, 138.0, 192.0, 301.0, 414.0, 660.0, 899.0, 1419.0, 2238.0, 3376.0, 5411.0, 8840.0, 14700.0, 25701.0, 46478.0, 86993.0, 161360.0, 237351.0, 198933.0, 112350.0, 59726.0, 32921.0, 18634.0, 10835.0, 6513.0, 4084.0, 2662.0, 1694.0, 1099.0, 778.0, 461.0, 363.0, 244.0, 152.0, 118.0, 77.0, 53.0, 35.0, 20.0, 14.0, 8.0, 10.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.703125, -3.58251953125, -3.4619140625, -3.34130859375, -3.220703125, -3.10009765625, -2.9794921875, -2.85888671875, -2.73828125, -2.61767578125, -2.4970703125, -2.37646484375, -2.255859375, -2.13525390625, -2.0146484375, -1.89404296875, -1.7734375, -1.65283203125, -1.5322265625, -1.41162109375, -1.291015625, -1.17041015625, -1.0498046875, -0.92919921875, -0.80859375, -0.68798828125, -0.5673828125, -0.44677734375, -0.326171875, -0.20556640625, -0.0849609375, 0.03564453125, 0.15625, 0.27685546875, 0.3974609375, 0.51806640625, 0.638671875, 0.75927734375, 0.8798828125, 1.00048828125, 1.12109375, 1.24169921875, 1.3623046875, 1.48291015625, 1.603515625, 1.72412109375, 1.8447265625, 1.96533203125, 2.0859375, 2.20654296875, 2.3271484375, 2.44775390625, 2.568359375, 2.68896484375, 2.8095703125, 2.93017578125, 3.05078125, 3.17138671875, 3.2919921875, 3.41259765625, 3.533203125, 3.65380859375, 3.7744140625, 3.89501953125, 4.015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 17.0, 18.0, 17.0, 24.0, 43.0, 45.0, 35.0, 52.0, 60.0, 83.0, 67.0, 66.0, 85.0, 59.0, 42.0, 59.0, 44.0, 36.0, 25.0, 21.0, 16.0, 11.0, 10.0, 11.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.979034423828125, -1.92095947265625, -1.862884521484375, -1.8048095703125, -1.746734619140625, -1.68865966796875, -1.630584716796875, -1.572509765625, -1.514434814453125, -1.45635986328125, -1.398284912109375, -1.3402099609375, -1.282135009765625, -1.22406005859375, -1.165985107421875, -1.10791015625, -1.049835205078125, -0.99176025390625, -0.933685302734375, -0.8756103515625, -0.817535400390625, -0.75946044921875, -0.701385498046875, -0.643310546875, -0.585235595703125, -0.52716064453125, -0.469085693359375, -0.4110107421875, -0.352935791015625, -0.29486083984375, -0.236785888671875, -0.1787109375, -0.120635986328125, -0.06256103515625, -0.004486083984375, 0.0535888671875, 0.111663818359375, 0.16973876953125, 0.227813720703125, 0.285888671875, 0.343963623046875, 0.40203857421875, 0.460113525390625, 0.5181884765625, 0.576263427734375, 0.63433837890625, 0.692413330078125, 0.75048828125, 0.808563232421875, 0.86663818359375, 0.924713134765625, 0.9827880859375, 1.040863037109375, 1.09893798828125, 1.157012939453125, 1.215087890625, 1.273162841796875, 1.33123779296875, 1.389312744140625, 1.4473876953125, 1.505462646484375, 1.56353759765625, 1.621612548828125, 1.6796875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 11.0, 12.0, 6.0, 23.0, 20.0, 24.0, 20.0, 29.0, 26.0, 27.0, 22.0, 33.0, 42.0, 30.0, 33.0, 39.0, 36.0, 48.0, 39.0, 42.0, 36.0, 37.0, 41.0, 35.0, 33.0, 31.0, 33.0, 25.0, 23.0, 18.0, 17.0, 20.0, 11.0, 8.0, 7.0, 11.0, 9.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-37.677852630615234, -36.64337158203125, -35.608890533447266, -34.57440948486328, -33.53993225097656, -32.50545120239258, -31.470970153808594, -30.43648910522461, -29.402008056640625, -28.36752700805664, -27.33304786682129, -26.298566818237305, -25.26408576965332, -24.22960662841797, -23.195125579833984, -22.16064453125, -21.12616539001465, -20.091684341430664, -19.057205200195312, -18.022724151611328, -16.988243103027344, -15.953763008117676, -14.919282913208008, -13.884801864624023, -12.850321769714355, -11.815841674804688, -10.781360626220703, -9.746880531311035, -8.712400436401367, -7.677919387817383, -6.643439292907715, -5.608958721160889, -4.574480056762695, -3.539999485015869, -2.505519151687622, -1.471038818359375, -0.43655824661254883, 0.5979223251342773, 1.6324024200439453, 2.6668829917907715, 3.7013635635375977, 4.735844135284424, 5.77032470703125, 6.804804801940918, 7.839285373687744, 8.87376594543457, 9.908246040344238, 10.942726135253906, 11.97720718383789, 13.011687278747559, 14.046168327331543, 15.080648422241211, 16.115129470825195, 17.149608612060547, 18.18408966064453, 19.218570709228516, 20.2530517578125, 21.287532806396484, 22.322011947631836, 23.35649299621582, 24.390974044799805, 25.425453186035156, 26.45993423461914, 27.494415283203125, 28.528894424438477]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 9.0, 7.0, 14.0, 14.0, 12.0, 25.0, 16.0, 17.0, 22.0, 32.0, 25.0, 31.0, 36.0, 35.0, 44.0, 40.0, 42.0, 54.0, 38.0, 30.0, 44.0, 42.0, 41.0, 34.0, 24.0, 36.0, 31.0, 23.0, 25.0, 24.0, 25.0, 16.0, 20.0, 10.0, 16.0, 6.0, 6.0, 10.0, 2.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.422523498535156, -42.125492095947266, -40.828460693359375, -39.531429290771484, -38.234397888183594, -36.9373664855957, -35.64033508300781, -34.343299865722656, -33.04627227783203, -31.74924087524414, -30.45220947265625, -29.15517807006836, -27.85814666748047, -26.561115264892578, -25.264081954956055, -23.967050552368164, -22.67001724243164, -21.37298583984375, -20.07595443725586, -18.77892303466797, -17.481891632080078, -16.184860229492188, -14.887826919555664, -13.590795516967773, -12.293764114379883, -10.996732711791992, -9.699701309204102, -8.402668952941895, -7.105637550354004, -5.808606147766113, -4.5115742683410645, -3.2145423889160156, -1.917510986328125, -0.6204793453216553, 0.6765522956848145, 1.9735839366912842, 3.270615577697754, 4.5676469802856445, 5.864678859710693, 7.161710739135742, 8.458742141723633, 9.755773544311523, 11.052804946899414, 12.349837303161621, 13.646868705749512, 14.943900108337402, 16.24093246459961, 17.5379638671875, 18.83499526977539, 20.13202667236328, 21.429058074951172, 22.726089477539062, 24.023120880126953, 25.320152282714844, 26.617185592651367, 27.914216995239258, 29.21124839782715, 30.50827980041504, 31.80531120300293, 33.10234451293945, 34.399375915527344, 35.696407318115234, 36.993438720703125, 38.290470123291016, 39.587501525878906]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 20.0, 23.0, 39.0, 84.0, 138.0, 231.0, 428.0, 666.0, 1172.0, 1942.0, 3214.0, 5016.0, 8059.0, 12325.0, 18579.0, 26757.0, 36966.0, 49436.0, 63003.0, 77017.0, 87527.0, 95372.0, 97365.0, 94319.0, 85626.0, 73027.0, 59780.0, 46068.0, 33873.0, 24596.0, 16520.0, 10967.0, 7011.0, 4565.0, 2788.0, 1636.0, 992.0, 580.0, 343.0, 208.0, 108.0, 71.0, 38.0, 23.0, 13.0, 7.0, 11.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.625, -18.049560546875, -17.47412109375, -16.898681640625, -16.3232421875, -15.747802734375, -15.17236328125, -14.596923828125, -14.021484375, -13.446044921875, -12.87060546875, -12.295166015625, -11.7197265625, -11.144287109375, -10.56884765625, -9.993408203125, -9.41796875, -8.842529296875, -8.26708984375, -7.691650390625, -7.1162109375, -6.540771484375, -5.96533203125, -5.389892578125, -4.814453125, -4.239013671875, -3.66357421875, -3.088134765625, -2.5126953125, -1.937255859375, -1.36181640625, -0.786376953125, -0.2109375, 0.364501953125, 0.93994140625, 1.515380859375, 2.0908203125, 2.666259765625, 3.24169921875, 3.817138671875, 4.392578125, 4.968017578125, 5.54345703125, 6.118896484375, 6.6943359375, 7.269775390625, 7.84521484375, 8.420654296875, 8.99609375, 9.571533203125, 10.14697265625, 10.722412109375, 11.2978515625, 11.873291015625, 12.44873046875, 13.024169921875, 13.599609375, 14.175048828125, 14.75048828125, 15.325927734375, 15.9013671875, 16.476806640625, 17.05224609375, 17.627685546875, 18.203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 6.0, 14.0, 14.0, 12.0, 25.0, 16.0, 16.0, 22.0, 35.0, 23.0, 29.0, 33.0, 39.0, 41.0, 43.0, 39.0, 55.0, 39.0, 31.0, 42.0, 43.0, 39.0, 34.0, 25.0, 36.0, 34.0, 22.0, 23.0, 26.0, 25.0, 18.0, 13.0, 14.0, 18.0, 6.0, 3.0, 13.0, 2.0, 3.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.44482421875, -40.1708984375, -38.89697265625, -37.623046875, -36.34912109375, -35.0751953125, -33.80126953125, -32.52734375, -31.25341796875, -29.9794921875, -28.70556640625, -27.431640625, -26.15771484375, -24.8837890625, -23.60986328125, -22.3359375, -21.06201171875, -19.7880859375, -18.51416015625, -17.240234375, -15.96630859375, -14.6923828125, -13.41845703125, -12.14453125, -10.87060546875, -9.5966796875, -8.32275390625, -7.048828125, -5.77490234375, -4.5009765625, -3.22705078125, -1.953125, -0.67919921875, 0.5947265625, 1.86865234375, 3.142578125, 4.41650390625, 5.6904296875, 6.96435546875, 8.23828125, 9.51220703125, 10.7861328125, 12.06005859375, 13.333984375, 14.60791015625, 15.8818359375, 17.15576171875, 18.4296875, 19.70361328125, 20.9775390625, 22.25146484375, 23.525390625, 24.79931640625, 26.0732421875, 27.34716796875, 28.62109375, 29.89501953125, 31.1689453125, 32.44287109375, 33.716796875, 34.99072265625, 36.2646484375, 37.53857421875, 38.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 15.0, 12.0, 26.0, 33.0, 49.0, 94.0, 136.0, 215.0, 355.0, 527.0, 781.0, 1218.0, 1841.0, 2717.0, 3976.0, 5887.0, 8457.0, 11774.0, 16261.0, 21985.0, 29062.0, 37424.0, 46729.0, 55583.0, 64745.0, 71957.0, 78053.0, 80351.0, 79521.0, 76094.0, 69438.0, 61512.0, 51926.0, 42633.0, 33862.0, 26331.0, 19451.0, 14490.0, 10443.0, 7353.0, 4981.0, 3479.0, 2324.0, 1555.0, 1061.0, 674.0, 412.0, 263.0, 191.0, 87.0, 81.0, 46.0, 37.0, 22.0, 16.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-15.265625, -14.77001953125, -14.2744140625, -13.77880859375, -13.283203125, -12.78759765625, -12.2919921875, -11.79638671875, -11.30078125, -10.80517578125, -10.3095703125, -9.81396484375, -9.318359375, -8.82275390625, -8.3271484375, -7.83154296875, -7.3359375, -6.84033203125, -6.3447265625, -5.84912109375, -5.353515625, -4.85791015625, -4.3623046875, -3.86669921875, -3.37109375, -2.87548828125, -2.3798828125, -1.88427734375, -1.388671875, -0.89306640625, -0.3974609375, 0.09814453125, 0.59375, 1.08935546875, 1.5849609375, 2.08056640625, 2.576171875, 3.07177734375, 3.5673828125, 4.06298828125, 4.55859375, 5.05419921875, 5.5498046875, 6.04541015625, 6.541015625, 7.03662109375, 7.5322265625, 8.02783203125, 8.5234375, 9.01904296875, 9.5146484375, 10.01025390625, 10.505859375, 11.00146484375, 11.4970703125, 11.99267578125, 12.48828125, 12.98388671875, 13.4794921875, 13.97509765625, 14.470703125, 14.96630859375, 15.4619140625, 15.95751953125, 16.453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 3.0, 6.0, 6.0, 14.0, 8.0, 18.0, 20.0, 21.0, 19.0, 19.0, 28.0, 29.0, 33.0, 33.0, 46.0, 42.0, 37.0, 37.0, 48.0, 45.0, 51.0, 40.0, 37.0, 30.0, 31.0, 42.0, 31.0, 43.0, 28.0, 26.0, 26.0, 13.0, 14.0, 16.0, 11.0, 13.0, 2.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.53125, -32.6240234375, -31.716796875, -30.8095703125, -29.90234375, -28.9951171875, -28.087890625, -27.1806640625, -26.2734375, -25.3662109375, -24.458984375, -23.5517578125, -22.64453125, -21.7373046875, -20.830078125, -19.9228515625, -19.015625, -18.1083984375, -17.201171875, -16.2939453125, -15.38671875, -14.4794921875, -13.572265625, -12.6650390625, -11.7578125, -10.8505859375, -9.943359375, -9.0361328125, -8.12890625, -7.2216796875, -6.314453125, -5.4072265625, -4.5, -3.5927734375, -2.685546875, -1.7783203125, -0.87109375, 0.0361328125, 0.943359375, 1.8505859375, 2.7578125, 3.6650390625, 4.572265625, 5.4794921875, 6.38671875, 7.2939453125, 8.201171875, 9.1083984375, 10.015625, 10.9228515625, 11.830078125, 12.7373046875, 13.64453125, 14.5517578125, 15.458984375, 16.3662109375, 17.2734375, 18.1806640625, 19.087890625, 19.9951171875, 20.90234375, 21.8095703125, 22.716796875, 23.6240234375, 24.53125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 22.0, 35.0, 69.0, 89.0, 157.0, 242.0, 421.0, 708.0, 1111.0, 1896.0, 3225.0, 5330.0, 8627.0, 13766.0, 21151.0, 31952.0, 46349.0, 63317.0, 81058.0, 97731.0, 107883.0, 111969.0, 106165.0, 92884.0, 75823.0, 57353.0, 41404.0, 28456.0, 18636.0, 11966.0, 7355.0, 4484.0, 2733.0, 1640.0, 1037.0, 593.0, 371.0, 203.0, 159.0, 72.0, 42.0, 25.0, 15.0, 7.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-10.125, -9.8302001953125, -9.535400390625, -9.2406005859375, -8.94580078125, -8.6510009765625, -8.356201171875, -8.0614013671875, -7.7666015625, -7.4718017578125, -7.177001953125, -6.8822021484375, -6.58740234375, -6.2926025390625, -5.997802734375, -5.7030029296875, -5.408203125, -5.1134033203125, -4.818603515625, -4.5238037109375, -4.22900390625, -3.9342041015625, -3.639404296875, -3.3446044921875, -3.0498046875, -2.7550048828125, -2.460205078125, -2.1654052734375, -1.87060546875, -1.5758056640625, -1.281005859375, -0.9862060546875, -0.69140625, -0.3966064453125, -0.101806640625, 0.1929931640625, 0.48779296875, 0.7825927734375, 1.077392578125, 1.3721923828125, 1.6669921875, 1.9617919921875, 2.256591796875, 2.5513916015625, 2.84619140625, 3.1409912109375, 3.435791015625, 3.7305908203125, 4.025390625, 4.3201904296875, 4.614990234375, 4.9097900390625, 5.20458984375, 5.4993896484375, 5.794189453125, 6.0889892578125, 6.3837890625, 6.6785888671875, 6.973388671875, 7.2681884765625, 7.56298828125, 7.8577880859375, 8.152587890625, 8.4473876953125, 8.7421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 4.0, 3.0, 6.0, 5.0, 11.0, 10.0, 20.0, 14.0, 22.0, 23.0, 30.0, 21.0, 25.0, 28.0, 27.0, 28.0, 39.0, 39.0, 35.0, 44.0, 43.0, 35.0, 51.0, 36.0, 30.0, 37.0, 36.0, 31.0, 31.0, 24.0, 17.0, 28.0, 28.0, 14.0, 23.0, 14.0, 11.0, 11.0, 14.0, 5.0, 5.0, 2.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.000881195068359375, -0.000851556658744812, -0.000821918249130249, -0.000792279839515686, -0.000762641429901123, -0.0007330030202865601, -0.0007033646106719971, -0.0006737262010574341, -0.0006440877914428711, -0.0006144493818283081, -0.0005848109722137451, -0.0005551725625991821, -0.0005255341529846191, -0.0004958957433700562, -0.00046625733375549316, -0.0004366189241409302, -0.0004069805145263672, -0.0003773421049118042, -0.0003477036952972412, -0.0003180652856826782, -0.00028842687606811523, -0.00025878846645355225, -0.00022915005683898926, -0.00019951164722442627, -0.00016987323760986328, -0.0001402348279953003, -0.0001105964183807373, -8.095800876617432e-05, -5.131959915161133e-05, -2.168118953704834e-05, 7.957220077514648e-06, 3.759562969207764e-05, 6.723403930664062e-05, 9.687244892120361e-05, 0.0001265108585357666, 0.0001561492681503296, 0.00018578767776489258, 0.00021542608737945557, 0.00024506449699401855, 0.00027470290660858154, 0.00030434131622314453, 0.0003339797258377075, 0.0003636181354522705, 0.0003932565450668335, 0.0004228949546813965, 0.00045253336429595947, 0.00048217177391052246, 0.0005118101835250854, 0.0005414485931396484, 0.0005710870027542114, 0.0006007254123687744, 0.0006303638219833374, 0.0006600022315979004, 0.0006896406412124634, 0.0007192790508270264, 0.0007489174604415894, 0.0007785558700561523, 0.0008081942796707153, 0.0008378326892852783, 0.0008674710988998413, 0.0008971095085144043, 0.0009267479181289673, 0.0009563863277435303, 0.0009860247373580933, 0.0010156631469726562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 15.0, 25.0, 21.0, 42.0, 59.0, 95.0, 141.0, 234.0, 386.0, 566.0, 890.0, 1447.0, 2389.0, 3761.0, 6056.0, 9590.0, 15228.0, 23066.0, 34456.0, 49380.0, 66440.0, 84595.0, 100421.0, 110288.0, 111358.0, 103594.0, 89361.0, 71599.0, 53730.0, 37934.0, 25814.0, 16666.0, 10917.0, 6771.0, 4126.0, 2573.0, 1669.0, 1004.0, 691.0, 415.0, 274.0, 139.0, 115.0, 61.0, 52.0, 30.0, 21.0, 13.0, 12.0, 9.0, 7.0, 2.0, 1.0, 2.0], "bins": [-11.53125, -11.193359375, -10.85546875, -10.517578125, -10.1796875, -9.841796875, -9.50390625, -9.166015625, -8.828125, -8.490234375, -8.15234375, -7.814453125, -7.4765625, -7.138671875, -6.80078125, -6.462890625, -6.125, -5.787109375, -5.44921875, -5.111328125, -4.7734375, -4.435546875, -4.09765625, -3.759765625, -3.421875, -3.083984375, -2.74609375, -2.408203125, -2.0703125, -1.732421875, -1.39453125, -1.056640625, -0.71875, -0.380859375, -0.04296875, 0.294921875, 0.6328125, 0.970703125, 1.30859375, 1.646484375, 1.984375, 2.322265625, 2.66015625, 2.998046875, 3.3359375, 3.673828125, 4.01171875, 4.349609375, 4.6875, 5.025390625, 5.36328125, 5.701171875, 6.0390625, 6.376953125, 6.71484375, 7.052734375, 7.390625, 7.728515625, 8.06640625, 8.404296875, 8.7421875, 9.080078125, 9.41796875, 9.755859375, 10.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 10.0, 8.0, 13.0, 11.0, 17.0, 16.0, 22.0, 29.0, 33.0, 37.0, 38.0, 46.0, 49.0, 64.0, 52.0, 46.0, 57.0, 56.0, 46.0, 46.0, 30.0, 41.0, 33.0, 22.0, 30.0, 23.0, 22.0, 16.0, 15.0, 7.0, 4.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.234375, -5.0631103515625, -4.891845703125, -4.7205810546875, -4.54931640625, -4.3780517578125, -4.206787109375, -4.0355224609375, -3.8642578125, -3.6929931640625, -3.521728515625, -3.3504638671875, -3.17919921875, -3.0079345703125, -2.836669921875, -2.6654052734375, -2.494140625, -2.3228759765625, -2.151611328125, -1.9803466796875, -1.80908203125, -1.6378173828125, -1.466552734375, -1.2952880859375, -1.1240234375, -0.9527587890625, -0.781494140625, -0.6102294921875, -0.43896484375, -0.2677001953125, -0.096435546875, 0.0748291015625, 0.24609375, 0.4173583984375, 0.588623046875, 0.7598876953125, 0.93115234375, 1.1024169921875, 1.273681640625, 1.4449462890625, 1.6162109375, 1.7874755859375, 1.958740234375, 2.1300048828125, 2.30126953125, 2.4725341796875, 2.643798828125, 2.8150634765625, 2.986328125, 3.1575927734375, 3.328857421875, 3.5001220703125, 3.67138671875, 3.8426513671875, 4.013916015625, 4.1851806640625, 4.3564453125, 4.5277099609375, 4.698974609375, 4.8702392578125, 5.04150390625, 5.2127685546875, 5.384033203125, 5.5552978515625, 5.7265625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 8.0, 13.0, 13.0, 14.0, 16.0, 19.0, 30.0, 22.0, 26.0, 23.0, 32.0, 24.0, 28.0, 37.0, 38.0, 47.0, 43.0, 45.0, 50.0, 35.0, 37.0, 41.0, 35.0, 45.0, 25.0, 39.0, 38.0, 23.0, 14.0, 16.0, 21.0, 20.0, 14.0, 10.0, 7.0, 13.0, 3.0, 7.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.35649490356445, -36.284942626953125, -35.21338653564453, -34.1418342590332, -33.070281982421875, -31.998727798461914, -30.927173614501953, -29.855621337890625, -28.784067153930664, -27.712512969970703, -26.640960693359375, -25.569406509399414, -24.497852325439453, -23.426300048828125, -22.354745864868164, -21.283191680908203, -20.211639404296875, -19.140085220336914, -18.068532943725586, -16.996978759765625, -15.92542552947998, -14.853872299194336, -13.782318115234375, -12.71076488494873, -11.639211654663086, -10.567658424377441, -9.496105194091797, -8.424551010131836, -7.352997779846191, -6.281444549560547, -5.209890842437744, -4.138337135314941, -3.0667800903320312, -1.9952266216278076, -0.923673152923584, 0.14788031578063965, 1.2194337844848633, 2.290987014770508, 3.3625407218933105, 4.434094429016113, 5.505647659301758, 6.577200889587402, 7.648754596710205, 8.720308303833008, 9.791861534118652, 10.863414764404297, 11.934968948364258, 13.006522178649902, 14.078075408935547, 15.149628639221191, 16.221181869506836, 17.292736053466797, 18.364288330078125, 19.435842514038086, 20.507396697998047, 21.578948974609375, 22.650503158569336, 23.722057342529297, 24.793609619140625, 25.865163803100586, 26.936717987060547, 28.008270263671875, 29.079824447631836, 30.151378631591797, 31.222930908203125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 6.0, 13.0, 11.0, 12.0, 17.0, 20.0, 16.0, 23.0, 27.0, 29.0, 23.0, 28.0, 42.0, 45.0, 27.0, 46.0, 42.0, 32.0, 51.0, 38.0, 39.0, 52.0, 45.0, 24.0, 36.0, 27.0, 38.0, 25.0, 32.0, 14.0, 18.0, 19.0, 12.0, 9.0, 14.0, 8.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.5936164855957, -45.1582145690918, -43.72281265258789, -42.287410736083984, -40.85200881958008, -39.41660690307617, -37.981201171875, -36.545799255371094, -35.11039733886719, -33.67499542236328, -32.239593505859375, -30.80419158935547, -29.368789672851562, -27.933387756347656, -26.497983932495117, -25.06258201599121, -23.627182006835938, -22.19178009033203, -20.756378173828125, -19.32097625732422, -17.885574340820312, -16.450172424316406, -15.014768600463867, -13.579366683959961, -12.143964767456055, -10.708562850952148, -9.273160934448242, -7.8377580642700195, -6.402356147766113, -4.966954231262207, -3.5315513610839844, -2.096149444580078, -0.6607475280761719, 0.7746546268463135, 2.210056781768799, 3.6454591751098633, 5.0808610916137695, 6.516263008117676, 7.951665878295898, 9.387067794799805, 10.822469711303711, 12.257871627807617, 13.693273544311523, 15.128676414489746, 16.56407928466797, 17.999481201171875, 19.43488311767578, 20.870285034179688, 22.305686950683594, 23.7410888671875, 25.176490783691406, 26.611892700195312, 28.04729461669922, 29.482696533203125, 30.918100357055664, 32.35350036621094, 33.788902282714844, 35.22430419921875, 36.659706115722656, 38.09510803222656, 39.53050994873047, 40.965911865234375, 42.40131378173828, 43.83671569824219, 45.27212142944336]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 11.0, 22.0, 28.0, 58.0, 72.0, 151.0, 226.0, 398.0, 656.0, 1047.0, 1610.0, 2578.0, 4109.0, 6505.0, 9713.0, 14865.0, 22231.0, 32378.0, 46729.0, 64682.0, 88245.0, 118969.0, 152407.0, 192165.0, 231216.0, 270810.0, 302796.0, 323496.0, 333971.0, 328128.0, 308708.0, 279572.0, 241849.0, 203273.0, 163806.0, 126329.0, 95611.0, 70618.0, 50282.0, 35145.0, 23749.0, 16075.0, 10515.0, 6937.0, 4384.0, 2846.0, 1654.0, 1017.0, 692.0, 380.0, 231.0, 147.0, 94.0, 44.0, 32.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0], "bins": [-22.03125, -21.33447265625, -20.6376953125, -19.94091796875, -19.244140625, -18.54736328125, -17.8505859375, -17.15380859375, -16.45703125, -15.76025390625, -15.0634765625, -14.36669921875, -13.669921875, -12.97314453125, -12.2763671875, -11.57958984375, -10.8828125, -10.18603515625, -9.4892578125, -8.79248046875, -8.095703125, -7.39892578125, -6.7021484375, -6.00537109375, -5.30859375, -4.61181640625, -3.9150390625, -3.21826171875, -2.521484375, -1.82470703125, -1.1279296875, -0.43115234375, 0.265625, 0.96240234375, 1.6591796875, 2.35595703125, 3.052734375, 3.74951171875, 4.4462890625, 5.14306640625, 5.83984375, 6.53662109375, 7.2333984375, 7.93017578125, 8.626953125, 9.32373046875, 10.0205078125, 10.71728515625, 11.4140625, 12.11083984375, 12.8076171875, 13.50439453125, 14.201171875, 14.89794921875, 15.5947265625, 16.29150390625, 16.98828125, 17.68505859375, 18.3818359375, 19.07861328125, 19.775390625, 20.47216796875, 21.1689453125, 21.86572265625, 22.5625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 4.0, 15.0, 11.0, 13.0, 14.0, 21.0, 18.0, 20.0, 26.0, 26.0, 25.0, 31.0, 37.0, 44.0, 35.0, 31.0, 49.0, 36.0, 47.0, 38.0, 42.0, 44.0, 45.0, 25.0, 33.0, 34.0, 34.0, 27.0, 28.0, 22.0, 14.0, 22.0, 13.0, 10.0, 11.0, 15.0, 3.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.875, -40.583984375, -39.29296875, -38.001953125, -36.7109375, -35.419921875, -34.12890625, -32.837890625, -31.546875, -30.255859375, -28.96484375, -27.673828125, -26.3828125, -25.091796875, -23.80078125, -22.509765625, -21.21875, -19.927734375, -18.63671875, -17.345703125, -16.0546875, -14.763671875, -13.47265625, -12.181640625, -10.890625, -9.599609375, -8.30859375, -7.017578125, -5.7265625, -4.435546875, -3.14453125, -1.853515625, -0.5625, 0.728515625, 2.01953125, 3.310546875, 4.6015625, 5.892578125, 7.18359375, 8.474609375, 9.765625, 11.056640625, 12.34765625, 13.638671875, 14.9296875, 16.220703125, 17.51171875, 18.802734375, 20.09375, 21.384765625, 22.67578125, 23.966796875, 25.2578125, 26.548828125, 27.83984375, 29.130859375, 30.421875, 31.712890625, 33.00390625, 34.294921875, 35.5859375, 36.876953125, 38.16796875, 39.458984375, 40.75]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 19.0, 35.0, 64.0, 169.0, 238.0, 505.0, 969.0, 1739.0, 3342.0, 5904.0, 10238.0, 17064.0, 28313.0, 44189.0, 67939.0, 99267.0, 140249.0, 188489.0, 241819.0, 295047.0, 340422.0, 372575.0, 385123.0, 375999.0, 350043.0, 306286.0, 254770.0, 200687.0, 152338.0, 108571.0, 74701.0, 49728.0, 31538.0, 19264.0, 11678.0, 6692.0, 3847.0, 2112.0, 1092.0, 593.0, 317.0, 155.0, 73.0, 44.0, 27.0, 12.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-30.734375, -29.87158203125, -29.0087890625, -28.14599609375, -27.283203125, -26.42041015625, -25.5576171875, -24.69482421875, -23.83203125, -22.96923828125, -22.1064453125, -21.24365234375, -20.380859375, -19.51806640625, -18.6552734375, -17.79248046875, -16.9296875, -16.06689453125, -15.2041015625, -14.34130859375, -13.478515625, -12.61572265625, -11.7529296875, -10.89013671875, -10.02734375, -9.16455078125, -8.3017578125, -7.43896484375, -6.576171875, -5.71337890625, -4.8505859375, -3.98779296875, -3.125, -2.26220703125, -1.3994140625, -0.53662109375, 0.326171875, 1.18896484375, 2.0517578125, 2.91455078125, 3.77734375, 4.64013671875, 5.5029296875, 6.36572265625, 7.228515625, 8.09130859375, 8.9541015625, 9.81689453125, 10.6796875, 11.54248046875, 12.4052734375, 13.26806640625, 14.130859375, 14.99365234375, 15.8564453125, 16.71923828125, 17.58203125, 18.44482421875, 19.3076171875, 20.17041015625, 21.033203125, 21.89599609375, 22.7587890625, 23.62158203125, 24.484375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 12.0, 9.0, 12.0, 13.0, 24.0, 31.0, 48.0, 47.0, 51.0, 63.0, 69.0, 95.0, 97.0, 115.0, 124.0, 136.0, 153.0, 154.0, 154.0, 197.0, 192.0, 174.0, 190.0, 184.0, 183.0, 153.0, 173.0, 163.0, 128.0, 134.0, 122.0, 100.0, 91.0, 95.0, 61.0, 58.0, 56.0, 40.0, 33.0, 35.0, 19.0, 22.0, 7.0, 25.0, 8.0, 6.0, 9.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.296875, -15.7744140625, -15.251953125, -14.7294921875, -14.20703125, -13.6845703125, -13.162109375, -12.6396484375, -12.1171875, -11.5947265625, -11.072265625, -10.5498046875, -10.02734375, -9.5048828125, -8.982421875, -8.4599609375, -7.9375, -7.4150390625, -6.892578125, -6.3701171875, -5.84765625, -5.3251953125, -4.802734375, -4.2802734375, -3.7578125, -3.2353515625, -2.712890625, -2.1904296875, -1.66796875, -1.1455078125, -0.623046875, -0.1005859375, 0.421875, 0.9443359375, 1.466796875, 1.9892578125, 2.51171875, 3.0341796875, 3.556640625, 4.0791015625, 4.6015625, 5.1240234375, 5.646484375, 6.1689453125, 6.69140625, 7.2138671875, 7.736328125, 8.2587890625, 8.78125, 9.3037109375, 9.826171875, 10.3486328125, 10.87109375, 11.3935546875, 11.916015625, 12.4384765625, 12.9609375, 13.4833984375, 14.005859375, 14.5283203125, 15.05078125, 15.5732421875, 16.095703125, 16.6181640625, 17.140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 3.0, 8.0, 6.0, 6.0, 16.0, 11.0, 13.0, 25.0, 17.0, 29.0, 33.0, 33.0, 27.0, 50.0, 45.0, 30.0, 40.0, 40.0, 43.0, 43.0, 44.0, 40.0, 37.0, 33.0, 39.0, 43.0, 37.0, 30.0, 21.0, 35.0, 19.0, 26.0, 14.0, 7.0, 9.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.42011260986328, -38.20119857788086, -36.98228454589844, -35.76336669921875, -34.54445266723633, -33.325538635253906, -32.10662078857422, -30.887706756591797, -29.668792724609375, -28.449878692626953, -27.2309627532959, -26.012046813964844, -24.793132781982422, -23.57421875, -22.355302810668945, -21.13638687133789, -19.91747283935547, -18.698558807373047, -17.479642868041992, -16.260726928710938, -15.041812896728516, -13.822897911071777, -12.603982925415039, -11.3850679397583, -10.166152954101562, -8.947237968444824, -7.728322982788086, -6.509407997131348, -5.290493011474609, -4.071578025817871, -2.852663040161133, -1.6337480545043945, -0.4148292541503906, 0.8040857315063477, 2.023000717163086, 3.241915702819824, 4.4608306884765625, 5.679745674133301, 6.898660659790039, 8.117575645446777, 9.336490631103516, 10.555405616760254, 11.774320602416992, 12.99323558807373, 14.212150573730469, 15.431065559387207, 16.649980545043945, 17.868896484375, 19.087810516357422, 20.306724548339844, 21.5256404876709, 22.744556427001953, 23.963470458984375, 25.182384490966797, 26.40130043029785, 27.620216369628906, 28.839130401611328, 30.05804443359375, 31.276960372924805, 32.49587631225586, 33.71479034423828, 34.9337043762207, 36.152618408203125, 37.37153625488281, 38.590450286865234]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 6.0, 5.0, 9.0, 11.0, 15.0, 17.0, 20.0, 26.0, 21.0, 22.0, 30.0, 28.0, 28.0, 25.0, 32.0, 34.0, 41.0, 47.0, 43.0, 34.0, 25.0, 39.0, 43.0, 39.0, 32.0, 34.0, 33.0, 26.0, 33.0, 31.0, 25.0, 12.0, 26.0, 16.0, 16.0, 7.0, 11.0, 11.0, 11.0, 12.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.32664108276367, -41.88127136230469, -40.4359016418457, -38.99053192138672, -37.545162200927734, -36.09979248046875, -34.6544189453125, -33.20905303955078, -31.763681411743164, -30.31831169128418, -28.872941970825195, -27.427570343017578, -25.982200622558594, -24.53683090209961, -23.091461181640625, -21.64609146118164, -20.200721740722656, -18.755352020263672, -17.309982299804688, -15.864611625671387, -14.419241905212402, -12.973872184753418, -11.528501510620117, -10.083131790161133, -8.637762069702148, -7.192392349243164, -5.7470221519470215, -4.301651954650879, -2.8562822341918945, -1.4109125137329102, 0.034458160400390625, 1.479827880859375, 2.9251976013183594, 4.370567321777344, 5.815937519073486, 7.261307716369629, 8.706677436828613, 10.152047157287598, 11.597417831420898, 13.042787551879883, 14.488157272338867, 15.933526992797852, 17.378896713256836, 18.824268341064453, 20.269638061523438, 21.715007781982422, 23.160377502441406, 24.60574722290039, 26.051116943359375, 27.49648666381836, 28.941856384277344, 30.387226104736328, 31.832595825195312, 33.2779655456543, 34.72333526611328, 36.16870880126953, 37.61407470703125, 39.059444427490234, 40.50481414794922, 41.9501838684082, 43.39555358886719, 44.84092330932617, 46.286293029785156, 47.731666564941406, 49.17703628540039]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 8.0, 9.0, 18.0, 24.0, 47.0, 57.0, 114.0, 168.0, 311.0, 537.0, 1051.0, 2122.0, 4280.0, 9227.0, 20371.0, 47150.0, 111903.0, 241089.0, 300873.0, 175065.0, 75460.0, 32060.0, 13934.0, 6348.0, 2998.0, 1510.0, 788.0, 428.0, 224.0, 153.0, 84.0, 50.0, 34.0, 16.0, 9.0, 17.0, 9.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8046875, -9.5008544921875, -9.197021484375, -8.8931884765625, -8.58935546875, -8.2855224609375, -7.981689453125, -7.6778564453125, -7.3740234375, -7.0701904296875, -6.766357421875, -6.4625244140625, -6.15869140625, -5.8548583984375, -5.551025390625, -5.2471923828125, -4.943359375, -4.6395263671875, -4.335693359375, -4.0318603515625, -3.72802734375, -3.4241943359375, -3.120361328125, -2.8165283203125, -2.5126953125, -2.2088623046875, -1.905029296875, -1.6011962890625, -1.29736328125, -0.9935302734375, -0.689697265625, -0.3858642578125, -0.08203125, 0.2218017578125, 0.525634765625, 0.8294677734375, 1.13330078125, 1.4371337890625, 1.740966796875, 2.0447998046875, 2.3486328125, 2.6524658203125, 2.956298828125, 3.2601318359375, 3.56396484375, 3.8677978515625, 4.171630859375, 4.4754638671875, 4.779296875, 5.0831298828125, 5.386962890625, 5.6907958984375, 5.99462890625, 6.2984619140625, 6.602294921875, 6.9061279296875, 7.2099609375, 7.5137939453125, 7.817626953125, 8.1214599609375, 8.42529296875, 8.7291259765625, 9.032958984375, 9.3367919921875, 9.640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 5.0, 8.0, 10.0, 14.0, 20.0, 17.0, 27.0, 22.0, 20.0, 29.0, 31.0, 28.0, 25.0, 27.0, 36.0, 41.0, 48.0, 42.0, 34.0, 27.0, 38.0, 44.0, 36.0, 30.0, 40.0, 31.0, 27.0, 33.0, 31.0, 25.0, 12.0, 27.0, 16.0, 16.0, 8.0, 11.0, 11.0, 10.0, 12.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.34375, -41.89501953125, -40.4462890625, -38.99755859375, -37.548828125, -36.10009765625, -34.6513671875, -33.20263671875, -31.75390625, -30.30517578125, -28.8564453125, -27.40771484375, -25.958984375, -24.51025390625, -23.0615234375, -21.61279296875, -20.1640625, -18.71533203125, -17.2666015625, -15.81787109375, -14.369140625, -12.92041015625, -11.4716796875, -10.02294921875, -8.57421875, -7.12548828125, -5.6767578125, -4.22802734375, -2.779296875, -1.33056640625, 0.1181640625, 1.56689453125, 3.015625, 4.46435546875, 5.9130859375, 7.36181640625, 8.810546875, 10.25927734375, 11.7080078125, 13.15673828125, 14.60546875, 16.05419921875, 17.5029296875, 18.95166015625, 20.400390625, 21.84912109375, 23.2978515625, 24.74658203125, 26.1953125, 27.64404296875, 29.0927734375, 30.54150390625, 31.990234375, 33.43896484375, 34.8876953125, 36.33642578125, 37.78515625, 39.23388671875, 40.6826171875, 42.13134765625, 43.580078125, 45.02880859375, 46.4775390625, 47.92626953125, 49.375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 13.0, 23.0, 35.0, 53.0, 57.0, 93.0, 152.0, 241.0, 384.0, 668.0, 1041.0, 1765.0, 3315.0, 6194.0, 13326.0, 30415.0, 78767.0, 221955.0, 376292.0, 194117.0, 68285.0, 26672.0, 11802.0, 5729.0, 2987.0, 1621.0, 1015.0, 544.0, 335.0, 238.0, 132.0, 82.0, 47.0, 35.0, 34.0, 17.0, 19.0, 14.0, 7.0, 4.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.1328125, -9.8297119140625, -9.526611328125, -9.2235107421875, -8.92041015625, -8.6173095703125, -8.314208984375, -8.0111083984375, -7.7080078125, -7.4049072265625, -7.101806640625, -6.7987060546875, -6.49560546875, -6.1925048828125, -5.889404296875, -5.5863037109375, -5.283203125, -4.9801025390625, -4.677001953125, -4.3739013671875, -4.07080078125, -3.7677001953125, -3.464599609375, -3.1614990234375, -2.8583984375, -2.5552978515625, -2.252197265625, -1.9490966796875, -1.64599609375, -1.3428955078125, -1.039794921875, -0.7366943359375, -0.43359375, -0.1304931640625, 0.172607421875, 0.4757080078125, 0.77880859375, 1.0819091796875, 1.385009765625, 1.6881103515625, 1.9912109375, 2.2943115234375, 2.597412109375, 2.9005126953125, 3.20361328125, 3.5067138671875, 3.809814453125, 4.1129150390625, 4.416015625, 4.7191162109375, 5.022216796875, 5.3253173828125, 5.62841796875, 5.9315185546875, 6.234619140625, 6.5377197265625, 6.8408203125, 7.1439208984375, 7.447021484375, 7.7501220703125, 8.05322265625, 8.3563232421875, 8.659423828125, 8.9625244140625, 9.265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 10.0, 6.0, 19.0, 17.0, 23.0, 15.0, 27.0, 30.0, 23.0, 24.0, 45.0, 49.0, 33.0, 55.0, 44.0, 49.0, 43.0, 47.0, 48.0, 41.0, 38.0, 40.0, 27.0, 35.0, 32.0, 28.0, 17.0, 16.0, 17.0, 12.0, 14.0, 12.0, 6.0, 10.0, 8.0, 11.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.03125, -36.92529296875, -35.8193359375, -34.71337890625, -33.607421875, -32.50146484375, -31.3955078125, -30.28955078125, -29.18359375, -28.07763671875, -26.9716796875, -25.86572265625, -24.759765625, -23.65380859375, -22.5478515625, -21.44189453125, -20.3359375, -19.22998046875, -18.1240234375, -17.01806640625, -15.912109375, -14.80615234375, -13.7001953125, -12.59423828125, -11.48828125, -10.38232421875, -9.2763671875, -8.17041015625, -7.064453125, -5.95849609375, -4.8525390625, -3.74658203125, -2.640625, -1.53466796875, -0.4287109375, 0.67724609375, 1.783203125, 2.88916015625, 3.9951171875, 5.10107421875, 6.20703125, 7.31298828125, 8.4189453125, 9.52490234375, 10.630859375, 11.73681640625, 12.8427734375, 13.94873046875, 15.0546875, 16.16064453125, 17.2666015625, 18.37255859375, 19.478515625, 20.58447265625, 21.6904296875, 22.79638671875, 23.90234375, 25.00830078125, 26.1142578125, 27.22021484375, 28.326171875, 29.43212890625, 30.5380859375, 31.64404296875, 32.75]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 11.0, 21.0, 17.0, 32.0, 47.0, 67.0, 98.0, 142.0, 199.0, 350.0, 650.0, 1130.0, 1980.0, 3958.0, 8310.0, 19745.0, 57396.0, 278435.0, 517671.0, 103904.0, 30627.0, 12014.0, 5387.0, 2692.0, 1486.0, 861.0, 499.0, 276.0, 206.0, 120.0, 77.0, 53.0, 36.0, 23.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.4114990234375, -4.260498046875, -4.1094970703125, -3.95849609375, -3.8074951171875, -3.656494140625, -3.5054931640625, -3.3544921875, -3.2034912109375, -3.052490234375, -2.9014892578125, -2.75048828125, -2.5994873046875, -2.448486328125, -2.2974853515625, -2.146484375, -1.9954833984375, -1.844482421875, -1.6934814453125, -1.54248046875, -1.3914794921875, -1.240478515625, -1.0894775390625, -0.9384765625, -0.7874755859375, -0.636474609375, -0.4854736328125, -0.33447265625, -0.1834716796875, -0.032470703125, 0.1185302734375, 0.26953125, 0.4205322265625, 0.571533203125, 0.7225341796875, 0.87353515625, 1.0245361328125, 1.175537109375, 1.3265380859375, 1.4775390625, 1.6285400390625, 1.779541015625, 1.9305419921875, 2.08154296875, 2.2325439453125, 2.383544921875, 2.5345458984375, 2.685546875, 2.8365478515625, 2.987548828125, 3.1385498046875, 3.28955078125, 3.4405517578125, 3.591552734375, 3.7425537109375, 3.8935546875, 4.0445556640625, 4.195556640625, 4.3465576171875, 4.49755859375, 4.6485595703125, 4.799560546875, 4.9505615234375, 5.1015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 8.0, 1.0, 13.0, 18.0, 18.0, 18.0, 23.0, 28.0, 43.0, 27.0, 35.0, 44.0, 31.0, 56.0, 43.0, 60.0, 61.0, 44.0, 41.0, 41.0, 55.0, 47.0, 33.0, 40.0, 30.0, 20.0, 18.0, 15.0, 16.0, 12.0, 13.0, 10.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016450881958007812, -0.00015909597277641296, -0.0001536831259727478, -0.00014827027916908264, -0.00014285743236541748, -0.00013744458556175232, -0.00013203173875808716, -0.000126618891954422, -0.00012120604515075684, -0.00011579319834709167, -0.00011038035154342651, -0.00010496750473976135, -9.955465793609619e-05, -9.414181113243103e-05, -8.872896432876587e-05, -8.331611752510071e-05, -7.790327072143555e-05, -7.249042391777039e-05, -6.707757711410522e-05, -6.166473031044006e-05, -5.62518835067749e-05, -5.083903670310974e-05, -4.542618989944458e-05, -4.001334309577942e-05, -3.460049629211426e-05, -2.9187649488449097e-05, -2.3774802684783936e-05, -1.8361955881118774e-05, -1.2949109077453613e-05, -7.536262273788452e-06, -2.123415470123291e-06, 3.28943133354187e-06, 8.702278137207031e-06, 1.4115124940872192e-05, 1.9527971744537354e-05, 2.4940818548202515e-05, 3.0353665351867676e-05, 3.576651215553284e-05, 4.1179358959198e-05, 4.659220576286316e-05, 5.200505256652832e-05, 5.741789937019348e-05, 6.283074617385864e-05, 6.82435929775238e-05, 7.365643978118896e-05, 7.906928658485413e-05, 8.448213338851929e-05, 8.989498019218445e-05, 9.530782699584961e-05, 0.00010072067379951477, 0.00010613352060317993, 0.00011154636740684509, 0.00011695921421051025, 0.00012237206101417542, 0.00012778490781784058, 0.00013319775462150574, 0.0001386106014251709, 0.00014402344822883606, 0.00014943629503250122, 0.00015484914183616638, 0.00016026198863983154, 0.0001656748354434967, 0.00017108768224716187, 0.00017650052905082703, 0.0001819133758544922]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 8.0, 9.0, 9.0, 20.0, 32.0, 55.0, 68.0, 103.0, 140.0, 217.0, 322.0, 505.0, 715.0, 1239.0, 1896.0, 3135.0, 5052.0, 8337.0, 14201.0, 24988.0, 45772.0, 83527.0, 148188.0, 219006.0, 203156.0, 127100.0, 70095.0, 38404.0, 21477.0, 12232.0, 7191.0, 4249.0, 2463.0, 1624.0, 1068.0, 653.0, 407.0, 292.0, 218.0, 112.0, 83.0, 54.0, 41.0, 29.0, 20.0, 13.0, 11.0, 8.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.716796875, -3.603668212890625, -3.49053955078125, -3.377410888671875, -3.2642822265625, -3.151153564453125, -3.03802490234375, -2.924896240234375, -2.811767578125, -2.698638916015625, -2.58551025390625, -2.472381591796875, -2.3592529296875, -2.246124267578125, -2.13299560546875, -2.019866943359375, -1.90673828125, -1.793609619140625, -1.68048095703125, -1.567352294921875, -1.4542236328125, -1.341094970703125, -1.22796630859375, -1.114837646484375, -1.001708984375, -0.888580322265625, -0.77545166015625, -0.662322998046875, -0.5491943359375, -0.436065673828125, -0.32293701171875, -0.209808349609375, -0.0966796875, 0.016448974609375, 0.12957763671875, 0.242706298828125, 0.3558349609375, 0.468963623046875, 0.58209228515625, 0.695220947265625, 0.808349609375, 0.921478271484375, 1.03460693359375, 1.147735595703125, 1.2608642578125, 1.373992919921875, 1.48712158203125, 1.600250244140625, 1.71337890625, 1.826507568359375, 1.93963623046875, 2.052764892578125, 2.1658935546875, 2.279022216796875, 2.39215087890625, 2.505279541015625, 2.618408203125, 2.731536865234375, 2.84466552734375, 2.957794189453125, 3.0709228515625, 3.184051513671875, 3.29718017578125, 3.410308837890625, 3.5234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 14.0, 15.0, 17.0, 24.0, 32.0, 62.0, 48.0, 75.0, 89.0, 96.0, 86.0, 71.0, 63.0, 66.0, 44.0, 43.0, 29.0, 21.0, 14.0, 19.0, 10.0, 9.0, 3.0, 9.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.013671875, -2.919097900390625, -2.82452392578125, -2.729949951171875, -2.6353759765625, -2.540802001953125, -2.44622802734375, -2.351654052734375, -2.257080078125, -2.162506103515625, -2.06793212890625, -1.973358154296875, -1.8787841796875, -1.784210205078125, -1.68963623046875, -1.595062255859375, -1.50048828125, -1.405914306640625, -1.31134033203125, -1.216766357421875, -1.1221923828125, -1.027618408203125, -0.93304443359375, -0.838470458984375, -0.743896484375, -0.649322509765625, -0.55474853515625, -0.460174560546875, -0.3656005859375, -0.271026611328125, -0.17645263671875, -0.081878662109375, 0.0126953125, 0.107269287109375, 0.20184326171875, 0.296417236328125, 0.3909912109375, 0.485565185546875, 0.58013916015625, 0.674713134765625, 0.769287109375, 0.863861083984375, 0.95843505859375, 1.053009033203125, 1.1475830078125, 1.242156982421875, 1.33673095703125, 1.431304931640625, 1.52587890625, 1.620452880859375, 1.71502685546875, 1.809600830078125, 1.9041748046875, 1.998748779296875, 2.09332275390625, 2.187896728515625, 2.282470703125, 2.377044677734375, 2.47161865234375, 2.566192626953125, 2.6607666015625, 2.755340576171875, 2.84991455078125, 2.944488525390625, 3.0390625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 4.0, 8.0, 9.0, 16.0, 13.0, 20.0, 21.0, 26.0, 28.0, 27.0, 35.0, 38.0, 50.0, 36.0, 35.0, 47.0, 36.0, 46.0, 38.0, 42.0, 41.0, 41.0, 34.0, 40.0, 42.0, 31.0, 24.0, 30.0, 24.0, 27.0, 13.0, 12.0, 12.0, 8.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.04429626464844, -37.81381607055664, -36.58333206176758, -35.35285186767578, -34.12236785888672, -32.89188766479492, -31.661407470703125, -30.430925369262695, -29.200443267822266, -27.969961166381836, -26.739479064941406, -25.50899887084961, -24.27851676940918, -23.04803466796875, -21.817554473876953, -20.587072372436523, -19.356590270996094, -18.126108169555664, -16.895626068115234, -15.665145874023438, -14.434663772583008, -13.204181671142578, -11.973700523376465, -10.743219375610352, -9.512737274169922, -8.282255172729492, -7.051774024963379, -5.821292400360107, -4.590810775756836, -3.3603291511535645, -2.129847526550293, -0.8993663787841797, 0.33111572265625, 1.5615973472595215, 2.792078971862793, 4.0225605964660645, 5.253042221069336, 6.483523845672607, 7.714005470275879, 8.944486618041992, 10.174968719482422, 11.405450820922852, 12.635931968688965, 13.866413116455078, 15.096895217895508, 16.327377319335938, 17.557857513427734, 18.788339614868164, 20.018821716308594, 21.249303817749023, 22.479785919189453, 23.71026611328125, 24.94074821472168, 26.17123031616211, 27.401710510253906, 28.632192611694336, 29.862674713134766, 31.093156814575195, 32.323638916015625, 33.55411911010742, 34.78459930419922, 36.01508331298828, 37.24556350708008, 38.476043701171875, 39.70652770996094]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 5.0, 11.0, 16.0, 8.0, 16.0, 26.0, 21.0, 22.0, 21.0, 30.0, 30.0, 28.0, 29.0, 31.0, 40.0, 35.0, 47.0, 39.0, 32.0, 31.0, 38.0, 45.0, 37.0, 29.0, 37.0, 29.0, 27.0, 34.0, 32.0, 19.0, 17.0, 22.0, 20.0, 12.0, 7.0, 17.0, 8.0, 9.0, 13.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.920928955078125, -41.475074768066406, -40.02922058105469, -38.58336639404297, -37.13751220703125, -35.69165802001953, -34.24580383300781, -32.799949645996094, -31.354095458984375, -29.908241271972656, -28.462387084960938, -27.01653289794922, -25.5706787109375, -24.12482452392578, -22.678970336914062, -21.233116149902344, -19.787261962890625, -18.341407775878906, -16.895553588867188, -15.449699401855469, -14.00384521484375, -12.557991027832031, -11.112136840820312, -9.666282653808594, -8.220428466796875, -6.774574279785156, -5.3287200927734375, -3.8828659057617188, -2.43701171875, -0.9911575317382812, 0.4546966552734375, 1.9005508422851562, 3.3464088439941406, 4.792263031005859, 6.238117218017578, 7.683971405029297, 9.129825592041016, 10.575679779052734, 12.021533966064453, 13.467388153076172, 14.91324234008789, 16.35909652709961, 17.804950714111328, 19.250804901123047, 20.696659088134766, 22.142513275146484, 23.588367462158203, 25.034221649169922, 26.48007583618164, 27.92593002319336, 29.371784210205078, 30.817638397216797, 32.263492584228516, 33.709346771240234, 35.15520095825195, 36.60105514526367, 38.04690933227539, 39.49276351928711, 40.93861770629883, 42.38447189331055, 43.830326080322266, 45.276180267333984, 46.7220344543457, 48.16788864135742, 49.61374282836914]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 26.0, 30.0, 49.0, 79.0, 143.0, 225.0, 288.0, 521.0, 851.0, 1391.0, 2059.0, 3032.0, 4602.0, 6928.0, 9554.0, 13800.0, 19112.0, 25466.0, 33232.0, 42391.0, 52059.0, 61534.0, 69525.0, 76654.0, 80678.0, 81547.0, 78863.0, 73172.0, 65872.0, 56845.0, 46548.0, 37966.0, 29328.0, 21940.0, 16489.0, 11482.0, 8064.0, 5439.0, 3685.0, 2539.0, 1607.0, 1073.0, 686.0, 429.0, 279.0, 177.0, 100.0, 69.0, 49.0, 27.0, 14.0, 11.0, 8.0, 5.0, 4.0], "bins": [-17.875, -17.35302734375, -16.8310546875, -16.30908203125, -15.787109375, -15.26513671875, -14.7431640625, -14.22119140625, -13.69921875, -13.17724609375, -12.6552734375, -12.13330078125, -11.611328125, -11.08935546875, -10.5673828125, -10.04541015625, -9.5234375, -9.00146484375, -8.4794921875, -7.95751953125, -7.435546875, -6.91357421875, -6.3916015625, -5.86962890625, -5.34765625, -4.82568359375, -4.3037109375, -3.78173828125, -3.259765625, -2.73779296875, -2.2158203125, -1.69384765625, -1.171875, -0.64990234375, -0.1279296875, 0.39404296875, 0.916015625, 1.43798828125, 1.9599609375, 2.48193359375, 3.00390625, 3.52587890625, 4.0478515625, 4.56982421875, 5.091796875, 5.61376953125, 6.1357421875, 6.65771484375, 7.1796875, 7.70166015625, 8.2236328125, 8.74560546875, 9.267578125, 9.78955078125, 10.3115234375, 10.83349609375, 11.35546875, 11.87744140625, 12.3994140625, 12.92138671875, 13.443359375, 13.96533203125, 14.4873046875, 15.00927734375, 15.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 4.0, 12.0, 15.0, 8.0, 17.0, 25.0, 22.0, 21.0, 21.0, 30.0, 35.0, 19.0, 30.0, 35.0, 34.0, 39.0, 44.0, 38.0, 34.0, 32.0, 36.0, 42.0, 39.0, 31.0, 34.0, 28.0, 30.0, 32.0, 36.0, 21.0, 16.0, 22.0, 18.0, 15.0, 8.0, 15.0, 8.0, 9.0, 13.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.89306640625, -39.4736328125, -38.05419921875, -36.634765625, -35.21533203125, -33.7958984375, -32.37646484375, -30.95703125, -29.53759765625, -28.1181640625, -26.69873046875, -25.279296875, -23.85986328125, -22.4404296875, -21.02099609375, -19.6015625, -18.18212890625, -16.7626953125, -15.34326171875, -13.923828125, -12.50439453125, -11.0849609375, -9.66552734375, -8.24609375, -6.82666015625, -5.4072265625, -3.98779296875, -2.568359375, -1.14892578125, 0.2705078125, 1.68994140625, 3.109375, 4.52880859375, 5.9482421875, 7.36767578125, 8.787109375, 10.20654296875, 11.6259765625, 13.04541015625, 14.46484375, 15.88427734375, 17.3037109375, 18.72314453125, 20.142578125, 21.56201171875, 22.9814453125, 24.40087890625, 25.8203125, 27.23974609375, 28.6591796875, 30.07861328125, 31.498046875, 32.91748046875, 34.3369140625, 35.75634765625, 37.17578125, 38.59521484375, 40.0146484375, 41.43408203125, 42.853515625, 44.27294921875, 45.6923828125, 47.11181640625, 48.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 14.0, 21.0, 46.0, 54.0, 100.0, 176.0, 291.0, 456.0, 686.0, 1098.0, 1767.0, 2858.0, 4389.0, 6461.0, 10108.0, 14835.0, 21234.0, 29230.0, 39456.0, 50852.0, 64505.0, 75369.0, 85104.0, 91091.0, 92774.0, 88927.0, 81032.0, 70068.0, 57701.0, 45375.0, 34440.0, 24840.0, 17771.0, 12501.0, 8217.0, 5445.0, 3537.0, 2088.0, 1341.0, 844.0, 519.0, 368.0, 231.0, 135.0, 67.0, 48.0, 33.0, 16.0, 8.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-18.953125, -18.32666015625, -17.7001953125, -17.07373046875, -16.447265625, -15.82080078125, -15.1943359375, -14.56787109375, -13.94140625, -13.31494140625, -12.6884765625, -12.06201171875, -11.435546875, -10.80908203125, -10.1826171875, -9.55615234375, -8.9296875, -8.30322265625, -7.6767578125, -7.05029296875, -6.423828125, -5.79736328125, -5.1708984375, -4.54443359375, -3.91796875, -3.29150390625, -2.6650390625, -2.03857421875, -1.412109375, -0.78564453125, -0.1591796875, 0.46728515625, 1.09375, 1.72021484375, 2.3466796875, 2.97314453125, 3.599609375, 4.22607421875, 4.8525390625, 5.47900390625, 6.10546875, 6.73193359375, 7.3583984375, 7.98486328125, 8.611328125, 9.23779296875, 9.8642578125, 10.49072265625, 11.1171875, 11.74365234375, 12.3701171875, 12.99658203125, 13.623046875, 14.24951171875, 14.8759765625, 15.50244140625, 16.12890625, 16.75537109375, 17.3818359375, 18.00830078125, 18.634765625, 19.26123046875, 19.8876953125, 20.51416015625, 21.140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 4.0, 5.0, 4.0, 9.0, 6.0, 10.0, 13.0, 16.0, 18.0, 15.0, 26.0, 27.0, 33.0, 40.0, 36.0, 34.0, 32.0, 47.0, 34.0, 36.0, 52.0, 44.0, 40.0, 34.0, 37.0, 38.0, 35.0, 38.0, 29.0, 24.0, 30.0, 21.0, 21.0, 11.0, 21.0, 15.0, 14.0, 12.0, 11.0, 3.0, 9.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.28125, -34.263671875, -33.24609375, -32.228515625, -31.2109375, -30.193359375, -29.17578125, -28.158203125, -27.140625, -26.123046875, -25.10546875, -24.087890625, -23.0703125, -22.052734375, -21.03515625, -20.017578125, -19.0, -17.982421875, -16.96484375, -15.947265625, -14.9296875, -13.912109375, -12.89453125, -11.876953125, -10.859375, -9.841796875, -8.82421875, -7.806640625, -6.7890625, -5.771484375, -4.75390625, -3.736328125, -2.71875, -1.701171875, -0.68359375, 0.333984375, 1.3515625, 2.369140625, 3.38671875, 4.404296875, 5.421875, 6.439453125, 7.45703125, 8.474609375, 9.4921875, 10.509765625, 11.52734375, 12.544921875, 13.5625, 14.580078125, 15.59765625, 16.615234375, 17.6328125, 18.650390625, 19.66796875, 20.685546875, 21.703125, 22.720703125, 23.73828125, 24.755859375, 25.7734375, 26.791015625, 27.80859375, 28.826171875, 29.84375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 12.0, 18.0, 29.0, 56.0, 95.0, 136.0, 230.0, 411.0, 647.0, 1078.0, 1613.0, 2626.0, 4174.0, 6570.0, 10379.0, 15607.0, 23118.0, 33079.0, 45240.0, 58953.0, 73975.0, 87072.0, 96361.0, 100385.0, 97813.0, 89386.0, 77659.0, 62686.0, 48516.0, 35947.0, 25535.0, 17453.0, 11516.0, 7468.0, 4737.0, 3026.0, 1885.0, 1177.0, 750.0, 447.0, 284.0, 161.0, 109.0, 46.0, 40.0, 16.0, 21.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0], "bins": [-10.390625, -10.090576171875, -9.79052734375, -9.490478515625, -9.1904296875, -8.890380859375, -8.59033203125, -8.290283203125, -7.990234375, -7.690185546875, -7.39013671875, -7.090087890625, -6.7900390625, -6.489990234375, -6.18994140625, -5.889892578125, -5.58984375, -5.289794921875, -4.98974609375, -4.689697265625, -4.3896484375, -4.089599609375, -3.78955078125, -3.489501953125, -3.189453125, -2.889404296875, -2.58935546875, -2.289306640625, -1.9892578125, -1.689208984375, -1.38916015625, -1.089111328125, -0.7890625, -0.489013671875, -0.18896484375, 0.111083984375, 0.4111328125, 0.711181640625, 1.01123046875, 1.311279296875, 1.611328125, 1.911376953125, 2.21142578125, 2.511474609375, 2.8115234375, 3.111572265625, 3.41162109375, 3.711669921875, 4.01171875, 4.311767578125, 4.61181640625, 4.911865234375, 5.2119140625, 5.511962890625, 5.81201171875, 6.112060546875, 6.412109375, 6.712158203125, 7.01220703125, 7.312255859375, 7.6123046875, 7.912353515625, 8.21240234375, 8.512451171875, 8.8125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 4.0, 9.0, 10.0, 13.0, 15.0, 6.0, 12.0, 20.0, 25.0, 20.0, 28.0, 25.0, 36.0, 31.0, 33.0, 44.0, 42.0, 45.0, 29.0, 34.0, 41.0, 47.0, 31.0, 47.0, 36.0, 25.0, 42.0, 38.0, 28.0, 24.0, 26.0, 24.0, 17.0, 19.0, 14.0, 6.0, 11.0, 16.0, 7.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010700225830078125, -0.0010326355695724487, -0.000995248556137085, -0.0009578615427017212, -0.0009204745292663574, -0.0008830875158309937, -0.0008457005023956299, -0.0008083134889602661, -0.0007709264755249023, -0.0007335394620895386, -0.0006961524486541748, -0.000658765435218811, -0.0006213784217834473, -0.0005839914083480835, -0.0005466043949127197, -0.000509217381477356, -0.0004718303680419922, -0.0004344433546066284, -0.00039705634117126465, -0.0003596693277359009, -0.0003222823143005371, -0.00028489530086517334, -0.00024750828742980957, -0.0002101212739944458, -0.00017273426055908203, -0.00013534724712371826, -9.796023368835449e-05, -6.057322025299072e-05, -2.3186206817626953e-05, 1.4200806617736816e-05, 5.1587820053100586e-05, 8.897483348846436e-05, 0.00012636184692382812, 0.0001637488603591919, 0.00020113587379455566, 0.00023852288722991943, 0.0002759099006652832, 0.00031329691410064697, 0.00035068392753601074, 0.0003880709409713745, 0.0004254579544067383, 0.00046284496784210205, 0.0005002319812774658, 0.0005376189947128296, 0.0005750060081481934, 0.0006123930215835571, 0.0006497800350189209, 0.0006871670484542847, 0.0007245540618896484, 0.0007619410753250122, 0.000799328088760376, 0.0008367151021957397, 0.0008741021156311035, 0.0009114891290664673, 0.0009488761425018311, 0.0009862631559371948, 0.0010236501693725586, 0.0010610371828079224, 0.0010984241962432861, 0.00113581120967865, 0.0011731982231140137, 0.0012105852365493774, 0.0012479722499847412, 0.001285359263420105, 0.0013227462768554688]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 12.0, 27.0, 47.0, 43.0, 101.0, 165.0, 278.0, 406.0, 683.0, 1119.0, 1661.0, 2753.0, 4418.0, 6808.0, 10459.0, 16110.0, 23410.0, 33444.0, 46420.0, 60753.0, 75403.0, 89069.0, 98500.0, 102128.0, 98403.0, 89154.0, 75702.0, 61015.0, 46558.0, 33986.0, 23654.0, 16337.0, 10640.0, 6883.0, 4468.0, 2877.0, 1748.0, 1099.0, 696.0, 417.0, 275.0, 156.0, 94.0, 54.0, 45.0, 24.0, 18.0, 10.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-10.8671875, -10.532958984375, -10.19873046875, -9.864501953125, -9.5302734375, -9.196044921875, -8.86181640625, -8.527587890625, -8.193359375, -7.859130859375, -7.52490234375, -7.190673828125, -6.8564453125, -6.522216796875, -6.18798828125, -5.853759765625, -5.51953125, -5.185302734375, -4.85107421875, -4.516845703125, -4.1826171875, -3.848388671875, -3.51416015625, -3.179931640625, -2.845703125, -2.511474609375, -2.17724609375, -1.843017578125, -1.5087890625, -1.174560546875, -0.84033203125, -0.506103515625, -0.171875, 0.162353515625, 0.49658203125, 0.830810546875, 1.1650390625, 1.499267578125, 1.83349609375, 2.167724609375, 2.501953125, 2.836181640625, 3.17041015625, 3.504638671875, 3.8388671875, 4.173095703125, 4.50732421875, 4.841552734375, 5.17578125, 5.510009765625, 5.84423828125, 6.178466796875, 6.5126953125, 6.846923828125, 7.18115234375, 7.515380859375, 7.849609375, 8.183837890625, 8.51806640625, 8.852294921875, 9.1865234375, 9.520751953125, 9.85498046875, 10.189208984375, 10.5234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 10.0, 14.0, 24.0, 20.0, 16.0, 26.0, 31.0, 41.0, 57.0, 49.0, 76.0, 74.0, 51.0, 58.0, 59.0, 68.0, 45.0, 44.0, 54.0, 30.0, 26.0, 27.0, 18.0, 10.0, 9.0, 13.0, 13.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3828125, -7.15142822265625, -6.9200439453125, -6.68865966796875, -6.457275390625, -6.22589111328125, -5.9945068359375, -5.76312255859375, -5.53173828125, -5.30035400390625, -5.0689697265625, -4.83758544921875, -4.606201171875, -4.37481689453125, -4.1434326171875, -3.91204833984375, -3.6806640625, -3.44927978515625, -3.2178955078125, -2.98651123046875, -2.755126953125, -2.52374267578125, -2.2923583984375, -2.06097412109375, -1.82958984375, -1.59820556640625, -1.3668212890625, -1.13543701171875, -0.904052734375, -0.67266845703125, -0.4412841796875, -0.20989990234375, 0.021484375, 0.25286865234375, 0.4842529296875, 0.71563720703125, 0.947021484375, 1.17840576171875, 1.4097900390625, 1.64117431640625, 1.87255859375, 2.10394287109375, 2.3353271484375, 2.56671142578125, 2.798095703125, 3.02947998046875, 3.2608642578125, 3.49224853515625, 3.7236328125, 3.95501708984375, 4.1864013671875, 4.41778564453125, 4.649169921875, 4.88055419921875, 5.1119384765625, 5.34332275390625, 5.57470703125, 5.80609130859375, 6.0374755859375, 6.26885986328125, 6.500244140625, 6.73162841796875, 6.9630126953125, 7.19439697265625, 7.42578125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 2.0, 8.0, 17.0, 12.0, 9.0, 11.0, 13.0, 23.0, 31.0, 15.0, 37.0, 41.0, 50.0, 37.0, 29.0, 59.0, 51.0, 38.0, 38.0, 50.0, 55.0, 43.0, 40.0, 33.0, 33.0, 36.0, 32.0, 26.0, 28.0, 22.0, 19.0, 12.0, 10.0, 3.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.491859436035156, -43.1541862487793, -41.81651306152344, -40.47883605957031, -39.14116287231445, -37.803489685058594, -36.465816497802734, -35.128143310546875, -33.79046630859375, -32.45279312133789, -31.1151180267334, -29.77744483947754, -28.439769744873047, -27.102096557617188, -25.764423370361328, -24.42675018310547, -23.08907699584961, -21.75140380859375, -20.413728713989258, -19.0760555267334, -17.738380432128906, -16.400707244873047, -15.063034057617188, -13.725359916687012, -12.387685775756836, -11.05001163482666, -9.712337493896484, -8.374664306640625, -7.036990165710449, -5.699316024780273, -4.361642837524414, -3.0239686965942383, -1.6862983703613281, -0.34862446784973145, 0.9890494346618652, 2.326723098754883, 3.6643972396850586, 5.002071380615234, 6.339744567871094, 7.6774187088012695, 9.015092849731445, 10.352766990661621, 11.690441131591797, 13.028114318847656, 14.365788459777832, 15.703462600708008, 17.041135787963867, 18.37881088256836, 19.71648406982422, 21.054157257080078, 22.39183235168457, 23.72950553894043, 25.067180633544922, 26.40485382080078, 27.74252700805664, 29.0802001953125, 30.417875289916992, 31.75554847717285, 33.093223571777344, 34.4308967590332, 35.76856994628906, 37.10624694824219, 38.44391632080078, 39.781593322753906, 41.119266510009766]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 6.0, 5.0, 5.0, 9.0, 16.0, 16.0, 22.0, 23.0, 18.0, 23.0, 20.0, 29.0, 27.0, 35.0, 37.0, 38.0, 37.0, 30.0, 34.0, 40.0, 47.0, 42.0, 44.0, 38.0, 43.0, 35.0, 42.0, 39.0, 27.0, 30.0, 26.0, 24.0, 14.0, 11.0, 16.0, 8.0, 8.0, 6.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-63.33000564575195, -61.52952575683594, -59.72904586791992, -57.928565979003906, -56.12808609008789, -54.327606201171875, -52.527122497558594, -50.72664260864258, -48.92616271972656, -47.12568283081055, -45.32520294189453, -43.524723052978516, -41.7242431640625, -39.92375946044922, -38.12328338623047, -36.32279968261719, -34.52232360839844, -32.72184371948242, -30.921363830566406, -29.12088394165039, -27.320402145385742, -25.519922256469727, -23.71944236755371, -21.918960571289062, -20.118480682373047, -18.31800079345703, -16.517520904541016, -14.717040061950684, -12.916559219360352, -11.116079330444336, -9.31559944152832, -7.515118598937988, -5.714637756347656, -3.9141573905944824, -2.1136772632598877, -0.31319713592529297, 1.4872832298278809, 3.2877635955810547, 5.08824348449707, 6.888724327087402, 8.689204216003418, 10.489684104919434, 12.290164947509766, 14.090644836425781, 15.891124725341797, 17.691604614257812, 19.492084503173828, 21.292566299438477, 23.093046188354492, 24.893526077270508, 26.694005966186523, 28.494487762451172, 30.294967651367188, 32.0954475402832, 33.89592742919922, 35.696407318115234, 37.49688720703125, 39.297367095947266, 41.09784698486328, 42.8983268737793, 44.69880676269531, 46.499290466308594, 48.299766540527344, 50.100250244140625, 51.90073013305664]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 7.0, 14.0, 24.0, 36.0, 73.0, 102.0, 153.0, 262.0, 488.0, 728.0, 1275.0, 1975.0, 3350.0, 5334.0, 8301.0, 13318.0, 20516.0, 30692.0, 46394.0, 67492.0, 94655.0, 130536.0, 172230.0, 217775.0, 266889.0, 310391.0, 345147.0, 364210.0, 363898.0, 344646.0, 310806.0, 266175.0, 218414.0, 170987.0, 128293.0, 93994.0, 65214.0, 45311.0, 30591.0, 19935.0, 12681.0, 8064.0, 5037.0, 3050.0, 1959.0, 1175.0, 668.0, 411.0, 256.0, 129.0, 104.0, 57.0, 27.0, 20.0, 9.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-27.265625, -26.385498046875, -25.50537109375, -24.625244140625, -23.7451171875, -22.864990234375, -21.98486328125, -21.104736328125, -20.224609375, -19.344482421875, -18.46435546875, -17.584228515625, -16.7041015625, -15.823974609375, -14.94384765625, -14.063720703125, -13.18359375, -12.303466796875, -11.42333984375, -10.543212890625, -9.6630859375, -8.782958984375, -7.90283203125, -7.022705078125, -6.142578125, -5.262451171875, -4.38232421875, -3.502197265625, -2.6220703125, -1.741943359375, -0.86181640625, 0.018310546875, 0.8984375, 1.778564453125, 2.65869140625, 3.538818359375, 4.4189453125, 5.299072265625, 6.17919921875, 7.059326171875, 7.939453125, 8.819580078125, 9.69970703125, 10.579833984375, 11.4599609375, 12.340087890625, 13.22021484375, 14.100341796875, 14.98046875, 15.860595703125, 16.74072265625, 17.620849609375, 18.5009765625, 19.381103515625, 20.26123046875, 21.141357421875, 22.021484375, 22.901611328125, 23.78173828125, 24.661865234375, 25.5419921875, 26.422119140625, 27.30224609375, 28.182373046875, 29.0625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 1.0, 6.0, 9.0, 18.0, 13.0, 25.0, 19.0, 18.0, 24.0, 26.0, 22.0, 31.0, 34.0, 38.0, 36.0, 37.0, 30.0, 40.0, 40.0, 44.0, 39.0, 41.0, 40.0, 42.0, 40.0, 41.0, 36.0, 27.0, 29.0, 24.0, 23.0, 16.0, 11.0, 16.0, 9.0, 6.0, 9.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-60.4375, -58.7158203125, -56.994140625, -55.2724609375, -53.55078125, -51.8291015625, -50.107421875, -48.3857421875, -46.6640625, -44.9423828125, -43.220703125, -41.4990234375, -39.77734375, -38.0556640625, -36.333984375, -34.6123046875, -32.890625, -31.1689453125, -29.447265625, -27.7255859375, -26.00390625, -24.2822265625, -22.560546875, -20.8388671875, -19.1171875, -17.3955078125, -15.673828125, -13.9521484375, -12.23046875, -10.5087890625, -8.787109375, -7.0654296875, -5.34375, -3.6220703125, -1.900390625, -0.1787109375, 1.54296875, 3.2646484375, 4.986328125, 6.7080078125, 8.4296875, 10.1513671875, 11.873046875, 13.5947265625, 15.31640625, 17.0380859375, 18.759765625, 20.4814453125, 22.203125, 23.9248046875, 25.646484375, 27.3681640625, 29.08984375, 30.8115234375, 32.533203125, 34.2548828125, 35.9765625, 37.6982421875, 39.419921875, 41.1416015625, 42.86328125, 44.5849609375, 46.306640625, 48.0283203125, 49.75]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [4.0, 5.0, 14.0, 16.0, 30.0, 45.0, 98.0, 192.0, 251.0, 412.0, 723.0, 1306.0, 1972.0, 3227.0, 4971.0, 7990.0, 12201.0, 18475.0, 27216.0, 38381.0, 54494.0, 74579.0, 99780.0, 129174.0, 162978.0, 198167.0, 233679.0, 264837.0, 290578.0, 306895.0, 313708.0, 307242.0, 293631.0, 266091.0, 234719.0, 199988.0, 163815.0, 130992.0, 100694.0, 75591.0, 55521.0, 39851.0, 27182.0, 18749.0, 12355.0, 7980.0, 5207.0, 3324.0, 1968.0, 1237.0, 697.0, 431.0, 270.0, 156.0, 87.0, 58.0, 31.0, 20.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-24.6875, -23.878662109375, -23.06982421875, -22.260986328125, -21.4521484375, -20.643310546875, -19.83447265625, -19.025634765625, -18.216796875, -17.407958984375, -16.59912109375, -15.790283203125, -14.9814453125, -14.172607421875, -13.36376953125, -12.554931640625, -11.74609375, -10.937255859375, -10.12841796875, -9.319580078125, -8.5107421875, -7.701904296875, -6.89306640625, -6.084228515625, -5.275390625, -4.466552734375, -3.65771484375, -2.848876953125, -2.0400390625, -1.231201171875, -0.42236328125, 0.386474609375, 1.1953125, 2.004150390625, 2.81298828125, 3.621826171875, 4.4306640625, 5.239501953125, 6.04833984375, 6.857177734375, 7.666015625, 8.474853515625, 9.28369140625, 10.092529296875, 10.9013671875, 11.710205078125, 12.51904296875, 13.327880859375, 14.13671875, 14.945556640625, 15.75439453125, 16.563232421875, 17.3720703125, 18.180908203125, 18.98974609375, 19.798583984375, 20.607421875, 21.416259765625, 22.22509765625, 23.033935546875, 23.8427734375, 24.651611328125, 25.46044921875, 26.269287109375, 27.078125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 7.0, 1.0, 3.0, 4.0, 11.0, 11.0, 16.0, 20.0, 16.0, 28.0, 32.0, 33.0, 52.0, 66.0, 81.0, 81.0, 88.0, 109.0, 86.0, 135.0, 124.0, 156.0, 152.0, 173.0, 195.0, 173.0, 164.0, 183.0, 187.0, 168.0, 170.0, 133.0, 175.0, 120.0, 124.0, 100.0, 126.0, 91.0, 88.0, 79.0, 64.0, 49.0, 44.0, 42.0, 27.0, 22.0, 17.0, 14.0, 16.0, 11.0, 4.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.68017578125, -19.0478515625, -18.41552734375, -17.783203125, -17.15087890625, -16.5185546875, -15.88623046875, -15.25390625, -14.62158203125, -13.9892578125, -13.35693359375, -12.724609375, -12.09228515625, -11.4599609375, -10.82763671875, -10.1953125, -9.56298828125, -8.9306640625, -8.29833984375, -7.666015625, -7.03369140625, -6.4013671875, -5.76904296875, -5.13671875, -4.50439453125, -3.8720703125, -3.23974609375, -2.607421875, -1.97509765625, -1.3427734375, -0.71044921875, -0.078125, 0.55419921875, 1.1865234375, 1.81884765625, 2.451171875, 3.08349609375, 3.7158203125, 4.34814453125, 4.98046875, 5.61279296875, 6.2451171875, 6.87744140625, 7.509765625, 8.14208984375, 8.7744140625, 9.40673828125, 10.0390625, 10.67138671875, 11.3037109375, 11.93603515625, 12.568359375, 13.20068359375, 13.8330078125, 14.46533203125, 15.09765625, 15.72998046875, 16.3623046875, 16.99462890625, 17.626953125, 18.25927734375, 18.8916015625, 19.52392578125, 20.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 6.0, 4.0, 10.0, 13.0, 12.0, 13.0, 17.0, 14.0, 34.0, 22.0, 25.0, 34.0, 40.0, 37.0, 30.0, 45.0, 35.0, 38.0, 51.0, 41.0, 35.0, 45.0, 46.0, 48.0, 42.0, 32.0, 28.0, 25.0, 31.0, 17.0, 27.0, 18.0, 13.0, 17.0, 15.0, 8.0, 8.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.42487716674805, -46.97502899169922, -45.525184631347656, -44.07533645629883, -42.62548828125, -41.17564392089844, -39.72579574584961, -38.27594757080078, -36.82610321044922, -35.37625503540039, -33.92641067504883, -32.4765625, -31.026716232299805, -29.57686996459961, -28.12702178955078, -26.677175521850586, -25.227327346801758, -23.777481079101562, -22.327632904052734, -20.87778663635254, -19.427940368652344, -17.978092193603516, -16.52824592590332, -15.078399658203125, -13.628552436828613, -12.178705215454102, -10.728858947753906, -9.279011726379395, -7.829164981842041, -6.3793182373046875, -4.929471015930176, -3.4796247482299805, -2.0297775268554688, -0.5799306631088257, 0.8699162006378174, 2.31976318359375, 3.7696099281311035, 5.219456672668457, 6.669303894042969, 8.119150161743164, 9.568997383117676, 11.018844604492188, 12.468690872192383, 13.918538093566895, 15.368385314941406, 16.8182315826416, 18.268077850341797, 19.717926025390625, 21.16777229309082, 22.617618560791016, 24.067466735839844, 25.51731300354004, 26.967159271240234, 28.417007446289062, 29.866853713989258, 31.316699981689453, 32.76654815673828, 34.21639633178711, 35.66624069213867, 37.1160888671875, 38.56593704223633, 40.01578140258789, 41.46562957763672, 42.91547393798828, 44.36532211303711]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 13.0, 6.0, 12.0, 19.0, 13.0, 17.0, 25.0, 31.0, 31.0, 18.0, 23.0, 34.0, 43.0, 39.0, 53.0, 43.0, 43.0, 35.0, 44.0, 44.0, 47.0, 42.0, 46.0, 42.0, 35.0, 26.0, 25.0, 23.0, 15.0, 18.0, 20.0, 13.0, 12.0, 15.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.95011901855469, -68.76985931396484, -66.589599609375, -64.40933990478516, -62.22907638549805, -60.0488166809082, -57.868553161621094, -55.68829345703125, -53.508033752441406, -51.32777404785156, -49.14751434326172, -46.96725082397461, -44.786991119384766, -42.60673141479492, -40.42646789550781, -38.24620819091797, -36.065948486328125, -33.88568878173828, -31.705427169799805, -29.525165557861328, -27.344905853271484, -25.16464614868164, -22.984384536743164, -20.804122924804688, -18.623863220214844, -16.443603515625, -14.263341903686523, -12.083081245422363, -9.902820587158203, -7.722559928894043, -5.542299270629883, -3.3620386123657227, -1.1817779541015625, 0.9984827041625977, 3.178743362426758, 5.359004020690918, 7.539264678955078, 9.719525337219238, 11.899785995483398, 14.080046653747559, 16.26030731201172, 18.440567016601562, 20.62082862854004, 22.801090240478516, 24.98134994506836, 27.161609649658203, 29.34187126159668, 31.522132873535156, 33.702392578125, 35.882652282714844, 38.06291198730469, 40.2431755065918, 42.42343521118164, 44.603694915771484, 46.783958435058594, 48.96421813964844, 51.14447784423828, 53.324737548828125, 55.50499725341797, 57.68526077270508, 59.86552047729492, 62.045780181884766, 64.22604370117188, 66.40630340576172, 68.58656311035156]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 14.0, 17.0, 21.0, 39.0, 57.0, 114.0, 137.0, 204.0, 292.0, 476.0, 714.0, 1046.0, 1743.0, 2764.0, 4618.0, 7315.0, 12310.0, 20500.0, 34400.0, 57772.0, 95747.0, 146888.0, 186497.0, 170670.0, 119811.0, 74035.0, 44246.0, 26155.0, 15422.0, 9221.0, 5735.0, 3443.0, 2279.0, 1306.0, 904.0, 559.0, 345.0, 231.0, 148.0, 117.0, 70.0, 46.0, 32.0, 26.0, 26.0, 13.0, 8.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.0390625, -6.81005859375, -6.5810546875, -6.35205078125, -6.123046875, -5.89404296875, -5.6650390625, -5.43603515625, -5.20703125, -4.97802734375, -4.7490234375, -4.52001953125, -4.291015625, -4.06201171875, -3.8330078125, -3.60400390625, -3.375, -3.14599609375, -2.9169921875, -2.68798828125, -2.458984375, -2.22998046875, -2.0009765625, -1.77197265625, -1.54296875, -1.31396484375, -1.0849609375, -0.85595703125, -0.626953125, -0.39794921875, -0.1689453125, 0.06005859375, 0.2890625, 0.51806640625, 0.7470703125, 0.97607421875, 1.205078125, 1.43408203125, 1.6630859375, 1.89208984375, 2.12109375, 2.35009765625, 2.5791015625, 2.80810546875, 3.037109375, 3.26611328125, 3.4951171875, 3.72412109375, 3.953125, 4.18212890625, 4.4111328125, 4.64013671875, 4.869140625, 5.09814453125, 5.3271484375, 5.55615234375, 5.78515625, 6.01416015625, 6.2431640625, 6.47216796875, 6.701171875, 6.93017578125, 7.1591796875, 7.38818359375, 7.6171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 6.0, 13.0, 18.0, 13.0, 16.0, 28.0, 29.0, 33.0, 19.0, 22.0, 32.0, 46.0, 39.0, 54.0, 43.0, 42.0, 34.0, 48.0, 42.0, 46.0, 44.0, 43.0, 40.0, 36.0, 26.0, 23.0, 24.0, 14.0, 19.0, 19.0, 14.0, 11.0, 15.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.4375, -68.2568359375, -66.076171875, -63.8955078125, -61.71484375, -59.5341796875, -57.353515625, -55.1728515625, -52.9921875, -50.8115234375, -48.630859375, -46.4501953125, -44.26953125, -42.0888671875, -39.908203125, -37.7275390625, -35.546875, -33.3662109375, -31.185546875, -29.0048828125, -26.82421875, -24.6435546875, -22.462890625, -20.2822265625, -18.1015625, -15.9208984375, -13.740234375, -11.5595703125, -9.37890625, -7.1982421875, -5.017578125, -2.8369140625, -0.65625, 1.5244140625, 3.705078125, 5.8857421875, 8.06640625, 10.2470703125, 12.427734375, 14.6083984375, 16.7890625, 18.9697265625, 21.150390625, 23.3310546875, 25.51171875, 27.6923828125, 29.873046875, 32.0537109375, 34.234375, 36.4150390625, 38.595703125, 40.7763671875, 42.95703125, 45.1376953125, 47.318359375, 49.4990234375, 51.6796875, 53.8603515625, 56.041015625, 58.2216796875, 60.40234375, 62.5830078125, 64.763671875, 66.9443359375, 69.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 7.0, 10.0, 4.0, 19.0, 20.0, 23.0, 49.0, 62.0, 116.0, 120.0, 176.0, 237.0, 357.0, 552.0, 841.0, 1284.0, 1972.0, 3243.0, 5204.0, 8793.0, 15882.0, 28766.0, 55930.0, 111197.0, 212504.0, 260990.0, 163093.0, 82012.0, 41869.0, 22180.0, 12312.0, 7062.0, 4092.0, 2604.0, 1704.0, 1067.0, 689.0, 483.0, 323.0, 206.0, 166.0, 116.0, 80.0, 40.0, 38.0, 26.0, 12.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.1910400390625, -6.936767578125, -6.6824951171875, -6.42822265625, -6.1739501953125, -5.919677734375, -5.6654052734375, -5.4111328125, -5.1568603515625, -4.902587890625, -4.6483154296875, -4.39404296875, -4.1397705078125, -3.885498046875, -3.6312255859375, -3.376953125, -3.1226806640625, -2.868408203125, -2.6141357421875, -2.35986328125, -2.1055908203125, -1.851318359375, -1.5970458984375, -1.3427734375, -1.0885009765625, -0.834228515625, -0.5799560546875, -0.32568359375, -0.0714111328125, 0.182861328125, 0.4371337890625, 0.69140625, 0.9456787109375, 1.199951171875, 1.4542236328125, 1.70849609375, 1.9627685546875, 2.217041015625, 2.4713134765625, 2.7255859375, 2.9798583984375, 3.234130859375, 3.4884033203125, 3.74267578125, 3.9969482421875, 4.251220703125, 4.5054931640625, 4.759765625, 5.0140380859375, 5.268310546875, 5.5225830078125, 5.77685546875, 6.0311279296875, 6.285400390625, 6.5396728515625, 6.7939453125, 7.0482177734375, 7.302490234375, 7.5567626953125, 7.81103515625, 8.0653076171875, 8.319580078125, 8.5738525390625, 8.828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 12.0, 8.0, 12.0, 17.0, 20.0, 14.0, 21.0, 29.0, 28.0, 33.0, 25.0, 28.0, 45.0, 35.0, 36.0, 45.0, 35.0, 43.0, 38.0, 37.0, 38.0, 49.0, 34.0, 30.0, 36.0, 34.0, 31.0, 33.0, 23.0, 17.0, 18.0, 18.0, 13.0, 12.0, 9.0, 9.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.25, -45.87353515625, -44.4970703125, -43.12060546875, -41.744140625, -40.36767578125, -38.9912109375, -37.61474609375, -36.23828125, -34.86181640625, -33.4853515625, -32.10888671875, -30.732421875, -29.35595703125, -27.9794921875, -26.60302734375, -25.2265625, -23.85009765625, -22.4736328125, -21.09716796875, -19.720703125, -18.34423828125, -16.9677734375, -15.59130859375, -14.21484375, -12.83837890625, -11.4619140625, -10.08544921875, -8.708984375, -7.33251953125, -5.9560546875, -4.57958984375, -3.203125, -1.82666015625, -0.4501953125, 0.92626953125, 2.302734375, 3.67919921875, 5.0556640625, 6.43212890625, 7.80859375, 9.18505859375, 10.5615234375, 11.93798828125, 13.314453125, 14.69091796875, 16.0673828125, 17.44384765625, 18.8203125, 20.19677734375, 21.5732421875, 22.94970703125, 24.326171875, 25.70263671875, 27.0791015625, 28.45556640625, 29.83203125, 31.20849609375, 32.5849609375, 33.96142578125, 35.337890625, 36.71435546875, 38.0908203125, 39.46728515625, 40.84375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 17.0, 14.0, 14.0, 13.0, 20.0, 34.0, 54.0, 75.0, 86.0, 107.0, 158.0, 217.0, 304.0, 470.0, 776.0, 1167.0, 2074.0, 3855.0, 7460.0, 16000.0, 41213.0, 151159.0, 546750.0, 192258.0, 48170.0, 17917.0, 8195.0, 4114.0, 2209.0, 1265.0, 767.0, 478.0, 339.0, 217.0, 156.0, 100.0, 82.0, 56.0, 48.0, 35.0, 20.0, 31.0, 15.0, 8.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-6.23046875, -6.0391845703125, -5.847900390625, -5.6566162109375, -5.46533203125, -5.2740478515625, -5.082763671875, -4.8914794921875, -4.7001953125, -4.5089111328125, -4.317626953125, -4.1263427734375, -3.93505859375, -3.7437744140625, -3.552490234375, -3.3612060546875, -3.169921875, -2.9786376953125, -2.787353515625, -2.5960693359375, -2.40478515625, -2.2135009765625, -2.022216796875, -1.8309326171875, -1.6396484375, -1.4483642578125, -1.257080078125, -1.0657958984375, -0.87451171875, -0.6832275390625, -0.491943359375, -0.3006591796875, -0.109375, 0.0819091796875, 0.273193359375, 0.4644775390625, 0.65576171875, 0.8470458984375, 1.038330078125, 1.2296142578125, 1.4208984375, 1.6121826171875, 1.803466796875, 1.9947509765625, 2.18603515625, 2.3773193359375, 2.568603515625, 2.7598876953125, 2.951171875, 3.1424560546875, 3.333740234375, 3.5250244140625, 3.71630859375, 3.9075927734375, 4.098876953125, 4.2901611328125, 4.4814453125, 4.6727294921875, 4.864013671875, 5.0552978515625, 5.24658203125, 5.4378662109375, 5.629150390625, 5.8204345703125, 6.01171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 0.0, 7.0, 6.0, 9.0, 11.0, 10.0, 27.0, 22.0, 20.0, 30.0, 33.0, 37.0, 56.0, 52.0, 56.0, 49.0, 59.0, 55.0, 52.0, 59.0, 62.0, 35.0, 50.0, 29.0, 34.0, 30.0, 17.0, 20.0, 20.0, 17.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00030040740966796875, -0.00029208511114120483, -0.0002837628126144409, -0.000275440514087677, -0.0002671182155609131, -0.00025879591703414917, -0.00025047361850738525, -0.00024215131998062134, -0.00023382902145385742, -0.0002255067229270935, -0.0002171844244003296, -0.00020886212587356567, -0.00020053982734680176, -0.00019221752882003784, -0.00018389523029327393, -0.00017557293176651, -0.0001672506332397461, -0.00015892833471298218, -0.00015060603618621826, -0.00014228373765945435, -0.00013396143913269043, -0.00012563914060592651, -0.0001173168420791626, -0.00010899454355239868, -0.00010067224502563477, -9.234994649887085e-05, -8.402764797210693e-05, -7.570534944534302e-05, -6.73830509185791e-05, -5.9060752391815186e-05, -5.073845386505127e-05, -4.2416155338287354e-05, -3.409385681152344e-05, -2.577155828475952e-05, -1.7449259757995605e-05, -9.12696123123169e-06, -8.046627044677734e-07, 7.517635822296143e-06, 1.583993434906006e-05, 2.4162232875823975e-05, 3.248453140258789e-05, 4.080682992935181e-05, 4.912912845611572e-05, 5.745142698287964e-05, 6.577372550964355e-05, 7.409602403640747e-05, 8.241832256317139e-05, 9.07406210899353e-05, 9.906291961669922e-05, 0.00010738521814346313, 0.00011570751667022705, 0.00012402981519699097, 0.00013235211372375488, 0.0001406744122505188, 0.00014899671077728271, 0.00015731900930404663, 0.00016564130783081055, 0.00017396360635757446, 0.00018228590488433838, 0.0001906082034111023, 0.0001989305019378662, 0.00020725280046463013, 0.00021557509899139404, 0.00022389739751815796, 0.00023221969604492188]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 13.0, 22.0, 35.0, 57.0, 73.0, 115.0, 155.0, 258.0, 391.0, 701.0, 1183.0, 2055.0, 3653.0, 6616.0, 12552.0, 24627.0, 49818.0, 103853.0, 202824.0, 269308.0, 185070.0, 92657.0, 44700.0, 22396.0, 11353.0, 6144.0, 3327.0, 1812.0, 1090.0, 621.0, 364.0, 235.0, 166.0, 94.0, 52.0, 47.0, 27.0, 13.0, 18.0, 12.0, 6.0, 8.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.703125, -4.53765869140625, -4.3721923828125, -4.20672607421875, -4.041259765625, -3.87579345703125, -3.7103271484375, -3.54486083984375, -3.37939453125, -3.21392822265625, -3.0484619140625, -2.88299560546875, -2.717529296875, -2.55206298828125, -2.3865966796875, -2.22113037109375, -2.0556640625, -1.89019775390625, -1.7247314453125, -1.55926513671875, -1.393798828125, -1.22833251953125, -1.0628662109375, -0.89739990234375, -0.73193359375, -0.56646728515625, -0.4010009765625, -0.23553466796875, -0.070068359375, 0.09539794921875, 0.2608642578125, 0.42633056640625, 0.591796875, 0.75726318359375, 0.9227294921875, 1.08819580078125, 1.253662109375, 1.41912841796875, 1.5845947265625, 1.75006103515625, 1.91552734375, 2.08099365234375, 2.2464599609375, 2.41192626953125, 2.577392578125, 2.74285888671875, 2.9083251953125, 3.07379150390625, 3.2392578125, 3.40472412109375, 3.5701904296875, 3.73565673828125, 3.901123046875, 4.06658935546875, 4.2320556640625, 4.39752197265625, 4.56298828125, 4.72845458984375, 4.8939208984375, 5.05938720703125, 5.224853515625, 5.39031982421875, 5.5557861328125, 5.72125244140625, 5.88671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 2.0, 6.0, 8.0, 12.0, 29.0, 34.0, 42.0, 54.0, 70.0, 76.0, 82.0, 93.0, 79.0, 87.0, 75.0, 50.0, 41.0, 32.0, 26.0, 26.0, 16.0, 7.0, 15.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.728515625, -3.588531494140625, -3.44854736328125, -3.308563232421875, -3.1685791015625, -3.028594970703125, -2.88861083984375, -2.748626708984375, -2.608642578125, -2.468658447265625, -2.32867431640625, -2.188690185546875, -2.0487060546875, -1.908721923828125, -1.76873779296875, -1.628753662109375, -1.48876953125, -1.348785400390625, -1.20880126953125, -1.068817138671875, -0.9288330078125, -0.788848876953125, -0.64886474609375, -0.508880615234375, -0.368896484375, -0.228912353515625, -0.08892822265625, 0.051055908203125, 0.1910400390625, 0.331024169921875, 0.47100830078125, 0.610992431640625, 0.7509765625, 0.890960693359375, 1.03094482421875, 1.170928955078125, 1.3109130859375, 1.450897216796875, 1.59088134765625, 1.730865478515625, 1.870849609375, 2.010833740234375, 2.15081787109375, 2.290802001953125, 2.4307861328125, 2.570770263671875, 2.71075439453125, 2.850738525390625, 2.99072265625, 3.130706787109375, 3.27069091796875, 3.410675048828125, 3.5506591796875, 3.690643310546875, 3.83062744140625, 3.970611572265625, 4.110595703125, 4.250579833984375, 4.39056396484375, 4.530548095703125, 4.6705322265625, 4.810516357421875, 4.95050048828125, 5.090484619140625, 5.23046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 6.0, 9.0, 5.0, 13.0, 15.0, 15.0, 13.0, 21.0, 27.0, 28.0, 22.0, 34.0, 44.0, 39.0, 37.0, 43.0, 41.0, 36.0, 39.0, 48.0, 42.0, 47.0, 44.0, 47.0, 35.0, 34.0, 23.0, 28.0, 31.0, 23.0, 26.0, 11.0, 14.0, 18.0, 7.0, 10.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.803672790527344, -47.32434844970703, -45.84502410888672, -44.365699768066406, -42.886375427246094, -41.40705490112305, -39.927730560302734, -38.44840621948242, -36.96908187866211, -35.4897575378418, -34.010433197021484, -32.53110885620117, -31.051786422729492, -29.57246208190918, -28.0931396484375, -26.613815307617188, -25.134490966796875, -23.655166625976562, -22.17584228515625, -20.69651985168457, -19.217195510864258, -17.737871170043945, -16.258548736572266, -14.779224395751953, -13.29990005493164, -11.820575714111328, -10.341252326965332, -8.861928939819336, -7.382604598999023, -5.903280735015869, -4.423956871032715, -2.9446334838867188, -1.4653053283691406, 0.014018535614013672, 1.493342399597168, 2.9726662635803223, 4.451990127563477, 5.931313991546631, 7.410637855529785, 8.889961242675781, 10.369285583496094, 11.848609924316406, 13.327933311462402, 14.807256698608398, 16.28658103942871, 17.765905380249023, 19.245227813720703, 20.724552154541016, 22.203876495361328, 23.68320083618164, 25.162525177001953, 26.641847610473633, 28.121171951293945, 29.600496292114258, 31.079818725585938, 32.55914306640625, 34.03846740722656, 35.517791748046875, 36.99711608886719, 38.4764404296875, 39.95576477050781, 41.43508529663086, 42.91440963745117, 44.393733978271484, 45.8730583190918]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 6.0, 10.0, 10.0, 11.0, 14.0, 12.0, 20.0, 19.0, 25.0, 27.0, 28.0, 28.0, 21.0, 36.0, 42.0, 41.0, 52.0, 47.0, 35.0, 38.0, 49.0, 43.0, 41.0, 53.0, 38.0, 40.0, 36.0, 24.0, 21.0, 25.0, 15.0, 19.0, 17.0, 14.0, 12.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.67494201660156, -68.4756088256836, -66.27627563476562, -64.07693481445312, -61.877601623535156, -59.67826843261719, -57.47893524169922, -55.279598236083984, -53.08026123046875, -50.88092803955078, -48.68159103393555, -46.48225784301758, -44.282920837402344, -42.083587646484375, -39.884254455566406, -37.68491744995117, -35.4855842590332, -33.286251068115234, -31.0869140625, -28.88758087158203, -26.688243865966797, -24.488910675048828, -22.289575576782227, -20.090240478515625, -17.890905380249023, -15.691570281982422, -13.49223518371582, -11.292901039123535, -9.093565940856934, -6.894230842590332, -4.694896697998047, -2.4955615997314453, -0.29622650146484375, 1.9031083583831787, 4.102443218231201, 6.3017778396606445, 8.501112937927246, 10.700448036193848, 12.899782180786133, 15.099117279052734, 17.298452377319336, 19.497787475585938, 21.69712257385254, 23.89645767211914, 26.09579086303711, 28.295127868652344, 30.494461059570312, 32.69379425048828, 34.893131256103516, 37.092464447021484, 39.29180145263672, 41.49113464355469, 43.69047164916992, 45.88980484008789, 48.089141845703125, 50.288475036621094, 52.48780822753906, 54.68714141845703, 56.886478424072266, 59.085811614990234, 61.28514862060547, 63.48448181152344, 65.6838150024414, 67.88314819335938, 70.08248901367188]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 16.0, 16.0, 20.0, 40.0, 49.0, 91.0, 130.0, 197.0, 284.0, 497.0, 730.0, 1136.0, 1888.0, 3085.0, 4863.0, 8065.0, 13501.0, 21709.0, 34146.0, 50712.0, 71553.0, 93629.0, 112269.0, 122030.0, 120105.0, 108332.0, 87928.0, 65625.0, 45958.0, 30236.0, 19388.0, 11837.0, 7146.0, 4371.0, 2505.0, 1606.0, 1002.0, 656.0, 428.0, 259.0, 178.0, 128.0, 74.0, 49.0, 32.0, 20.0, 11.0, 11.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-30.859375, -29.859619140625, -28.85986328125, -27.860107421875, -26.8603515625, -25.860595703125, -24.86083984375, -23.861083984375, -22.861328125, -21.861572265625, -20.86181640625, -19.862060546875, -18.8623046875, -17.862548828125, -16.86279296875, -15.863037109375, -14.86328125, -13.863525390625, -12.86376953125, -11.864013671875, -10.8642578125, -9.864501953125, -8.86474609375, -7.864990234375, -6.865234375, -5.865478515625, -4.86572265625, -3.865966796875, -2.8662109375, -1.866455078125, -0.86669921875, 0.133056640625, 1.1328125, 2.132568359375, 3.13232421875, 4.132080078125, 5.1318359375, 6.131591796875, 7.13134765625, 8.131103515625, 9.130859375, 10.130615234375, 11.13037109375, 12.130126953125, 13.1298828125, 14.129638671875, 15.12939453125, 16.129150390625, 17.12890625, 18.128662109375, 19.12841796875, 20.128173828125, 21.1279296875, 22.127685546875, 23.12744140625, 24.127197265625, 25.126953125, 26.126708984375, 27.12646484375, 28.126220703125, 29.1259765625, 30.125732421875, 31.12548828125, 32.125244140625, 33.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 10.0, 12.0, 13.0, 13.0, 20.0, 19.0, 27.0, 28.0, 28.0, 25.0, 21.0, 39.0, 43.0, 38.0, 52.0, 50.0, 32.0, 40.0, 48.0, 43.0, 43.0, 49.0, 41.0, 39.0, 34.0, 23.0, 22.0, 24.0, 15.0, 19.0, 17.0, 14.0, 13.0, 14.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.6875, -68.4833984375, -66.279296875, -64.0751953125, -61.87109375, -59.6669921875, -57.462890625, -55.2587890625, -53.0546875, -50.8505859375, -48.646484375, -46.4423828125, -44.23828125, -42.0341796875, -39.830078125, -37.6259765625, -35.421875, -33.2177734375, -31.013671875, -28.8095703125, -26.60546875, -24.4013671875, -22.197265625, -19.9931640625, -17.7890625, -15.5849609375, -13.380859375, -11.1767578125, -8.97265625, -6.7685546875, -4.564453125, -2.3603515625, -0.15625, 2.0478515625, 4.251953125, 6.4560546875, 8.66015625, 10.8642578125, 13.068359375, 15.2724609375, 17.4765625, 19.6806640625, 21.884765625, 24.0888671875, 26.29296875, 28.4970703125, 30.701171875, 32.9052734375, 35.109375, 37.3134765625, 39.517578125, 41.7216796875, 43.92578125, 46.1298828125, 48.333984375, 50.5380859375, 52.7421875, 54.9462890625, 57.150390625, 59.3544921875, 61.55859375, 63.7626953125, 65.966796875, 68.1708984375, 70.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 9.0, 11.0, 16.0, 21.0, 25.0, 54.0, 73.0, 99.0, 179.0, 213.0, 352.0, 556.0, 793.0, 1156.0, 1863.0, 2829.0, 4385.0, 7093.0, 11146.0, 17543.0, 28177.0, 43004.0, 63614.0, 87667.0, 111343.0, 127940.0, 128908.0, 116314.0, 93076.0, 68116.0, 47300.0, 30673.0, 19581.0, 12445.0, 7906.0, 4945.0, 3067.0, 2092.0, 1296.0, 880.0, 623.0, 404.0, 260.0, 154.0, 132.0, 68.0, 48.0, 31.0, 23.0, 17.0, 14.0, 10.0, 5.0, 2.0, 4.0, 2.0, 5.0], "bins": [-42.84375, -41.5498046875, -40.255859375, -38.9619140625, -37.66796875, -36.3740234375, -35.080078125, -33.7861328125, -32.4921875, -31.1982421875, -29.904296875, -28.6103515625, -27.31640625, -26.0224609375, -24.728515625, -23.4345703125, -22.140625, -20.8466796875, -19.552734375, -18.2587890625, -16.96484375, -15.6708984375, -14.376953125, -13.0830078125, -11.7890625, -10.4951171875, -9.201171875, -7.9072265625, -6.61328125, -5.3193359375, -4.025390625, -2.7314453125, -1.4375, -0.1435546875, 1.150390625, 2.4443359375, 3.73828125, 5.0322265625, 6.326171875, 7.6201171875, 8.9140625, 10.2080078125, 11.501953125, 12.7958984375, 14.08984375, 15.3837890625, 16.677734375, 17.9716796875, 19.265625, 20.5595703125, 21.853515625, 23.1474609375, 24.44140625, 25.7353515625, 27.029296875, 28.3232421875, 29.6171875, 30.9111328125, 32.205078125, 33.4990234375, 34.79296875, 36.0869140625, 37.380859375, 38.6748046875, 39.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 3.0, 6.0, 5.0, 8.0, 14.0, 14.0, 12.0, 14.0, 16.0, 16.0, 23.0, 17.0, 35.0, 29.0, 32.0, 29.0, 27.0, 28.0, 33.0, 40.0, 38.0, 49.0, 38.0, 38.0, 34.0, 43.0, 31.0, 26.0, 42.0, 32.0, 35.0, 21.0, 22.0, 17.0, 15.0, 17.0, 12.0, 15.0, 12.0, 13.0, 8.0, 6.0, 7.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-39.6875, -38.4208984375, -37.154296875, -35.8876953125, -34.62109375, -33.3544921875, -32.087890625, -30.8212890625, -29.5546875, -28.2880859375, -27.021484375, -25.7548828125, -24.48828125, -23.2216796875, -21.955078125, -20.6884765625, -19.421875, -18.1552734375, -16.888671875, -15.6220703125, -14.35546875, -13.0888671875, -11.822265625, -10.5556640625, -9.2890625, -8.0224609375, -6.755859375, -5.4892578125, -4.22265625, -2.9560546875, -1.689453125, -0.4228515625, 0.84375, 2.1103515625, 3.376953125, 4.6435546875, 5.91015625, 7.1767578125, 8.443359375, 9.7099609375, 10.9765625, 12.2431640625, 13.509765625, 14.7763671875, 16.04296875, 17.3095703125, 18.576171875, 19.8427734375, 21.109375, 22.3759765625, 23.642578125, 24.9091796875, 26.17578125, 27.4423828125, 28.708984375, 29.9755859375, 31.2421875, 32.5087890625, 33.775390625, 35.0419921875, 36.30859375, 37.5751953125, 38.841796875, 40.1083984375, 41.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 6.0, 14.0, 12.0, 19.0, 25.0, 43.0, 66.0, 86.0, 125.0, 187.0, 241.0, 376.0, 572.0, 859.0, 1358.0, 2135.0, 3600.0, 6005.0, 10056.0, 16664.0, 26851.0, 41991.0, 60955.0, 83831.0, 105127.0, 119271.0, 124373.0, 116012.0, 98603.0, 76939.0, 54939.0, 36828.0, 23474.0, 14546.0, 8817.0, 5142.0, 3066.0, 1900.0, 1147.0, 745.0, 449.0, 356.0, 205.0, 137.0, 123.0, 66.0, 64.0, 46.0, 26.0, 20.0, 15.0, 14.0, 11.0, 7.0, 1.0, 2.0, 3.0, 5.0], "bins": [-13.9921875, -13.5596923828125, -13.127197265625, -12.6947021484375, -12.26220703125, -11.8297119140625, -11.397216796875, -10.9647216796875, -10.5322265625, -10.0997314453125, -9.667236328125, -9.2347412109375, -8.80224609375, -8.3697509765625, -7.937255859375, -7.5047607421875, -7.072265625, -6.6397705078125, -6.207275390625, -5.7747802734375, -5.34228515625, -4.9097900390625, -4.477294921875, -4.0447998046875, -3.6123046875, -3.1798095703125, -2.747314453125, -2.3148193359375, -1.88232421875, -1.4498291015625, -1.017333984375, -0.5848388671875, -0.15234375, 0.2801513671875, 0.712646484375, 1.1451416015625, 1.57763671875, 2.0101318359375, 2.442626953125, 2.8751220703125, 3.3076171875, 3.7401123046875, 4.172607421875, 4.6051025390625, 5.03759765625, 5.4700927734375, 5.902587890625, 6.3350830078125, 6.767578125, 7.2000732421875, 7.632568359375, 8.0650634765625, 8.49755859375, 8.9300537109375, 9.362548828125, 9.7950439453125, 10.2275390625, 10.6600341796875, 11.092529296875, 11.5250244140625, 11.95751953125, 12.3900146484375, 12.822509765625, 13.2550048828125, 13.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 16.0, 16.0, 22.0, 27.0, 39.0, 62.0, 54.0, 44.0, 82.0, 71.0, 72.0, 80.0, 69.0, 58.0, 60.0, 53.0, 47.0, 24.0, 22.0, 16.0, 14.0, 8.0, 8.0, 4.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002086639404296875, -0.002007126808166504, -0.0019276142120361328, -0.0018481016159057617, -0.0017685890197753906, -0.0016890764236450195, -0.0016095638275146484, -0.0015300512313842773, -0.0014505386352539062, -0.0013710260391235352, -0.001291513442993164, -0.001212000846862793, -0.0011324882507324219, -0.0010529756546020508, -0.0009734630584716797, -0.0008939504623413086, -0.0008144378662109375, -0.0007349252700805664, -0.0006554126739501953, -0.0005759000778198242, -0.0004963874816894531, -0.00041687488555908203, -0.00033736228942871094, -0.00025784969329833984, -0.00017833709716796875, -9.882450103759766e-05, -1.9311904907226562e-05, 6.020069122314453e-05, 0.00013971328735351562, 0.00021922588348388672, 0.0002987384796142578, 0.0003782510757446289, 0.000457763671875, 0.0005372762680053711, 0.0006167888641357422, 0.0006963014602661133, 0.0007758140563964844, 0.0008553266525268555, 0.0009348392486572266, 0.0010143518447875977, 0.0010938644409179688, 0.0011733770370483398, 0.001252889633178711, 0.001332402229309082, 0.0014119148254394531, 0.0014914274215698242, 0.0015709400177001953, 0.0016504526138305664, 0.0017299652099609375, 0.0018094778060913086, 0.0018889904022216797, 0.0019685029983520508, 0.002048015594482422, 0.002127528190612793, 0.002207040786743164, 0.002286553382873535, 0.0023660659790039062, 0.0024455785751342773, 0.0025250911712646484, 0.0026046037673950195, 0.0026841163635253906, 0.0027636289596557617, 0.002843141555786133, 0.002922654151916504, 0.003002166748046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 4.0, 30.0, 41.0, 50.0, 75.0, 102.0, 205.0, 256.0, 409.0, 675.0, 1089.0, 1650.0, 2726.0, 4366.0, 7042.0, 11203.0, 17398.0, 26621.0, 38833.0, 54257.0, 71909.0, 89236.0, 102736.0, 109649.0, 108408.0, 99458.0, 84364.0, 66537.0, 49547.0, 34796.0, 23595.0, 15420.0, 9698.0, 6185.0, 3768.0, 2314.0, 1415.0, 882.0, 570.0, 394.0, 214.0, 164.0, 94.0, 58.0, 47.0, 23.0, 10.0, 5.0, 9.0, 6.0, 2.0, 2.0, 3.0], "bins": [-14.234375, -13.825927734375, -13.41748046875, -13.009033203125, -12.6005859375, -12.192138671875, -11.78369140625, -11.375244140625, -10.966796875, -10.558349609375, -10.14990234375, -9.741455078125, -9.3330078125, -8.924560546875, -8.51611328125, -8.107666015625, -7.69921875, -7.290771484375, -6.88232421875, -6.473876953125, -6.0654296875, -5.656982421875, -5.24853515625, -4.840087890625, -4.431640625, -4.023193359375, -3.61474609375, -3.206298828125, -2.7978515625, -2.389404296875, -1.98095703125, -1.572509765625, -1.1640625, -0.755615234375, -0.34716796875, 0.061279296875, 0.4697265625, 0.878173828125, 1.28662109375, 1.695068359375, 2.103515625, 2.511962890625, 2.92041015625, 3.328857421875, 3.7373046875, 4.145751953125, 4.55419921875, 4.962646484375, 5.37109375, 5.779541015625, 6.18798828125, 6.596435546875, 7.0048828125, 7.413330078125, 7.82177734375, 8.230224609375, 8.638671875, 9.047119140625, 9.45556640625, 9.864013671875, 10.2724609375, 10.680908203125, 11.08935546875, 11.497802734375, 11.90625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 9.0, 6.0, 8.0, 12.0, 11.0, 14.0, 15.0, 20.0, 17.0, 17.0, 25.0, 37.0, 34.0, 25.0, 42.0, 28.0, 31.0, 36.0, 37.0, 53.0, 39.0, 52.0, 44.0, 45.0, 41.0, 36.0, 39.0, 26.0, 34.0, 21.0, 12.0, 18.0, 21.0, 19.0, 10.0, 14.0, 14.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0], "bins": [-7.53125, -7.32574462890625, -7.1202392578125, -6.91473388671875, -6.709228515625, -6.50372314453125, -6.2982177734375, -6.09271240234375, -5.88720703125, -5.68170166015625, -5.4761962890625, -5.27069091796875, -5.065185546875, -4.85968017578125, -4.6541748046875, -4.44866943359375, -4.2431640625, -4.03765869140625, -3.8321533203125, -3.62664794921875, -3.421142578125, -3.21563720703125, -3.0101318359375, -2.80462646484375, -2.59912109375, -2.39361572265625, -2.1881103515625, -1.98260498046875, -1.777099609375, -1.57159423828125, -1.3660888671875, -1.16058349609375, -0.955078125, -0.74957275390625, -0.5440673828125, -0.33856201171875, -0.133056640625, 0.07244873046875, 0.2779541015625, 0.48345947265625, 0.68896484375, 0.89447021484375, 1.0999755859375, 1.30548095703125, 1.510986328125, 1.71649169921875, 1.9219970703125, 2.12750244140625, 2.3330078125, 2.53851318359375, 2.7440185546875, 2.94952392578125, 3.155029296875, 3.36053466796875, 3.5660400390625, 3.77154541015625, 3.97705078125, 4.18255615234375, 4.3880615234375, 4.59356689453125, 4.799072265625, 5.00457763671875, 5.2100830078125, 5.41558837890625, 5.62109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 11.0, 7.0, 14.0, 10.0, 19.0, 21.0, 18.0, 26.0, 27.0, 29.0, 38.0, 27.0, 30.0, 32.0, 37.0, 33.0, 45.0, 55.0, 33.0, 48.0, 44.0, 47.0, 36.0, 39.0, 32.0, 29.0, 29.0, 29.0, 23.0, 20.0, 25.0, 18.0, 14.0, 11.0, 11.0, 8.0, 3.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.345523834228516, -46.852291107177734, -45.35906219482422, -43.86582946777344, -42.372596740722656, -40.879364013671875, -39.386131286621094, -37.89290237426758, -36.3996696472168, -34.906436920166016, -33.4132080078125, -31.91997528076172, -30.426742553710938, -28.933509826660156, -27.440279006958008, -25.94704818725586, -24.453815460205078, -22.960582733154297, -21.46735191345215, -19.97412109375, -18.48088836669922, -16.987655639648438, -15.494424819946289, -14.001193046569824, -12.50796127319336, -11.014729499816895, -9.52149772644043, -8.028265953063965, -6.5350341796875, -5.041802406311035, -3.5485706329345703, -2.0553388595581055, -0.562103271484375, 0.9311285018920898, 2.4243602752685547, 3.9175920486450195, 5.410823822021484, 6.904055595397949, 8.397287368774414, 9.890519142150879, 11.383750915527344, 12.876982688903809, 14.370214462280273, 15.863446235656738, 17.356678009033203, 18.849910736083984, 20.343141555786133, 21.83637237548828, 23.329605102539062, 24.822837829589844, 26.316068649291992, 27.80929946899414, 29.302532196044922, 30.795764923095703, 32.28899383544922, 33.7822265625, 35.27545928955078, 36.76869201660156, 38.261924743652344, 39.75515365600586, 41.24838638305664, 42.74161911010742, 44.23484802246094, 45.72808074951172, 47.2213134765625]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 6.0, 7.0, 12.0, 2.0, 14.0, 24.0, 16.0, 17.0, 28.0, 26.0, 29.0, 36.0, 29.0, 35.0, 28.0, 32.0, 28.0, 36.0, 45.0, 45.0, 43.0, 53.0, 47.0, 37.0, 44.0, 42.0, 44.0, 17.0, 21.0, 27.0, 16.0, 30.0, 12.0, 15.0, 10.0, 15.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.1419677734375, -71.64351654052734, -69.14507293701172, -66.64662170410156, -64.14817810058594, -61.64972686767578, -59.151275634765625, -56.652828216552734, -54.154380798339844, -51.65593338012695, -49.15748596191406, -46.659034729003906, -44.160587310791016, -41.662139892578125, -39.16368865966797, -36.66524124145508, -34.16679382324219, -31.668346405029297, -29.169897079467773, -26.67144775390625, -24.17300033569336, -21.67455291748047, -19.176103591918945, -16.677654266357422, -14.179206848144531, -11.680758476257324, -9.182310104370117, -6.68386173248291, -4.185413360595703, -1.686964988708496, 0.8114833831787109, 3.3099327087402344, 5.808387756347656, 8.306836128234863, 10.80528450012207, 13.303732872009277, 15.802181243896484, 18.300628662109375, 20.7990779876709, 23.297527313232422, 25.795974731445312, 28.294422149658203, 30.792871475219727, 33.29132080078125, 35.78976821899414, 38.28821563720703, 40.78666687011719, 43.28511428833008, 45.78356170654297, 48.28200912475586, 50.78045654296875, 53.278907775878906, 55.7773551940918, 58.27580261230469, 60.774253845214844, 63.272701263427734, 65.77114868164062, 68.26959991455078, 70.7680435180664, 73.26649475097656, 75.76493835449219, 78.26338958740234, 80.7618408203125, 83.26028442382812, 85.75873565673828]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 13.0, 24.0, 34.0, 50.0, 66.0, 90.0, 133.0, 144.0, 192.0, 283.0, 382.0, 458.0, 573.0, 764.0, 894.0, 1182.0, 1383.0, 1657.0, 2026.0, 2361.0, 2685.0, 2842.0, 1012617.0, 2862.0, 2712.0, 2525.0, 2190.0, 1866.0, 1530.0, 1313.0, 1070.0, 828.0, 684.0, 525.0, 416.0, 304.0, 245.0, 183.0, 134.0, 121.0, 85.0, 37.0, 43.0, 29.0, 21.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-383.05731201171875, -370.6102294921875, -358.1631164550781, -345.7160339355469, -333.2689514160156, -320.82183837890625, -308.374755859375, -295.92767333984375, -283.4805908203125, -271.03350830078125, -258.5863952636719, -246.13931274414062, -233.69223022460938, -221.24513244628906, -208.79803466796875, -196.3509521484375, -183.90383911132812, -171.4567413330078, -159.00965881347656, -146.56256103515625, -134.115478515625, -121.66838073730469, -109.22128295898438, -96.7741928100586, -84.32710266113281, -71.88001251220703, -59.432918548583984, -46.98582458496094, -34.538734436035156, -22.091644287109375, -9.644546508789062, 2.8025436401367188, 15.249664306640625, 27.69675636291504, 40.14384841918945, 52.5909423828125, 65.03803253173828, 77.48512268066406, 89.93222045898438, 102.37931060791016, 114.82640075683594, 127.27349090576172, 139.7205810546875, 152.1676788330078, 164.61477661132812, 177.06185913085938, 189.5089569091797, 201.9560546875, 214.40313720703125, 226.85023498535156, 239.2973175048828, 251.74441528320312, 264.1914978027344, 276.63861083984375, 289.085693359375, 301.53277587890625, 313.9798583984375, 326.42694091796875, 338.8740539550781, 351.3211364746094, 363.7682189941406, 376.21533203125, 388.66241455078125, 401.1094970703125, 413.5566101074219]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 15.0, 14.0, 35.0, 32.0, 60.0, 105.0, 145.0, 185.0, 305.0, 450.0, 714.0, 1159.0, 1766.0, 2625.0, 4143.0, 5789.0, 8404.0, 11582.0, 15100.0, 19685.0, 36771.0, 51253180.0, 36742.0, 19663.0, 15029.0, 11387.0, 8496.0, 5920.0, 4035.0, 2669.0, 1809.0, 1150.0, 696.0, 474.0, 328.0, 207.0, 154.0, 94.0, 61.0, 39.0, 34.0, 16.0, 14.0, 10.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.5635681152344, -322.2576904296875, -310.9517822265625, -299.6459045410156, -288.34002685546875, -277.03411865234375, -265.7282409667969, -254.42234802246094, -243.116455078125, -231.81056213378906, -220.50466918945312, -209.19879150390625, -197.8928985595703, -186.58700561523438, -175.2811279296875, -163.97523498535156, -152.66934204101562, -141.3634490966797, -130.05755615234375, -118.75167846679688, -107.44578552246094, -96.139892578125, -84.8340072631836, -73.52812194824219, -62.22222900390625, -50.91633987426758, -39.610450744628906, -28.304561614990234, -16.998672485351562, -5.692783355712891, 5.613105773925781, 16.918991088867188, 28.22491455078125, 39.53080368041992, 50.836692810058594, 62.142581939697266, 73.44847106933594, 84.75436401367188, 96.06024932861328, 107.36613464355469, 118.67202758789062, 129.97792053222656, 141.2838134765625, 152.58969116210938, 163.8955841064453, 175.20147705078125, 186.50735473632812, 197.81324768066406, 209.119140625, 220.42503356933594, 231.73092651367188, 243.03680419921875, 254.3426971435547, 265.6485900878906, 276.9544677734375, 288.2603759765625, 299.5662536621094, 310.87213134765625, 322.17803955078125, 333.4839172363281, 344.789794921875, 356.095703125, 367.4015808105469, 378.70745849609375, 390.01336669921875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 11.0, 14.0, 22.0, 19.0, 28.0, 49.0, 87.0, 103.0, 155.0, 242.0, 353.0, 535.0, 920.0, 1449.0, 2496.0, 4385.0, 8368.0, 16250.0, 35721.0, 92784.0, 289902.0, 1204557.0, 3701703.0, 635767.0, 180877.0, 61994.0, 25565.0, 12017.0, 6285.0, 3504.0, 1949.0, 1160.0, 748.0, 491.0, 295.0, 209.0, 123.0, 92.0, 62.0, 36.0, 24.0, 30.0, 11.0, 10.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-39.8125, -38.580078125, -37.34765625, -36.115234375, -34.8828125, -33.650390625, -32.41796875, -31.185546875, -29.953125, -28.720703125, -27.48828125, -26.255859375, -25.0234375, -23.791015625, -22.55859375, -21.326171875, -20.09375, -18.861328125, -17.62890625, -16.396484375, -15.1640625, -13.931640625, -12.69921875, -11.466796875, -10.234375, -9.001953125, -7.76953125, -6.537109375, -5.3046875, -4.072265625, -2.83984375, -1.607421875, -0.375, 0.857421875, 2.08984375, 3.322265625, 4.5546875, 5.787109375, 7.01953125, 8.251953125, 9.484375, 10.716796875, 11.94921875, 13.181640625, 14.4140625, 15.646484375, 16.87890625, 18.111328125, 19.34375, 20.576171875, 21.80859375, 23.041015625, 24.2734375, 25.505859375, 26.73828125, 27.970703125, 29.203125, 30.435546875, 31.66796875, 32.900390625, 34.1328125, 35.365234375, 36.59765625, 37.830078125, 39.0625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 5.0, 10.0, 14.0, 16.0, 23.0, 26.0, 37.0, 39.0, 68.0, 60.0, 66.0, 78.0, 612.0, 472.0, 80.0, 69.0, 55.0, 50.0, 46.0, 34.0, 34.0, 21.0, 15.0, 17.0, 13.0, 8.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-93.75, -91.068359375, -88.38671875, -85.705078125, -83.0234375, -80.341796875, -77.66015625, -74.978515625, -72.296875, -69.615234375, -66.93359375, -64.251953125, -61.5703125, -58.888671875, -56.20703125, -53.525390625, -50.84375, -48.162109375, -45.48046875, -42.798828125, -40.1171875, -37.435546875, -34.75390625, -32.072265625, -29.390625, -26.708984375, -24.02734375, -21.345703125, -18.6640625, -15.982421875, -13.30078125, -10.619140625, -7.9375, -5.255859375, -2.57421875, 0.107421875, 2.7890625, 5.470703125, 8.15234375, 10.833984375, 13.515625, 16.197265625, 18.87890625, 21.560546875, 24.2421875, 26.923828125, 29.60546875, 32.287109375, 34.96875, 37.650390625, 40.33203125, 43.013671875, 45.6953125, 48.376953125, 51.05859375, 53.740234375, 56.421875, 59.103515625, 61.78515625, 64.466796875, 67.1484375, 69.830078125, 72.51171875, 75.193359375, 77.875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 9.0, 8.0, 19.0, 24.0, 53.0, 65.0, 104.0, 130.0, 192.0, 336.0, 466.0, 769.0, 1339.0, 2063.0, 3737.0, 6942.0, 13165.0, 26697.0, 58628.0, 143882.0, 396445.0, 1993532.0, 2911891.0, 448618.0, 158882.0, 63561.0, 28643.0, 13990.0, 7324.0, 4066.0, 2286.0, 1374.0, 800.0, 452.0, 345.0, 188.0, 134.0, 97.0, 58.0, 37.0, 24.0, 17.0, 11.0, 8.0, 1.0, 2.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-29.65625, -28.73095703125, -27.8056640625, -26.88037109375, -25.955078125, -25.02978515625, -24.1044921875, -23.17919921875, -22.25390625, -21.32861328125, -20.4033203125, -19.47802734375, -18.552734375, -17.62744140625, -16.7021484375, -15.77685546875, -14.8515625, -13.92626953125, -13.0009765625, -12.07568359375, -11.150390625, -10.22509765625, -9.2998046875, -8.37451171875, -7.44921875, -6.52392578125, -5.5986328125, -4.67333984375, -3.748046875, -2.82275390625, -1.8974609375, -0.97216796875, -0.046875, 0.87841796875, 1.8037109375, 2.72900390625, 3.654296875, 4.57958984375, 5.5048828125, 6.43017578125, 7.35546875, 8.28076171875, 9.2060546875, 10.13134765625, 11.056640625, 11.98193359375, 12.9072265625, 13.83251953125, 14.7578125, 15.68310546875, 16.6083984375, 17.53369140625, 18.458984375, 19.38427734375, 20.3095703125, 21.23486328125, 22.16015625, 23.08544921875, 24.0107421875, 24.93603515625, 25.861328125, 26.78662109375, 27.7119140625, 28.63720703125, 29.5625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 9.0, 9.0, 8.0, 12.0, 11.0, 22.0, 25.0, 14.0, 27.0, 22.0, 31.0, 38.0, 50.0, 39.0, 69.0, 117.0, 317.0, 681.0, 99.0, 54.0, 45.0, 41.0, 38.0, 47.0, 38.0, 32.0, 17.0, 21.0, 20.0, 18.0, 16.0, 3.0, 5.0, 6.0, 6.0, 3.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-81.375, -79.20068359375, -77.0263671875, -74.85205078125, -72.677734375, -70.50341796875, -68.3291015625, -66.15478515625, -63.98046875, -61.80615234375, -59.6318359375, -57.45751953125, -55.283203125, -53.10888671875, -50.9345703125, -48.76025390625, -46.5859375, -44.41162109375, -42.2373046875, -40.06298828125, -37.888671875, -35.71435546875, -33.5400390625, -31.36572265625, -29.19140625, -27.01708984375, -24.8427734375, -22.66845703125, -20.494140625, -18.31982421875, -16.1455078125, -13.97119140625, -11.796875, -9.62255859375, -7.4482421875, -5.27392578125, -3.099609375, -0.92529296875, 1.2490234375, 3.42333984375, 5.59765625, 7.77197265625, 9.9462890625, 12.12060546875, 14.294921875, 16.46923828125, 18.6435546875, 20.81787109375, 22.9921875, 25.16650390625, 27.3408203125, 29.51513671875, 31.689453125, 33.86376953125, 36.0380859375, 38.21240234375, 40.38671875, 42.56103515625, 44.7353515625, 46.90966796875, 49.083984375, 51.25830078125, 53.4326171875, 55.60693359375, 57.78125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 21.0, 22.0, 14.0, 30.0, 36.0, 36.0, 47.0, 41.0, 70.0, 90.0, 112.0, 170.0, 200.0, 278.0, 372.0, 594.0, 719.0, 1211.0, 1821.0, 3146.0, 5685.0, 12442.0, 30833.0, 120597.0, 5946503.0, 110018.0, 29690.0, 12061.0, 5665.0, 3226.0, 1702.0, 1086.0, 776.0, 503.0, 344.0, 306.0, 218.0, 147.0, 147.0, 102.0, 64.0, 69.0, 28.0, 38.0, 45.0, 29.0, 16.0, 13.0, 5.0, 11.0, 6.0, 11.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-181.5, -175.734375, -169.96875, -164.203125, -158.4375, -152.671875, -146.90625, -141.140625, -135.375, -129.609375, -123.84375, -118.078125, -112.3125, -106.546875, -100.78125, -95.015625, -89.25, -83.484375, -77.71875, -71.953125, -66.1875, -60.421875, -54.65625, -48.890625, -43.125, -37.359375, -31.59375, -25.828125, -20.0625, -14.296875, -8.53125, -2.765625, 3.0, 8.765625, 14.53125, 20.296875, 26.0625, 31.828125, 37.59375, 43.359375, 49.125, 54.890625, 60.65625, 66.421875, 72.1875, 77.953125, 83.71875, 89.484375, 95.25, 101.015625, 106.78125, 112.546875, 118.3125, 124.078125, 129.84375, 135.609375, 141.375, 147.140625, 152.90625, 158.671875, 164.4375, 170.203125, 175.96875, 181.734375, 187.5]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 3.0, 8.0, 5.0, 8.0, 5.0, 12.0, 14.0, 10.0, 22.0, 21.0, 29.0, 24.0, 33.0, 40.0, 50.0, 63.0, 187.0, 760.0, 227.0, 74.0, 56.0, 49.0, 49.0, 46.0, 32.0, 34.0, 36.0, 21.0, 22.0, 16.0, 21.0, 8.0, 3.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-91.375, -88.5927734375, -85.810546875, -83.0283203125, -80.24609375, -77.4638671875, -74.681640625, -71.8994140625, -69.1171875, -66.3349609375, -63.552734375, -60.7705078125, -57.98828125, -55.2060546875, -52.423828125, -49.6416015625, -46.859375, -44.0771484375, -41.294921875, -38.5126953125, -35.73046875, -32.9482421875, -30.166015625, -27.3837890625, -24.6015625, -21.8193359375, -19.037109375, -16.2548828125, -13.47265625, -10.6904296875, -7.908203125, -5.1259765625, -2.34375, 0.4384765625, 3.220703125, 6.0029296875, 8.78515625, 11.5673828125, 14.349609375, 17.1318359375, 19.9140625, 22.6962890625, 25.478515625, 28.2607421875, 31.04296875, 33.8251953125, 36.607421875, 39.3896484375, 42.171875, 44.9541015625, 47.736328125, 50.5185546875, 53.30078125, 56.0830078125, 58.865234375, 61.6474609375, 64.4296875, 67.2119140625, 69.994140625, 72.7763671875, 75.55859375, 78.3408203125, 81.123046875, 83.9052734375, 86.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 22.0, 58.0, 222.0, 620.0, 43.0, 12.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2257.08203125, -2216.116943359375, -2175.15185546875, -2134.186767578125, -2093.2216796875, -2052.256591796875, -2011.29150390625, -1970.326416015625, -1929.361328125, -1888.396240234375, -1847.43115234375, -1806.466064453125, -1765.5009765625, -1724.535888671875, -1683.57080078125, -1642.605712890625, -1601.640625, -1560.675537109375, -1519.71044921875, -1478.745361328125, -1437.7802734375, -1396.815185546875, -1355.85009765625, -1314.885009765625, -1273.9200439453125, -1232.9549560546875, -1191.9898681640625, -1151.0247802734375, -1110.0596923828125, -1069.0946044921875, -1028.1295166015625, -987.1644287109375, -946.19921875, -905.234130859375, -864.26904296875, -823.303955078125, -782.3388671875, -741.373779296875, -700.40869140625, -659.443603515625, -618.4785766601562, -577.5134887695312, -536.5484008789062, -495.58331298828125, -454.61822509765625, -413.65313720703125, -372.6880798339844, -331.7229919433594, -290.7579040527344, -249.79281616210938, -208.82772827148438, -167.86265563964844, -126.89756774902344, -85.93247985839844, -44.9674072265625, -4.0023193359375, 36.9627685546875, 77.9278564453125, 118.89293670654297, 159.85801696777344, 200.82310485839844, 241.78819274902344, 282.7532653808594, 323.7183532714844, 364.6834411621094]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 11.0, 18.0, 38.0, 59.0, 199.0, 510.0, 66.0, 35.0, 22.0, 11.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1075.1649169921875, -1030.64794921875, -986.131103515625, -941.6141967773438, -897.0972900390625, -852.5803833007812, -808.0634765625, -763.5465698242188, -719.0296630859375, -674.5127563476562, -629.995849609375, -585.4789428710938, -540.9620361328125, -496.44512939453125, -451.92822265625, -407.41131591796875, -362.8944091796875, -318.37750244140625, -273.860595703125, -229.34368896484375, -184.8267822265625, -140.30987548828125, -95.79296875, -51.27606201171875, -6.7591552734375, 37.75775146484375, 82.274658203125, 126.79156494140625, 171.3084716796875, 215.82537841796875, 260.34228515625, 304.85919189453125, 349.3759765625, 393.89288330078125, 438.4097900390625, 482.92669677734375, 527.443603515625, 571.9605102539062, 616.4774169921875, 660.9943237304688, 705.51123046875, 750.0281372070312, 794.5450439453125, 839.0619506835938, 883.578857421875, 928.0957641601562, 972.6126708984375, 1017.1295776367188, 1061.646484375, 1106.163330078125, 1150.6802978515625, 1195.197265625, 1239.714111328125, 1284.23095703125, 1328.7479248046875, 1373.264892578125, 1417.78173828125, 1462.298583984375, 1506.8155517578125, 1551.33251953125, 1595.849365234375, 1640.3662109375, 1684.8831787109375, 1729.400146484375, 1773.9169921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 11.0, 11.0, 21.0, 43.0, 56.0, 59.0, 102.0, 135.0, 240.0, 306.0, 549.0, 813.0, 1295.0, 2272.0, 3933.0, 8042.0, 18336.0, 68190.0, 3396356.0, 618486.0, 44598.0, 15062.0, 6476.0, 3340.0, 1800.0, 1128.0, 725.0, 509.0, 330.0, 245.0, 202.0, 148.0, 103.0, 88.0, 67.0, 40.0, 38.0, 19.0, 26.0, 20.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.485107421875, -6.24365234375, -6.002197265625, -5.7607421875, -5.519287109375, -5.27783203125, -5.036376953125, -4.794921875, -4.553466796875, -4.31201171875, -4.070556640625, -3.8291015625, -3.587646484375, -3.34619140625, -3.104736328125, -2.86328125, -2.621826171875, -2.38037109375, -2.138916015625, -1.8974609375, -1.656005859375, -1.41455078125, -1.173095703125, -0.931640625, -0.690185546875, -0.44873046875, -0.207275390625, 0.0341796875, 0.275634765625, 0.51708984375, 0.758544921875, 1.0, 1.241455078125, 1.48291015625, 1.724365234375, 1.9658203125, 2.207275390625, 2.44873046875, 2.690185546875, 2.931640625, 3.173095703125, 3.41455078125, 3.656005859375, 3.8974609375, 4.138916015625, 4.38037109375, 4.621826171875, 4.86328125, 5.104736328125, 5.34619140625, 5.587646484375, 5.8291015625, 6.070556640625, 6.31201171875, 6.553466796875, 6.794921875, 7.036376953125, 7.27783203125, 7.519287109375, 7.7607421875, 8.002197265625, 8.24365234375, 8.485107421875, 8.7265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 3.0, 6.0, 14.0, 18.0, 56.0, 214.0, 418.0, 162.0, 30.0, 14.0, 10.0, 13.0, 6.0, 8.0, 0.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59912109375, -0.5787429809570312, -0.5583648681640625, -0.5379867553710938, -0.517608642578125, -0.49723052978515625, -0.4768524169921875, -0.45647430419921875, -0.43609619140625, -0.41571807861328125, -0.3953399658203125, -0.37496185302734375, -0.354583740234375, -0.33420562744140625, -0.3138275146484375, -0.29344940185546875, -0.2730712890625, -0.25269317626953125, -0.2323150634765625, -0.21193695068359375, -0.191558837890625, -0.17118072509765625, -0.1508026123046875, -0.13042449951171875, -0.11004638671875, -0.08966827392578125, -0.0692901611328125, -0.04891204833984375, -0.028533935546875, -0.00815582275390625, 0.0122222900390625, 0.03260040283203125, 0.052978515625, 0.07335662841796875, 0.0937347412109375, 0.11411285400390625, 0.134490966796875, 0.15486907958984375, 0.1752471923828125, 0.19562530517578125, 0.21600341796875, 0.23638153076171875, 0.2567596435546875, 0.27713775634765625, 0.297515869140625, 0.31789398193359375, 0.3382720947265625, 0.35865020751953125, 0.3790283203125, 0.39940643310546875, 0.4197845458984375, 0.44016265869140625, 0.460540771484375, 0.48091888427734375, 0.5012969970703125, 0.5216751098632812, 0.54205322265625, 0.5624313354492188, 0.5828094482421875, 0.6031875610351562, 0.623565673828125, 0.6439437866210938, 0.6643218994140625, 0.6847000122070312, 0.705078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 15.0, 12.0, 13.0, 14.0, 18.0, 28.0, 36.0, 37.0, 65.0, 89.0, 140.0, 220.0, 251.0, 423.0, 699.0, 1389.0, 2739.0, 6181.0, 18210.0, 79353.0, 1111844.0, 2807632.0, 125721.0, 24316.0, 7797.0, 3225.0, 1566.0, 831.0, 502.0, 281.0, 174.0, 142.0, 82.0, 61.0, 41.0, 28.0, 22.0, 14.0, 16.0, 15.0, 12.0, 7.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.2578125, -7.03179931640625, -6.8057861328125, -6.57977294921875, -6.353759765625, -6.12774658203125, -5.9017333984375, -5.67572021484375, -5.44970703125, -5.22369384765625, -4.9976806640625, -4.77166748046875, -4.545654296875, -4.31964111328125, -4.0936279296875, -3.86761474609375, -3.6416015625, -3.41558837890625, -3.1895751953125, -2.96356201171875, -2.737548828125, -2.51153564453125, -2.2855224609375, -2.05950927734375, -1.83349609375, -1.60748291015625, -1.3814697265625, -1.15545654296875, -0.929443359375, -0.70343017578125, -0.4774169921875, -0.25140380859375, -0.025390625, 0.20062255859375, 0.4266357421875, 0.65264892578125, 0.878662109375, 1.10467529296875, 1.3306884765625, 1.55670166015625, 1.78271484375, 2.00872802734375, 2.2347412109375, 2.46075439453125, 2.686767578125, 2.91278076171875, 3.1387939453125, 3.36480712890625, 3.5908203125, 3.81683349609375, 4.0428466796875, 4.26885986328125, 4.494873046875, 4.72088623046875, 4.9468994140625, 5.17291259765625, 5.39892578125, 5.62493896484375, 5.8509521484375, 6.07696533203125, 6.302978515625, 6.52899169921875, 6.7550048828125, 6.98101806640625, 7.20703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 5.0, 8.0, 9.0, 11.0, 5.0, 9.0, 17.0, 21.0, 23.0, 28.0, 40.0, 46.0, 69.0, 71.0, 87.0, 116.0, 147.0, 206.0, 312.0, 408.0, 657.0, 424.0, 292.0, 207.0, 164.0, 133.0, 98.0, 92.0, 72.0, 60.0, 46.0, 43.0, 23.0, 32.0, 11.0, 9.0, 21.0, 12.0, 8.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.936553955078125, -0.90142822265625, -0.866302490234375, -0.8311767578125, -0.796051025390625, -0.76092529296875, -0.725799560546875, -0.690673828125, -0.655548095703125, -0.62042236328125, -0.585296630859375, -0.5501708984375, -0.515045166015625, -0.47991943359375, -0.444793701171875, -0.40966796875, -0.374542236328125, -0.33941650390625, -0.304290771484375, -0.2691650390625, -0.234039306640625, -0.19891357421875, -0.163787841796875, -0.128662109375, -0.093536376953125, -0.05841064453125, -0.023284912109375, 0.0118408203125, 0.046966552734375, 0.08209228515625, 0.117218017578125, 0.15234375, 0.187469482421875, 0.22259521484375, 0.257720947265625, 0.2928466796875, 0.327972412109375, 0.36309814453125, 0.398223876953125, 0.433349609375, 0.468475341796875, 0.50360107421875, 0.538726806640625, 0.5738525390625, 0.608978271484375, 0.64410400390625, 0.679229736328125, 0.71435546875, 0.749481201171875, 0.78460693359375, 0.819732666015625, 0.8548583984375, 0.889984130859375, 0.92510986328125, 0.960235595703125, 0.995361328125, 1.030487060546875, 1.06561279296875, 1.100738525390625, 1.1358642578125, 1.170989990234375, 1.20611572265625, 1.241241455078125, 1.2763671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 4.0, 4.0, 14.0, 20.0, 44.0, 55.0, 126.0, 195.0, 203.0, 127.0, 70.0, 42.0, 28.0, 15.0, 15.0, 13.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.504745483398438, -10.862683296203613, -10.220622062683105, -9.578559875488281, -8.936498641967773, -8.29443645477295, -7.652374267578125, -7.010312557220459, -6.368250846862793, -5.726189136505127, -5.084127426147461, -4.442065238952637, -3.8000035285949707, -3.1579418182373047, -2.5158798694610596, -1.8738179206848145, -1.2317562103271484, -0.5896943807601929, 0.052367448806762695, 0.6944292783737183, 1.3364911079406738, 1.9785528182983398, 2.620614767074585, 3.26267671585083, 3.904738426208496, 4.546800136566162, 5.188861846923828, 5.830924034118652, 6.472985744476318, 7.115047454833984, 7.757109642028809, 8.399171829223633, 9.04123306274414, 9.683295249938965, 10.325356483459473, 10.967418670654297, 11.609479904174805, 12.251542091369629, 12.893604278564453, 13.535665512084961, 14.177727699279785, 14.81978988647461, 15.461851119995117, 16.103912353515625, 16.745975494384766, 17.388036727905273, 18.03009796142578, 18.672161102294922, 19.31422233581543, 19.956283569335938, 20.598346710205078, 21.240407943725586, 21.882469177246094, 22.524532318115234, 23.166593551635742, 23.80865478515625, 24.45071792602539, 25.0927791595459, 25.73484230041504, 26.376903533935547, 27.018964767456055, 27.661026000976562, 28.303089141845703, 28.94515037536621, 29.58721160888672]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 6.0, 10.0, 10.0, 13.0, 10.0, 14.0, 12.0, 24.0, 27.0, 26.0, 20.0, 32.0, 24.0, 47.0, 45.0, 35.0, 48.0, 42.0, 38.0, 44.0, 33.0, 50.0, 35.0, 36.0, 39.0, 33.0, 40.0, 29.0, 31.0, 22.0, 17.0, 16.0, 13.0, 12.0, 19.0, 9.0, 3.0, 8.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.937492370605469, -8.650494575500488, -8.363497734069824, -8.076499938964844, -7.789502143859863, -7.502504825592041, -7.215507507324219, -6.928509712219238, -6.641512393951416, -6.354515075683594, -6.067517280578613, -5.780519962310791, -5.493522644042969, -5.206524848937988, -4.919527530670166, -4.632530212402344, -4.345532417297363, -4.058535099029541, -3.7715373039245605, -3.4845399856567383, -3.197542428970337, -2.9105448722839355, -2.6235475540161133, -2.336549997329712, -2.0495524406433105, -1.7625548839569092, -1.4755574464797974, -1.1885600090026855, -0.9015624523162842, -0.6145648956298828, -0.327567458152771, -0.04057002067565918, 0.24642658233642578, 0.5334240794181824, 0.820421576499939, 1.1074190139770508, 1.3944165706634521, 1.6814141273498535, 1.9684115648269653, 2.255409002304077, 2.5424065589904785, 2.82940411567688, 3.1164016723632812, 3.4033989906311035, 3.690396547317505, 3.9773941040039062, 4.2643914222717285, 4.551388740539551, 4.838386535644531, 5.1253838539123535, 5.412381649017334, 5.699378967285156, 5.986376762390137, 6.273374080657959, 6.560371398925781, 6.847369194030762, 7.134366512298584, 7.421363830566406, 7.708361625671387, 7.995358943939209, 8.282356262207031, 8.569354057312012, 8.856351852416992, 9.143348693847656, 9.430346488952637]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 7.0, 12.0, 16.0, 21.0, 19.0, 36.0, 55.0, 62.0, 118.0, 198.0, 358.0, 631.0, 1262.0, 2820.0, 8120.0, 45048.0, 841935.0, 127070.0, 13283.0, 4041.0, 1572.0, 770.0, 421.0, 256.0, 140.0, 95.0, 63.0, 35.0, 31.0, 22.0, 13.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.859375, -8.5882568359375, -8.317138671875, -8.0460205078125, -7.77490234375, -7.5037841796875, -7.232666015625, -6.9615478515625, -6.6904296875, -6.4193115234375, -6.148193359375, -5.8770751953125, -5.60595703125, -5.3348388671875, -5.063720703125, -4.7926025390625, -4.521484375, -4.2503662109375, -3.979248046875, -3.7081298828125, -3.43701171875, -3.1658935546875, -2.894775390625, -2.6236572265625, -2.3525390625, -2.0814208984375, -1.810302734375, -1.5391845703125, -1.26806640625, -0.9969482421875, -0.725830078125, -0.4547119140625, -0.18359375, 0.0875244140625, 0.358642578125, 0.6297607421875, 0.90087890625, 1.1719970703125, 1.443115234375, 1.7142333984375, 1.9853515625, 2.2564697265625, 2.527587890625, 2.7987060546875, 3.06982421875, 3.3409423828125, 3.612060546875, 3.8831787109375, 4.154296875, 4.4254150390625, 4.696533203125, 4.9676513671875, 5.23876953125, 5.5098876953125, 5.781005859375, 6.0521240234375, 6.3232421875, 6.5943603515625, 6.865478515625, 7.1365966796875, 7.40771484375, 7.6788330078125, 7.949951171875, 8.2210693359375, 8.4921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 7.0, 13.0, 14.0, 29.0, 54.0, 112.0, 156.0, 198.0, 174.0, 104.0, 46.0, 30.0, 13.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4892578125, -0.467498779296875, -0.44573974609375, -0.423980712890625, -0.4022216796875, -0.380462646484375, -0.35870361328125, -0.336944580078125, -0.315185546875, -0.293426513671875, -0.27166748046875, -0.249908447265625, -0.2281494140625, -0.206390380859375, -0.18463134765625, -0.162872314453125, -0.14111328125, -0.119354248046875, -0.09759521484375, -0.075836181640625, -0.0540771484375, -0.032318115234375, -0.01055908203125, 0.011199951171875, 0.032958984375, 0.054718017578125, 0.07647705078125, 0.098236083984375, 0.1199951171875, 0.141754150390625, 0.16351318359375, 0.185272216796875, 0.20703125, 0.228790283203125, 0.25054931640625, 0.272308349609375, 0.2940673828125, 0.315826416015625, 0.33758544921875, 0.359344482421875, 0.381103515625, 0.402862548828125, 0.42462158203125, 0.446380615234375, 0.4681396484375, 0.489898681640625, 0.51165771484375, 0.533416748046875, 0.55517578125, 0.576934814453125, 0.59869384765625, 0.620452880859375, 0.6422119140625, 0.663970947265625, 0.68572998046875, 0.707489013671875, 0.729248046875, 0.751007080078125, 0.77276611328125, 0.794525146484375, 0.8162841796875, 0.838043212890625, 0.85980224609375, 0.881561279296875, 0.9033203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 7.0, 7.0, 5.0, 8.0, 6.0, 10.0, 18.0, 24.0, 61.0, 59.0, 102.0, 169.0, 261.0, 477.0, 948.0, 2093.0, 5485.0, 21487.0, 386889.0, 593412.0, 26227.0, 6201.0, 2300.0, 1070.0, 478.0, 263.0, 128.0, 109.0, 83.0, 48.0, 39.0, 24.0, 13.0, 14.0, 12.0, 8.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.377685546875, -9.07568359375, -8.773681640625, -8.4716796875, -8.169677734375, -7.86767578125, -7.565673828125, -7.263671875, -6.961669921875, -6.65966796875, -6.357666015625, -6.0556640625, -5.753662109375, -5.45166015625, -5.149658203125, -4.84765625, -4.545654296875, -4.24365234375, -3.941650390625, -3.6396484375, -3.337646484375, -3.03564453125, -2.733642578125, -2.431640625, -2.129638671875, -1.82763671875, -1.525634765625, -1.2236328125, -0.921630859375, -0.61962890625, -0.317626953125, -0.015625, 0.286376953125, 0.58837890625, 0.890380859375, 1.1923828125, 1.494384765625, 1.79638671875, 2.098388671875, 2.400390625, 2.702392578125, 3.00439453125, 3.306396484375, 3.6083984375, 3.910400390625, 4.21240234375, 4.514404296875, 4.81640625, 5.118408203125, 5.42041015625, 5.722412109375, 6.0244140625, 6.326416015625, 6.62841796875, 6.930419921875, 7.232421875, 7.534423828125, 7.83642578125, 8.138427734375, 8.4404296875, 8.742431640625, 9.04443359375, 9.346435546875, 9.6484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 7.0, 7.0, 11.0, 13.0, 15.0, 5.0, 13.0, 20.0, 26.0, 29.0, 30.0, 26.0, 40.0, 44.0, 37.0, 46.0, 51.0, 53.0, 32.0, 51.0, 52.0, 42.0, 44.0, 35.0, 39.0, 30.0, 39.0, 29.0, 17.0, 23.0, 19.0, 16.0, 10.0, 14.0, 10.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.853240966796875, -2.76702880859375, -2.680816650390625, -2.5946044921875, -2.508392333984375, -2.42218017578125, -2.335968017578125, -2.249755859375, -2.163543701171875, -2.07733154296875, -1.991119384765625, -1.9049072265625, -1.818695068359375, -1.73248291015625, -1.646270751953125, -1.56005859375, -1.473846435546875, -1.38763427734375, -1.301422119140625, -1.2152099609375, -1.128997802734375, -1.04278564453125, -0.956573486328125, -0.870361328125, -0.784149169921875, -0.69793701171875, -0.611724853515625, -0.5255126953125, -0.439300537109375, -0.35308837890625, -0.266876220703125, -0.1806640625, -0.094451904296875, -0.00823974609375, 0.077972412109375, 0.1641845703125, 0.250396728515625, 0.33660888671875, 0.422821044921875, 0.509033203125, 0.595245361328125, 0.68145751953125, 0.767669677734375, 0.8538818359375, 0.940093994140625, 1.02630615234375, 1.112518310546875, 1.19873046875, 1.284942626953125, 1.37115478515625, 1.457366943359375, 1.5435791015625, 1.629791259765625, 1.71600341796875, 1.802215576171875, 1.888427734375, 1.974639892578125, 2.06085205078125, 2.147064208984375, 2.2332763671875, 2.319488525390625, 2.40570068359375, 2.491912841796875, 2.578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 18.0, 19.0, 25.0, 33.0, 49.0, 77.0, 130.0, 228.0, 500.0, 1240.0, 4260.0, 27318.0, 915246.0, 88248.0, 7844.0, 1894.0, 673.0, 278.0, 162.0, 89.0, 54.0, 47.0, 28.0, 21.0, 12.0, 10.0, 5.0, 11.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5234375, -11.1708984375, -10.818359375, -10.4658203125, -10.11328125, -9.7607421875, -9.408203125, -9.0556640625, -8.703125, -8.3505859375, -7.998046875, -7.6455078125, -7.29296875, -6.9404296875, -6.587890625, -6.2353515625, -5.8828125, -5.5302734375, -5.177734375, -4.8251953125, -4.47265625, -4.1201171875, -3.767578125, -3.4150390625, -3.0625, -2.7099609375, -2.357421875, -2.0048828125, -1.65234375, -1.2998046875, -0.947265625, -0.5947265625, -0.2421875, 0.1103515625, 0.462890625, 0.8154296875, 1.16796875, 1.5205078125, 1.873046875, 2.2255859375, 2.578125, 2.9306640625, 3.283203125, 3.6357421875, 3.98828125, 4.3408203125, 4.693359375, 5.0458984375, 5.3984375, 5.7509765625, 6.103515625, 6.4560546875, 6.80859375, 7.1611328125, 7.513671875, 7.8662109375, 8.21875, 8.5712890625, 8.923828125, 9.2763671875, 9.62890625, 9.9814453125, 10.333984375, 10.6865234375, 11.0390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 9.0, 8.0, 8.0, 6.0, 26.0, 29.0, 35.0, 65.0, 87.0, 116.0, 137.0, 149.0, 107.0, 54.0, 43.0, 21.0, 19.0, 13.0, 10.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0005340576171875, -0.0005208998918533325, -0.000507742166519165, -0.0004945844411849976, -0.0004814267158508301, -0.0004682689905166626, -0.0004551112651824951, -0.00044195353984832764, -0.00042879581451416016, -0.0004156380891799927, -0.0004024803638458252, -0.0003893226385116577, -0.00037616491317749023, -0.00036300718784332275, -0.0003498494625091553, -0.0003366917371749878, -0.0003235340118408203, -0.00031037628650665283, -0.00029721856117248535, -0.00028406083583831787, -0.0002709031105041504, -0.0002577453851699829, -0.00024458765983581543, -0.00023142993450164795, -0.00021827220916748047, -0.000205114483833313, -0.0001919567584991455, -0.00017879903316497803, -0.00016564130783081055, -0.00015248358249664307, -0.00013932585716247559, -0.0001261681318283081, -0.00011301040649414062, -9.985268115997314e-05, -8.669495582580566e-05, -7.353723049163818e-05, -6.03795051574707e-05, -4.722177982330322e-05, -3.406405448913574e-05, -2.0906329154968262e-05, -7.748603820800781e-06, 5.409121513366699e-06, 1.856684684753418e-05, 3.172457218170166e-05, 4.488229751586914e-05, 5.804002285003662e-05, 7.11977481842041e-05, 8.435547351837158e-05, 9.751319885253906e-05, 0.00011067092418670654, 0.00012382864952087402, 0.0001369863748550415, 0.00015014410018920898, 0.00016330182552337646, 0.00017645955085754395, 0.00018961727619171143, 0.0002027750015258789, 0.0002159327268600464, 0.00022909045219421387, 0.00024224817752838135, 0.00025540590286254883, 0.0002685636281967163, 0.0002817213535308838, 0.00029487907886505127, 0.00030803680419921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 18.0, 18.0, 28.0, 55.0, 118.0, 235.0, 608.0, 1878.0, 8366.0, 125529.0, 883904.0, 22573.0, 3478.0, 1007.0, 370.0, 171.0, 79.0, 53.0, 20.0, 21.0, 8.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0667724609375, -10.688232421875, -10.3096923828125, -9.93115234375, -9.5526123046875, -9.174072265625, -8.7955322265625, -8.4169921875, -8.0384521484375, -7.659912109375, -7.2813720703125, -6.90283203125, -6.5242919921875, -6.145751953125, -5.7672119140625, -5.388671875, -5.0101318359375, -4.631591796875, -4.2530517578125, -3.87451171875, -3.4959716796875, -3.117431640625, -2.7388916015625, -2.3603515625, -1.9818115234375, -1.603271484375, -1.2247314453125, -0.84619140625, -0.4676513671875, -0.089111328125, 0.2894287109375, 0.66796875, 1.0465087890625, 1.425048828125, 1.8035888671875, 2.18212890625, 2.5606689453125, 2.939208984375, 3.3177490234375, 3.6962890625, 4.0748291015625, 4.453369140625, 4.8319091796875, 5.21044921875, 5.5889892578125, 5.967529296875, 6.3460693359375, 6.724609375, 7.1031494140625, 7.481689453125, 7.8602294921875, 8.23876953125, 8.6173095703125, 8.995849609375, 9.3743896484375, 9.7529296875, 10.1314697265625, 10.510009765625, 10.8885498046875, 11.26708984375, 11.6456298828125, 12.024169921875, 12.4027099609375, 12.78125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 13.0, 8.0, 15.0, 19.0, 34.0, 31.0, 68.0, 81.0, 116.0, 115.0, 112.0, 114.0, 87.0, 48.0, 40.0, 28.0, 20.0, 9.0, 7.0, 7.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6640625, -4.53460693359375, -4.4051513671875, -4.27569580078125, -4.146240234375, -4.01678466796875, -3.8873291015625, -3.75787353515625, -3.62841796875, -3.49896240234375, -3.3695068359375, -3.24005126953125, -3.110595703125, -2.98114013671875, -2.8516845703125, -2.72222900390625, -2.5927734375, -2.46331787109375, -2.3338623046875, -2.20440673828125, -2.074951171875, -1.94549560546875, -1.8160400390625, -1.68658447265625, -1.55712890625, -1.42767333984375, -1.2982177734375, -1.16876220703125, -1.039306640625, -0.90985107421875, -0.7803955078125, -0.65093994140625, -0.521484375, -0.39202880859375, -0.2625732421875, -0.13311767578125, -0.003662109375, 0.12579345703125, 0.2552490234375, 0.38470458984375, 0.51416015625, 0.64361572265625, 0.7730712890625, 0.90252685546875, 1.031982421875, 1.16143798828125, 1.2908935546875, 1.42034912109375, 1.5498046875, 1.67926025390625, 1.8087158203125, 1.93817138671875, 2.067626953125, 2.19708251953125, 2.3265380859375, 2.45599365234375, 2.58544921875, 2.71490478515625, 2.8443603515625, 2.97381591796875, 3.103271484375, 3.23272705078125, 3.3621826171875, 3.49163818359375, 3.62109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 3.0, 10.0, 14.0, 47.0, 109.0, 288.0, 279.0, 120.0, 44.0, 22.0, 18.0, 11.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4100341796875, -32.678707122802734, -30.947376251220703, -29.216049194335938, -27.484718322753906, -25.75339126586914, -24.022062301635742, -22.290733337402344, -20.559404373168945, -18.828075408935547, -17.09674644470215, -15.365418434143066, -13.634089469909668, -11.90276050567627, -10.171432495117188, -8.440103530883789, -6.708774566650391, -4.977445602416992, -3.246117115020752, -1.5147886276245117, 0.21654033660888672, 1.9478693008422852, 3.679197311401367, 5.410526275634766, 7.141855239868164, 8.873184204101562, 10.604513168334961, 12.335841178894043, 14.067170143127441, 15.79849910736084, 17.529827117919922, 19.26115608215332, 20.99248504638672, 22.723814010620117, 24.455142974853516, 26.18647003173828, 27.917800903320312, 29.649127960205078, 31.380456924438477, 33.111785888671875, 34.843116760253906, 36.57444381713867, 38.3057746887207, 40.03710174560547, 41.7684326171875, 43.499759674072266, 45.23108673095703, 46.96241760253906, 48.69374465942383, 50.425071716308594, 52.156402587890625, 53.88772964477539, 55.61906051635742, 57.35038757324219, 59.08171844482422, 60.813045501708984, 62.54437255859375, 64.27570343017578, 66.00702667236328, 67.73835754394531, 69.46968841552734, 71.20101928710938, 72.93234252929688, 74.6636734008789, 76.39500427246094]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 7.0, 0.0, 2.0, 5.0, 3.0, 13.0, 10.0, 25.0, 41.0, 64.0, 82.0, 118.0, 122.0, 128.0, 125.0, 83.0, 65.0, 41.0, 15.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-64.34403991699219, -62.69165802001953, -61.039276123046875, -59.38689422607422, -57.73451614379883, -56.08213424682617, -54.429752349853516, -52.77737045288086, -51.12499237060547, -49.47261047363281, -47.820228576660156, -46.1678466796875, -44.51546859741211, -42.86308670043945, -41.2107048034668, -39.55832290649414, -37.905941009521484, -36.25355911254883, -34.60117721557617, -32.94879913330078, -31.296417236328125, -29.64403533935547, -27.991653442382812, -26.339271545410156, -24.686891555786133, -23.034509658813477, -21.382129669189453, -19.729747772216797, -18.07736587524414, -16.424985885620117, -14.772603988647461, -13.120223045349121, -11.467842102050781, -9.815461158752441, -8.163080215454102, -6.510698318481445, -4.8583173751831055, -3.2059364318847656, -1.5535545349121094, 0.09882640838623047, 1.7512073516845703, 3.4035885334014893, 5.055969715118408, 6.708351135253906, 8.360732078552246, 10.013113021850586, 11.665494918823242, 13.317875862121582, 14.970256805419922, 16.622638702392578, 18.2750186920166, 19.927400588989258, 21.57978057861328, 23.232162475585938, 24.884544372558594, 26.53692626953125, 28.189306259155273, 29.84168815612793, 31.494068145751953, 33.14645004272461, 34.798831939697266, 36.451210021972656, 38.10359191894531, 39.75597381591797, 41.408355712890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 11.0, 7.0, 11.0, 22.0, 34.0, 57.0, 265.0, 8338.0, 4175632.0, 9395.0, 334.0, 65.0, 28.0, 20.0, 13.0, 8.0, 5.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.5, -95.5595703125, -92.619140625, -89.6787109375, -86.73828125, -83.7978515625, -80.857421875, -77.9169921875, -74.9765625, -72.0361328125, -69.095703125, -66.1552734375, -63.21484375, -60.2744140625, -57.333984375, -54.3935546875, -51.453125, -48.5126953125, -45.572265625, -42.6318359375, -39.69140625, -36.7509765625, -33.810546875, -30.8701171875, -27.9296875, -24.9892578125, -22.048828125, -19.1083984375, -16.16796875, -13.2275390625, -10.287109375, -7.3466796875, -4.40625, -1.4658203125, 1.474609375, 4.4150390625, 7.35546875, 10.2958984375, 13.236328125, 16.1767578125, 19.1171875, 22.0576171875, 24.998046875, 27.9384765625, 30.87890625, 33.8193359375, 36.759765625, 39.7001953125, 42.640625, 45.5810546875, 48.521484375, 51.4619140625, 54.40234375, 57.3427734375, 60.283203125, 63.2236328125, 66.1640625, 69.1044921875, 72.044921875, 74.9853515625, 77.92578125, 80.8662109375, 83.806640625, 86.7470703125, 89.6875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 3.0, 9.0, 9.0, 12.0, 15.0, 17.0, 36.0, 54.0, 73.0, 87.0, 88.0, 104.0, 99.0, 102.0, 80.0, 54.0, 55.0, 23.0, 11.0, 11.0, 11.0, 8.0, 7.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36083984375, -0.34632110595703125, -0.3318023681640625, -0.31728363037109375, -0.302764892578125, -0.28824615478515625, -0.2737274169921875, -0.25920867919921875, -0.24468994140625, -0.23017120361328125, -0.2156524658203125, -0.20113372802734375, -0.186614990234375, -0.17209625244140625, -0.1575775146484375, -0.14305877685546875, -0.1285400390625, -0.11402130126953125, -0.0995025634765625, -0.08498382568359375, -0.070465087890625, -0.05594635009765625, -0.0414276123046875, -0.02690887451171875, -0.01239013671875, 0.00212860107421875, 0.0166473388671875, 0.03116607666015625, 0.045684814453125, 0.06020355224609375, 0.0747222900390625, 0.08924102783203125, 0.103759765625, 0.11827850341796875, 0.1327972412109375, 0.14731597900390625, 0.161834716796875, 0.17635345458984375, 0.1908721923828125, 0.20539093017578125, 0.21990966796875, 0.23442840576171875, 0.2489471435546875, 0.26346588134765625, 0.277984619140625, 0.29250335693359375, 0.3070220947265625, 0.32154083251953125, 0.3360595703125, 0.35057830810546875, 0.3650970458984375, 0.37961578369140625, 0.394134521484375, 0.40865325927734375, 0.4231719970703125, 0.43769073486328125, 0.45220947265625, 0.46672821044921875, 0.4812469482421875, 0.49576568603515625, 0.510284423828125, 0.5248031616210938, 0.5393218994140625, 0.5538406372070312, 0.568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 14.0, 30.0, 93.0, 236.0, 1937.0, 314737.0, 3872608.0, 3713.0, 510.0, 205.0, 95.0, 49.0, 28.0, 20.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -11.918701171875, -10.44677734375, -8.974853515625, -7.5029296875, -6.031005859375, -4.55908203125, -3.087158203125, -1.615234375, -0.143310546875, 1.32861328125, 2.800537109375, 4.2724609375, 5.744384765625, 7.21630859375, 8.688232421875, 10.16015625, 11.632080078125, 13.10400390625, 14.575927734375, 16.0478515625, 17.519775390625, 18.99169921875, 20.463623046875, 21.935546875, 23.407470703125, 24.87939453125, 26.351318359375, 27.8232421875, 29.295166015625, 30.76708984375, 32.239013671875, 33.7109375, 35.182861328125, 36.65478515625, 38.126708984375, 39.5986328125, 41.070556640625, 42.54248046875, 44.014404296875, 45.486328125, 46.958251953125, 48.43017578125, 49.902099609375, 51.3740234375, 52.845947265625, 54.31787109375, 55.789794921875, 57.26171875, 58.733642578125, 60.20556640625, 61.677490234375, 63.1494140625, 64.621337890625, 66.09326171875, 67.565185546875, 69.037109375, 70.509033203125, 71.98095703125, 73.452880859375, 74.9248046875, 76.396728515625, 77.86865234375, 79.340576171875, 80.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 7.0, 3.0, 5.0, 9.0, 8.0, 7.0, 12.0, 16.0, 13.0, 14.0, 29.0, 30.0, 53.0, 57.0, 67.0, 110.0, 162.0, 337.0, 1055.0, 868.0, 470.0, 235.0, 138.0, 87.0, 51.0, 35.0, 39.0, 16.0, 22.0, 18.0, 14.0, 17.0, 10.0, 10.0, 9.0, 5.0, 5.0, 1.0, 7.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.78955078125, -0.7655563354492188, -0.7415618896484375, -0.7175674438476562, -0.693572998046875, -0.6695785522460938, -0.6455841064453125, -0.6215896606445312, -0.59759521484375, -0.5736007690429688, -0.5496063232421875, -0.5256118774414062, -0.501617431640625, -0.47762298583984375, -0.4536285400390625, -0.42963409423828125, -0.4056396484375, -0.38164520263671875, -0.3576507568359375, -0.33365631103515625, -0.309661865234375, -0.28566741943359375, -0.2616729736328125, -0.23767852783203125, -0.21368408203125, -0.18968963623046875, -0.1656951904296875, -0.14170074462890625, -0.117706298828125, -0.09371185302734375, -0.0697174072265625, -0.04572296142578125, -0.021728515625, 0.00226593017578125, 0.0262603759765625, 0.05025482177734375, 0.074249267578125, 0.09824371337890625, 0.1222381591796875, 0.14623260498046875, 0.17022705078125, 0.19422149658203125, 0.2182159423828125, 0.24221038818359375, 0.266204833984375, 0.29019927978515625, 0.3141937255859375, 0.33818817138671875, 0.3621826171875, 0.38617706298828125, 0.4101715087890625, 0.43416595458984375, 0.458160400390625, 0.48215484619140625, 0.5061492919921875, 0.5301437377929688, 0.55413818359375, 0.5781326293945312, 0.6021270751953125, 0.6261215209960938, 0.650115966796875, 0.6741104125976562, 0.6981048583984375, 0.7220993041992188, 0.74609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 904.0, 99.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.41563606262207, -8.240530014038086, -3.0654239654541016, 2.109682083129883, 7.284788131713867, 12.459894180297852, 17.635000228881836, 22.81010627746582, 27.985212326049805, 33.160316467285156, 38.335426330566406, 43.510528564453125, 48.685638427734375, 53.860740661621094, 59.035850524902344, 64.21095275878906, 69.38606262207031, 74.56117248535156, 79.73627471923828, 84.911376953125, 90.08648681640625, 95.2615966796875, 100.43669891357422, 105.61180114746094, 110.78691101074219, 115.96202087402344, 121.13712310791016, 126.31222534179688, 131.48733520507812, 136.66244506835938, 141.83755493164062, 147.0126495361328, 152.187744140625, 157.36285400390625, 162.5379638671875, 167.7130584716797, 172.88816833496094, 178.0632781982422, 183.23837280273438, 188.41348266601562, 193.58859252929688, 198.76370239257812, 203.93881225585938, 209.11390686035156, 214.2890167236328, 219.46412658691406, 224.63922119140625, 229.8143310546875, 234.98944091796875, 240.16455078125, 245.33966064453125, 250.51475524902344, 255.6898651123047, 260.8649597167969, 266.0400695800781, 271.2151794433594, 276.3902893066406, 281.5653991699219, 286.7405090332031, 291.9156188964844, 297.0906982421875, 302.26580810546875, 307.44091796875, 312.61602783203125, 317.7911376953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 1.0, 3.0, 11.0, 14.0, 16.0, 33.0, 58.0, 62.0, 105.0, 102.0, 109.0, 103.0, 98.0, 91.0, 70.0, 42.0, 38.0, 21.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.060612201690674, -6.711625576019287, -6.3626389503479, -6.013652801513672, -5.664666175842285, -5.315679550170898, -4.966692924499512, -4.617706298828125, -4.268719673156738, -3.9197330474853516, -3.570746660232544, -3.2217600345611572, -2.8727736473083496, -2.523787021636963, -2.174800395965576, -1.8258140087127686, -1.476827621459961, -1.1278411149978638, -0.7788545489311218, -0.4298679828643799, -0.08088147640228271, 0.26810503005981445, 0.6170916557312012, 0.9660780429840088, 1.3150646686553955, 1.6640511751174927, 2.01303768157959, 2.3620243072509766, 2.7110109329223633, 3.059997320175171, 3.4089839458465576, 3.7579703330993652, 4.10695743560791, 4.455944061279297, 4.804930686950684, 5.15391731262207, 5.502903461456299, 5.8518900871276855, 6.200876712799072, 6.549862861633301, 6.8988494873046875, 7.247836112976074, 7.596822738647461, 7.945809364318848, 8.294795989990234, 8.643781661987305, 8.992769241333008, 9.341754913330078, 9.690742492675781, 10.039729118347168, 10.388715744018555, 10.737702369689941, 11.086688995361328, 11.435674667358398, 11.784662246704102, 12.133647918701172, 12.482634544372559, 12.831621170043945, 13.180607795715332, 13.529594421386719, 13.878581047058105, 14.227567672729492, 14.576553344726562, 14.92553997039795, 15.274526596069336]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 2.0, 4.0, 10.0, 7.0, 14.0, 21.0, 33.0, 49.0, 65.0, 146.0, 318.0, 899.0, 2558.0, 9876.0, 62380.0, 751077.0, 193986.0, 20197.0, 4544.0, 1302.0, 531.0, 220.0, 114.0, 66.0, 33.0, 21.0, 26.0, 12.0, 11.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.40625, -14.0029296875, -13.599609375, -13.1962890625, -12.79296875, -12.3896484375, -11.986328125, -11.5830078125, -11.1796875, -10.7763671875, -10.373046875, -9.9697265625, -9.56640625, -9.1630859375, -8.759765625, -8.3564453125, -7.953125, -7.5498046875, -7.146484375, -6.7431640625, -6.33984375, -5.9365234375, -5.533203125, -5.1298828125, -4.7265625, -4.3232421875, -3.919921875, -3.5166015625, -3.11328125, -2.7099609375, -2.306640625, -1.9033203125, -1.5, -1.0966796875, -0.693359375, -0.2900390625, 0.11328125, 0.5166015625, 0.919921875, 1.3232421875, 1.7265625, 2.1298828125, 2.533203125, 2.9365234375, 3.33984375, 3.7431640625, 4.146484375, 4.5498046875, 4.953125, 5.3564453125, 5.759765625, 6.1630859375, 6.56640625, 6.9697265625, 7.373046875, 7.7763671875, 8.1796875, 8.5830078125, 8.986328125, 9.3896484375, 9.79296875, 10.1962890625, 10.599609375, 11.0029296875, 11.40625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 19.0, 19.0, 38.0, 61.0, 86.0, 147.0, 144.0, 127.0, 119.0, 82.0, 48.0, 40.0, 25.0, 17.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0498313903808594, -1.0264205932617188, -1.0030097961425781, -0.9795989990234375, -0.9561882019042969, -0.9327774047851562, -0.9093666076660156, -0.885955810546875, -0.8625450134277344, -0.8391342163085938, -0.8157234191894531, -0.7923126220703125, -0.7689018249511719, -0.7454910278320312, -0.7220802307128906, -0.69866943359375, -0.6752586364746094, -0.6518478393554688, -0.6284370422363281, -0.6050262451171875, -0.5816154479980469, -0.5582046508789062, -0.5347938537597656, -0.511383056640625, -0.4879722595214844, -0.46456146240234375, -0.4411506652832031, -0.4177398681640625, -0.3943290710449219, -0.37091827392578125, -0.3475074768066406, -0.3240966796875, -0.3006858825683594, -0.27727508544921875, -0.2538642883300781, -0.2304534912109375, -0.20704269409179688, -0.18363189697265625, -0.16022109985351562, -0.136810302734375, -0.11339950561523438, -0.08998870849609375, -0.06657791137695312, -0.0431671142578125, -0.019756317138671875, 0.00365447998046875, 0.027065277099609375, 0.05047607421875, 0.07388687133789062, 0.09729766845703125, 0.12070846557617188, 0.1441192626953125, 0.16753005981445312, 0.19094085693359375, 0.21435165405273438, 0.237762451171875, 0.2611732482910156, 0.28458404541015625, 0.3079948425292969, 0.3314056396484375, 0.3548164367675781, 0.37822723388671875, 0.4016380310058594, 0.425048828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 4.0, 11.0, 18.0, 17.0, 19.0, 19.0, 13.0, 28.0, 80.0, 273.0, 2358.0, 188570.0, 852173.0, 4344.0, 345.0, 75.0, 35.0, 22.0, 15.0, 18.0, 9.0, 13.0, 11.0, 11.0, 6.0, 5.0, 9.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.828125, -27.012451171875, -26.19677734375, -25.381103515625, -24.5654296875, -23.749755859375, -22.93408203125, -22.118408203125, -21.302734375, -20.487060546875, -19.67138671875, -18.855712890625, -18.0400390625, -17.224365234375, -16.40869140625, -15.593017578125, -14.77734375, -13.961669921875, -13.14599609375, -12.330322265625, -11.5146484375, -10.698974609375, -9.88330078125, -9.067626953125, -8.251953125, -7.436279296875, -6.62060546875, -5.804931640625, -4.9892578125, -4.173583984375, -3.35791015625, -2.542236328125, -1.7265625, -0.910888671875, -0.09521484375, 0.720458984375, 1.5361328125, 2.351806640625, 3.16748046875, 3.983154296875, 4.798828125, 5.614501953125, 6.43017578125, 7.245849609375, 8.0615234375, 8.877197265625, 9.69287109375, 10.508544921875, 11.32421875, 12.139892578125, 12.95556640625, 13.771240234375, 14.5869140625, 15.402587890625, 16.21826171875, 17.033935546875, 17.849609375, 18.665283203125, 19.48095703125, 20.296630859375, 21.1123046875, 21.927978515625, 22.74365234375, 23.559326171875, 24.375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 9.0, 10.0, 13.0, 19.0, 14.0, 21.0, 18.0, 31.0, 26.0, 37.0, 34.0, 44.0, 38.0, 37.0, 38.0, 40.0, 49.0, 43.0, 41.0, 41.0, 44.0, 45.0, 43.0, 41.0, 35.0, 23.0, 25.0, 27.0, 20.0, 19.0, 16.0, 8.0, 11.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.046875, -1.9837188720703125, -1.920562744140625, -1.8574066162109375, -1.79425048828125, -1.7310943603515625, -1.667938232421875, -1.6047821044921875, -1.5416259765625, -1.4784698486328125, -1.415313720703125, -1.3521575927734375, -1.28900146484375, -1.2258453369140625, -1.162689208984375, -1.0995330810546875, -1.036376953125, -0.9732208251953125, -0.910064697265625, -0.8469085693359375, -0.78375244140625, -0.7205963134765625, -0.657440185546875, -0.5942840576171875, -0.5311279296875, -0.4679718017578125, -0.404815673828125, -0.3416595458984375, -0.27850341796875, -0.2153472900390625, -0.152191162109375, -0.0890350341796875, -0.02587890625, 0.0372772216796875, 0.100433349609375, 0.1635894775390625, 0.22674560546875, 0.2899017333984375, 0.353057861328125, 0.4162139892578125, 0.4793701171875, 0.5425262451171875, 0.605682373046875, 0.6688385009765625, 0.73199462890625, 0.7951507568359375, 0.858306884765625, 0.9214630126953125, 0.984619140625, 1.0477752685546875, 1.110931396484375, 1.1740875244140625, 1.23724365234375, 1.3003997802734375, 1.363555908203125, 1.4267120361328125, 1.4898681640625, 1.5530242919921875, 1.616180419921875, 1.6793365478515625, 1.74249267578125, 1.8056488037109375, 1.868804931640625, 1.9319610595703125, 1.9951171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 21.0, 51.0, 170.0, 1534.0, 1043486.0, 2954.0, 221.0, 52.0, 23.0, 12.0, 3.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-124.375, -120.30859375, -116.2421875, -112.17578125, -108.109375, -104.04296875, -99.9765625, -95.91015625, -91.84375, -87.77734375, -83.7109375, -79.64453125, -75.578125, -71.51171875, -67.4453125, -63.37890625, -59.3125, -55.24609375, -51.1796875, -47.11328125, -43.046875, -38.98046875, -34.9140625, -30.84765625, -26.78125, -22.71484375, -18.6484375, -14.58203125, -10.515625, -6.44921875, -2.3828125, 1.68359375, 5.75, 9.81640625, 13.8828125, 17.94921875, 22.015625, 26.08203125, 30.1484375, 34.21484375, 38.28125, 42.34765625, 46.4140625, 50.48046875, 54.546875, 58.61328125, 62.6796875, 66.74609375, 70.8125, 74.87890625, 78.9453125, 83.01171875, 87.078125, 91.14453125, 95.2109375, 99.27734375, 103.34375, 107.41015625, 111.4765625, 115.54296875, 119.609375, 123.67578125, 127.7421875, 131.80859375, 135.875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 3.0, 8.0, 5.0, 10.0, 5.0, 19.0, 16.0, 16.0, 15.0, 15.0, 25.0, 27.0, 38.0, 38.0, 56.0, 76.0, 103.0, 101.0, 94.0, 62.0, 41.0, 35.0, 32.0, 19.0, 18.0, 24.0, 9.0, 14.0, 10.0, 10.0, 8.0, 5.0, 6.0, 5.0, 3.0, 6.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008368492126464844, -0.0008098185062408447, -0.0007827877998352051, -0.0007557570934295654, -0.0007287263870239258, -0.0007016956806182861, -0.0006746649742126465, -0.0006476342678070068, -0.0006206035614013672, -0.0005935728549957275, -0.0005665421485900879, -0.0005395114421844482, -0.0005124807357788086, -0.00048545002937316895, -0.0004584193229675293, -0.00043138861656188965, -0.00040435791015625, -0.00037732720375061035, -0.0003502964973449707, -0.00032326579093933105, -0.0002962350845336914, -0.00026920437812805176, -0.0002421736717224121, -0.00021514296531677246, -0.0001881122589111328, -0.00016108155250549316, -0.00013405084609985352, -0.00010702013969421387, -7.998943328857422e-05, -5.295872688293457e-05, -2.5928020477294922e-05, 1.1026859283447266e-06, 2.8133392333984375e-05, 5.5164098739624023e-05, 8.219480514526367e-05, 0.00010922551155090332, 0.00013625621795654297, 0.00016328692436218262, 0.00019031763076782227, 0.00021734833717346191, 0.00024437904357910156, 0.0002714097499847412, 0.00029844045639038086, 0.0003254711627960205, 0.00035250186920166016, 0.0003795325756072998, 0.00040656328201293945, 0.0004335939884185791, 0.00046062469482421875, 0.0004876554012298584, 0.000514686107635498, 0.0005417168140411377, 0.0005687475204467773, 0.000595778226852417, 0.0006228089332580566, 0.0006498396396636963, 0.0006768703460693359, 0.0007039010524749756, 0.0007309317588806152, 0.0007579624652862549, 0.0007849931716918945, 0.0008120238780975342, 0.0008390545845031738, 0.0008660852909088135, 0.0008931159973144531]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 7.0, 7.0, 24.0, 28.0, 22.0, 34.0, 40.0, 66.0, 101.0, 147.0, 252.0, 426.0, 730.0, 1712.0, 4251.0, 13401.0, 62114.0, 729740.0, 196809.0, 26033.0, 7275.0, 2717.0, 1157.0, 625.0, 301.0, 178.0, 129.0, 61.0, 46.0, 29.0, 18.0, 17.0, 4.0, 9.0, 10.0, 2.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.609375, -16.1312255859375, -15.653076171875, -15.1749267578125, -14.69677734375, -14.2186279296875, -13.740478515625, -13.2623291015625, -12.7841796875, -12.3060302734375, -11.827880859375, -11.3497314453125, -10.87158203125, -10.3934326171875, -9.915283203125, -9.4371337890625, -8.958984375, -8.4808349609375, -8.002685546875, -7.5245361328125, -7.04638671875, -6.5682373046875, -6.090087890625, -5.6119384765625, -5.1337890625, -4.6556396484375, -4.177490234375, -3.6993408203125, -3.22119140625, -2.7430419921875, -2.264892578125, -1.7867431640625, -1.30859375, -0.8304443359375, -0.352294921875, 0.1258544921875, 0.60400390625, 1.0821533203125, 1.560302734375, 2.0384521484375, 2.5166015625, 2.9947509765625, 3.472900390625, 3.9510498046875, 4.42919921875, 4.9073486328125, 5.385498046875, 5.8636474609375, 6.341796875, 6.8199462890625, 7.298095703125, 7.7762451171875, 8.25439453125, 8.7325439453125, 9.210693359375, 9.6888427734375, 10.1669921875, 10.6451416015625, 11.123291015625, 11.6014404296875, 12.07958984375, 12.5577392578125, 13.035888671875, 13.5140380859375, 13.9921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 7.0, 21.0, 36.0, 49.0, 90.0, 165.0, 228.0, 179.0, 87.0, 56.0, 32.0, 22.0, 5.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.71875, -13.4100341796875, -13.101318359375, -12.7926025390625, -12.48388671875, -12.1751708984375, -11.866455078125, -11.5577392578125, -11.2490234375, -10.9403076171875, -10.631591796875, -10.3228759765625, -10.01416015625, -9.7054443359375, -9.396728515625, -9.0880126953125, -8.779296875, -8.4705810546875, -8.161865234375, -7.8531494140625, -7.54443359375, -7.2357177734375, -6.927001953125, -6.6182861328125, -6.3095703125, -6.0008544921875, -5.692138671875, -5.3834228515625, -5.07470703125, -4.7659912109375, -4.457275390625, -4.1485595703125, -3.83984375, -3.5311279296875, -3.222412109375, -2.9136962890625, -2.60498046875, -2.2962646484375, -1.987548828125, -1.6788330078125, -1.3701171875, -1.0614013671875, -0.752685546875, -0.4439697265625, -0.13525390625, 0.1734619140625, 0.482177734375, 0.7908935546875, 1.099609375, 1.4083251953125, 1.717041015625, 2.0257568359375, 2.33447265625, 2.6431884765625, 2.951904296875, 3.2606201171875, 3.5693359375, 3.8780517578125, 4.186767578125, 4.4954833984375, 4.80419921875, 5.1129150390625, 5.421630859375, 5.7303466796875, 6.0390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 10.0, 37.0, 81.0, 173.0, 290.0, 226.0, 96.0, 34.0, 12.0, 15.0, 6.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.779842376708984, -42.96872329711914, -41.1576042175293, -39.34648895263672, -37.535369873046875, -35.72425079345703, -33.91313171386719, -32.102012634277344, -30.290895462036133, -28.47977638244629, -26.668659210205078, -24.857540130615234, -23.04642105102539, -21.23530387878418, -19.424184799194336, -17.613067626953125, -15.801948547363281, -13.990830421447754, -12.179712295532227, -10.368593215942383, -8.557475090026855, -6.746356964111328, -4.935237884521484, -3.124119758605957, -1.3130016326904297, 0.49811673164367676, 2.309235095977783, 4.120353698730469, 5.931471824645996, 7.742589950561523, 9.553709030151367, 11.364827156066895, 13.175949096679688, 14.987067222595215, 16.798185348510742, 18.609304428100586, 20.420421600341797, 22.23154067993164, 24.042659759521484, 25.853778839111328, 27.66489601135254, 29.476015090942383, 31.287132263183594, 33.09825134277344, 34.90937042236328, 36.720489501953125, 38.53160858154297, 40.34272384643555, 42.15384292602539, 43.964962005615234, 45.77608108520508, 47.587196350097656, 49.3983154296875, 51.209434509277344, 53.02055358886719, 54.83167266845703, 56.642791748046875, 58.45391082763672, 60.26502990722656, 62.076148986816406, 63.887264251708984, 65.69837951660156, 67.50950622558594, 69.32061767578125, 71.1317367553711]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 9.0, 11.0, 25.0, 22.0, 48.0, 53.0, 60.0, 78.0, 98.0, 90.0, 74.0, 89.0, 69.0, 57.0, 49.0, 42.0, 31.0, 21.0, 23.0, 7.0, 7.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.773853302001953, -23.75680160522461, -22.739749908447266, -21.722698211669922, -20.705646514892578, -19.688594818115234, -18.671545028686523, -17.65449333190918, -16.637441635131836, -15.620389938354492, -14.603338241577148, -13.586287498474121, -12.569235801696777, -11.552184104919434, -10.535133361816406, -9.518081665039062, -8.501029968261719, -7.483978271484375, -6.4669270515441895, -5.449875831604004, -4.43282413482666, -3.4157724380493164, -2.398721218109131, -1.3816699981689453, -0.36461830139160156, 0.6524331569671631, 1.6694846153259277, 2.6865360736846924, 3.703587532043457, 4.720639228820801, 5.737690448760986, 6.754741668701172, 7.77178955078125, 8.788841247558594, 9.805892944335938, 10.822943687438965, 11.839995384216309, 12.857047080993652, 13.87409782409668, 14.891149520874023, 15.908201217651367, 16.92525291442871, 17.942304611206055, 18.9593563079834, 19.97640609741211, 20.993457794189453, 22.010509490966797, 23.02756118774414, 24.044612884521484, 25.061664581298828, 26.078716278076172, 27.095767974853516, 28.11281967163086, 29.129871368408203, 30.146921157836914, 31.163972854614258, 32.18102264404297, 33.19807434082031, 34.215126037597656, 35.232177734375, 36.249229431152344, 37.26628112792969, 38.28333282470703, 39.300384521484375, 40.31743621826172]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 8.0, 0.0, 8.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 10.0, 2.0, 12.0, 20.0, 2.0, 26.0, 23.0, 27.0, 54.0, 409.0, 8044.0, 4133207.0, 50964.0, 1053.0, 193.0, 60.0, 35.0, 23.0, 14.0, 4.0, 8.0, 16.0, 14.0, 4.0, 4.0, 4.0, 2.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-48.15625, -46.28173828125, -44.4072265625, -42.53271484375, -40.658203125, -38.78369140625, -36.9091796875, -35.03466796875, -33.16015625, -31.28564453125, -29.4111328125, -27.53662109375, -25.662109375, -23.78759765625, -21.9130859375, -20.03857421875, -18.1640625, -16.28955078125, -14.4150390625, -12.54052734375, -10.666015625, -8.79150390625, -6.9169921875, -5.04248046875, -3.16796875, -1.29345703125, 0.5810546875, 2.45556640625, 4.330078125, 6.20458984375, 8.0791015625, 9.95361328125, 11.828125, 13.70263671875, 15.5771484375, 17.45166015625, 19.326171875, 21.20068359375, 23.0751953125, 24.94970703125, 26.82421875, 28.69873046875, 30.5732421875, 32.44775390625, 34.322265625, 36.19677734375, 38.0712890625, 39.94580078125, 41.8203125, 43.69482421875, 45.5693359375, 47.44384765625, 49.318359375, 51.19287109375, 53.0673828125, 54.94189453125, 56.81640625, 58.69091796875, 60.5654296875, 62.43994140625, 64.314453125, 66.18896484375, 68.0634765625, 69.93798828125, 71.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 12.0, 12.0, 22.0, 27.0, 21.0, 32.0, 37.0, 45.0, 59.0, 58.0, 48.0, 61.0, 58.0, 62.0, 54.0, 54.0, 44.0, 37.0, 35.0, 40.0, 30.0, 21.0, 16.0, 14.0, 17.0, 18.0, 11.0, 3.0, 3.0, 7.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.3305320739746094, -0.31853485107421875, -0.3065376281738281, -0.2945404052734375, -0.2825431823730469, -0.27054595947265625, -0.2585487365722656, -0.246551513671875, -0.23455429077148438, -0.22255706787109375, -0.21055984497070312, -0.1985626220703125, -0.18656539916992188, -0.17456817626953125, -0.16257095336914062, -0.15057373046875, -0.13857650756835938, -0.12657928466796875, -0.11458206176757812, -0.1025848388671875, -0.09058761596679688, -0.07859039306640625, -0.06659317016601562, -0.054595947265625, -0.042598724365234375, -0.03060150146484375, -0.018604278564453125, -0.0066070556640625, 0.005390167236328125, 0.01738739013671875, 0.029384613037109375, 0.0413818359375, 0.053379058837890625, 0.06537628173828125, 0.07737350463867188, 0.0893707275390625, 0.10136795043945312, 0.11336517333984375, 0.12536239624023438, 0.137359619140625, 0.14935684204101562, 0.16135406494140625, 0.17335128784179688, 0.1853485107421875, 0.19734573364257812, 0.20934295654296875, 0.22134017944335938, 0.23333740234375, 0.24533462524414062, 0.25733184814453125, 0.2693290710449219, 0.2813262939453125, 0.2933235168457031, 0.30532073974609375, 0.3173179626464844, 0.329315185546875, 0.3413124084472656, 0.35330963134765625, 0.3653068542480469, 0.3773040771484375, 0.3893013000488281, 0.40129852294921875, 0.4132957458496094, 0.42529296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 12.0, 40.0, 93.0, 375.0, 15239.0, 4177200.0, 1187.0, 90.0, 41.0, 12.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.125, -170.91796875, -167.7109375, -164.50390625, -161.296875, -158.08984375, -154.8828125, -151.67578125, -148.46875, -145.26171875, -142.0546875, -138.84765625, -135.640625, -132.43359375, -129.2265625, -126.01953125, -122.8125, -119.60546875, -116.3984375, -113.19140625, -109.984375, -106.77734375, -103.5703125, -100.36328125, -97.15625, -93.94921875, -90.7421875, -87.53515625, -84.328125, -81.12109375, -77.9140625, -74.70703125, -71.5, -68.29296875, -65.0859375, -61.87890625, -58.671875, -55.46484375, -52.2578125, -49.05078125, -45.84375, -42.63671875, -39.4296875, -36.22265625, -33.015625, -29.80859375, -26.6015625, -23.39453125, -20.1875, -16.98046875, -13.7734375, -10.56640625, -7.359375, -4.15234375, -0.9453125, 2.26171875, 5.46875, 8.67578125, 11.8828125, 15.08984375, 18.296875, 21.50390625, 24.7109375, 27.91796875, 31.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 7.0, 9.0, 8.0, 14.0, 23.0, 28.0, 52.0, 76.0, 135.0, 231.0, 588.0, 1887.0, 487.0, 202.0, 110.0, 81.0, 47.0, 37.0, 11.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2982635498046875, -2.235198974609375, -2.1721343994140625, -2.10906982421875, -2.0460052490234375, -1.982940673828125, -1.9198760986328125, -1.8568115234375, -1.7937469482421875, -1.730682373046875, -1.6676177978515625, -1.60455322265625, -1.5414886474609375, -1.478424072265625, -1.4153594970703125, -1.352294921875, -1.2892303466796875, -1.226165771484375, -1.1631011962890625, -1.10003662109375, -1.0369720458984375, -0.973907470703125, -0.9108428955078125, -0.8477783203125, -0.7847137451171875, -0.721649169921875, -0.6585845947265625, -0.59552001953125, -0.5324554443359375, -0.469390869140625, -0.4063262939453125, -0.34326171875, -0.2801971435546875, -0.217132568359375, -0.1540679931640625, -0.09100341796875, -0.0279388427734375, 0.035125732421875, 0.0981903076171875, 0.1612548828125, 0.2243194580078125, 0.287384033203125, 0.3504486083984375, 0.41351318359375, 0.4765777587890625, 0.539642333984375, 0.6027069091796875, 0.665771484375, 0.7288360595703125, 0.791900634765625, 0.8549652099609375, 0.91802978515625, 0.9810943603515625, 1.044158935546875, 1.1072235107421875, 1.1702880859375, 1.2333526611328125, 1.296417236328125, 1.3594818115234375, 1.42254638671875, 1.4856109619140625, 1.548675537109375, 1.6117401123046875, 1.6748046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 906.0, 108.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-430.1242370605469, -422.2818908691406, -414.4395446777344, -406.5971984863281, -398.7548522949219, -390.9125061035156, -383.0701599121094, -375.2278137207031, -367.3854675292969, -359.5431213378906, -351.7007751464844, -343.8584289550781, -336.0160827636719, -328.1737365722656, -320.3313903808594, -312.4890441894531, -304.6466979980469, -296.8043518066406, -288.9620056152344, -281.1196594238281, -273.2773132324219, -265.4349670410156, -257.5926208496094, -249.75027465820312, -241.9079132080078, -234.06556701660156, -226.2232208251953, -218.38087463378906, -210.5385284423828, -202.69618225097656, -194.8538360595703, -187.01148986816406, -179.16912841796875, -171.3267822265625, -163.48443603515625, -155.64208984375, -147.79974365234375, -139.9573974609375, -132.11505126953125, -124.272705078125, -116.43035888671875, -108.5880126953125, -100.74566650390625, -92.9033203125, -85.06097412109375, -77.2186279296875, -69.37628173828125, -61.533931732177734, -53.69158935546875, -45.8492431640625, -38.00689697265625, -30.164548873901367, -22.322202682495117, -14.479854583740234, -6.637508392333984, 1.2048377990722656, 9.047183990478516, 16.889530181884766, 24.731876373291016, 32.57422637939453, 40.41657257080078, 48.25891876220703, 56.10126495361328, 63.94361114501953, 71.78595733642578]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 19.0, 15.0, 31.0, 48.0, 62.0, 69.0, 109.0, 95.0, 105.0, 88.0, 88.0, 72.0, 58.0, 43.0, 24.0, 27.0, 17.0, 9.0, 6.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.358285903930664, -20.849388122558594, -20.340490341186523, -19.831592559814453, -19.322694778442383, -18.813796997070312, -18.304899215698242, -17.796001434326172, -17.2871036529541, -16.77820587158203, -16.26930809020996, -15.76041030883789, -15.25151252746582, -14.74261474609375, -14.23371696472168, -13.72481918334961, -13.215920448303223, -12.707022666931152, -12.198124885559082, -11.689227104187012, -11.180329322814941, -10.671431541442871, -10.162532806396484, -9.653635025024414, -9.144737243652344, -8.635839462280273, -8.126941680908203, -7.618043899536133, -7.1091461181640625, -6.600248336791992, -6.091350078582764, -5.582452297210693, -5.073554992675781, -4.564657211303711, -4.055759429931641, -3.546861410140991, -3.037963628768921, -2.5290658473968506, -2.020167827606201, -1.5112700462341309, -1.0023722648620605, -0.49347442388534546, 0.015423417091369629, 0.5243213176727295, 1.0332190990447998, 1.5421168804168701, 2.0510149002075195, 2.55991268157959, 3.06881046295166, 3.5777082443237305, 4.086606025695801, 4.595503807067871, 5.104401588439941, 5.613299369812012, 6.12219762802124, 6.6310954093933105, 7.139993190765381, 7.648890972137451, 8.15778923034668, 8.66668701171875, 9.17558479309082, 9.68448257446289, 10.193380355834961, 10.702278137207031, 11.211175918579102]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 12.0, 11.0, 15.0, 18.0, 21.0, 25.0, 32.0, 48.0, 49.0, 68.0, 97.0, 372.0, 12238.0, 743638.0, 287306.0, 4004.0, 214.0, 82.0, 53.0, 54.0, 49.0, 22.0, 20.0, 26.0, 17.0, 15.0, 12.0, 6.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.98681640625, -19.3173828125, -18.64794921875, -17.978515625, -17.30908203125, -16.6396484375, -15.97021484375, -15.30078125, -14.63134765625, -13.9619140625, -13.29248046875, -12.623046875, -11.95361328125, -11.2841796875, -10.61474609375, -9.9453125, -9.27587890625, -8.6064453125, -7.93701171875, -7.267578125, -6.59814453125, -5.9287109375, -5.25927734375, -4.58984375, -3.92041015625, -3.2509765625, -2.58154296875, -1.912109375, -1.24267578125, -0.5732421875, 0.09619140625, 0.765625, 1.43505859375, 2.1044921875, 2.77392578125, 3.443359375, 4.11279296875, 4.7822265625, 5.45166015625, 6.12109375, 6.79052734375, 7.4599609375, 8.12939453125, 8.798828125, 9.46826171875, 10.1376953125, 10.80712890625, 11.4765625, 12.14599609375, 12.8154296875, 13.48486328125, 14.154296875, 14.82373046875, 15.4931640625, 16.16259765625, 16.83203125, 17.50146484375, 18.1708984375, 18.84033203125, 19.509765625, 20.17919921875, 20.8486328125, 21.51806640625, 22.1875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 19.0, 41.0, 84.0, 151.0, 211.0, 214.0, 157.0, 79.0, 43.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8424072265625, -2.780517578125, -2.7186279296875, -2.65673828125, -2.5948486328125, -2.532958984375, -2.4710693359375, -2.4091796875, -2.3472900390625, -2.285400390625, -2.2235107421875, -2.16162109375, -2.0997314453125, -2.037841796875, -1.9759521484375, -1.9140625, -1.8521728515625, -1.790283203125, -1.7283935546875, -1.66650390625, -1.6046142578125, -1.542724609375, -1.4808349609375, -1.4189453125, -1.3570556640625, -1.295166015625, -1.2332763671875, -1.17138671875, -1.1094970703125, -1.047607421875, -0.9857177734375, -0.923828125, -0.8619384765625, -0.800048828125, -0.7381591796875, -0.67626953125, -0.6143798828125, -0.552490234375, -0.4906005859375, -0.4287109375, -0.3668212890625, -0.304931640625, -0.2430419921875, -0.18115234375, -0.1192626953125, -0.057373046875, 0.0045166015625, 0.06640625, 0.1282958984375, 0.190185546875, 0.2520751953125, 0.31396484375, 0.3758544921875, 0.437744140625, 0.4996337890625, 0.5615234375, 0.6234130859375, 0.685302734375, 0.7471923828125, 0.80908203125, 0.8709716796875, 0.932861328125, 0.9947509765625, 1.056640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 18.0, 18.0, 31.0, 30.0, 57.0, 80.0, 150.0, 254.0, 517.0, 1239.0, 3550.0, 14416.0, 81017.0, 468533.0, 395708.0, 65330.0, 12210.0, 3148.0, 1120.0, 444.0, 252.0, 134.0, 86.0, 49.0, 38.0, 30.0, 16.0, 18.0, 8.0, 12.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5079345703125, -8.203369140625, -7.8988037109375, -7.59423828125, -7.2896728515625, -6.985107421875, -6.6805419921875, -6.3759765625, -6.0714111328125, -5.766845703125, -5.4622802734375, -5.15771484375, -4.8531494140625, -4.548583984375, -4.2440185546875, -3.939453125, -3.6348876953125, -3.330322265625, -3.0257568359375, -2.72119140625, -2.4166259765625, -2.112060546875, -1.8074951171875, -1.5029296875, -1.1983642578125, -0.893798828125, -0.5892333984375, -0.28466796875, 0.0198974609375, 0.324462890625, 0.6290283203125, 0.93359375, 1.2381591796875, 1.542724609375, 1.8472900390625, 2.15185546875, 2.4564208984375, 2.760986328125, 3.0655517578125, 3.3701171875, 3.6746826171875, 3.979248046875, 4.2838134765625, 4.58837890625, 4.8929443359375, 5.197509765625, 5.5020751953125, 5.806640625, 6.1112060546875, 6.415771484375, 6.7203369140625, 7.02490234375, 7.3294677734375, 7.634033203125, 7.9385986328125, 8.2431640625, 8.5477294921875, 8.852294921875, 9.1568603515625, 9.46142578125, 9.7659912109375, 10.070556640625, 10.3751220703125, 10.6796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 10.0, 4.0, 8.0, 6.0, 7.0, 19.0, 13.0, 24.0, 34.0, 25.0, 31.0, 33.0, 40.0, 52.0, 38.0, 47.0, 36.0, 47.0, 50.0, 44.0, 42.0, 48.0, 42.0, 32.0, 32.0, 41.0, 41.0, 33.0, 22.0, 18.0, 27.0, 11.0, 9.0, 8.0, 11.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.23114013671875, -3.1165771484375, -3.00201416015625, -2.887451171875, -2.77288818359375, -2.6583251953125, -2.54376220703125, -2.42919921875, -2.31463623046875, -2.2000732421875, -2.08551025390625, -1.970947265625, -1.85638427734375, -1.7418212890625, -1.62725830078125, -1.5126953125, -1.39813232421875, -1.2835693359375, -1.16900634765625, -1.054443359375, -0.93988037109375, -0.8253173828125, -0.71075439453125, -0.59619140625, -0.48162841796875, -0.3670654296875, -0.25250244140625, -0.137939453125, -0.02337646484375, 0.0911865234375, 0.20574951171875, 0.3203125, 0.43487548828125, 0.5494384765625, 0.66400146484375, 0.778564453125, 0.89312744140625, 1.0076904296875, 1.12225341796875, 1.23681640625, 1.35137939453125, 1.4659423828125, 1.58050537109375, 1.695068359375, 1.80963134765625, 1.9241943359375, 2.03875732421875, 2.1533203125, 2.26788330078125, 2.3824462890625, 2.49700927734375, 2.611572265625, 2.72613525390625, 2.8406982421875, 2.95526123046875, 3.06982421875, 3.18438720703125, 3.2989501953125, 3.41351318359375, 3.528076171875, 3.64263916015625, 3.7572021484375, 3.87176513671875, 3.986328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 12.0, 16.0, 22.0, 29.0, 44.0, 70.0, 145.0, 292.0, 611.0, 1740.0, 5526.0, 24582.0, 169231.0, 644694.0, 168601.0, 24238.0, 5653.0, 1747.0, 605.0, 299.0, 142.0, 80.0, 38.0, 30.0, 30.0, 18.0, 7.0, 12.0, 8.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.5660400390625, -7.280517578125, -6.9949951171875, -6.70947265625, -6.4239501953125, -6.138427734375, -5.8529052734375, -5.5673828125, -5.2818603515625, -4.996337890625, -4.7108154296875, -4.42529296875, -4.1397705078125, -3.854248046875, -3.5687255859375, -3.283203125, -2.9976806640625, -2.712158203125, -2.4266357421875, -2.14111328125, -1.8555908203125, -1.570068359375, -1.2845458984375, -0.9990234375, -0.7135009765625, -0.427978515625, -0.1424560546875, 0.14306640625, 0.4285888671875, 0.714111328125, 0.9996337890625, 1.28515625, 1.5706787109375, 1.856201171875, 2.1417236328125, 2.42724609375, 2.7127685546875, 2.998291015625, 3.2838134765625, 3.5693359375, 3.8548583984375, 4.140380859375, 4.4259033203125, 4.71142578125, 4.9969482421875, 5.282470703125, 5.5679931640625, 5.853515625, 6.1390380859375, 6.424560546875, 6.7100830078125, 6.99560546875, 7.2811279296875, 7.566650390625, 7.8521728515625, 8.1376953125, 8.4232177734375, 8.708740234375, 8.9942626953125, 9.27978515625, 9.5653076171875, 9.850830078125, 10.1363525390625, 10.421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 12.0, 14.0, 21.0, 23.0, 38.0, 33.0, 51.0, 53.0, 74.0, 60.0, 103.0, 82.0, 73.0, 61.0, 64.0, 46.0, 38.0, 22.0, 30.0, 18.0, 15.0, 6.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00069427490234375, -0.0006744042038917542, -0.0006545335054397583, -0.0006346628069877625, -0.0006147921085357666, -0.0005949214100837708, -0.0005750507116317749, -0.000555180013179779, -0.0005353093147277832, -0.0005154386162757874, -0.0004955679178237915, -0.00047569721937179565, -0.0004558265209197998, -0.00043595582246780396, -0.0004160851240158081, -0.00039621442556381226, -0.0003763437271118164, -0.00035647302865982056, -0.0003366023302078247, -0.00031673163175582886, -0.000296860933303833, -0.00027699023485183716, -0.0002571195363998413, -0.00023724883794784546, -0.0002173781394958496, -0.00019750744104385376, -0.0001776367425918579, -0.00015776604413986206, -0.0001378953456878662, -0.00011802464723587036, -9.815394878387451e-05, -7.828325033187866e-05, -5.841255187988281e-05, -3.854185342788696e-05, -1.8671154975891113e-05, 1.1995434761047363e-06, 2.1070241928100586e-05, 4.0940940380096436e-05, 6.0811638832092285e-05, 8.068233728408813e-05, 0.00010055303573608398, 0.00012042373418807983, 0.00014029443264007568, 0.00016016513109207153, 0.00018003582954406738, 0.00019990652799606323, 0.00021977722644805908, 0.00023964792490005493, 0.0002595186233520508, 0.00027938932180404663, 0.0002992600202560425, 0.00031913071870803833, 0.0003390014171600342, 0.00035887211561203003, 0.0003787428140640259, 0.00039861351251602173, 0.0004184842109680176, 0.00043835490942001343, 0.0004582256078720093, 0.0004780963063240051, 0.000497967004776001, 0.0005178377032279968, 0.0005377084016799927, 0.0005575791001319885, 0.0005774497985839844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 2.0, 3.0, 5.0, 10.0, 12.0, 22.0, 24.0, 40.0, 57.0, 102.0, 139.0, 227.0, 407.0, 791.0, 1854.0, 5468.0, 25368.0, 181190.0, 630168.0, 170067.0, 23919.0, 5239.0, 1809.0, 716.0, 349.0, 204.0, 113.0, 74.0, 50.0, 32.0, 22.0, 21.0, 4.0, 9.0, 10.0, 3.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1953125, -7.926513671875, -7.65771484375, -7.388916015625, -7.1201171875, -6.851318359375, -6.58251953125, -6.313720703125, -6.044921875, -5.776123046875, -5.50732421875, -5.238525390625, -4.9697265625, -4.700927734375, -4.43212890625, -4.163330078125, -3.89453125, -3.625732421875, -3.35693359375, -3.088134765625, -2.8193359375, -2.550537109375, -2.28173828125, -2.012939453125, -1.744140625, -1.475341796875, -1.20654296875, -0.937744140625, -0.6689453125, -0.400146484375, -0.13134765625, 0.137451171875, 0.40625, 0.675048828125, 0.94384765625, 1.212646484375, 1.4814453125, 1.750244140625, 2.01904296875, 2.287841796875, 2.556640625, 2.825439453125, 3.09423828125, 3.363037109375, 3.6318359375, 3.900634765625, 4.16943359375, 4.438232421875, 4.70703125, 4.975830078125, 5.24462890625, 5.513427734375, 5.7822265625, 6.051025390625, 6.31982421875, 6.588623046875, 6.857421875, 7.126220703125, 7.39501953125, 7.663818359375, 7.9326171875, 8.201416015625, 8.47021484375, 8.739013671875, 9.0078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 4.0, 15.0, 21.0, 33.0, 38.0, 75.0, 89.0, 101.0, 117.0, 92.0, 99.0, 68.0, 60.0, 57.0, 38.0, 23.0, 19.0, 15.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.86328125, -5.724822998046875, -5.58636474609375, -5.447906494140625, -5.3094482421875, -5.170989990234375, -5.03253173828125, -4.894073486328125, -4.755615234375, -4.617156982421875, -4.47869873046875, -4.340240478515625, -4.2017822265625, -4.063323974609375, -3.92486572265625, -3.786407470703125, -3.64794921875, -3.509490966796875, -3.37103271484375, -3.232574462890625, -3.0941162109375, -2.955657958984375, -2.81719970703125, -2.678741455078125, -2.540283203125, -2.401824951171875, -2.26336669921875, -2.124908447265625, -1.9864501953125, -1.847991943359375, -1.70953369140625, -1.571075439453125, -1.4326171875, -1.294158935546875, -1.15570068359375, -1.017242431640625, -0.8787841796875, -0.740325927734375, -0.60186767578125, -0.463409423828125, -0.324951171875, -0.186492919921875, -0.04803466796875, 0.090423583984375, 0.2288818359375, 0.367340087890625, 0.50579833984375, 0.644256591796875, 0.78271484375, 0.921173095703125, 1.05963134765625, 1.198089599609375, 1.3365478515625, 1.475006103515625, 1.61346435546875, 1.751922607421875, 1.890380859375, 2.028839111328125, 2.16729736328125, 2.305755615234375, 2.4442138671875, 2.582672119140625, 2.72113037109375, 2.859588623046875, 2.998046875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 12.0, 76.0, 507.0, 357.0, 44.0, 9.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.2283935546875, -262.7335510253906, -257.23870849609375, -251.7438507080078, -246.24900817871094, -240.75416564941406, -235.2593231201172, -229.76446533203125, -224.26962280273438, -218.7747802734375, -213.27993774414062, -207.7850799560547, -202.2902374267578, -196.79539489746094, -191.30055236816406, -185.80569458007812, -180.31085205078125, -174.81600952148438, -169.3211669921875, -163.82630920410156, -158.3314666748047, -152.8366241455078, -147.34178161621094, -141.846923828125, -136.3520965576172, -130.8572540283203, -125.3624038696289, -119.86756134033203, -114.37271118164062, -108.87786865234375, -103.38302612304688, -97.88817596435547, -92.39332580566406, -86.89848327636719, -81.40363311767578, -75.9087905883789, -70.4139404296875, -64.91909790039062, -59.424251556396484, -53.929405212402344, -48.4345588684082, -42.93971252441406, -37.44486618041992, -31.950021743774414, -26.455175399780273, -20.960329055786133, -15.465484619140625, -9.970638275146484, -4.475791931152344, 1.0190539360046387, 6.513899803161621, 12.008745193481445, 17.503591537475586, 22.998437881469727, 28.493282318115234, 33.988128662109375, 39.482975006103516, 44.977821350097656, 50.4726676940918, 55.96751403808594, 61.46235656738281, 66.95720672607422, 72.4520492553711, 77.9468994140625, 83.44174194335938]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 10.0, 5.0, 9.0, 18.0, 17.0, 32.0, 28.0, 52.0, 45.0, 58.0, 73.0, 66.0, 67.0, 65.0, 79.0, 73.0, 79.0, 51.0, 43.0, 32.0, 30.0, 23.0, 13.0, 13.0, 11.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.706134796142578, -27.579944610595703, -26.453752517700195, -25.32756233215332, -24.201370239257812, -23.075180053710938, -21.948989868164062, -20.822799682617188, -19.69660758972168, -18.570417404174805, -17.444225311279297, -16.318035125732422, -15.19184398651123, -14.065652847290039, -12.939462661743164, -11.813271522521973, -10.687080383300781, -9.56088924407959, -8.434698104858398, -7.308507919311523, -6.182316780090332, -5.056125640869141, -3.9299349784851074, -2.803744316101074, -1.6775531768798828, -0.5513622760772705, 0.5748286247253418, 1.701019525527954, 2.8272104263305664, 3.953401565551758, 5.079592227935791, 6.205782890319824, 7.331977844238281, 8.458168983459473, 9.584360122680664, 10.710550308227539, 11.83674144744873, 12.962932586669922, 14.089122772216797, 15.215313911437988, 16.34150505065918, 17.467695236206055, 18.593887329101562, 19.720077514648438, 20.846267700195312, 21.97245979309082, 23.098649978637695, 24.224842071533203, 25.351032257080078, 26.477222442626953, 27.60341453552246, 28.729604721069336, 29.855796813964844, 30.98198699951172, 32.108177185058594, 33.23436737060547, 34.360557556152344, 35.48674774169922, 36.612937927246094, 37.739131927490234, 38.86532211303711, 39.991512298583984, 41.11770248413086, 42.243892669677734, 43.370086669921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 9.0, 23.0, 51.0, 129.0, 348.0, 2011.0, 4034860.0, 155469.0, 1151.0, 168.0, 48.0, 10.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-130.0, -127.3408203125, -124.681640625, -122.0224609375, -119.36328125, -116.7041015625, -114.044921875, -111.3857421875, -108.7265625, -106.0673828125, -103.408203125, -100.7490234375, -98.08984375, -95.4306640625, -92.771484375, -90.1123046875, -87.453125, -84.7939453125, -82.134765625, -79.4755859375, -76.81640625, -74.1572265625, -71.498046875, -68.8388671875, -66.1796875, -63.5205078125, -60.861328125, -58.2021484375, -55.54296875, -52.8837890625, -50.224609375, -47.5654296875, -44.90625, -42.2470703125, -39.587890625, -36.9287109375, -34.26953125, -31.6103515625, -28.951171875, -26.2919921875, -23.6328125, -20.9736328125, -18.314453125, -15.6552734375, -12.99609375, -10.3369140625, -7.677734375, -5.0185546875, -2.359375, 0.2998046875, 2.958984375, 5.6181640625, 8.27734375, 10.9365234375, 13.595703125, 16.2548828125, 18.9140625, 21.5732421875, 24.232421875, 26.8916015625, 29.55078125, 32.2099609375, 34.869140625, 37.5283203125, 40.1875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 11.0, 40.0, 78.0, 145.0, 164.0, 207.0, 176.0, 109.0, 46.0, 24.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171875, -3.1002197265625, -3.028564453125, -2.9569091796875, -2.88525390625, -2.8135986328125, -2.741943359375, -2.6702880859375, -2.5986328125, -2.5269775390625, -2.455322265625, -2.3836669921875, -2.31201171875, -2.2403564453125, -2.168701171875, -2.0970458984375, -2.025390625, -1.9537353515625, -1.882080078125, -1.8104248046875, -1.73876953125, -1.6671142578125, -1.595458984375, -1.5238037109375, -1.4521484375, -1.3804931640625, -1.308837890625, -1.2371826171875, -1.16552734375, -1.0938720703125, -1.022216796875, -0.9505615234375, -0.87890625, -0.8072509765625, -0.735595703125, -0.6639404296875, -0.59228515625, -0.5206298828125, -0.448974609375, -0.3773193359375, -0.3056640625, -0.2340087890625, -0.162353515625, -0.0906982421875, -0.01904296875, 0.0526123046875, 0.124267578125, 0.1959228515625, 0.267578125, 0.3392333984375, 0.410888671875, 0.4825439453125, 0.55419921875, 0.6258544921875, 0.697509765625, 0.7691650390625, 0.8408203125, 0.9124755859375, 0.984130859375, 1.0557861328125, 1.12744140625, 1.1990966796875, 1.270751953125, 1.3424072265625, 1.4140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 20.0, 34.0, 66.0, 99.0, 176.0, 357.0, 4581.0, 4187377.0, 987.0, 270.0, 140.0, 90.0, 46.0, 24.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.625, -212.14453125, -207.6640625, -203.18359375, -198.703125, -194.22265625, -189.7421875, -185.26171875, -180.78125, -176.30078125, -171.8203125, -167.33984375, -162.859375, -158.37890625, -153.8984375, -149.41796875, -144.9375, -140.45703125, -135.9765625, -131.49609375, -127.015625, -122.53515625, -118.0546875, -113.57421875, -109.09375, -104.61328125, -100.1328125, -95.65234375, -91.171875, -86.69140625, -82.2109375, -77.73046875, -73.25, -68.76953125, -64.2890625, -59.80859375, -55.328125, -50.84765625, -46.3671875, -41.88671875, -37.40625, -32.92578125, -28.4453125, -23.96484375, -19.484375, -15.00390625, -10.5234375, -6.04296875, -1.5625, 2.91796875, 7.3984375, 11.87890625, 16.359375, 20.83984375, 25.3203125, 29.80078125, 34.28125, 38.76171875, 43.2421875, 47.72265625, 52.203125, 56.68359375, 61.1640625, 65.64453125, 70.125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 12.0, 44.0, 158.0, 913.0, 2595.0, 249.0, 65.0, 26.0, 11.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7265625, -13.47320556640625, -13.2198486328125, -12.96649169921875, -12.713134765625, -12.45977783203125, -12.2064208984375, -11.95306396484375, -11.69970703125, -11.44635009765625, -11.1929931640625, -10.93963623046875, -10.686279296875, -10.43292236328125, -10.1795654296875, -9.92620849609375, -9.6728515625, -9.41949462890625, -9.1661376953125, -8.91278076171875, -8.659423828125, -8.40606689453125, -8.1527099609375, -7.89935302734375, -7.64599609375, -7.39263916015625, -7.1392822265625, -6.88592529296875, -6.632568359375, -6.37921142578125, -6.1258544921875, -5.87249755859375, -5.619140625, -5.36578369140625, -5.1124267578125, -4.85906982421875, -4.605712890625, -4.35235595703125, -4.0989990234375, -3.84564208984375, -3.59228515625, -3.33892822265625, -3.0855712890625, -2.83221435546875, -2.578857421875, -2.32550048828125, -2.0721435546875, -1.81878662109375, -1.5654296875, -1.31207275390625, -1.0587158203125, -0.80535888671875, -0.552001953125, -0.29864501953125, -0.0452880859375, 0.20806884765625, 0.46142578125, 0.71478271484375, 0.9681396484375, 1.22149658203125, 1.474853515625, 1.72821044921875, 1.9815673828125, 2.23492431640625, 2.48828125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 59.0, 837.0, 97.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.95411682128906, -245.8665771484375, -238.77903747558594, -231.69149780273438, -224.6039581298828, -217.51641845703125, -210.42889404296875, -203.34133911132812, -196.25381469726562, -189.16627502441406, -182.0787353515625, -174.99119567871094, -167.90365600585938, -160.8161163330078, -153.72857666015625, -146.64105224609375, -139.55349731445312, -132.46595764160156, -125.37841796875, -118.29087829589844, -111.20333862304688, -104.11579895019531, -97.02826690673828, -89.94072723388672, -82.85318756103516, -75.7656478881836, -68.67810821533203, -61.590572357177734, -54.50303268432617, -47.41549301147461, -40.32795715332031, -33.24041748046875, -26.152877807617188, -19.065338134765625, -11.977800369262695, -4.890262603759766, 2.197277069091797, 9.28481674194336, 16.372352600097656, 23.45989227294922, 30.54743194580078, 37.634971618652344, 44.722511291503906, 51.8100471496582, 58.897586822509766, 65.98512268066406, 73.07266235351562, 80.16020202636719, 87.24774169921875, 94.33528137207031, 101.42282104492188, 108.51036071777344, 115.597900390625, 122.68544006347656, 129.77297973632812, 136.86050415039062, 143.94805908203125, 151.0355987548828, 158.12313842773438, 165.21067810058594, 172.2982177734375, 179.38575744628906, 186.47329711914062, 193.56082153320312, 200.6483612060547]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 11.0, 24.0, 37.0, 50.0, 90.0, 95.0, 137.0, 131.0, 130.0, 107.0, 83.0, 39.0, 31.0, 16.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.93144989013672, -29.90447235107422, -28.87749481201172, -27.85051727294922, -26.82353973388672, -25.79656219482422, -24.769582748413086, -23.742605209350586, -22.715627670288086, -21.688650131225586, -20.661672592163086, -19.634695053100586, -18.607715606689453, -17.580738067626953, -16.553760528564453, -15.526782989501953, -14.499805450439453, -13.472827911376953, -12.445850372314453, -11.418871879577637, -10.391894340515137, -9.364916801452637, -8.33793830871582, -7.31096076965332, -6.28398323059082, -5.25700569152832, -4.230027675628662, -3.203049898147583, -2.176072120666504, -1.149094581604004, -0.1221165657043457, 0.9048614501953125, 1.9318389892578125, 2.9588167667388916, 3.9857945442199707, 5.012772560119629, 6.039750099182129, 7.066727638244629, 8.093706130981445, 9.120683670043945, 10.147661209106445, 11.174638748168945, 12.201616287231445, 13.228594779968262, 14.255572319030762, 15.282549858093262, 16.309528350830078, 17.336505889892578, 18.363483428955078, 19.390460968017578, 20.417438507080078, 21.444416046142578, 22.471393585205078, 23.498371124267578, 24.52535057067871, 25.55232810974121, 26.57930564880371, 27.60628318786621, 28.63326072692871, 29.66023826599121, 30.687217712402344, 31.714195251464844, 32.741172790527344, 33.768150329589844, 34.795127868652344]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 10.0, 17.0, 15.0, 31.0, 22.0, 47.0, 93.0, 129.0, 283.0, 662.0, 2057.0, 12946.0, 326219.0, 675372.0, 25870.0, 3037.0, 884.0, 354.0, 185.0, 97.0, 55.0, 38.0, 32.0, 24.0, 13.0, 18.0, 13.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.9375, -30.081298828125, -29.22509765625, -28.368896484375, -27.5126953125, -26.656494140625, -25.80029296875, -24.944091796875, -24.087890625, -23.231689453125, -22.37548828125, -21.519287109375, -20.6630859375, -19.806884765625, -18.95068359375, -18.094482421875, -17.23828125, -16.382080078125, -15.52587890625, -14.669677734375, -13.8134765625, -12.957275390625, -12.10107421875, -11.244873046875, -10.388671875, -9.532470703125, -8.67626953125, -7.820068359375, -6.9638671875, -6.107666015625, -5.25146484375, -4.395263671875, -3.5390625, -2.682861328125, -1.82666015625, -0.970458984375, -0.1142578125, 0.741943359375, 1.59814453125, 2.454345703125, 3.310546875, 4.166748046875, 5.02294921875, 5.879150390625, 6.7353515625, 7.591552734375, 8.44775390625, 9.303955078125, 10.16015625, 11.016357421875, 11.87255859375, 12.728759765625, 13.5849609375, 14.441162109375, 15.29736328125, 16.153564453125, 17.009765625, 17.865966796875, 18.72216796875, 19.578369140625, 20.4345703125, 21.290771484375, 22.14697265625, 23.003173828125, 23.859375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 34.0, 73.0, 101.0, 144.0, 159.0, 175.0, 145.0, 85.0, 40.0, 18.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.478851318359375, -3.39129638671875, -3.303741455078125, -3.2161865234375, -3.128631591796875, -3.04107666015625, -2.953521728515625, -2.865966796875, -2.778411865234375, -2.69085693359375, -2.603302001953125, -2.5157470703125, -2.428192138671875, -2.34063720703125, -2.253082275390625, -2.16552734375, -2.077972412109375, -1.99041748046875, -1.902862548828125, -1.8153076171875, -1.727752685546875, -1.64019775390625, -1.552642822265625, -1.465087890625, -1.377532958984375, -1.28997802734375, -1.202423095703125, -1.1148681640625, -1.027313232421875, -0.93975830078125, -0.852203369140625, -0.7646484375, -0.677093505859375, -0.58953857421875, -0.501983642578125, -0.4144287109375, -0.326873779296875, -0.23931884765625, -0.151763916015625, -0.064208984375, 0.023345947265625, 0.11090087890625, 0.198455810546875, 0.2860107421875, 0.373565673828125, 0.46112060546875, 0.548675537109375, 0.63623046875, 0.723785400390625, 0.81134033203125, 0.898895263671875, 0.9864501953125, 1.074005126953125, 1.16156005859375, 1.249114990234375, 1.336669921875, 1.424224853515625, 1.51177978515625, 1.599334716796875, 1.6868896484375, 1.774444580078125, 1.86199951171875, 1.949554443359375, 2.037109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 9.0, 9.0, 11.0, 20.0, 24.0, 26.0, 36.0, 52.0, 68.0, 83.0, 159.0, 303.0, 722.0, 2333.0, 12671.0, 167358.0, 763582.0, 89718.0, 8307.0, 1796.0, 563.0, 244.0, 136.0, 96.0, 59.0, 41.0, 24.0, 28.0, 15.0, 15.0, 16.0, 2.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.3125, -18.7818603515625, -18.251220703125, -17.7205810546875, -17.18994140625, -16.6593017578125, -16.128662109375, -15.5980224609375, -15.0673828125, -14.5367431640625, -14.006103515625, -13.4754638671875, -12.94482421875, -12.4141845703125, -11.883544921875, -11.3529052734375, -10.822265625, -10.2916259765625, -9.760986328125, -9.2303466796875, -8.69970703125, -8.1690673828125, -7.638427734375, -7.1077880859375, -6.5771484375, -6.0465087890625, -5.515869140625, -4.9852294921875, -4.45458984375, -3.9239501953125, -3.393310546875, -2.8626708984375, -2.33203125, -1.8013916015625, -1.270751953125, -0.7401123046875, -0.20947265625, 0.3211669921875, 0.851806640625, 1.3824462890625, 1.9130859375, 2.4437255859375, 2.974365234375, 3.5050048828125, 4.03564453125, 4.5662841796875, 5.096923828125, 5.6275634765625, 6.158203125, 6.6888427734375, 7.219482421875, 7.7501220703125, 8.28076171875, 8.8114013671875, 9.342041015625, 9.8726806640625, 10.4033203125, 10.9339599609375, 11.464599609375, 11.9952392578125, 12.52587890625, 13.0565185546875, 13.587158203125, 14.1177978515625, 14.6484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 3.0, 12.0, 10.0, 12.0, 16.0, 19.0, 43.0, 23.0, 37.0, 44.0, 44.0, 48.0, 50.0, 39.0, 67.0, 64.0, 55.0, 58.0, 42.0, 45.0, 53.0, 36.0, 23.0, 23.0, 29.0, 19.0, 20.0, 13.0, 10.0, 6.0, 11.0, 3.0, 3.0, 8.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.4140625, -6.237548828125, -6.06103515625, -5.884521484375, -5.7080078125, -5.531494140625, -5.35498046875, -5.178466796875, -5.001953125, -4.825439453125, -4.64892578125, -4.472412109375, -4.2958984375, -4.119384765625, -3.94287109375, -3.766357421875, -3.58984375, -3.413330078125, -3.23681640625, -3.060302734375, -2.8837890625, -2.707275390625, -2.53076171875, -2.354248046875, -2.177734375, -2.001220703125, -1.82470703125, -1.648193359375, -1.4716796875, -1.295166015625, -1.11865234375, -0.942138671875, -0.765625, -0.589111328125, -0.41259765625, -0.236083984375, -0.0595703125, 0.116943359375, 0.29345703125, 0.469970703125, 0.646484375, 0.822998046875, 0.99951171875, 1.176025390625, 1.3525390625, 1.529052734375, 1.70556640625, 1.882080078125, 2.05859375, 2.235107421875, 2.41162109375, 2.588134765625, 2.7646484375, 2.941162109375, 3.11767578125, 3.294189453125, 3.470703125, 3.647216796875, 3.82373046875, 4.000244140625, 4.1767578125, 4.353271484375, 4.52978515625, 4.706298828125, 4.8828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 15.0, 19.0, 24.0, 38.0, 64.0, 116.0, 203.0, 409.0, 863.0, 2160.0, 7030.0, 37347.0, 388940.0, 542942.0, 54581.0, 9076.0, 2645.0, 1017.0, 455.0, 254.0, 111.0, 78.0, 48.0, 36.0, 13.0, 5.0, 11.0, 4.0, 12.0, 5.0, 1.0, 2.0, 2.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -7.9638671875, -7.646484375, -7.3291015625, -7.01171875, -6.6943359375, -6.376953125, -6.0595703125, -5.7421875, -5.4248046875, -5.107421875, -4.7900390625, -4.47265625, -4.1552734375, -3.837890625, -3.5205078125, -3.203125, -2.8857421875, -2.568359375, -2.2509765625, -1.93359375, -1.6162109375, -1.298828125, -0.9814453125, -0.6640625, -0.3466796875, -0.029296875, 0.2880859375, 0.60546875, 0.9228515625, 1.240234375, 1.5576171875, 1.875, 2.1923828125, 2.509765625, 2.8271484375, 3.14453125, 3.4619140625, 3.779296875, 4.0966796875, 4.4140625, 4.7314453125, 5.048828125, 5.3662109375, 5.68359375, 6.0009765625, 6.318359375, 6.6357421875, 6.953125, 7.2705078125, 7.587890625, 7.9052734375, 8.22265625, 8.5400390625, 8.857421875, 9.1748046875, 9.4921875, 9.8095703125, 10.126953125, 10.4443359375, 10.76171875, 11.0791015625, 11.396484375, 11.7138671875, 12.03125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 7.0, 6.0, 11.0, 13.0, 30.0, 29.0, 53.0, 60.0, 81.0, 96.0, 95.0, 93.0, 97.0, 74.0, 60.0, 43.0, 32.0, 44.0, 20.0, 16.0, 5.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009002685546875, -0.0008752793073654175, -0.000850290060043335, -0.0008253008127212524, -0.0008003115653991699, -0.0007753223180770874, -0.0007503330707550049, -0.0007253438234329224, -0.0007003545761108398, -0.0006753653287887573, -0.0006503760814666748, -0.0006253868341445923, -0.0006003975868225098, -0.0005754083395004272, -0.0005504190921783447, -0.0005254298448562622, -0.0005004405975341797, -0.00047545135021209717, -0.00045046210289001465, -0.00042547285556793213, -0.0004004836082458496, -0.0003754943609237671, -0.00035050511360168457, -0.00032551586627960205, -0.00030052661895751953, -0.000275537371635437, -0.0002505481243133545, -0.00022555887699127197, -0.00020056962966918945, -0.00017558038234710693, -0.00015059113502502441, -0.0001256018877029419, -0.00010061264038085938, -7.562339305877686e-05, -5.0634145736694336e-05, -2.5644898414611816e-05, -6.556510925292969e-07, 2.4333596229553223e-05, 4.932284355163574e-05, 7.431209087371826e-05, 9.930133819580078e-05, 0.0001242905855178833, 0.00014927983283996582, 0.00017426908016204834, 0.00019925832748413086, 0.00022424757480621338, 0.0002492368221282959, 0.0002742260694503784, 0.00029921531677246094, 0.00032420456409454346, 0.000349193811416626, 0.0003741830587387085, 0.000399172306060791, 0.00042416155338287354, 0.00044915080070495605, 0.0004741400480270386, 0.0004991292953491211, 0.0005241185426712036, 0.0005491077899932861, 0.0005740970373153687, 0.0005990862846374512, 0.0006240755319595337, 0.0006490647792816162, 0.0006740540266036987, 0.0006990432739257812]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 11.0, 14.0, 16.0, 24.0, 22.0, 30.0, 46.0, 62.0, 99.0, 191.0, 351.0, 798.0, 1860.0, 6770.0, 41559.0, 383626.0, 532001.0, 66832.0, 9798.0, 2466.0, 985.0, 409.0, 200.0, 122.0, 61.0, 56.0, 41.0, 16.0, 18.0, 14.0, 5.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.3125, -9.0224609375, -8.732421875, -8.4423828125, -8.15234375, -7.8623046875, -7.572265625, -7.2822265625, -6.9921875, -6.7021484375, -6.412109375, -6.1220703125, -5.83203125, -5.5419921875, -5.251953125, -4.9619140625, -4.671875, -4.3818359375, -4.091796875, -3.8017578125, -3.51171875, -3.2216796875, -2.931640625, -2.6416015625, -2.3515625, -2.0615234375, -1.771484375, -1.4814453125, -1.19140625, -0.9013671875, -0.611328125, -0.3212890625, -0.03125, 0.2587890625, 0.548828125, 0.8388671875, 1.12890625, 1.4189453125, 1.708984375, 1.9990234375, 2.2890625, 2.5791015625, 2.869140625, 3.1591796875, 3.44921875, 3.7392578125, 4.029296875, 4.3193359375, 4.609375, 4.8994140625, 5.189453125, 5.4794921875, 5.76953125, 6.0595703125, 6.349609375, 6.6396484375, 6.9296875, 7.2197265625, 7.509765625, 7.7998046875, 8.08984375, 8.3798828125, 8.669921875, 8.9599609375, 9.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 5.0, 10.0, 5.0, 8.0, 12.0, 19.0, 14.0, 25.0, 30.0, 26.0, 52.0, 48.0, 47.0, 60.0, 82.0, 79.0, 57.0, 72.0, 51.0, 57.0, 57.0, 37.0, 35.0, 21.0, 17.0, 14.0, 15.0, 9.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.661895751953125, -3.54254150390625, -3.423187255859375, -3.3038330078125, -3.184478759765625, -3.06512451171875, -2.945770263671875, -2.826416015625, -2.707061767578125, -2.58770751953125, -2.468353271484375, -2.3489990234375, -2.229644775390625, -2.11029052734375, -1.990936279296875, -1.87158203125, -1.752227783203125, -1.63287353515625, -1.513519287109375, -1.3941650390625, -1.274810791015625, -1.15545654296875, -1.036102294921875, -0.916748046875, -0.797393798828125, -0.67803955078125, -0.558685302734375, -0.4393310546875, -0.319976806640625, -0.20062255859375, -0.081268310546875, 0.0380859375, 0.157440185546875, 0.27679443359375, 0.396148681640625, 0.5155029296875, 0.634857177734375, 0.75421142578125, 0.873565673828125, 0.992919921875, 1.112274169921875, 1.23162841796875, 1.350982666015625, 1.4703369140625, 1.589691162109375, 1.70904541015625, 1.828399658203125, 1.94775390625, 2.067108154296875, 2.18646240234375, 2.305816650390625, 2.4251708984375, 2.544525146484375, 2.66387939453125, 2.783233642578125, 2.902587890625, 3.021942138671875, 3.14129638671875, 3.260650634765625, 3.3800048828125, 3.499359130859375, 3.61871337890625, 3.738067626953125, 3.857421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 15.0, 68.0, 353.0, 412.0, 103.0, 42.0, 11.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.497636795043945, -26.170827865600586, -20.84402084350586, -15.5172119140625, -10.19040298461914, -4.863594055175781, 0.4632129669189453, 5.790021896362305, 11.116830825805664, 16.443639755249023, 21.77044677734375, 27.09725570678711, 32.42406463623047, 37.75087356567383, 43.07768249511719, 48.40448760986328, 53.731300354003906, 59.058109283447266, 64.38491821289062, 69.71172332763672, 75.03853607177734, 80.36534118652344, 85.69215393066406, 91.01895904541016, 96.34576416015625, 101.67256927490234, 106.99938201904297, 112.32618713378906, 117.65299987792969, 122.97980499267578, 128.30661010742188, 133.6334228515625, 138.96022033691406, 144.2870330810547, 149.61383056640625, 154.94064331054688, 160.2674560546875, 165.59426879882812, 170.9210662841797, 176.2478790283203, 181.57469177246094, 186.90150451660156, 192.22830200195312, 197.55511474609375, 202.88192749023438, 208.208740234375, 213.53553771972656, 218.8623504638672, 224.18914794921875, 229.51596069335938, 234.84275817871094, 240.16957092285156, 245.4963836669922, 250.8231964111328, 256.1499938964844, 261.476806640625, 266.8036193847656, 272.13043212890625, 277.4572448730469, 282.7840576171875, 288.11083984375, 293.4376525878906, 298.76446533203125, 304.0912780761719, 309.4180908203125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 14.0, 8.0, 14.0, 8.0, 21.0, 25.0, 26.0, 31.0, 40.0, 41.0, 53.0, 58.0, 56.0, 44.0, 70.0, 62.0, 52.0, 48.0, 49.0, 58.0, 33.0, 30.0, 25.0, 19.0, 26.0, 20.0, 12.0, 10.0, 6.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.592987060546875, -38.282344818115234, -36.97170639038086, -35.66106414794922, -34.350425720214844, -33.0397834777832, -31.729143142700195, -30.418502807617188, -29.10786247253418, -27.797222137451172, -26.486581802368164, -25.175941467285156, -23.865299224853516, -22.55466079711914, -21.2440185546875, -19.933378219604492, -18.622737884521484, -17.312097549438477, -16.00145721435547, -14.690815925598145, -13.380175590515137, -12.069535255432129, -10.758893966674805, -9.448253631591797, -8.137613296508789, -6.826972961425781, -5.516332149505615, -4.205691337585449, -2.8950510025024414, -1.5844106674194336, -0.2737698554992676, 1.0368709564208984, 2.3475112915039062, 3.658151865005493, 4.96879243850708, 6.279433250427246, 7.590073585510254, 8.900713920593262, 10.211355209350586, 11.521995544433594, 12.832635879516602, 14.14327621459961, 15.453916549682617, 16.764556884765625, 18.075199127197266, 19.38583755493164, 20.69647979736328, 22.00712013244629, 23.317760467529297, 24.628400802612305, 25.939041137695312, 27.24968147277832, 28.560321807861328, 29.87096405029297, 31.181604385375977, 32.492244720458984, 33.802886962890625, 35.113529205322266, 36.42416763305664, 37.73480987548828, 39.045448303222656, 40.3560905456543, 41.66672897338867, 42.97737121582031, 44.28800964355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 15.0, 17.0, 30.0, 47.0, 96.0, 146.0, 394.0, 1762.0, 50196.0, 4123663.0, 16616.0, 963.0, 205.0, 77.0, 16.0, 22.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0, -74.361328125, -72.72265625, -71.083984375, -69.4453125, -67.806640625, -66.16796875, -64.529296875, -62.890625, -61.251953125, -59.61328125, -57.974609375, -56.3359375, -54.697265625, -53.05859375, -51.419921875, -49.78125, -48.142578125, -46.50390625, -44.865234375, -43.2265625, -41.587890625, -39.94921875, -38.310546875, -36.671875, -35.033203125, -33.39453125, -31.755859375, -30.1171875, -28.478515625, -26.83984375, -25.201171875, -23.5625, -21.923828125, -20.28515625, -18.646484375, -17.0078125, -15.369140625, -13.73046875, -12.091796875, -10.453125, -8.814453125, -7.17578125, -5.537109375, -3.8984375, -2.259765625, -0.62109375, 1.017578125, 2.65625, 4.294921875, 5.93359375, 7.572265625, 9.2109375, 10.849609375, 12.48828125, 14.126953125, 15.765625, 17.404296875, 19.04296875, 20.681640625, 22.3203125, 23.958984375, 25.59765625, 27.236328125, 28.875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 17.0, 32.0, 58.0, 100.0, 122.0, 161.0, 171.0, 127.0, 92.0, 60.0, 26.0, 19.0, 5.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.816925048828125, -3.72369384765625, -3.630462646484375, -3.5372314453125, -3.444000244140625, -3.35076904296875, -3.257537841796875, -3.164306640625, -3.071075439453125, -2.97784423828125, -2.884613037109375, -2.7913818359375, -2.698150634765625, -2.60491943359375, -2.511688232421875, -2.41845703125, -2.325225830078125, -2.23199462890625, -2.138763427734375, -2.0455322265625, -1.952301025390625, -1.85906982421875, -1.765838623046875, -1.672607421875, -1.579376220703125, -1.48614501953125, -1.392913818359375, -1.2996826171875, -1.206451416015625, -1.11322021484375, -1.019989013671875, -0.9267578125, -0.833526611328125, -0.74029541015625, -0.647064208984375, -0.5538330078125, -0.460601806640625, -0.36737060546875, -0.274139404296875, -0.180908203125, -0.087677001953125, 0.00555419921875, 0.098785400390625, 0.1920166015625, 0.285247802734375, 0.37847900390625, 0.471710205078125, 0.56494140625, 0.658172607421875, 0.75140380859375, 0.844635009765625, 0.9378662109375, 1.031097412109375, 1.12432861328125, 1.217559814453125, 1.310791015625, 1.404022216796875, 1.49725341796875, 1.590484619140625, 1.6837158203125, 1.776947021484375, 1.87017822265625, 1.963409423828125, 2.056640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 9.0, 23.0, 38.0, 59.0, 117.0, 248.0, 574.0, 2827.0, 4023252.0, 164987.0, 1427.0, 396.0, 171.0, 66.0, 40.0, 17.0, 12.0, 10.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-125.5, -122.9326171875, -120.365234375, -117.7978515625, -115.23046875, -112.6630859375, -110.095703125, -107.5283203125, -104.9609375, -102.3935546875, -99.826171875, -97.2587890625, -94.69140625, -92.1240234375, -89.556640625, -86.9892578125, -84.421875, -81.8544921875, -79.287109375, -76.7197265625, -74.15234375, -71.5849609375, -69.017578125, -66.4501953125, -63.8828125, -61.3154296875, -58.748046875, -56.1806640625, -53.61328125, -51.0458984375, -48.478515625, -45.9111328125, -43.34375, -40.7763671875, -38.208984375, -35.6416015625, -33.07421875, -30.5068359375, -27.939453125, -25.3720703125, -22.8046875, -20.2373046875, -17.669921875, -15.1025390625, -12.53515625, -9.9677734375, -7.400390625, -4.8330078125, -2.265625, 0.3017578125, 2.869140625, 5.4365234375, 8.00390625, 10.5712890625, 13.138671875, 15.7060546875, 18.2734375, 20.8408203125, 23.408203125, 25.9755859375, 28.54296875, 31.1103515625, 33.677734375, 36.2451171875, 38.8125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 15.0, 26.0, 47.0, 138.0, 544.0, 2554.0, 517.0, 122.0, 58.0, 26.0, 13.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.61602783203125, -9.3726806640625, -9.12933349609375, -8.885986328125, -8.64263916015625, -8.3992919921875, -8.15594482421875, -7.91259765625, -7.66925048828125, -7.4259033203125, -7.18255615234375, -6.939208984375, -6.69586181640625, -6.4525146484375, -6.20916748046875, -5.9658203125, -5.72247314453125, -5.4791259765625, -5.23577880859375, -4.992431640625, -4.74908447265625, -4.5057373046875, -4.26239013671875, -4.01904296875, -3.77569580078125, -3.5323486328125, -3.28900146484375, -3.045654296875, -2.80230712890625, -2.5589599609375, -2.31561279296875, -2.072265625, -1.82891845703125, -1.5855712890625, -1.34222412109375, -1.098876953125, -0.85552978515625, -0.6121826171875, -0.36883544921875, -0.12548828125, 0.11785888671875, 0.3612060546875, 0.60455322265625, 0.847900390625, 1.09124755859375, 1.3345947265625, 1.57794189453125, 1.8212890625, 2.06463623046875, 2.3079833984375, 2.55133056640625, 2.794677734375, 3.03802490234375, 3.2813720703125, 3.52471923828125, 3.76806640625, 4.01141357421875, 4.2547607421875, 4.49810791015625, 4.741455078125, 4.98480224609375, 5.2281494140625, 5.47149658203125, 5.71484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 27.0, 446.0, 502.0, 22.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.4884490966797, -135.60340881347656, -129.7183837890625, -123.83334350585938, -117.94830322265625, -112.06326293945312, -106.17823028564453, -100.29319763183594, -94.40815734863281, -88.52311706542969, -82.6380844116211, -76.7530517578125, -70.86801147460938, -64.98297119140625, -59.097938537597656, -53.2129020690918, -47.32786560058594, -41.44282913208008, -35.55779266357422, -29.67275619506836, -23.7877197265625, -17.90268325805664, -12.017646789550781, -6.132610321044922, -0.2475738525390625, 5.637462615966797, 11.522499084472656, 17.407535552978516, 23.292572021484375, 29.177608489990234, 35.062644958496094, 40.94768142700195, 46.83270263671875, 52.71773910522461, 58.60277557373047, 64.48780822753906, 70.37284851074219, 76.25788879394531, 82.1429214477539, 88.0279541015625, 93.91299438476562, 99.79803466796875, 105.68306732177734, 111.56809997558594, 117.45314025878906, 123.33818054199219, 129.22320556640625, 135.10824584960938, 140.9932861328125, 146.87832641601562, 152.76336669921875, 158.6483917236328, 164.53343200683594, 170.41847229003906, 176.30349731445312, 182.18853759765625, 188.07357788085938, 193.9586181640625, 199.84365844726562, 205.7286834716797, 211.6137237548828, 217.49876403808594, 223.3837890625, 229.26882934570312, 235.15386962890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 19.0, 35.0, 43.0, 49.0, 57.0, 61.0, 71.0, 82.0, 87.0, 100.0, 79.0, 72.0, 49.0, 39.0, 45.0, 35.0, 20.0, 14.0, 5.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.530033111572266, -28.667436599731445, -27.804840087890625, -26.942245483398438, -26.079648971557617, -25.217052459716797, -24.354455947875977, -23.491859436035156, -22.62926483154297, -21.76666831970215, -20.904071807861328, -20.04147720336914, -19.17888069152832, -18.3162841796875, -17.45368766784668, -16.59109115600586, -15.728494644165039, -14.865898132324219, -14.003302574157715, -13.140706062316895, -12.27811050415039, -11.41551399230957, -10.55291748046875, -9.69032096862793, -8.827725410461426, -7.965129375457764, -7.102533340454102, -6.239936828613281, -5.377340793609619, -4.514744758605957, -3.6521482467651367, -2.7895522117614746, -1.9269580841064453, -1.0643619298934937, -0.201765775680542, 0.6608304977416992, 1.5234265327453613, 2.3860225677490234, 3.2486190795898438, 4.111215114593506, 4.973811149597168, 5.83640718460083, 6.699003219604492, 7.5615997314453125, 8.424196243286133, 9.286791801452637, 10.149388313293457, 11.011983871459961, 11.874580383300781, 12.737176895141602, 13.599772453308105, 14.462368965148926, 15.32496452331543, 16.18756103515625, 17.05015754699707, 17.91275405883789, 18.775348663330078, 19.6379451751709, 20.50054168701172, 21.363136291503906, 22.225732803344727, 23.088329315185547, 23.950925827026367, 24.813522338867188, 25.676118850708008]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 9.0, 4.0, 10.0, 15.0, 14.0, 16.0, 26.0, 36.0, 54.0, 70.0, 110.0, 124.0, 214.0, 339.0, 578.0, 1176.0, 2947.0, 10095.0, 52548.0, 371704.0, 509122.0, 78751.0, 13668.0, 3685.0, 1381.0, 677.0, 355.0, 230.0, 157.0, 118.0, 74.0, 62.0, 41.0, 27.0, 35.0, 16.0, 13.0, 11.0, 14.0, 10.0, 5.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.4847412109375, -12.024169921875, -11.5635986328125, -11.10302734375, -10.6424560546875, -10.181884765625, -9.7213134765625, -9.2607421875, -8.8001708984375, -8.339599609375, -7.8790283203125, -7.41845703125, -6.9578857421875, -6.497314453125, -6.0367431640625, -5.576171875, -5.1156005859375, -4.655029296875, -4.1944580078125, -3.73388671875, -3.2733154296875, -2.812744140625, -2.3521728515625, -1.8916015625, -1.4310302734375, -0.970458984375, -0.5098876953125, -0.04931640625, 0.4112548828125, 0.871826171875, 1.3323974609375, 1.79296875, 2.2535400390625, 2.714111328125, 3.1746826171875, 3.63525390625, 4.0958251953125, 4.556396484375, 5.0169677734375, 5.4775390625, 5.9381103515625, 6.398681640625, 6.8592529296875, 7.31982421875, 7.7803955078125, 8.240966796875, 8.7015380859375, 9.162109375, 9.6226806640625, 10.083251953125, 10.5438232421875, 11.00439453125, 11.4649658203125, 11.925537109375, 12.3861083984375, 12.8466796875, 13.3072509765625, 13.767822265625, 14.2283935546875, 14.68896484375, 15.1495361328125, 15.610107421875, 16.0706787109375, 16.53125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 10.0, 9.0, 23.0, 29.0, 51.0, 55.0, 100.0, 114.0, 101.0, 115.0, 99.0, 93.0, 53.0, 54.0, 39.0, 28.0, 12.0, 10.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.36883544921875, -3.2825927734375, -3.19635009765625, -3.110107421875, -3.02386474609375, -2.9376220703125, -2.85137939453125, -2.76513671875, -2.67889404296875, -2.5926513671875, -2.50640869140625, -2.420166015625, -2.33392333984375, -2.2476806640625, -2.16143798828125, -2.0751953125, -1.98895263671875, -1.9027099609375, -1.81646728515625, -1.730224609375, -1.64398193359375, -1.5577392578125, -1.47149658203125, -1.38525390625, -1.29901123046875, -1.2127685546875, -1.12652587890625, -1.040283203125, -0.95404052734375, -0.8677978515625, -0.78155517578125, -0.6953125, -0.60906982421875, -0.5228271484375, -0.43658447265625, -0.350341796875, -0.26409912109375, -0.1778564453125, -0.09161376953125, -0.00537109375, 0.08087158203125, 0.1671142578125, 0.25335693359375, 0.339599609375, 0.42584228515625, 0.5120849609375, 0.59832763671875, 0.6845703125, 0.77081298828125, 0.8570556640625, 0.94329833984375, 1.029541015625, 1.11578369140625, 1.2020263671875, 1.28826904296875, 1.37451171875, 1.46075439453125, 1.5469970703125, 1.63323974609375, 1.719482421875, 1.80572509765625, 1.8919677734375, 1.97821044921875, 2.064453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 15.0, 11.0, 31.0, 36.0, 49.0, 104.0, 213.0, 403.0, 1055.0, 4259.0, 47452.0, 849423.0, 135160.0, 7789.0, 1515.0, 526.0, 221.0, 109.0, 61.0, 42.0, 20.0, 14.0, 15.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.493408203125, -16.78369140625, -16.073974609375, -15.3642578125, -14.654541015625, -13.94482421875, -13.235107421875, -12.525390625, -11.815673828125, -11.10595703125, -10.396240234375, -9.6865234375, -8.976806640625, -8.26708984375, -7.557373046875, -6.84765625, -6.137939453125, -5.42822265625, -4.718505859375, -4.0087890625, -3.299072265625, -2.58935546875, -1.879638671875, -1.169921875, -0.460205078125, 0.24951171875, 0.959228515625, 1.6689453125, 2.378662109375, 3.08837890625, 3.798095703125, 4.5078125, 5.217529296875, 5.92724609375, 6.636962890625, 7.3466796875, 8.056396484375, 8.76611328125, 9.475830078125, 10.185546875, 10.895263671875, 11.60498046875, 12.314697265625, 13.0244140625, 13.734130859375, 14.44384765625, 15.153564453125, 15.86328125, 16.572998046875, 17.28271484375, 17.992431640625, 18.7021484375, 19.411865234375, 20.12158203125, 20.831298828125, 21.541015625, 22.250732421875, 22.96044921875, 23.670166015625, 24.3798828125, 25.089599609375, 25.79931640625, 26.509033203125, 27.21875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 8.0, 8.0, 5.0, 14.0, 16.0, 13.0, 25.0, 43.0, 36.0, 35.0, 59.0, 42.0, 50.0, 60.0, 57.0, 62.0, 73.0, 63.0, 44.0, 50.0, 50.0, 28.0, 41.0, 33.0, 28.0, 12.0, 13.0, 9.0, 5.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.89752197265625, -6.6427001953125, -6.38787841796875, -6.133056640625, -5.87823486328125, -5.6234130859375, -5.36859130859375, -5.11376953125, -4.85894775390625, -4.6041259765625, -4.34930419921875, -4.094482421875, -3.83966064453125, -3.5848388671875, -3.33001708984375, -3.0751953125, -2.82037353515625, -2.5655517578125, -2.31072998046875, -2.055908203125, -1.80108642578125, -1.5462646484375, -1.29144287109375, -1.03662109375, -0.78179931640625, -0.5269775390625, -0.27215576171875, -0.017333984375, 0.23748779296875, 0.4923095703125, 0.74713134765625, 1.001953125, 1.25677490234375, 1.5115966796875, 1.76641845703125, 2.021240234375, 2.27606201171875, 2.5308837890625, 2.78570556640625, 3.04052734375, 3.29534912109375, 3.5501708984375, 3.80499267578125, 4.059814453125, 4.31463623046875, 4.5694580078125, 4.82427978515625, 5.0791015625, 5.33392333984375, 5.5887451171875, 5.84356689453125, 6.098388671875, 6.35321044921875, 6.6080322265625, 6.86285400390625, 7.11767578125, 7.37249755859375, 7.6273193359375, 7.88214111328125, 8.136962890625, 8.39178466796875, 8.6466064453125, 8.90142822265625, 9.15625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 9.0, 10.0, 25.0, 35.0, 58.0, 106.0, 216.0, 494.0, 1184.0, 3515.0, 14871.0, 98618.0, 613166.0, 273755.0, 32639.0, 6452.0, 1990.0, 733.0, 317.0, 145.0, 84.0, 45.0, 29.0, 26.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.1221923828125, -5.916259765625, -5.7103271484375, -5.50439453125, -5.2984619140625, -5.092529296875, -4.8865966796875, -4.6806640625, -4.4747314453125, -4.268798828125, -4.0628662109375, -3.85693359375, -3.6510009765625, -3.445068359375, -3.2391357421875, -3.033203125, -2.8272705078125, -2.621337890625, -2.4154052734375, -2.20947265625, -2.0035400390625, -1.797607421875, -1.5916748046875, -1.3857421875, -1.1798095703125, -0.973876953125, -0.7679443359375, -0.56201171875, -0.3560791015625, -0.150146484375, 0.0557861328125, 0.26171875, 0.4676513671875, 0.673583984375, 0.8795166015625, 1.08544921875, 1.2913818359375, 1.497314453125, 1.7032470703125, 1.9091796875, 2.1151123046875, 2.321044921875, 2.5269775390625, 2.73291015625, 2.9388427734375, 3.144775390625, 3.3507080078125, 3.556640625, 3.7625732421875, 3.968505859375, 4.1744384765625, 4.38037109375, 4.5863037109375, 4.792236328125, 4.9981689453125, 5.2041015625, 5.4100341796875, 5.615966796875, 5.8218994140625, 6.02783203125, 6.2337646484375, 6.439697265625, 6.6456298828125, 6.8515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 1.0, 4.0, 12.0, 3.0, 21.0, 24.0, 21.0, 38.0, 41.0, 51.0, 83.0, 96.0, 113.0, 99.0, 77.0, 69.0, 48.0, 58.0, 35.0, 30.0, 14.0, 20.0, 10.0, 8.0, 5.0, 4.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006079673767089844, -0.0005918741226196289, -0.0005757808685302734, -0.000559687614440918, -0.0005435943603515625, -0.000527501106262207, -0.0005114078521728516, -0.0004953145980834961, -0.0004792213439941406, -0.00046312808990478516, -0.0004470348358154297, -0.0004309415817260742, -0.00041484832763671875, -0.0003987550735473633, -0.0003826618194580078, -0.00036656856536865234, -0.0003504753112792969, -0.0003343820571899414, -0.00031828880310058594, -0.00030219554901123047, -0.000286102294921875, -0.00027000904083251953, -0.00025391578674316406, -0.0002378225326538086, -0.00022172927856445312, -0.00020563602447509766, -0.0001895427703857422, -0.00017344951629638672, -0.00015735626220703125, -0.00014126300811767578, -0.0001251697540283203, -0.00010907649993896484, -9.298324584960938e-05, -7.68899917602539e-05, -6.079673767089844e-05, -4.470348358154297e-05, -2.86102294921875e-05, -1.2516975402832031e-05, 3.5762786865234375e-06, 1.9669532775878906e-05, 3.5762786865234375e-05, 5.1856040954589844e-05, 6.794929504394531e-05, 8.404254913330078e-05, 0.00010013580322265625, 0.00011622905731201172, 0.0001323223114013672, 0.00014841556549072266, 0.00016450881958007812, 0.0001806020736694336, 0.00019669532775878906, 0.00021278858184814453, 0.0002288818359375, 0.00024497509002685547, 0.00026106834411621094, 0.0002771615982055664, 0.0002932548522949219, 0.00030934810638427734, 0.0003254413604736328, 0.0003415346145629883, 0.00035762786865234375, 0.0003737211227416992, 0.0003898143768310547, 0.00040590763092041016, 0.0004220008850097656]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 11.0, 8.0, 21.0, 23.0, 38.0, 71.0, 119.0, 251.0, 620.0, 1770.0, 6314.0, 36881.0, 375119.0, 553421.0, 61253.0, 9009.0, 2147.0, 769.0, 295.0, 163.0, 78.0, 43.0, 39.0, 30.0, 16.0, 5.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.3597412109375, -6.133544921875, -5.9073486328125, -5.68115234375, -5.4549560546875, -5.228759765625, -5.0025634765625, -4.7763671875, -4.5501708984375, -4.323974609375, -4.0977783203125, -3.87158203125, -3.6453857421875, -3.419189453125, -3.1929931640625, -2.966796875, -2.7406005859375, -2.514404296875, -2.2882080078125, -2.06201171875, -1.8358154296875, -1.609619140625, -1.3834228515625, -1.1572265625, -0.9310302734375, -0.704833984375, -0.4786376953125, -0.25244140625, -0.0262451171875, 0.199951171875, 0.4261474609375, 0.65234375, 0.8785400390625, 1.104736328125, 1.3309326171875, 1.55712890625, 1.7833251953125, 2.009521484375, 2.2357177734375, 2.4619140625, 2.6881103515625, 2.914306640625, 3.1405029296875, 3.36669921875, 3.5928955078125, 3.819091796875, 4.0452880859375, 4.271484375, 4.4976806640625, 4.723876953125, 4.9500732421875, 5.17626953125, 5.4024658203125, 5.628662109375, 5.8548583984375, 6.0810546875, 6.3072509765625, 6.533447265625, 6.7596435546875, 6.98583984375, 7.2120361328125, 7.438232421875, 7.6644287109375, 7.890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 20.0, 18.0, 19.0, 25.0, 38.0, 62.0, 57.0, 50.0, 96.0, 63.0, 86.0, 77.0, 74.0, 61.0, 46.0, 54.0, 25.0, 21.0, 12.0, 14.0, 12.0, 6.0, 8.0, 1.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.779296875, -3.664825439453125, -3.55035400390625, -3.435882568359375, -3.3214111328125, -3.206939697265625, -3.09246826171875, -2.977996826171875, -2.863525390625, -2.749053955078125, -2.63458251953125, -2.520111083984375, -2.4056396484375, -2.291168212890625, -2.17669677734375, -2.062225341796875, -1.94775390625, -1.833282470703125, -1.71881103515625, -1.604339599609375, -1.4898681640625, -1.375396728515625, -1.26092529296875, -1.146453857421875, -1.031982421875, -0.917510986328125, -0.80303955078125, -0.688568115234375, -0.5740966796875, -0.459625244140625, -0.34515380859375, -0.230682373046875, -0.1162109375, -0.001739501953125, 0.11273193359375, 0.227203369140625, 0.3416748046875, 0.456146240234375, 0.57061767578125, 0.685089111328125, 0.799560546875, 0.914031982421875, 1.02850341796875, 1.142974853515625, 1.2574462890625, 1.371917724609375, 1.48638916015625, 1.600860595703125, 1.71533203125, 1.829803466796875, 1.94427490234375, 2.058746337890625, 2.1732177734375, 2.287689208984375, 2.40216064453125, 2.516632080078125, 2.631103515625, 2.745574951171875, 2.86004638671875, 2.974517822265625, 3.0889892578125, 3.203460693359375, 3.31793212890625, 3.432403564453125, 3.546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 17.0, 293.0, 629.0, 59.0, 12.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.71131896972656, -65.57402801513672, -56.436729431152344, -47.2994384765625, -38.16214370727539, -29.02484893798828, -19.887557983398438, -10.750263214111328, -1.6129684448242188, 7.524325370788574, 16.661619186401367, 25.798912048339844, 34.93620681762695, 44.07350158691406, 53.210792541503906, 62.348087310791016, 71.48538208007812, 80.62267303466797, 89.75997161865234, 98.89726257324219, 108.03456115722656, 117.1718521118164, 126.30914306640625, 135.44644165039062, 144.583740234375, 153.72103881835938, 162.8583221435547, 171.99562072753906, 181.13291931152344, 190.27020263671875, 199.40750122070312, 208.5447998046875, 217.68209838867188, 226.81939697265625, 235.95668029785156, 245.09397888183594, 254.2312774658203, 263.3685607910156, 272.505859375, 281.6431579589844, 290.78045654296875, 299.9177551269531, 309.0550537109375, 318.19232177734375, 327.3296203613281, 336.4669189453125, 345.6042175292969, 354.74151611328125, 363.8787841796875, 373.0160827636719, 382.15338134765625, 391.2906494140625, 400.4279479980469, 409.56524658203125, 418.7025451660156, 427.83984375, 436.9771423339844, 446.11444091796875, 455.2517395019531, 464.3890380859375, 473.52630615234375, 482.6636047363281, 491.8009033203125, 500.9382019042969, 510.07550048828125]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 9.0, 7.0, 24.0, 26.0, 36.0, 32.0, 49.0, 60.0, 59.0, 70.0, 68.0, 69.0, 61.0, 54.0, 56.0, 47.0, 45.0, 43.0, 36.0, 34.0, 25.0, 19.0, 21.0, 6.0, 10.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.18724822998047, -43.58382034301758, -41.98039627075195, -40.37696838378906, -38.77354049682617, -37.17011260986328, -35.566688537597656, -33.963260650634766, -32.359832763671875, -30.756406784057617, -29.152978897094727, -27.54955291748047, -25.946125030517578, -24.34269905090332, -22.739273071289062, -21.135845184326172, -19.532421112060547, -17.92899513244629, -16.3255672454834, -14.72214126586914, -13.118714332580566, -11.515287399291992, -9.911861419677734, -8.30843448638916, -6.705007553100586, -5.101580619812012, -3.4981541633605957, -1.8947277069091797, -0.29130077362060547, 1.3121261596679688, 2.9155521392822266, 4.518979072570801, 6.122406005859375, 7.725832939147949, 9.329259872436523, 10.932685852050781, 12.536112785339355, 14.13953971862793, 15.742965698242188, 17.346393585205078, 18.949819564819336, 20.553245544433594, 22.156673431396484, 23.760099411010742, 25.363525390625, 26.96695327758789, 28.57037925720215, 30.173805236816406, 31.777233123779297, 33.38066101074219, 34.98408508300781, 36.5875129699707, 38.190940856933594, 39.79436492919922, 41.39779281616211, 43.001220703125, 44.604644775390625, 46.208072662353516, 47.81149673461914, 49.41492462158203, 51.01835250854492, 52.62178039550781, 54.22520446777344, 55.82863235473633, 57.43206024169922]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 11.0, 13.0, 18.0, 21.0, 42.0, 56.0, 92.0, 151.0, 253.0, 621.0, 1655.0, 7574.0, 162692.0, 3990109.0, 25948.0, 3441.0, 867.0, 350.0, 155.0, 90.0, 52.0, 19.0, 13.0, 12.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-42.03125, -41.08154296875, -40.1318359375, -39.18212890625, -38.232421875, -37.28271484375, -36.3330078125, -35.38330078125, -34.43359375, -33.48388671875, -32.5341796875, -31.58447265625, -30.634765625, -29.68505859375, -28.7353515625, -27.78564453125, -26.8359375, -25.88623046875, -24.9365234375, -23.98681640625, -23.037109375, -22.08740234375, -21.1376953125, -20.18798828125, -19.23828125, -18.28857421875, -17.3388671875, -16.38916015625, -15.439453125, -14.48974609375, -13.5400390625, -12.59033203125, -11.640625, -10.69091796875, -9.7412109375, -8.79150390625, -7.841796875, -6.89208984375, -5.9423828125, -4.99267578125, -4.04296875, -3.09326171875, -2.1435546875, -1.19384765625, -0.244140625, 0.70556640625, 1.6552734375, 2.60498046875, 3.5546875, 4.50439453125, 5.4541015625, 6.40380859375, 7.353515625, 8.30322265625, 9.2529296875, 10.20263671875, 11.15234375, 12.10205078125, 13.0517578125, 14.00146484375, 14.951171875, 15.90087890625, 16.8505859375, 17.80029296875, 18.75]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 11.0, 10.0, 17.0, 35.0, 43.0, 69.0, 69.0, 91.0, 98.0, 96.0, 92.0, 89.0, 74.0, 63.0, 41.0, 28.0, 31.0, 17.0, 6.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.19140625, -3.114501953125, -3.03759765625, -2.960693359375, -2.8837890625, -2.806884765625, -2.72998046875, -2.653076171875, -2.576171875, -2.499267578125, -2.42236328125, -2.345458984375, -2.2685546875, -2.191650390625, -2.11474609375, -2.037841796875, -1.9609375, -1.884033203125, -1.80712890625, -1.730224609375, -1.6533203125, -1.576416015625, -1.49951171875, -1.422607421875, -1.345703125, -1.268798828125, -1.19189453125, -1.114990234375, -1.0380859375, -0.961181640625, -0.88427734375, -0.807373046875, -0.73046875, -0.653564453125, -0.57666015625, -0.499755859375, -0.4228515625, -0.345947265625, -0.26904296875, -0.192138671875, -0.115234375, -0.038330078125, 0.03857421875, 0.115478515625, 0.1923828125, 0.269287109375, 0.34619140625, 0.423095703125, 0.5, 0.576904296875, 0.65380859375, 0.730712890625, 0.8076171875, 0.884521484375, 0.96142578125, 1.038330078125, 1.115234375, 1.192138671875, 1.26904296875, 1.345947265625, 1.4228515625, 1.499755859375, 1.57666015625, 1.653564453125, 1.73046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 18.0, 39.0, 52.0, 80.0, 147.0, 734.0, 4190635.0, 2061.0, 217.0, 101.0, 71.0, 45.0, 31.0, 21.0, 18.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.625, -62.671875, -57.71875, -52.765625, -47.8125, -42.859375, -37.90625, -32.953125, -28.0, -23.046875, -18.09375, -13.140625, -8.1875, -3.234375, 1.71875, 6.671875, 11.625, 16.578125, 21.53125, 26.484375, 31.4375, 36.390625, 41.34375, 46.296875, 51.25, 56.203125, 61.15625, 66.109375, 71.0625, 76.015625, 80.96875, 85.921875, 90.875, 95.828125, 100.78125, 105.734375, 110.6875, 115.640625, 120.59375, 125.546875, 130.5, 135.453125, 140.40625, 145.359375, 150.3125, 155.265625, 160.21875, 165.171875, 170.125, 175.078125, 180.03125, 184.984375, 189.9375, 194.890625, 199.84375, 204.796875, 209.75, 214.703125, 219.65625, 224.609375, 229.5625, 234.515625, 239.46875, 244.421875, 249.375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 18.0, 73.0, 768.0, 3013.0, 167.0, 34.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.450927734375, -8.01123046875, -7.571533203125, -7.1318359375, -6.692138671875, -6.25244140625, -5.812744140625, -5.373046875, -4.933349609375, -4.49365234375, -4.053955078125, -3.6142578125, -3.174560546875, -2.73486328125, -2.295166015625, -1.85546875, -1.415771484375, -0.97607421875, -0.536376953125, -0.0966796875, 0.343017578125, 0.78271484375, 1.222412109375, 1.662109375, 2.101806640625, 2.54150390625, 2.981201171875, 3.4208984375, 3.860595703125, 4.30029296875, 4.739990234375, 5.1796875, 5.619384765625, 6.05908203125, 6.498779296875, 6.9384765625, 7.378173828125, 7.81787109375, 8.257568359375, 8.697265625, 9.136962890625, 9.57666015625, 10.016357421875, 10.4560546875, 10.895751953125, 11.33544921875, 11.775146484375, 12.21484375, 12.654541015625, 13.09423828125, 13.533935546875, 13.9736328125, 14.413330078125, 14.85302734375, 15.292724609375, 15.732421875, 16.172119140625, 16.61181640625, 17.051513671875, 17.4912109375, 17.930908203125, 18.37060546875, 18.810302734375, 19.25]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 11.0, 959.0, 44.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-488.052978515625, -477.8087463378906, -467.5644836425781, -457.32025146484375, -447.07598876953125, -436.8317565917969, -426.5874938964844, -416.34326171875, -406.0989990234375, -395.8547668457031, -385.6105041503906, -375.36627197265625, -365.12200927734375, -354.8777770996094, -344.6335144042969, -334.3892822265625, -324.14501953125, -313.9007873535156, -303.6565246582031, -293.41229248046875, -283.16802978515625, -272.9237976074219, -262.6795349121094, -252.435302734375, -242.19107055664062, -231.9468231201172, -221.70257568359375, -211.4583282470703, -201.21408081054688, -190.96983337402344, -180.7255859375, -170.48135375976562, -160.23709106445312, -149.9928436279297, -139.74859619140625, -129.5043487548828, -119.26010131835938, -109.01585388183594, -98.77161407470703, -88.5273666381836, -78.28311920166016, -68.03887176513672, -57.79462432861328, -47.55038070678711, -37.30613327026367, -27.061885833740234, -16.817642211914062, -6.573394775390625, 3.6708526611328125, 13.915099143981934, 24.159345626831055, 34.40359115600586, 44.6478385925293, 54.892086029052734, 65.1363296508789, 75.38057708740234, 85.62482452392578, 95.86907196044922, 106.11331939697266, 116.35755920410156, 126.601806640625, 136.84605407714844, 147.09030151367188, 157.3345489501953, 167.57879638671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 10.0, 20.0, 23.0, 35.0, 47.0, 85.0, 95.0, 115.0, 102.0, 109.0, 84.0, 75.0, 61.0, 46.0, 32.0, 23.0, 18.0, 11.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.2419490814209, -28.393123626708984, -27.54429817199707, -26.695472717285156, -25.846647262573242, -24.997821807861328, -24.148998260498047, -23.3001708984375, -22.45134735107422, -21.602521896362305, -20.75369644165039, -19.904870986938477, -19.056045532226562, -18.20722007751465, -17.358394622802734, -16.509571075439453, -15.660743713378906, -14.811918258666992, -13.963092803955078, -13.114267349243164, -12.26544189453125, -11.416616439819336, -10.567791938781738, -9.718966484069824, -8.87014102935791, -8.021315574645996, -7.172490119934082, -6.323665142059326, -5.474839687347412, -4.626014232635498, -3.777189254760742, -2.928363800048828, -2.0795364379882812, -1.2307111024856567, -0.3818857669830322, 0.46693944931030273, 1.3157649040222168, 2.164590358734131, 3.0134153366088867, 3.862240791320801, 4.711066246032715, 5.559891700744629, 6.408717155456543, 7.257542133331299, 8.106367111206055, 8.955192565917969, 9.804018020629883, 10.652843475341797, 11.501668930053711, 12.350494384765625, 13.199319839477539, 14.048145294189453, 14.896970748901367, 15.745796203613281, 16.594619750976562, 17.44344711303711, 18.29227066040039, 19.141096115112305, 19.98992156982422, 20.838747024536133, 21.687572479248047, 22.53639793395996, 23.385223388671875, 24.234046936035156, 25.082874298095703]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 13.0, 20.0, 22.0, 29.0, 64.0, 94.0, 164.0, 356.0, 840.0, 2731.0, 13571.0, 113843.0, 682129.0, 206818.0, 21994.0, 3892.0, 1107.0, 398.0, 203.0, 107.0, 58.0, 33.0, 24.0, 14.0, 17.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-21.484375, -21.0029296875, -20.521484375, -20.0400390625, -19.55859375, -19.0771484375, -18.595703125, -18.1142578125, -17.6328125, -17.1513671875, -16.669921875, -16.1884765625, -15.70703125, -15.2255859375, -14.744140625, -14.2626953125, -13.78125, -13.2998046875, -12.818359375, -12.3369140625, -11.85546875, -11.3740234375, -10.892578125, -10.4111328125, -9.9296875, -9.4482421875, -8.966796875, -8.4853515625, -8.00390625, -7.5224609375, -7.041015625, -6.5595703125, -6.078125, -5.5966796875, -5.115234375, -4.6337890625, -4.15234375, -3.6708984375, -3.189453125, -2.7080078125, -2.2265625, -1.7451171875, -1.263671875, -0.7822265625, -0.30078125, 0.1806640625, 0.662109375, 1.1435546875, 1.625, 2.1064453125, 2.587890625, 3.0693359375, 3.55078125, 4.0322265625, 4.513671875, 4.9951171875, 5.4765625, 5.9580078125, 6.439453125, 6.9208984375, 7.40234375, 7.8837890625, 8.365234375, 8.8466796875, 9.328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 9.0, 11.0, 16.0, 26.0, 31.0, 54.0, 49.0, 55.0, 78.0, 79.0, 79.0, 76.0, 68.0, 71.0, 66.0, 54.0, 40.0, 28.0, 32.0, 29.0, 13.0, 12.0, 4.0, 11.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.1927642822265625, -2.133575439453125, -2.0743865966796875, -2.01519775390625, -1.9560089111328125, -1.896820068359375, -1.8376312255859375, -1.7784423828125, -1.7192535400390625, -1.660064697265625, -1.6008758544921875, -1.54168701171875, -1.4824981689453125, -1.423309326171875, -1.3641204833984375, -1.304931640625, -1.2457427978515625, -1.186553955078125, -1.1273651123046875, -1.06817626953125, -1.0089874267578125, -0.949798583984375, -0.8906097412109375, -0.8314208984375, -0.7722320556640625, -0.713043212890625, -0.6538543701171875, -0.59466552734375, -0.5354766845703125, -0.476287841796875, -0.4170989990234375, -0.35791015625, -0.2987213134765625, -0.239532470703125, -0.1803436279296875, -0.12115478515625, -0.0619659423828125, -0.002777099609375, 0.0564117431640625, 0.1156005859375, 0.1747894287109375, 0.233978271484375, 0.2931671142578125, 0.35235595703125, 0.4115447998046875, 0.470733642578125, 0.5299224853515625, 0.589111328125, 0.6483001708984375, 0.707489013671875, 0.7666778564453125, 0.82586669921875, 0.8850555419921875, 0.944244384765625, 1.0034332275390625, 1.0626220703125, 1.1218109130859375, 1.180999755859375, 1.2401885986328125, 1.29937744140625, 1.3585662841796875, 1.417755126953125, 1.4769439697265625, 1.5361328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 13.0, 14.0, 22.0, 41.0, 47.0, 91.0, 162.0, 255.0, 568.0, 1387.0, 4325.0, 25960.0, 412898.0, 558567.0, 35972.0, 5254.0, 1500.0, 666.0, 327.0, 190.0, 90.0, 61.0, 46.0, 28.0, 16.0, 13.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.0, -18.4874267578125, -17.974853515625, -17.4622802734375, -16.94970703125, -16.4371337890625, -15.924560546875, -15.4119873046875, -14.8994140625, -14.3868408203125, -13.874267578125, -13.3616943359375, -12.84912109375, -12.3365478515625, -11.823974609375, -11.3114013671875, -10.798828125, -10.2862548828125, -9.773681640625, -9.2611083984375, -8.74853515625, -8.2359619140625, -7.723388671875, -7.2108154296875, -6.6982421875, -6.1856689453125, -5.673095703125, -5.1605224609375, -4.64794921875, -4.1353759765625, -3.622802734375, -3.1102294921875, -2.59765625, -2.0850830078125, -1.572509765625, -1.0599365234375, -0.54736328125, -0.0347900390625, 0.477783203125, 0.9903564453125, 1.5029296875, 2.0155029296875, 2.528076171875, 3.0406494140625, 3.55322265625, 4.0657958984375, 4.578369140625, 5.0909423828125, 5.603515625, 6.1160888671875, 6.628662109375, 7.1412353515625, 7.65380859375, 8.1663818359375, 8.678955078125, 9.1915283203125, 9.7041015625, 10.2166748046875, 10.729248046875, 11.2418212890625, 11.75439453125, 12.2669677734375, 12.779541015625, 13.2921142578125, 13.8046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 13.0, 17.0, 11.0, 18.0, 22.0, 17.0, 28.0, 29.0, 60.0, 44.0, 49.0, 56.0, 55.0, 59.0, 46.0, 63.0, 59.0, 52.0, 47.0, 43.0, 37.0, 27.0, 24.0, 22.0, 13.0, 22.0, 15.0, 8.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.44921875, -7.222900390625, -6.99658203125, -6.770263671875, -6.5439453125, -6.317626953125, -6.09130859375, -5.864990234375, -5.638671875, -5.412353515625, -5.18603515625, -4.959716796875, -4.7333984375, -4.507080078125, -4.28076171875, -4.054443359375, -3.828125, -3.601806640625, -3.37548828125, -3.149169921875, -2.9228515625, -2.696533203125, -2.47021484375, -2.243896484375, -2.017578125, -1.791259765625, -1.56494140625, -1.338623046875, -1.1123046875, -0.885986328125, -0.65966796875, -0.433349609375, -0.20703125, 0.019287109375, 0.24560546875, 0.471923828125, 0.6982421875, 0.924560546875, 1.15087890625, 1.377197265625, 1.603515625, 1.829833984375, 2.05615234375, 2.282470703125, 2.5087890625, 2.735107421875, 2.96142578125, 3.187744140625, 3.4140625, 3.640380859375, 3.86669921875, 4.093017578125, 4.3193359375, 4.545654296875, 4.77197265625, 4.998291015625, 5.224609375, 5.450927734375, 5.67724609375, 5.903564453125, 6.1298828125, 6.356201171875, 6.58251953125, 6.808837890625, 7.03515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 12.0, 15.0, 26.0, 54.0, 89.0, 111.0, 200.0, 333.0, 682.0, 1636.0, 4207.0, 12731.0, 52772.0, 346907.0, 520123.0, 81336.0, 17876.0, 5595.0, 2013.0, 837.0, 396.0, 212.0, 122.0, 74.0, 54.0, 35.0, 21.0, 18.0, 9.0, 8.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.1678466796875, -4.984130859375, -4.8004150390625, -4.61669921875, -4.4329833984375, -4.249267578125, -4.0655517578125, -3.8818359375, -3.6981201171875, -3.514404296875, -3.3306884765625, -3.14697265625, -2.9632568359375, -2.779541015625, -2.5958251953125, -2.412109375, -2.2283935546875, -2.044677734375, -1.8609619140625, -1.67724609375, -1.4935302734375, -1.309814453125, -1.1260986328125, -0.9423828125, -0.7586669921875, -0.574951171875, -0.3912353515625, -0.20751953125, -0.0238037109375, 0.159912109375, 0.3436279296875, 0.52734375, 0.7110595703125, 0.894775390625, 1.0784912109375, 1.26220703125, 1.4459228515625, 1.629638671875, 1.8133544921875, 1.9970703125, 2.1807861328125, 2.364501953125, 2.5482177734375, 2.73193359375, 2.9156494140625, 3.099365234375, 3.2830810546875, 3.466796875, 3.6505126953125, 3.834228515625, 4.0179443359375, 4.20166015625, 4.3853759765625, 4.569091796875, 4.7528076171875, 4.9365234375, 5.1202392578125, 5.303955078125, 5.4876708984375, 5.67138671875, 5.8551025390625, 6.038818359375, 6.2225341796875, 6.40625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 9.0, 6.0, 11.0, 16.0, 21.0, 31.0, 39.0, 52.0, 87.0, 109.0, 128.0, 113.0, 114.0, 72.0, 55.0, 44.0, 29.0, 17.0, 10.0, 8.0, 8.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006842613220214844, -0.0006606057286262512, -0.0006369501352310181, -0.0006132945418357849, -0.0005896389484405518, -0.0005659833550453186, -0.0005423277616500854, -0.0005186721682548523, -0.0004950165748596191, -0.000471360981464386, -0.00044770538806915283, -0.0004240497946739197, -0.0004003942012786865, -0.00037673860788345337, -0.0003530830144882202, -0.00032942742109298706, -0.0003057718276977539, -0.00028211623430252075, -0.0002584606409072876, -0.00023480504751205444, -0.0002111494541168213, -0.00018749386072158813, -0.00016383826732635498, -0.00014018267393112183, -0.00011652708053588867, -9.287148714065552e-05, -6.921589374542236e-05, -4.556030035018921e-05, -2.1904706954956055e-05, 1.7508864402770996e-06, 2.5406479835510254e-05, 4.906207323074341e-05, 7.271766662597656e-05, 9.637326002120972e-05, 0.00012002885341644287, 0.00014368444681167603, 0.00016734004020690918, 0.00019099563360214233, 0.0002146512269973755, 0.00023830682039260864, 0.0002619624137878418, 0.00028561800718307495, 0.0003092736005783081, 0.00033292919397354126, 0.0003565847873687744, 0.00038024038076400757, 0.0004038959741592407, 0.0004275515675544739, 0.00045120716094970703, 0.0004748627543449402, 0.0004985183477401733, 0.0005221739411354065, 0.0005458295345306396, 0.0005694851279258728, 0.000593140721321106, 0.0006167963147163391, 0.0006404519081115723, 0.0006641075015068054, 0.0006877630949020386, 0.0007114186882972717, 0.0007350742816925049, 0.000758729875087738, 0.0007823854684829712, 0.0008060410618782043, 0.0008296966552734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 9.0, 7.0, 9.0, 15.0, 23.0, 47.0, 66.0, 120.0, 246.0, 532.0, 1201.0, 3451.0, 14371.0, 109066.0, 740873.0, 153842.0, 17888.0, 4134.0, 1416.0, 612.0, 305.0, 133.0, 71.0, 42.0, 29.0, 16.0, 17.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.09375, -5.8643798828125, -5.635009765625, -5.4056396484375, -5.17626953125, -4.9468994140625, -4.717529296875, -4.4881591796875, -4.2587890625, -4.0294189453125, -3.800048828125, -3.5706787109375, -3.34130859375, -3.1119384765625, -2.882568359375, -2.6531982421875, -2.423828125, -2.1944580078125, -1.965087890625, -1.7357177734375, -1.50634765625, -1.2769775390625, -1.047607421875, -0.8182373046875, -0.5888671875, -0.3594970703125, -0.130126953125, 0.0992431640625, 0.32861328125, 0.5579833984375, 0.787353515625, 1.0167236328125, 1.24609375, 1.4754638671875, 1.704833984375, 1.9342041015625, 2.16357421875, 2.3929443359375, 2.622314453125, 2.8516845703125, 3.0810546875, 3.3104248046875, 3.539794921875, 3.7691650390625, 3.99853515625, 4.2279052734375, 4.457275390625, 4.6866455078125, 4.916015625, 5.1453857421875, 5.374755859375, 5.6041259765625, 5.83349609375, 6.0628662109375, 6.292236328125, 6.5216064453125, 6.7509765625, 6.9803466796875, 7.209716796875, 7.4390869140625, 7.66845703125, 7.8978271484375, 8.127197265625, 8.3565673828125, 8.5859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 6.0, 9.0, 5.0, 10.0, 20.0, 16.0, 20.0, 23.0, 31.0, 40.0, 47.0, 71.0, 82.0, 90.0, 78.0, 84.0, 76.0, 49.0, 43.0, 36.0, 34.0, 19.0, 20.0, 19.0, 16.0, 9.0, 5.0, 6.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.333831787109375, -3.22625732421875, -3.118682861328125, -3.0111083984375, -2.903533935546875, -2.79595947265625, -2.688385009765625, -2.580810546875, -2.473236083984375, -2.36566162109375, -2.258087158203125, -2.1505126953125, -2.042938232421875, -1.93536376953125, -1.827789306640625, -1.72021484375, -1.612640380859375, -1.50506591796875, -1.397491455078125, -1.2899169921875, -1.182342529296875, -1.07476806640625, -0.967193603515625, -0.859619140625, -0.752044677734375, -0.64447021484375, -0.536895751953125, -0.4293212890625, -0.321746826171875, -0.21417236328125, -0.106597900390625, 0.0009765625, 0.108551025390625, 0.21612548828125, 0.323699951171875, 0.4312744140625, 0.538848876953125, 0.64642333984375, 0.753997802734375, 0.861572265625, 0.969146728515625, 1.07672119140625, 1.184295654296875, 1.2918701171875, 1.399444580078125, 1.50701904296875, 1.614593505859375, 1.72216796875, 1.829742431640625, 1.93731689453125, 2.044891357421875, 2.1524658203125, 2.260040283203125, 2.36761474609375, 2.475189208984375, 2.582763671875, 2.690338134765625, 2.79791259765625, 2.905487060546875, 3.0130615234375, 3.120635986328125, 3.22821044921875, 3.335784912109375, 3.443359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 30.0, 162.0, 400.0, 295.0, 73.0, 24.0, 12.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-245.78265380859375, -240.52084350585938, -235.259033203125, -229.99722290039062, -224.73541259765625, -219.47360229492188, -214.2117919921875, -208.94998168945312, -203.68817138671875, -198.42636108398438, -193.16455078125, -187.90274047851562, -182.64093017578125, -177.37911987304688, -172.1173095703125, -166.85549926757812, -161.59368896484375, -156.33187866210938, -151.070068359375, -145.80825805664062, -140.54644775390625, -135.28463745117188, -130.0228271484375, -124.76101684570312, -119.49922180175781, -114.23741149902344, -108.97560119628906, -103.71379089355469, -98.45198059082031, -93.19017028808594, -87.92835998535156, -82.66654968261719, -77.40473937988281, -72.14292907714844, -66.88111877441406, -61.61930847167969, -56.35749816894531, -51.09568786621094, -45.83388137817383, -40.57207107543945, -35.31026077270508, -30.048450469970703, -24.786640167236328, -19.524831771850586, -14.263021469116211, -9.001211166381836, -3.7394027709960938, 1.5224075317382812, 6.784217834472656, 12.046028137207031, 17.307838439941406, 22.56964683532715, 27.831457138061523, 33.09326934814453, 38.35507583618164, 43.616886138916016, 48.87869644165039, 54.140506744384766, 59.40231704711914, 64.66412353515625, 69.92593383789062, 75.187744140625, 80.44955444335938, 85.71136474609375, 90.97317504882812]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 15.0, 8.0, 15.0, 9.0, 23.0, 33.0, 33.0, 47.0, 44.0, 43.0, 69.0, 54.0, 65.0, 61.0, 74.0, 65.0, 56.0, 34.0, 49.0, 30.0, 39.0, 34.0, 24.0, 18.0, 7.0, 6.0, 12.0, 9.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.54570007324219, -48.94247055053711, -47.339237213134766, -45.73600769042969, -44.13277816772461, -42.52954864501953, -40.92631530761719, -39.32308578491211, -37.71985626220703, -36.11662673950195, -34.51339340209961, -32.91016387939453, -31.306934356689453, -29.703702926635742, -28.10047149658203, -26.497241973876953, -24.89400863647461, -23.2907772064209, -21.68754768371582, -20.08431625366211, -18.48108673095703, -16.87785530090332, -15.27462387084961, -13.671393394470215, -12.06816291809082, -10.464932441711426, -8.861701965332031, -7.25847053527832, -5.655240058898926, -4.052009582519531, -2.4487781524658203, -0.8455476760864258, 0.7576828002929688, 2.3609135150909424, 3.964144229888916, 5.567375183105469, 7.170605659484863, 8.773836135864258, 10.377067565917969, 11.980298042297363, 13.583528518676758, 15.186758995056152, 16.789989471435547, 18.393220901489258, 19.99645233154297, 21.599681854248047, 23.202913284301758, 24.80614471435547, 26.409374237060547, 28.012605667114258, 29.615835189819336, 31.219066619873047, 32.822296142578125, 34.42552947998047, 36.02875900268555, 37.631988525390625, 39.23522186279297, 40.83845138549805, 42.44168472290039, 44.04491424560547, 45.64814376831055, 47.251373291015625, 48.85460662841797, 50.45783615112305, 52.061065673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 11.0, 6.0, 22.0, 23.0, 32.0, 36.0, 45.0, 69.0, 87.0, 129.0, 190.0, 250.0, 428.0, 789.0, 1502.0, 3547.0, 9270.0, 31486.0, 163520.0, 3494122.0, 412112.0, 53680.0, 13996.0, 4825.0, 1963.0, 952.0, 440.0, 290.0, 170.0, 109.0, 62.0, 25.0, 21.0, 10.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0], "bins": [-17.03125, -16.6322021484375, -16.233154296875, -15.8341064453125, -15.43505859375, -15.0360107421875, -14.636962890625, -14.2379150390625, -13.8388671875, -13.4398193359375, -13.040771484375, -12.6417236328125, -12.24267578125, -11.8436279296875, -11.444580078125, -11.0455322265625, -10.646484375, -10.2474365234375, -9.848388671875, -9.4493408203125, -9.05029296875, -8.6512451171875, -8.252197265625, -7.8531494140625, -7.4541015625, -7.0550537109375, -6.656005859375, -6.2569580078125, -5.85791015625, -5.4588623046875, -5.059814453125, -4.6607666015625, -4.26171875, -3.8626708984375, -3.463623046875, -3.0645751953125, -2.66552734375, -2.2664794921875, -1.867431640625, -1.4683837890625, -1.0693359375, -0.6702880859375, -0.271240234375, 0.1278076171875, 0.52685546875, 0.9259033203125, 1.324951171875, 1.7239990234375, 2.123046875, 2.5220947265625, 2.921142578125, 3.3201904296875, 3.71923828125, 4.1182861328125, 4.517333984375, 4.9163818359375, 5.3154296875, 5.7144775390625, 6.113525390625, 6.5125732421875, 6.91162109375, 7.3106689453125, 7.709716796875, 8.1087646484375, 8.5078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 3.0, 4.0, 7.0, 14.0, 27.0, 23.0, 24.0, 42.0, 42.0, 53.0, 57.0, 62.0, 64.0, 65.0, 75.0, 75.0, 68.0, 55.0, 51.0, 34.0, 32.0, 27.0, 27.0, 18.0, 14.0, 12.0, 5.0, 6.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.9850921630859375, -1.931121826171875, -1.8771514892578125, -1.82318115234375, -1.7692108154296875, -1.715240478515625, -1.6612701416015625, -1.6072998046875, -1.5533294677734375, -1.499359130859375, -1.4453887939453125, -1.39141845703125, -1.3374481201171875, -1.283477783203125, -1.2295074462890625, -1.175537109375, -1.1215667724609375, -1.067596435546875, -1.0136260986328125, -0.95965576171875, -0.9056854248046875, -0.851715087890625, -0.7977447509765625, -0.7437744140625, -0.6898040771484375, -0.635833740234375, -0.5818634033203125, -0.52789306640625, -0.4739227294921875, -0.419952392578125, -0.3659820556640625, -0.31201171875, -0.2580413818359375, -0.204071044921875, -0.1501007080078125, -0.09613037109375, -0.0421600341796875, 0.011810302734375, 0.0657806396484375, 0.1197509765625, 0.1737213134765625, 0.227691650390625, 0.2816619873046875, 0.33563232421875, 0.3896026611328125, 0.443572998046875, 0.4975433349609375, 0.551513671875, 0.6054840087890625, 0.659454345703125, 0.7134246826171875, 0.76739501953125, 0.8213653564453125, 0.875335693359375, 0.9293060302734375, 0.9832763671875, 1.0372467041015625, 1.091217041015625, 1.1451873779296875, 1.19915771484375, 1.2531280517578125, 1.307098388671875, 1.3610687255859375, 1.4150390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 2.0, 13.0, 14.0, 26.0, 44.0, 70.0, 131.0, 271.0, 697.0, 2265.0, 11418.0, 311102.0, 3833163.0, 28964.0, 4131.0, 1136.0, 380.0, 193.0, 92.0, 60.0, 22.0, 20.0, 16.0, 7.0, 12.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.8125, -23.962890625, -23.11328125, -22.263671875, -21.4140625, -20.564453125, -19.71484375, -18.865234375, -18.015625, -17.166015625, -16.31640625, -15.466796875, -14.6171875, -13.767578125, -12.91796875, -12.068359375, -11.21875, -10.369140625, -9.51953125, -8.669921875, -7.8203125, -6.970703125, -6.12109375, -5.271484375, -4.421875, -3.572265625, -2.72265625, -1.873046875, -1.0234375, -0.173828125, 0.67578125, 1.525390625, 2.375, 3.224609375, 4.07421875, 4.923828125, 5.7734375, 6.623046875, 7.47265625, 8.322265625, 9.171875, 10.021484375, 10.87109375, 11.720703125, 12.5703125, 13.419921875, 14.26953125, 15.119140625, 15.96875, 16.818359375, 17.66796875, 18.517578125, 19.3671875, 20.216796875, 21.06640625, 21.916015625, 22.765625, 23.615234375, 24.46484375, 25.314453125, 26.1640625, 27.013671875, 27.86328125, 28.712890625, 29.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 10.0, 16.0, 15.0, 27.0, 34.0, 66.0, 111.0, 251.0, 496.0, 1332.0, 899.0, 374.0, 177.0, 88.0, 42.0, 29.0, 23.0, 10.0, 11.0, 13.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.456787109375, -4.31201171875, -4.167236328125, -4.0224609375, -3.877685546875, -3.73291015625, -3.588134765625, -3.443359375, -3.298583984375, -3.15380859375, -3.009033203125, -2.8642578125, -2.719482421875, -2.57470703125, -2.429931640625, -2.28515625, -2.140380859375, -1.99560546875, -1.850830078125, -1.7060546875, -1.561279296875, -1.41650390625, -1.271728515625, -1.126953125, -0.982177734375, -0.83740234375, -0.692626953125, -0.5478515625, -0.403076171875, -0.25830078125, -0.113525390625, 0.03125, 0.176025390625, 0.32080078125, 0.465576171875, 0.6103515625, 0.755126953125, 0.89990234375, 1.044677734375, 1.189453125, 1.334228515625, 1.47900390625, 1.623779296875, 1.7685546875, 1.913330078125, 2.05810546875, 2.202880859375, 2.34765625, 2.492431640625, 2.63720703125, 2.781982421875, 2.9267578125, 3.071533203125, 3.21630859375, 3.361083984375, 3.505859375, 3.650634765625, 3.79541015625, 3.940185546875, 4.0849609375, 4.229736328125, 4.37451171875, 4.519287109375, 4.6640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 70.0, 504.0, 370.0, 47.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.36361694335938, -175.72744750976562, -171.09127807617188, -166.45510864257812, -161.81893920898438, -157.18276977539062, -152.54660034179688, -147.91043090820312, -143.27426147460938, -138.63809204101562, -134.00192260742188, -129.36575317382812, -124.72958374023438, -120.09341430664062, -115.45724487304688, -110.82107543945312, -106.1849136352539, -101.54874420166016, -96.9125747680664, -92.27640533447266, -87.6402359008789, -83.00406646728516, -78.36790466308594, -73.73173522949219, -69.09556579589844, -64.45939636230469, -59.82322692871094, -55.18705749511719, -50.55088806152344, -45.91471862792969, -41.2785530090332, -36.64238357543945, -32.00621032714844, -27.370040893554688, -22.733871459960938, -18.09770393371582, -13.46153450012207, -8.82536506652832, -4.189197540283203, 0.4469718933105469, 5.083141326904297, 9.719310760498047, 14.35547924041748, 18.991647720336914, 23.627817153930664, 28.263986587524414, 32.90015411376953, 37.53632354736328, 42.17249298095703, 46.80866241455078, 51.44483184814453, 56.08100128173828, 60.71717071533203, 65.35334014892578, 69.989501953125, 74.62567138671875, 79.2618408203125, 83.89801025390625, 88.5341796875, 93.17034912109375, 97.8065185546875, 102.44268798828125, 107.078857421875, 111.71502685546875, 116.3511962890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 9.0, 10.0, 13.0, 14.0, 23.0, 25.0, 41.0, 40.0, 47.0, 46.0, 48.0, 41.0, 57.0, 51.0, 73.0, 51.0, 65.0, 64.0, 49.0, 44.0, 43.0, 28.0, 28.0, 19.0, 11.0, 15.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.07938003540039, -17.502084732055664, -16.924789428710938, -16.34749412536621, -15.770197868347168, -15.192902565002441, -14.615606307983398, -14.038311004638672, -13.461015701293945, -12.883720397949219, -12.306425094604492, -11.72912883758545, -11.151833534240723, -10.574538230895996, -9.997241973876953, -9.419946670532227, -8.8426513671875, -8.265356063842773, -7.688060283660889, -7.110764503479004, -6.533469200134277, -5.956173896789551, -5.378878116607666, -4.801582336425781, -4.224287033081055, -3.646991491317749, -3.0696959495544434, -2.4924004077911377, -1.915104866027832, -1.3378093242645264, -0.7605137825012207, -0.18321800231933594, 0.3940773010253906, 0.9713728427886963, 1.548668384552002, 2.1259639263153076, 2.7032594680786133, 3.280555009841919, 3.8578505516052246, 4.435146331787109, 5.012441635131836, 5.5897369384765625, 6.167032718658447, 6.744328498840332, 7.321623802185059, 7.898919105529785, 8.476215362548828, 9.053510665893555, 9.630805969238281, 10.208101272583008, 10.785396575927734, 11.362692832946777, 11.939988136291504, 12.51728343963623, 13.094579696655273, 13.671875, 14.249170303344727, 14.826465606689453, 15.40376091003418, 15.981057167053223, 16.558353424072266, 17.135648727416992, 17.71294403076172, 18.290239334106445, 18.867534637451172]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 11.0, 15.0, 14.0, 18.0, 14.0, 25.0, 31.0, 43.0, 63.0, 81.0, 149.0, 201.0, 349.0, 733.0, 1613.0, 3928.0, 11547.0, 40190.0, 168317.0, 525376.0, 222112.0, 50998.0, 14292.0, 4706.0, 1760.0, 799.0, 436.0, 245.0, 137.0, 102.0, 49.0, 39.0, 29.0, 25.0, 23.0, 18.0, 9.0, 10.0, 5.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-11.9296875, -11.594482421875, -11.25927734375, -10.924072265625, -10.5888671875, -10.253662109375, -9.91845703125, -9.583251953125, -9.248046875, -8.912841796875, -8.57763671875, -8.242431640625, -7.9072265625, -7.572021484375, -7.23681640625, -6.901611328125, -6.56640625, -6.231201171875, -5.89599609375, -5.560791015625, -5.2255859375, -4.890380859375, -4.55517578125, -4.219970703125, -3.884765625, -3.549560546875, -3.21435546875, -2.879150390625, -2.5439453125, -2.208740234375, -1.87353515625, -1.538330078125, -1.203125, -0.867919921875, -0.53271484375, -0.197509765625, 0.1376953125, 0.472900390625, 0.80810546875, 1.143310546875, 1.478515625, 1.813720703125, 2.14892578125, 2.484130859375, 2.8193359375, 3.154541015625, 3.48974609375, 3.824951171875, 4.16015625, 4.495361328125, 4.83056640625, 5.165771484375, 5.5009765625, 5.836181640625, 6.17138671875, 6.506591796875, 6.841796875, 7.177001953125, 7.51220703125, 7.847412109375, 8.1826171875, 8.517822265625, 8.85302734375, 9.188232421875, 9.5234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 2.0, 14.0, 11.0, 23.0, 18.0, 30.0, 36.0, 29.0, 47.0, 45.0, 76.0, 67.0, 55.0, 59.0, 59.0, 63.0, 51.0, 44.0, 46.0, 52.0, 41.0, 22.0, 23.0, 16.0, 17.0, 13.0, 11.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.1484375, -2.097686767578125, -2.04693603515625, -1.996185302734375, -1.9454345703125, -1.894683837890625, -1.84393310546875, -1.793182373046875, -1.742431640625, -1.691680908203125, -1.64093017578125, -1.590179443359375, -1.5394287109375, -1.488677978515625, -1.43792724609375, -1.387176513671875, -1.33642578125, -1.285675048828125, -1.23492431640625, -1.184173583984375, -1.1334228515625, -1.082672119140625, -1.03192138671875, -0.981170654296875, -0.930419921875, -0.879669189453125, -0.82891845703125, -0.778167724609375, -0.7274169921875, -0.676666259765625, -0.62591552734375, -0.575164794921875, -0.5244140625, -0.473663330078125, -0.42291259765625, -0.372161865234375, -0.3214111328125, -0.270660400390625, -0.21990966796875, -0.169158935546875, -0.118408203125, -0.067657470703125, -0.01690673828125, 0.033843994140625, 0.0845947265625, 0.135345458984375, 0.18609619140625, 0.236846923828125, 0.28759765625, 0.338348388671875, 0.38909912109375, 0.439849853515625, 0.4906005859375, 0.541351318359375, 0.59210205078125, 0.642852783203125, 0.693603515625, 0.744354248046875, 0.79510498046875, 0.845855712890625, 0.8966064453125, 0.947357177734375, 0.99810791015625, 1.048858642578125, 1.099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 8.0, 8.0, 15.0, 18.0, 35.0, 51.0, 57.0, 112.0, 191.0, 422.0, 1039.0, 3414.0, 16971.0, 122106.0, 629063.0, 236352.0, 30614.0, 5328.0, 1522.0, 572.0, 255.0, 137.0, 93.0, 45.0, 23.0, 31.0, 15.0, 5.0, 9.0, 5.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4453125, -12.0963134765625, -11.747314453125, -11.3983154296875, -11.04931640625, -10.7003173828125, -10.351318359375, -10.0023193359375, -9.6533203125, -9.3043212890625, -8.955322265625, -8.6063232421875, -8.25732421875, -7.9083251953125, -7.559326171875, -7.2103271484375, -6.861328125, -6.5123291015625, -6.163330078125, -5.8143310546875, -5.46533203125, -5.1163330078125, -4.767333984375, -4.4183349609375, -4.0693359375, -3.7203369140625, -3.371337890625, -3.0223388671875, -2.67333984375, -2.3243408203125, -1.975341796875, -1.6263427734375, -1.27734375, -0.9283447265625, -0.579345703125, -0.2303466796875, 0.11865234375, 0.4676513671875, 0.816650390625, 1.1656494140625, 1.5146484375, 1.8636474609375, 2.212646484375, 2.5616455078125, 2.91064453125, 3.2596435546875, 3.608642578125, 3.9576416015625, 4.306640625, 4.6556396484375, 5.004638671875, 5.3536376953125, 5.70263671875, 6.0516357421875, 6.400634765625, 6.7496337890625, 7.0986328125, 7.4476318359375, 7.796630859375, 8.1456298828125, 8.49462890625, 8.8436279296875, 9.192626953125, 9.5416259765625, 9.890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 8.0, 10.0, 10.0, 15.0, 12.0, 17.0, 25.0, 20.0, 26.0, 41.0, 31.0, 49.0, 42.0, 40.0, 38.0, 53.0, 49.0, 49.0, 55.0, 47.0, 40.0, 45.0, 35.0, 37.0, 27.0, 44.0, 20.0, 27.0, 15.0, 20.0, 11.0, 11.0, 12.0, 4.0, 3.0, 1.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.2421875, -7.04638671875, -6.8505859375, -6.65478515625, -6.458984375, -6.26318359375, -6.0673828125, -5.87158203125, -5.67578125, -5.47998046875, -5.2841796875, -5.08837890625, -4.892578125, -4.69677734375, -4.5009765625, -4.30517578125, -4.109375, -3.91357421875, -3.7177734375, -3.52197265625, -3.326171875, -3.13037109375, -2.9345703125, -2.73876953125, -2.54296875, -2.34716796875, -2.1513671875, -1.95556640625, -1.759765625, -1.56396484375, -1.3681640625, -1.17236328125, -0.9765625, -0.78076171875, -0.5849609375, -0.38916015625, -0.193359375, 0.00244140625, 0.1982421875, 0.39404296875, 0.58984375, 0.78564453125, 0.9814453125, 1.17724609375, 1.373046875, 1.56884765625, 1.7646484375, 1.96044921875, 2.15625, 2.35205078125, 2.5478515625, 2.74365234375, 2.939453125, 3.13525390625, 3.3310546875, 3.52685546875, 3.72265625, 3.91845703125, 4.1142578125, 4.31005859375, 4.505859375, 4.70166015625, 4.8974609375, 5.09326171875, 5.2890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 13.0, 13.0, 21.0, 35.0, 51.0, 109.0, 189.0, 418.0, 1104.0, 3539.0, 14466.0, 93735.0, 726577.0, 178220.0, 22621.0, 4971.0, 1392.0, 570.0, 227.0, 121.0, 53.0, 44.0, 27.0, 14.0, 6.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.86199951171875, -6.5716552734375, -6.28131103515625, -5.990966796875, -5.70062255859375, -5.4102783203125, -5.11993408203125, -4.82958984375, -4.53924560546875, -4.2489013671875, -3.95855712890625, -3.668212890625, -3.37786865234375, -3.0875244140625, -2.79718017578125, -2.5068359375, -2.21649169921875, -1.9261474609375, -1.63580322265625, -1.345458984375, -1.05511474609375, -0.7647705078125, -0.47442626953125, -0.18408203125, 0.10626220703125, 0.3966064453125, 0.68695068359375, 0.977294921875, 1.26763916015625, 1.5579833984375, 1.84832763671875, 2.138671875, 2.42901611328125, 2.7193603515625, 3.00970458984375, 3.300048828125, 3.59039306640625, 3.8807373046875, 4.17108154296875, 4.46142578125, 4.75177001953125, 5.0421142578125, 5.33245849609375, 5.622802734375, 5.91314697265625, 6.2034912109375, 6.49383544921875, 6.7841796875, 7.07452392578125, 7.3648681640625, 7.65521240234375, 7.945556640625, 8.23590087890625, 8.5262451171875, 8.81658935546875, 9.10693359375, 9.39727783203125, 9.6876220703125, 9.97796630859375, 10.268310546875, 10.55865478515625, 10.8489990234375, 11.13934326171875, 11.4296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 3.0, 8.0, 10.0, 13.0, 17.0, 15.0, 18.0, 36.0, 33.0, 53.0, 70.0, 79.0, 119.0, 98.0, 90.0, 69.0, 51.0, 41.0, 34.0, 22.0, 18.0, 18.0, 11.0, 9.0, 10.0, 6.0, 9.0, 3.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0005536079406738281, -0.0005383417010307312, -0.0005230754613876343, -0.0005078092217445374, -0.0004925429821014404, -0.0004772767424583435, -0.0004620105028152466, -0.00044674426317214966, -0.00043147802352905273, -0.0004162117838859558, -0.0004009455442428589, -0.00038567930459976196, -0.00037041306495666504, -0.0003551468253135681, -0.0003398805856704712, -0.00032461434602737427, -0.00030934810638427734, -0.0002940818667411804, -0.0002788156270980835, -0.00026354938745498657, -0.00024828314781188965, -0.00023301690816879272, -0.0002177506685256958, -0.00020248442888259888, -0.00018721818923950195, -0.00017195194959640503, -0.0001566857099533081, -0.00014141947031021118, -0.00012615323066711426, -0.00011088699102401733, -9.562075138092041e-05, -8.035451173782349e-05, -6.508827209472656e-05, -4.982203245162964e-05, -3.4555792808532715e-05, -1.928955316543579e-05, -4.023313522338867e-06, 1.1242926120758057e-05, 2.650916576385498e-05, 4.1775405406951904e-05, 5.704164505004883e-05, 7.230788469314575e-05, 8.757412433624268e-05, 0.0001028403639793396, 0.00011810660362243652, 0.00013337284326553345, 0.00014863908290863037, 0.0001639053225517273, 0.00017917156219482422, 0.00019443780183792114, 0.00020970404148101807, 0.000224970281124115, 0.00024023652076721191, 0.00025550276041030884, 0.00027076900005340576, 0.0002860352396965027, 0.0003013014793395996, 0.00031656771898269653, 0.00033183395862579346, 0.0003471001982688904, 0.0003623664379119873, 0.00037763267755508423, 0.00039289891719818115, 0.0004081651568412781, 0.000423431396484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 18.0, 32.0, 42.0, 96.0, 163.0, 303.0, 622.0, 1619.0, 5307.0, 26946.0, 271202.0, 671872.0, 56854.0, 9366.0, 2478.0, 821.0, 356.0, 174.0, 102.0, 60.0, 36.0, 27.0, 20.0, 11.0, 5.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -7.95751953125, -7.6416015625, -7.32568359375, -7.009765625, -6.69384765625, -6.3779296875, -6.06201171875, -5.74609375, -5.43017578125, -5.1142578125, -4.79833984375, -4.482421875, -4.16650390625, -3.8505859375, -3.53466796875, -3.21875, -2.90283203125, -2.5869140625, -2.27099609375, -1.955078125, -1.63916015625, -1.3232421875, -1.00732421875, -0.69140625, -0.37548828125, -0.0595703125, 0.25634765625, 0.572265625, 0.88818359375, 1.2041015625, 1.52001953125, 1.8359375, 2.15185546875, 2.4677734375, 2.78369140625, 3.099609375, 3.41552734375, 3.7314453125, 4.04736328125, 4.36328125, 4.67919921875, 4.9951171875, 5.31103515625, 5.626953125, 5.94287109375, 6.2587890625, 6.57470703125, 6.890625, 7.20654296875, 7.5224609375, 7.83837890625, 8.154296875, 8.47021484375, 8.7861328125, 9.10205078125, 9.41796875, 9.73388671875, 10.0498046875, 10.36572265625, 10.681640625, 10.99755859375, 11.3134765625, 11.62939453125, 11.9453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 12.0, 12.0, 7.0, 22.0, 21.0, 36.0, 49.0, 59.0, 76.0, 110.0, 141.0, 108.0, 94.0, 54.0, 48.0, 28.0, 24.0, 17.0, 18.0, 9.0, 3.0, 5.0, 5.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.16278076171875, -4.9935302734375, -4.82427978515625, -4.655029296875, -4.48577880859375, -4.3165283203125, -4.14727783203125, -3.97802734375, -3.80877685546875, -3.6395263671875, -3.47027587890625, -3.301025390625, -3.13177490234375, -2.9625244140625, -2.79327392578125, -2.6240234375, -2.45477294921875, -2.2855224609375, -2.11627197265625, -1.947021484375, -1.77777099609375, -1.6085205078125, -1.43927001953125, -1.27001953125, -1.10076904296875, -0.9315185546875, -0.76226806640625, -0.593017578125, -0.42376708984375, -0.2545166015625, -0.08526611328125, 0.083984375, 0.25323486328125, 0.4224853515625, 0.59173583984375, 0.760986328125, 0.93023681640625, 1.0994873046875, 1.26873779296875, 1.43798828125, 1.60723876953125, 1.7764892578125, 1.94573974609375, 2.114990234375, 2.28424072265625, 2.4534912109375, 2.62274169921875, 2.7919921875, 2.96124267578125, 3.1304931640625, 3.29974365234375, 3.468994140625, 3.63824462890625, 3.8074951171875, 3.97674560546875, 4.14599609375, 4.31524658203125, 4.4844970703125, 4.65374755859375, 4.822998046875, 4.99224853515625, 5.1614990234375, 5.33074951171875, 5.5]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 21.0, 29.0, 89.0, 202.0, 254.0, 220.0, 104.0, 45.0, 23.0, 10.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.09078979492188, -127.86033630371094, -124.6298828125, -121.39942932128906, -118.16898345947266, -114.93852996826172, -111.70807647705078, -108.47762298583984, -105.24717712402344, -102.0167236328125, -98.78627014160156, -95.55581665039062, -92.32537078857422, -89.09491729736328, -85.86446380615234, -82.6340103149414, -79.40355682373047, -76.17310333251953, -72.9426498413086, -69.71220397949219, -66.48175048828125, -63.25129699707031, -60.020843505859375, -56.79039001464844, -53.559940338134766, -50.32948684692383, -47.099037170410156, -43.86858367919922, -40.63813018798828, -37.40768051147461, -34.17722702026367, -30.946775436401367, -27.716331481933594, -24.48587989807129, -21.255428314208984, -18.024974822998047, -14.794523239135742, -11.564071655273438, -8.3336181640625, -5.103166580200195, -1.8727149963378906, 1.3577370643615723, 4.588189125061035, 7.818641662597656, 11.049093246459961, 14.279544830322266, 17.509998321533203, 20.740449905395508, 23.970901489257812, 27.201353073120117, 30.431804656982422, 33.66225814819336, 36.89270782470703, 40.12316131591797, 43.353614807128906, 46.584068298339844, 49.814517974853516, 53.04497146606445, 56.275421142578125, 59.50587463378906, 62.736328125, 65.96678161621094, 69.19723510742188, 72.42768096923828, 75.65813446044922]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 12.0, 10.0, 12.0, 19.0, 18.0, 25.0, 28.0, 34.0, 33.0, 34.0, 35.0, 36.0, 43.0, 47.0, 47.0, 47.0, 39.0, 43.0, 45.0, 42.0, 45.0, 23.0, 36.0, 35.0, 36.0, 23.0, 29.0, 15.0, 14.0, 12.0, 13.0, 10.0, 13.0, 5.0, 8.0, 10.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.629146575927734, -30.551347732543945, -29.473546981811523, -28.395748138427734, -27.317949295043945, -26.240150451660156, -25.162349700927734, -24.084550857543945, -23.006752014160156, -21.928953170776367, -20.851152420043945, -19.773353576660156, -18.695554733276367, -17.617755889892578, -16.539955139160156, -15.462156295776367, -14.384355545043945, -13.30655574798584, -12.22875690460205, -11.150957107543945, -10.073158264160156, -8.99535846710205, -7.917558670043945, -6.839759349822998, -5.761960029602051, -4.6841607093811035, -3.606361150741577, -2.528561592102051, -1.4507622718811035, -0.37296295166015625, 0.7048368453979492, 1.7826361656188965, 2.8604354858398438, 3.938234806060791, 5.016034126281738, 6.093833923339844, 7.171633243560791, 8.249432563781738, 9.327232360839844, 10.405031204223633, 11.482831001281738, 12.560630798339844, 13.638429641723633, 14.716229438781738, 15.794029235839844, 16.871828079223633, 17.949626922607422, 19.027427673339844, 20.105226516723633, 21.183025360107422, 22.260826110839844, 23.338624954223633, 24.416423797607422, 25.494224548339844, 26.572023391723633, 27.649822235107422, 28.727622985839844, 29.805421829223633, 30.883222579956055, 31.961021423339844, 33.038822174072266, 34.11661911010742, 35.194419860839844, 36.272220611572266, 37.35001754760742]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 14.0, 22.0, 22.0, 37.0, 64.0, 87.0, 125.0, 200.0, 346.0, 750.0, 1586.0, 4077.0, 12594.0, 61910.0, 3211394.0, 839898.0, 44900.0, 10170.0, 3331.0, 1368.0, 590.0, 337.0, 138.0, 105.0, 53.0, 45.0, 25.0, 17.0, 10.0, 7.0, 10.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.604248046875, -11.21630859375, -10.828369140625, -10.4404296875, -10.052490234375, -9.66455078125, -9.276611328125, -8.888671875, -8.500732421875, -8.11279296875, -7.724853515625, -7.3369140625, -6.948974609375, -6.56103515625, -6.173095703125, -5.78515625, -5.397216796875, -5.00927734375, -4.621337890625, -4.2333984375, -3.845458984375, -3.45751953125, -3.069580078125, -2.681640625, -2.293701171875, -1.90576171875, -1.517822265625, -1.1298828125, -0.741943359375, -0.35400390625, 0.033935546875, 0.421875, 0.809814453125, 1.19775390625, 1.585693359375, 1.9736328125, 2.361572265625, 2.74951171875, 3.137451171875, 3.525390625, 3.913330078125, 4.30126953125, 4.689208984375, 5.0771484375, 5.465087890625, 5.85302734375, 6.240966796875, 6.62890625, 7.016845703125, 7.40478515625, 7.792724609375, 8.1806640625, 8.568603515625, 8.95654296875, 9.344482421875, 9.732421875, 10.120361328125, 10.50830078125, 10.896240234375, 11.2841796875, 11.672119140625, 12.06005859375, 12.447998046875, 12.8359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 7.0, 9.0, 7.0, 10.0, 18.0, 17.0, 29.0, 31.0, 40.0, 51.0, 72.0, 54.0, 68.0, 54.0, 65.0, 74.0, 55.0, 50.0, 61.0, 40.0, 37.0, 27.0, 34.0, 29.0, 14.0, 9.0, 13.0, 11.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.1935882568359375, -2.139129638671875, -2.0846710205078125, -2.03021240234375, -1.9757537841796875, -1.921295166015625, -1.8668365478515625, -1.8123779296875, -1.7579193115234375, -1.703460693359375, -1.6490020751953125, -1.59454345703125, -1.5400848388671875, -1.485626220703125, -1.4311676025390625, -1.376708984375, -1.3222503662109375, -1.267791748046875, -1.2133331298828125, -1.15887451171875, -1.1044158935546875, -1.049957275390625, -0.9954986572265625, -0.9410400390625, -0.8865814208984375, -0.832122802734375, -0.7776641845703125, -0.72320556640625, -0.6687469482421875, -0.614288330078125, -0.5598297119140625, -0.50537109375, -0.4509124755859375, -0.396453857421875, -0.3419952392578125, -0.28753662109375, -0.2330780029296875, -0.178619384765625, -0.1241607666015625, -0.0697021484375, -0.0152435302734375, 0.039215087890625, 0.0936737060546875, 0.14813232421875, 0.2025909423828125, 0.257049560546875, 0.3115081787109375, 0.365966796875, 0.4204254150390625, 0.474884033203125, 0.5293426513671875, 0.58380126953125, 0.6382598876953125, 0.692718505859375, 0.7471771240234375, 0.8016357421875, 0.8560943603515625, 0.910552978515625, 0.9650115966796875, 1.01947021484375, 1.0739288330078125, 1.128387451171875, 1.1828460693359375, 1.2373046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 1.0, 10.0, 17.0, 20.0, 36.0, 64.0, 60.0, 118.0, 193.0, 348.0, 849.0, 3010.0, 21997.0, 1870014.0, 2269190.0, 23390.0, 3070.0, 935.0, 371.0, 206.0, 142.0, 74.0, 48.0, 28.0, 24.0, 20.0, 12.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.306640625, -19.69140625, -19.076171875, -18.4609375, -17.845703125, -17.23046875, -16.615234375, -16.0, -15.384765625, -14.76953125, -14.154296875, -13.5390625, -12.923828125, -12.30859375, -11.693359375, -11.078125, -10.462890625, -9.84765625, -9.232421875, -8.6171875, -8.001953125, -7.38671875, -6.771484375, -6.15625, -5.541015625, -4.92578125, -4.310546875, -3.6953125, -3.080078125, -2.46484375, -1.849609375, -1.234375, -0.619140625, -0.00390625, 0.611328125, 1.2265625, 1.841796875, 2.45703125, 3.072265625, 3.6875, 4.302734375, 4.91796875, 5.533203125, 6.1484375, 6.763671875, 7.37890625, 7.994140625, 8.609375, 9.224609375, 9.83984375, 10.455078125, 11.0703125, 11.685546875, 12.30078125, 12.916015625, 13.53125, 14.146484375, 14.76171875, 15.376953125, 15.9921875, 16.607421875, 17.22265625, 17.837890625, 18.453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 15.0, 11.0, 17.0, 32.0, 55.0, 88.0, 183.0, 498.0, 1886.0, 762.0, 218.0, 108.0, 79.0, 36.0, 27.0, 15.0, 11.0, 11.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.67315673828125, -4.5299072265625, -4.38665771484375, -4.243408203125, -4.10015869140625, -3.9569091796875, -3.81365966796875, -3.67041015625, -3.52716064453125, -3.3839111328125, -3.24066162109375, -3.097412109375, -2.95416259765625, -2.8109130859375, -2.66766357421875, -2.5244140625, -2.38116455078125, -2.2379150390625, -2.09466552734375, -1.951416015625, -1.80816650390625, -1.6649169921875, -1.52166748046875, -1.37841796875, -1.23516845703125, -1.0919189453125, -0.94866943359375, -0.805419921875, -0.66217041015625, -0.5189208984375, -0.37567138671875, -0.232421875, -0.08917236328125, 0.0540771484375, 0.19732666015625, 0.340576171875, 0.48382568359375, 0.6270751953125, 0.77032470703125, 0.91357421875, 1.05682373046875, 1.2000732421875, 1.34332275390625, 1.486572265625, 1.62982177734375, 1.7730712890625, 1.91632080078125, 2.0595703125, 2.20281982421875, 2.3460693359375, 2.48931884765625, 2.632568359375, 2.77581787109375, 2.9190673828125, 3.06231689453125, 3.20556640625, 3.34881591796875, 3.4920654296875, 3.63531494140625, 3.778564453125, 3.92181396484375, 4.0650634765625, 4.20831298828125, 4.3515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 61.0, 271.0, 406.0, 196.0, 49.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.64601135253906, -46.456756591796875, -44.26750183105469, -42.0782470703125, -39.88899230957031, -37.699737548828125, -35.51047897338867, -33.321224212646484, -31.131969451904297, -28.94271469116211, -26.753459930419922, -24.5642032623291, -22.374948501586914, -20.185693740844727, -17.996437072753906, -15.807182312011719, -13.617927551269531, -11.428672790527344, -9.23941707611084, -7.050161838531494, -4.860906600952148, -2.671651840209961, -0.48239612579345703, 1.7068595886230469, 3.8961143493652344, 6.08536958694458, 8.274624824523926, 10.46388053894043, 12.653135299682617, 14.842390060424805, 17.031646728515625, 19.220901489257812, 21.41014862060547, 23.599403381347656, 25.788658142089844, 27.977914810180664, 30.16716957092285, 32.356422424316406, 34.54568099975586, 36.73493576049805, 38.924190521240234, 41.11344528198242, 43.30270004272461, 45.4919548034668, 47.68121337890625, 49.87046813964844, 52.059722900390625, 54.24897766113281, 56.438232421875, 58.62748718261719, 60.816741943359375, 63.00599670410156, 65.19525146484375, 67.38450622558594, 69.57376098632812, 71.76301574707031, 73.9522705078125, 76.14152526855469, 78.33078002929688, 80.52003479003906, 82.70928955078125, 84.89854431152344, 87.08779907226562, 89.27705383300781, 91.46631622314453]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 15.0, 16.0, 23.0, 26.0, 25.0, 33.0, 43.0, 50.0, 58.0, 63.0, 52.0, 46.0, 59.0, 52.0, 51.0, 54.0, 32.0, 49.0, 45.0, 34.0, 37.0, 33.0, 11.0, 21.0, 19.0, 11.0, 4.0, 5.0, 6.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.039474487304688, -13.590597152709961, -13.14172077178955, -12.692843437194824, -12.243967056274414, -11.795089721679688, -11.346212387084961, -10.897335052490234, -10.448458671569824, -9.999581336975098, -9.550704956054688, -9.101827621459961, -8.652950286865234, -8.204073905944824, -7.755196571350098, -7.306319713592529, -6.857442855834961, -6.408565998077393, -5.959689140319824, -5.510811805725098, -5.061934947967529, -4.613058090209961, -4.164180755615234, -3.715303897857666, -3.2664270401000977, -2.8175501823425293, -2.368673086166382, -1.919796109199524, -1.470919132232666, -1.0220422744750977, -0.5731651782989502, -0.12428808212280273, 0.3245878219604492, 0.7734647989273071, 1.222341775894165, 1.671218752861023, 2.120095729827881, 2.568972587585449, 3.0178496837615967, 3.466726779937744, 3.9156036376953125, 4.364480495452881, 4.813357353210449, 5.262234687805176, 5.711111545562744, 6.1599884033203125, 6.608865737915039, 7.057742595672607, 7.506619453430176, 7.955496311187744, 8.404373168945312, 8.853250503540039, 9.302127838134766, 9.751004219055176, 10.199881553649902, 10.648757934570312, 11.097635269165039, 11.546512603759766, 11.995388984680176, 12.444266319274902, 12.893142700195312, 13.342020034790039, 13.790897369384766, 14.239774703979492, 14.688651084899902]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 13.0, 8.0, 22.0, 47.0, 66.0, 156.0, 245.0, 509.0, 1378.0, 4553.0, 19249.0, 114021.0, 554924.0, 292892.0, 47237.0, 9036.0, 2443.0, 902.0, 402.0, 197.0, 102.0, 59.0, 28.0, 19.0, 10.0, 9.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.6260986328125, -14.205322265625, -13.7845458984375, -13.36376953125, -12.9429931640625, -12.522216796875, -12.1014404296875, -11.6806640625, -11.2598876953125, -10.839111328125, -10.4183349609375, -9.99755859375, -9.5767822265625, -9.156005859375, -8.7352294921875, -8.314453125, -7.8936767578125, -7.472900390625, -7.0521240234375, -6.63134765625, -6.2105712890625, -5.789794921875, -5.3690185546875, -4.9482421875, -4.5274658203125, -4.106689453125, -3.6859130859375, -3.26513671875, -2.8443603515625, -2.423583984375, -2.0028076171875, -1.58203125, -1.1612548828125, -0.740478515625, -0.3197021484375, 0.10107421875, 0.5218505859375, 0.942626953125, 1.3634033203125, 1.7841796875, 2.2049560546875, 2.625732421875, 3.0465087890625, 3.46728515625, 3.8880615234375, 4.308837890625, 4.7296142578125, 5.150390625, 5.5711669921875, 5.991943359375, 6.4127197265625, 6.83349609375, 7.2542724609375, 7.675048828125, 8.0958251953125, 8.5166015625, 8.9373779296875, 9.358154296875, 9.7789306640625, 10.19970703125, 10.6204833984375, 11.041259765625, 11.4620361328125, 11.8828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 16.0, 17.0, 22.0, 22.0, 31.0, 31.0, 41.0, 61.0, 70.0, 68.0, 63.0, 68.0, 61.0, 53.0, 55.0, 49.0, 60.0, 35.0, 37.0, 30.0, 30.0, 17.0, 18.0, 8.0, 8.0, 5.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.218017578125, -2.16064453125, -2.103271484375, -2.0458984375, -1.988525390625, -1.93115234375, -1.873779296875, -1.81640625, -1.759033203125, -1.70166015625, -1.644287109375, -1.5869140625, -1.529541015625, -1.47216796875, -1.414794921875, -1.357421875, -1.300048828125, -1.24267578125, -1.185302734375, -1.1279296875, -1.070556640625, -1.01318359375, -0.955810546875, -0.8984375, -0.841064453125, -0.78369140625, -0.726318359375, -0.6689453125, -0.611572265625, -0.55419921875, -0.496826171875, -0.439453125, -0.382080078125, -0.32470703125, -0.267333984375, -0.2099609375, -0.152587890625, -0.09521484375, -0.037841796875, 0.01953125, 0.076904296875, 0.13427734375, 0.191650390625, 0.2490234375, 0.306396484375, 0.36376953125, 0.421142578125, 0.478515625, 0.535888671875, 0.59326171875, 0.650634765625, 0.7080078125, 0.765380859375, 0.82275390625, 0.880126953125, 0.9375, 0.994873046875, 1.05224609375, 1.109619140625, 1.1669921875, 1.224365234375, 1.28173828125, 1.339111328125, 1.396484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 12.0, 14.0, 13.0, 45.0, 41.0, 59.0, 84.0, 109.0, 176.0, 258.0, 355.0, 659.0, 1482.0, 4197.0, 16923.0, 90841.0, 458455.0, 384076.0, 70120.0, 13763.0, 3736.0, 1376.0, 660.0, 383.0, 224.0, 142.0, 109.0, 56.0, 47.0, 33.0, 22.0, 16.0, 18.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.09375, -10.7933349609375, -10.492919921875, -10.1925048828125, -9.89208984375, -9.5916748046875, -9.291259765625, -8.9908447265625, -8.6904296875, -8.3900146484375, -8.089599609375, -7.7891845703125, -7.48876953125, -7.1883544921875, -6.887939453125, -6.5875244140625, -6.287109375, -5.9866943359375, -5.686279296875, -5.3858642578125, -5.08544921875, -4.7850341796875, -4.484619140625, -4.1842041015625, -3.8837890625, -3.5833740234375, -3.282958984375, -2.9825439453125, -2.68212890625, -2.3817138671875, -2.081298828125, -1.7808837890625, -1.48046875, -1.1800537109375, -0.879638671875, -0.5792236328125, -0.27880859375, 0.0216064453125, 0.322021484375, 0.6224365234375, 0.9228515625, 1.2232666015625, 1.523681640625, 1.8240966796875, 2.12451171875, 2.4249267578125, 2.725341796875, 3.0257568359375, 3.326171875, 3.6265869140625, 3.927001953125, 4.2274169921875, 4.52783203125, 4.8282470703125, 5.128662109375, 5.4290771484375, 5.7294921875, 6.0299072265625, 6.330322265625, 6.6307373046875, 6.93115234375, 7.2315673828125, 7.531982421875, 7.8323974609375, 8.1328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 7.0, 7.0, 18.0, 11.0, 7.0, 16.0, 18.0, 27.0, 16.0, 18.0, 30.0, 32.0, 26.0, 34.0, 52.0, 43.0, 40.0, 26.0, 38.0, 38.0, 33.0, 31.0, 43.0, 28.0, 47.0, 54.0, 42.0, 32.0, 37.0, 25.0, 23.0, 25.0, 14.0, 11.0, 14.0, 6.0, 2.0, 7.0, 2.0, 6.0, 9.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.671875, -6.48712158203125, -6.3023681640625, -6.11761474609375, -5.932861328125, -5.74810791015625, -5.5633544921875, -5.37860107421875, -5.19384765625, -5.00909423828125, -4.8243408203125, -4.63958740234375, -4.454833984375, -4.27008056640625, -4.0853271484375, -3.90057373046875, -3.7158203125, -3.53106689453125, -3.3463134765625, -3.16156005859375, -2.976806640625, -2.79205322265625, -2.6072998046875, -2.42254638671875, -2.23779296875, -2.05303955078125, -1.8682861328125, -1.68353271484375, -1.498779296875, -1.31402587890625, -1.1292724609375, -0.94451904296875, -0.759765625, -0.57501220703125, -0.3902587890625, -0.20550537109375, -0.020751953125, 0.16400146484375, 0.3487548828125, 0.53350830078125, 0.71826171875, 0.90301513671875, 1.0877685546875, 1.27252197265625, 1.457275390625, 1.64202880859375, 1.8267822265625, 2.01153564453125, 2.1962890625, 2.38104248046875, 2.5657958984375, 2.75054931640625, 2.935302734375, 3.12005615234375, 3.3048095703125, 3.48956298828125, 3.67431640625, 3.85906982421875, 4.0438232421875, 4.22857666015625, 4.413330078125, 4.59808349609375, 4.7828369140625, 4.96759033203125, 5.15234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 11.0, 15.0, 15.0, 32.0, 54.0, 73.0, 159.0, 263.0, 477.0, 962.0, 1839.0, 4304.0, 10925.0, 32352.0, 133201.0, 565686.0, 226006.0, 46868.0, 14843.0, 5589.0, 2468.0, 1147.0, 571.0, 276.0, 170.0, 100.0, 54.0, 29.0, 18.0, 14.0, 11.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.35455322265625, -5.1739501953125, -4.99334716796875, -4.812744140625, -4.63214111328125, -4.4515380859375, -4.27093505859375, -4.09033203125, -3.90972900390625, -3.7291259765625, -3.54852294921875, -3.367919921875, -3.18731689453125, -3.0067138671875, -2.82611083984375, -2.6455078125, -2.46490478515625, -2.2843017578125, -2.10369873046875, -1.923095703125, -1.74249267578125, -1.5618896484375, -1.38128662109375, -1.20068359375, -1.02008056640625, -0.8394775390625, -0.65887451171875, -0.478271484375, -0.29766845703125, -0.1170654296875, 0.06353759765625, 0.244140625, 0.42474365234375, 0.6053466796875, 0.78594970703125, 0.966552734375, 1.14715576171875, 1.3277587890625, 1.50836181640625, 1.68896484375, 1.86956787109375, 2.0501708984375, 2.23077392578125, 2.411376953125, 2.59197998046875, 2.7725830078125, 2.95318603515625, 3.1337890625, 3.31439208984375, 3.4949951171875, 3.67559814453125, 3.856201171875, 4.03680419921875, 4.2174072265625, 4.39801025390625, 4.57861328125, 4.75921630859375, 4.9398193359375, 5.12042236328125, 5.301025390625, 5.48162841796875, 5.6622314453125, 5.84283447265625, 6.0234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 8.0, 7.0, 18.0, 11.0, 12.0, 11.0, 26.0, 22.0, 26.0, 33.0, 36.0, 59.0, 64.0, 76.0, 88.0, 82.0, 77.0, 65.0, 53.0, 43.0, 24.0, 34.0, 23.0, 20.0, 10.0, 14.0, 7.0, 9.0, 4.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0004901885986328125, -0.00047479569911956787, -0.00045940279960632324, -0.0004440099000930786, -0.000428617000579834, -0.00041322410106658936, -0.0003978312015533447, -0.0003824383020401001, -0.00036704540252685547, -0.00035165250301361084, -0.0003362596035003662, -0.0003208667039871216, -0.00030547380447387695, -0.0002900809049606323, -0.0002746880054473877, -0.00025929510593414307, -0.00024390220642089844, -0.0002285093069076538, -0.00021311640739440918, -0.00019772350788116455, -0.00018233060836791992, -0.0001669377088546753, -0.00015154480934143066, -0.00013615190982818604, -0.0001207590103149414, -0.00010536611080169678, -8.997321128845215e-05, -7.458031177520752e-05, -5.918741226196289e-05, -4.379451274871826e-05, -2.8401613235473633e-05, -1.3008713722229004e-05, 2.384185791015625e-06, 1.7777085304260254e-05, 3.316998481750488e-05, 4.856288433074951e-05, 6.395578384399414e-05, 7.934868335723877e-05, 9.47415828704834e-05, 0.00011013448238372803, 0.00012552738189697266, 0.00014092028141021729, 0.00015631318092346191, 0.00017170608043670654, 0.00018709897994995117, 0.0002024918794631958, 0.00021788477897644043, 0.00023327767848968506, 0.0002486705780029297, 0.0002640634775161743, 0.00027945637702941895, 0.0002948492765426636, 0.0003102421760559082, 0.00032563507556915283, 0.00034102797508239746, 0.0003564208745956421, 0.0003718137741088867, 0.00038720667362213135, 0.000402599573135376, 0.0004179924726486206, 0.00043338537216186523, 0.00044877827167510986, 0.0004641711711883545, 0.0004795640707015991, 0.0004949569702148438]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 11.0, 12.0, 19.0, 39.0, 44.0, 45.0, 92.0, 154.0, 234.0, 360.0, 689.0, 1372.0, 3019.0, 7981.0, 25107.0, 117344.0, 644790.0, 194136.0, 35089.0, 10373.0, 3946.0, 1657.0, 802.0, 448.0, 268.0, 182.0, 112.0, 66.0, 40.0, 29.0, 13.0, 21.0, 14.0, 7.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.609375, -6.400390625, -6.19140625, -5.982421875, -5.7734375, -5.564453125, -5.35546875, -5.146484375, -4.9375, -4.728515625, -4.51953125, -4.310546875, -4.1015625, -3.892578125, -3.68359375, -3.474609375, -3.265625, -3.056640625, -2.84765625, -2.638671875, -2.4296875, -2.220703125, -2.01171875, -1.802734375, -1.59375, -1.384765625, -1.17578125, -0.966796875, -0.7578125, -0.548828125, -0.33984375, -0.130859375, 0.078125, 0.287109375, 0.49609375, 0.705078125, 0.9140625, 1.123046875, 1.33203125, 1.541015625, 1.75, 1.958984375, 2.16796875, 2.376953125, 2.5859375, 2.794921875, 3.00390625, 3.212890625, 3.421875, 3.630859375, 3.83984375, 4.048828125, 4.2578125, 4.466796875, 4.67578125, 4.884765625, 5.09375, 5.302734375, 5.51171875, 5.720703125, 5.9296875, 6.138671875, 6.34765625, 6.556640625, 6.765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 7.0, 7.0, 8.0, 8.0, 10.0, 16.0, 24.0, 35.0, 51.0, 63.0, 78.0, 139.0, 140.0, 115.0, 79.0, 69.0, 35.0, 31.0, 21.0, 23.0, 10.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.968017578125, -4.79150390625, -4.614990234375, -4.4384765625, -4.261962890625, -4.08544921875, -3.908935546875, -3.732421875, -3.555908203125, -3.37939453125, -3.202880859375, -3.0263671875, -2.849853515625, -2.67333984375, -2.496826171875, -2.3203125, -2.143798828125, -1.96728515625, -1.790771484375, -1.6142578125, -1.437744140625, -1.26123046875, -1.084716796875, -0.908203125, -0.731689453125, -0.55517578125, -0.378662109375, -0.2021484375, -0.025634765625, 0.15087890625, 0.327392578125, 0.50390625, 0.680419921875, 0.85693359375, 1.033447265625, 1.2099609375, 1.386474609375, 1.56298828125, 1.739501953125, 1.916015625, 2.092529296875, 2.26904296875, 2.445556640625, 2.6220703125, 2.798583984375, 2.97509765625, 3.151611328125, 3.328125, 3.504638671875, 3.68115234375, 3.857666015625, 4.0341796875, 4.210693359375, 4.38720703125, 4.563720703125, 4.740234375, 4.916748046875, 5.09326171875, 5.269775390625, 5.4462890625, 5.622802734375, 5.79931640625, 5.975830078125, 6.15234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 27.0, 100.0, 307.0, 342.0, 153.0, 53.0, 11.0, 11.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.28428649902344, -240.19454956054688, -235.1048126220703, -230.01507568359375, -224.92532348632812, -219.83558654785156, -214.745849609375, -209.65611267089844, -204.56637573242188, -199.4766387939453, -194.38690185546875, -189.2971649169922, -184.20742797851562, -179.11767578125, -174.02793884277344, -168.93820190429688, -163.8484649658203, -158.75872802734375, -153.6689910888672, -148.57925415039062, -143.489501953125, -138.39976501464844, -133.31002807617188, -128.2202911376953, -123.13055419921875, -118.04081726074219, -112.95108032226562, -107.86133575439453, -102.77159881591797, -97.6818618774414, -92.59211730957031, -87.50238037109375, -82.41265869140625, -77.32292175292969, -72.23318481445312, -67.14344024658203, -62.05370330810547, -56.963966369628906, -51.87422561645508, -46.78448486328125, -41.69474792480469, -36.605010986328125, -31.515270233154297, -26.4255313873291, -21.335792541503906, -16.24605369567871, -11.156314849853516, -6.0665740966796875, -0.976837158203125, 4.11290168762207, 9.202640533447266, 14.292379379272461, 19.382118225097656, 24.47185707092285, 29.561595916748047, 34.651336669921875, 39.74107360839844, 44.830810546875, 49.92055130004883, 55.010292053222656, 60.10002899169922, 65.18976593017578, 70.27951049804688, 75.36924743652344, 80.458984375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 3.0, 2.0, 6.0, 13.0, 20.0, 22.0, 26.0, 22.0, 31.0, 36.0, 46.0, 52.0, 50.0, 61.0, 67.0, 60.0, 71.0, 69.0, 52.0, 59.0, 45.0, 38.0, 35.0, 26.0, 16.0, 19.0, 13.0, 10.0, 5.0, 5.0, 7.0, 7.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.400238037109375, -60.77083969116211, -59.14144515991211, -57.512046813964844, -55.882652282714844, -54.25325393676758, -52.62385559082031, -50.99446105957031, -49.36506271362305, -47.73566436767578, -46.10626983642578, -44.476871490478516, -42.847476959228516, -41.21807861328125, -39.58868408203125, -37.959285736083984, -36.32988739013672, -34.70048904418945, -33.07109451293945, -31.441696166992188, -29.812299728393555, -28.182903289794922, -26.55350685119629, -24.924110412597656, -23.294715881347656, -21.665319442749023, -20.03592300415039, -18.406524658203125, -16.777128219604492, -15.14773178100586, -13.518335342407227, -11.888937950134277, -10.259540557861328, -8.630144119262695, -7.000746726989746, -5.371350288391113, -3.7419533729553223, -2.1125564575195312, -0.48316001892089844, 1.1462373733520508, 2.7756338119506836, 4.405030727386475, 6.034427642822266, 7.663824081420898, 9.293220520019531, 10.92261791229248, 12.552014350891113, 14.181411743164062, 15.810808181762695, 17.440204620361328, 19.06960105895996, 20.698997497558594, 22.32839584350586, 23.957792282104492, 25.587188720703125, 27.21658706665039, 28.84598159790039, 30.475378036499023, 32.104774475097656, 33.73417282104492, 35.36356735229492, 36.99296569824219, 38.62236022949219, 40.25175857543945, 41.88115692138672]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 10.0, 10.0, 10.0, 19.0, 20.0, 22.0, 41.0, 58.0, 79.0, 141.0, 163.0, 287.0, 477.0, 855.0, 1724.0, 3735.0, 9135.0, 28906.0, 135605.0, 3319166.0, 599520.0, 65754.0, 17112.0, 6019.0, 2560.0, 1257.0, 657.0, 360.0, 203.0, 137.0, 88.0, 48.0, 34.0, 22.0, 14.0, 10.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.109375, -11.77099609375, -11.4326171875, -11.09423828125, -10.755859375, -10.41748046875, -10.0791015625, -9.74072265625, -9.40234375, -9.06396484375, -8.7255859375, -8.38720703125, -8.048828125, -7.71044921875, -7.3720703125, -7.03369140625, -6.6953125, -6.35693359375, -6.0185546875, -5.68017578125, -5.341796875, -5.00341796875, -4.6650390625, -4.32666015625, -3.98828125, -3.64990234375, -3.3115234375, -2.97314453125, -2.634765625, -2.29638671875, -1.9580078125, -1.61962890625, -1.28125, -0.94287109375, -0.6044921875, -0.26611328125, 0.072265625, 0.41064453125, 0.7490234375, 1.08740234375, 1.42578125, 1.76416015625, 2.1025390625, 2.44091796875, 2.779296875, 3.11767578125, 3.4560546875, 3.79443359375, 4.1328125, 4.47119140625, 4.8095703125, 5.14794921875, 5.486328125, 5.82470703125, 6.1630859375, 6.50146484375, 6.83984375, 7.17822265625, 7.5166015625, 7.85498046875, 8.193359375, 8.53173828125, 8.8701171875, 9.20849609375, 9.546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 6.0, 21.0, 28.0, 29.0, 46.0, 57.0, 68.0, 80.0, 98.0, 93.0, 91.0, 103.0, 73.0, 56.0, 55.0, 35.0, 28.0, 15.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.112457275390625, -4.01788330078125, -3.923309326171875, -3.8287353515625, -3.734161376953125, -3.63958740234375, -3.545013427734375, -3.450439453125, -3.355865478515625, -3.26129150390625, -3.166717529296875, -3.0721435546875, -2.977569580078125, -2.88299560546875, -2.788421630859375, -2.69384765625, -2.599273681640625, -2.50469970703125, -2.410125732421875, -2.3155517578125, -2.220977783203125, -2.12640380859375, -2.031829833984375, -1.937255859375, -1.842681884765625, -1.74810791015625, -1.653533935546875, -1.5589599609375, -1.464385986328125, -1.36981201171875, -1.275238037109375, -1.1806640625, -1.086090087890625, -0.99151611328125, -0.896942138671875, -0.8023681640625, -0.707794189453125, -0.61322021484375, -0.518646240234375, -0.424072265625, -0.329498291015625, -0.23492431640625, -0.140350341796875, -0.0457763671875, 0.048797607421875, 0.14337158203125, 0.237945556640625, 0.33251953125, 0.427093505859375, 0.52166748046875, 0.616241455078125, 0.7108154296875, 0.805389404296875, 0.89996337890625, 0.994537353515625, 1.089111328125, 1.183685302734375, 1.27825927734375, 1.372833251953125, 1.4674072265625, 1.561981201171875, 1.65655517578125, 1.751129150390625, 1.845703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 11.0, 8.0, 13.0, 53.0, 94.0, 257.0, 831.0, 3137.0, 19763.0, 401153.0, 3694950.0, 64773.0, 7028.0, 1468.0, 447.0, 141.0, 62.0, 36.0, 14.0, 16.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -22.0474853515625, -21.485595703125, -20.9237060546875, -20.36181640625, -19.7999267578125, -19.238037109375, -18.6761474609375, -18.1142578125, -17.5523681640625, -16.990478515625, -16.4285888671875, -15.86669921875, -15.3048095703125, -14.742919921875, -14.1810302734375, -13.619140625, -13.0572509765625, -12.495361328125, -11.9334716796875, -11.37158203125, -10.8096923828125, -10.247802734375, -9.6859130859375, -9.1240234375, -8.5621337890625, -8.000244140625, -7.4383544921875, -6.87646484375, -6.3145751953125, -5.752685546875, -5.1907958984375, -4.62890625, -4.0670166015625, -3.505126953125, -2.9432373046875, -2.38134765625, -1.8194580078125, -1.257568359375, -0.6956787109375, -0.1337890625, 0.4281005859375, 0.989990234375, 1.5518798828125, 2.11376953125, 2.6756591796875, 3.237548828125, 3.7994384765625, 4.361328125, 4.9232177734375, 5.485107421875, 6.0469970703125, 6.60888671875, 7.1707763671875, 7.732666015625, 8.2945556640625, 8.8564453125, 9.4183349609375, 9.980224609375, 10.5421142578125, 11.10400390625, 11.6658935546875, 12.227783203125, 12.7896728515625, 13.3515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 12.0, 15.0, 32.0, 47.0, 62.0, 113.0, 236.0, 527.0, 1606.0, 739.0, 283.0, 153.0, 70.0, 39.0, 42.0, 25.0, 23.0, 15.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.45880126953125, -5.2965087890625, -5.13421630859375, -4.971923828125, -4.80963134765625, -4.6473388671875, -4.48504638671875, -4.32275390625, -4.16046142578125, -3.9981689453125, -3.83587646484375, -3.673583984375, -3.51129150390625, -3.3489990234375, -3.18670654296875, -3.0244140625, -2.86212158203125, -2.6998291015625, -2.53753662109375, -2.375244140625, -2.21295166015625, -2.0506591796875, -1.88836669921875, -1.72607421875, -1.56378173828125, -1.4014892578125, -1.23919677734375, -1.076904296875, -0.91461181640625, -0.7523193359375, -0.59002685546875, -0.427734375, -0.26544189453125, -0.1031494140625, 0.05914306640625, 0.221435546875, 0.38372802734375, 0.5460205078125, 0.70831298828125, 0.87060546875, 1.03289794921875, 1.1951904296875, 1.35748291015625, 1.519775390625, 1.68206787109375, 1.8443603515625, 2.00665283203125, 2.1689453125, 2.33123779296875, 2.4935302734375, 2.65582275390625, 2.818115234375, 2.98040771484375, 3.1427001953125, 3.30499267578125, 3.46728515625, 3.62957763671875, 3.7918701171875, 3.95416259765625, 4.116455078125, 4.27874755859375, 4.4410400390625, 4.60333251953125, 4.765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 13.0, 16.0, 29.0, 49.0, 95.0, 117.0, 139.0, 133.0, 128.0, 97.0, 50.0, 41.0, 39.0, 19.0, 9.0, 12.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.46781539916992, -32.674476623535156, -31.881141662597656, -31.08780288696289, -30.294466018676758, -29.501129150390625, -28.70779037475586, -27.914453506469727, -27.121116638183594, -26.32777976989746, -25.534442901611328, -24.741104125976562, -23.94776725769043, -23.154430389404297, -22.36109161376953, -21.5677547454834, -20.774417877197266, -19.981081008911133, -19.187744140625, -18.394405364990234, -17.6010684967041, -16.80773162841797, -16.014392852783203, -15.22105598449707, -14.427719116210938, -13.634382247924805, -12.841044425964355, -12.047706604003906, -11.254369735717773, -10.46103286743164, -9.667695045471191, -8.874357223510742, -8.081018447875977, -7.2876811027526855, -6.4943437576293945, -5.7010064125061035, -4.9076690673828125, -4.1143317222595215, -3.3209943771362305, -2.5276570320129395, -1.7343196868896484, -0.9409823417663574, -0.1476449966430664, 0.6456923484802246, 1.4390296936035156, 2.2323670387268066, 3.0257043838500977, 3.8190417289733887, 4.61237907409668, 5.405716419219971, 6.199053764343262, 6.992391109466553, 7.785728454589844, 8.579065322875977, 9.372403144836426, 10.165740966796875, 10.959077835083008, 11.75241470336914, 12.54575252532959, 13.339090347290039, 14.132427215576172, 14.925764083862305, 15.719101905822754, 16.512439727783203, 17.305776596069336]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 10.0, 20.0, 14.0, 35.0, 36.0, 49.0, 48.0, 49.0, 54.0, 58.0, 65.0, 76.0, 73.0, 67.0, 60.0, 49.0, 52.0, 45.0, 23.0, 29.0, 26.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.450559616088867, -13.835054397583008, -13.219550132751465, -12.604044914245605, -11.988539695739746, -11.373035430908203, -10.757530212402344, -10.142024993896484, -9.526519775390625, -8.911014556884766, -8.295510292053223, -7.680005073547363, -7.064499855041504, -6.448995113372803, -5.833490371704102, -5.217985153198242, -4.602480888366699, -3.986975908279419, -3.3714709281921387, -2.7559661865234375, -2.1404612064361572, -1.524956226348877, -0.9094514846801758, -0.2939462661743164, 0.32155847549438477, 0.9370633959770203, 1.5525683164596558, 2.1680731773376465, 2.7835781574249268, 3.399083137512207, 4.014587879180908, 4.630093097686768, 5.245597839355469, 5.86110258102417, 6.476607799530029, 7.0921125411987305, 7.70761775970459, 8.323122024536133, 8.938627243041992, 9.554132461547852, 10.169637680053711, 10.78514289855957, 11.400647163391113, 12.016152381896973, 12.631657600402832, 13.247161865234375, 13.862667083740234, 14.478172302246094, 15.093676567077637, 15.709181785583496, 16.32468605041504, 16.9401912689209, 17.555696487426758, 18.171201705932617, 18.786705017089844, 19.402210235595703, 20.017715454101562, 20.633220672607422, 21.24872589111328, 21.86423110961914, 22.479734420776367, 23.095239639282227, 23.710744857788086, 24.326250076293945, 24.941755294799805]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 23.0, 25.0, 44.0, 62.0, 81.0, 121.0, 195.0, 297.0, 558.0, 1009.0, 1789.0, 3472.0, 7355.0, 17490.0, 48526.0, 167371.0, 531102.0, 183203.0, 51307.0, 18565.0, 7817.0, 3638.0, 1908.0, 976.0, 581.0, 339.0, 217.0, 141.0, 85.0, 72.0, 37.0, 36.0, 23.0, 19.0, 14.0, 6.0, 3.0, 7.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.203125, -7.9344482421875, -7.665771484375, -7.3970947265625, -7.12841796875, -6.8597412109375, -6.591064453125, -6.3223876953125, -6.0537109375, -5.7850341796875, -5.516357421875, -5.2476806640625, -4.97900390625, -4.7103271484375, -4.441650390625, -4.1729736328125, -3.904296875, -3.6356201171875, -3.366943359375, -3.0982666015625, -2.82958984375, -2.5609130859375, -2.292236328125, -2.0235595703125, -1.7548828125, -1.4862060546875, -1.217529296875, -0.9488525390625, -0.68017578125, -0.4114990234375, -0.142822265625, 0.1258544921875, 0.39453125, 0.6632080078125, 0.931884765625, 1.2005615234375, 1.46923828125, 1.7379150390625, 2.006591796875, 2.2752685546875, 2.5439453125, 2.8126220703125, 3.081298828125, 3.3499755859375, 3.61865234375, 3.8873291015625, 4.156005859375, 4.4246826171875, 4.693359375, 4.9620361328125, 5.230712890625, 5.4993896484375, 5.76806640625, 6.0367431640625, 6.305419921875, 6.5740966796875, 6.8427734375, 7.1114501953125, 7.380126953125, 7.6488037109375, 7.91748046875, 8.1861572265625, 8.454833984375, 8.7235107421875, 8.9921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 2.0, 3.0, 12.0, 17.0, 17.0, 28.0, 22.0, 32.0, 28.0, 40.0, 32.0, 48.0, 45.0, 47.0, 65.0, 54.0, 50.0, 58.0, 57.0, 50.0, 33.0, 48.0, 34.0, 41.0, 31.0, 29.0, 13.0, 17.0, 6.0, 12.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9599609375, -1.902008056640625, -1.84405517578125, -1.786102294921875, -1.7281494140625, -1.670196533203125, -1.61224365234375, -1.554290771484375, -1.496337890625, -1.438385009765625, -1.38043212890625, -1.322479248046875, -1.2645263671875, -1.206573486328125, -1.14862060546875, -1.090667724609375, -1.03271484375, -0.974761962890625, -0.91680908203125, -0.858856201171875, -0.8009033203125, -0.742950439453125, -0.68499755859375, -0.627044677734375, -0.569091796875, -0.511138916015625, -0.45318603515625, -0.395233154296875, -0.3372802734375, -0.279327392578125, -0.22137451171875, -0.163421630859375, -0.10546875, -0.047515869140625, 0.01043701171875, 0.068389892578125, 0.1263427734375, 0.184295654296875, 0.24224853515625, 0.300201416015625, 0.358154296875, 0.416107177734375, 0.47406005859375, 0.532012939453125, 0.5899658203125, 0.647918701171875, 0.70587158203125, 0.763824462890625, 0.82177734375, 0.879730224609375, 0.93768310546875, 0.995635986328125, 1.0535888671875, 1.111541748046875, 1.16949462890625, 1.227447509765625, 1.285400390625, 1.343353271484375, 1.40130615234375, 1.459259033203125, 1.5172119140625, 1.575164794921875, 1.63311767578125, 1.691070556640625, 1.7490234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 6.0, 10.0, 19.0, 30.0, 39.0, 64.0, 68.0, 133.0, 221.0, 372.0, 863.0, 2235.0, 7945.0, 47062.0, 549871.0, 393254.0, 36182.0, 6602.0, 1882.0, 761.0, 385.0, 190.0, 104.0, 91.0, 41.0, 34.0, 19.0, 18.0, 17.0, 9.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.4296875, -13.9915771484375, -13.553466796875, -13.1153564453125, -12.67724609375, -12.2391357421875, -11.801025390625, -11.3629150390625, -10.9248046875, -10.4866943359375, -10.048583984375, -9.6104736328125, -9.17236328125, -8.7342529296875, -8.296142578125, -7.8580322265625, -7.419921875, -6.9818115234375, -6.543701171875, -6.1055908203125, -5.66748046875, -5.2293701171875, -4.791259765625, -4.3531494140625, -3.9150390625, -3.4769287109375, -3.038818359375, -2.6007080078125, -2.16259765625, -1.7244873046875, -1.286376953125, -0.8482666015625, -0.41015625, 0.0279541015625, 0.466064453125, 0.9041748046875, 1.34228515625, 1.7803955078125, 2.218505859375, 2.6566162109375, 3.0947265625, 3.5328369140625, 3.970947265625, 4.4090576171875, 4.84716796875, 5.2852783203125, 5.723388671875, 6.1614990234375, 6.599609375, 7.0377197265625, 7.475830078125, 7.9139404296875, 8.35205078125, 8.7901611328125, 9.228271484375, 9.6663818359375, 10.1044921875, 10.5426025390625, 10.980712890625, 11.4188232421875, 11.85693359375, 12.2950439453125, 12.733154296875, 13.1712646484375, 13.609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 6.0, 7.0, 7.0, 10.0, 21.0, 17.0, 19.0, 23.0, 25.0, 32.0, 26.0, 38.0, 45.0, 42.0, 41.0, 48.0, 56.0, 40.0, 43.0, 52.0, 53.0, 41.0, 45.0, 38.0, 29.0, 28.0, 32.0, 33.0, 14.0, 24.0, 11.0, 8.0, 12.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.4921875, -7.26239013671875, -7.0325927734375, -6.80279541015625, -6.572998046875, -6.34320068359375, -6.1134033203125, -5.88360595703125, -5.65380859375, -5.42401123046875, -5.1942138671875, -4.96441650390625, -4.734619140625, -4.50482177734375, -4.2750244140625, -4.04522705078125, -3.8154296875, -3.58563232421875, -3.3558349609375, -3.12603759765625, -2.896240234375, -2.66644287109375, -2.4366455078125, -2.20684814453125, -1.97705078125, -1.74725341796875, -1.5174560546875, -1.28765869140625, -1.057861328125, -0.82806396484375, -0.5982666015625, -0.36846923828125, -0.138671875, 0.09112548828125, 0.3209228515625, 0.55072021484375, 0.780517578125, 1.01031494140625, 1.2401123046875, 1.46990966796875, 1.69970703125, 1.92950439453125, 2.1593017578125, 2.38909912109375, 2.618896484375, 2.84869384765625, 3.0784912109375, 3.30828857421875, 3.5380859375, 3.76788330078125, 3.9976806640625, 4.22747802734375, 4.457275390625, 4.68707275390625, 4.9168701171875, 5.14666748046875, 5.37646484375, 5.60626220703125, 5.8360595703125, 6.06585693359375, 6.295654296875, 6.52545166015625, 6.7552490234375, 6.98504638671875, 7.21484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 18.0, 22.0, 42.0, 86.0, 131.0, 298.0, 868.0, 4088.0, 50217.0, 954923.0, 33287.0, 3262.0, 765.0, 273.0, 106.0, 66.0, 36.0, 17.0, 15.0, 10.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.894775390625, -20.30517578125, -19.715576171875, -19.1259765625, -18.536376953125, -17.94677734375, -17.357177734375, -16.767578125, -16.177978515625, -15.58837890625, -14.998779296875, -14.4091796875, -13.819580078125, -13.22998046875, -12.640380859375, -12.05078125, -11.461181640625, -10.87158203125, -10.281982421875, -9.6923828125, -9.102783203125, -8.51318359375, -7.923583984375, -7.333984375, -6.744384765625, -6.15478515625, -5.565185546875, -4.9755859375, -4.385986328125, -3.79638671875, -3.206787109375, -2.6171875, -2.027587890625, -1.43798828125, -0.848388671875, -0.2587890625, 0.330810546875, 0.92041015625, 1.510009765625, 2.099609375, 2.689208984375, 3.27880859375, 3.868408203125, 4.4580078125, 5.047607421875, 5.63720703125, 6.226806640625, 6.81640625, 7.406005859375, 7.99560546875, 8.585205078125, 9.1748046875, 9.764404296875, 10.35400390625, 10.943603515625, 11.533203125, 12.122802734375, 12.71240234375, 13.302001953125, 13.8916015625, 14.481201171875, 15.07080078125, 15.660400390625, 16.25]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 6.0, 11.0, 29.0, 43.0, 75.0, 189.0, 314.0, 163.0, 56.0, 33.0, 23.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00205230712890625, -0.0020060762763023376, -0.0019598454236984253, -0.001913614571094513, -0.0018673837184906006, -0.0018211528658866882, -0.0017749220132827759, -0.0017286911606788635, -0.0016824603080749512, -0.0016362294554710388, -0.0015899986028671265, -0.0015437677502632141, -0.0014975368976593018, -0.0014513060450553894, -0.001405075192451477, -0.0013588443398475647, -0.0013126134872436523, -0.00126638263463974, -0.0012201517820358276, -0.0011739209294319153, -0.001127690076828003, -0.0010814592242240906, -0.0010352283716201782, -0.0009889975190162659, -0.0009427666664123535, -0.0008965358138084412, -0.0008503049612045288, -0.0008040741086006165, -0.0007578432559967041, -0.0007116124033927917, -0.0006653815507888794, -0.000619150698184967, -0.0005729198455810547, -0.0005266889929771423, -0.00048045814037323, -0.0004342272877693176, -0.0003879964351654053, -0.0003417655825614929, -0.00029553472995758057, -0.0002493038773536682, -0.00020307302474975586, -0.0001568421721458435, -0.00011061131954193115, -6.43804669380188e-05, -1.8149614334106445e-05, 2.8081238269805908e-05, 7.431209087371826e-05, 0.00012054294347763062, 0.00016677379608154297, 0.00021300464868545532, 0.0002592355012893677, 0.00030546635389328003, 0.0003516972064971924, 0.00039792805910110474, 0.0004441589117050171, 0.0004903897643089294, 0.0005366206169128418, 0.0005828514695167542, 0.0006290823221206665, 0.0006753131747245789, 0.0007215440273284912, 0.0007677748799324036, 0.0008140057325363159, 0.0008602365851402283, 0.0009064674377441406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 9.0, 7.0, 11.0, 27.0, 57.0, 64.0, 163.0, 312.0, 960.0, 5350.0, 188220.0, 842025.0, 9263.0, 1300.0, 411.0, 172.0, 70.0, 54.0, 31.0, 17.0, 10.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.6083984375, -20.935546875, -20.2626953125, -19.58984375, -18.9169921875, -18.244140625, -17.5712890625, -16.8984375, -16.2255859375, -15.552734375, -14.8798828125, -14.20703125, -13.5341796875, -12.861328125, -12.1884765625, -11.515625, -10.8427734375, -10.169921875, -9.4970703125, -8.82421875, -8.1513671875, -7.478515625, -6.8056640625, -6.1328125, -5.4599609375, -4.787109375, -4.1142578125, -3.44140625, -2.7685546875, -2.095703125, -1.4228515625, -0.75, -0.0771484375, 0.595703125, 1.2685546875, 1.94140625, 2.6142578125, 3.287109375, 3.9599609375, 4.6328125, 5.3056640625, 5.978515625, 6.6513671875, 7.32421875, 7.9970703125, 8.669921875, 9.3427734375, 10.015625, 10.6884765625, 11.361328125, 12.0341796875, 12.70703125, 13.3798828125, 14.052734375, 14.7255859375, 15.3984375, 16.0712890625, 16.744140625, 17.4169921875, 18.08984375, 18.7626953125, 19.435546875, 20.1083984375, 20.78125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 4.0, 4.0, 5.0, 13.0, 16.0, 21.0, 22.0, 36.0, 63.0, 111.0, 171.0, 174.0, 129.0, 76.0, 43.0, 31.0, 17.0, 9.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3203125, -7.11126708984375, -6.9022216796875, -6.69317626953125, -6.484130859375, -6.27508544921875, -6.0660400390625, -5.85699462890625, -5.64794921875, -5.43890380859375, -5.2298583984375, -5.02081298828125, -4.811767578125, -4.60272216796875, -4.3936767578125, -4.18463134765625, -3.9755859375, -3.76654052734375, -3.5574951171875, -3.34844970703125, -3.139404296875, -2.93035888671875, -2.7213134765625, -2.51226806640625, -2.30322265625, -2.09417724609375, -1.8851318359375, -1.67608642578125, -1.467041015625, -1.25799560546875, -1.0489501953125, -0.83990478515625, -0.630859375, -0.42181396484375, -0.2127685546875, -0.00372314453125, 0.205322265625, 0.41436767578125, 0.6234130859375, 0.83245849609375, 1.04150390625, 1.25054931640625, 1.4595947265625, 1.66864013671875, 1.877685546875, 2.08673095703125, 2.2957763671875, 2.50482177734375, 2.7138671875, 2.92291259765625, 3.1319580078125, 3.34100341796875, 3.550048828125, 3.75909423828125, 3.9681396484375, 4.17718505859375, 4.38623046875, 4.59527587890625, 4.8043212890625, 5.01336669921875, 5.222412109375, 5.43145751953125, 5.6405029296875, 5.84954833984375, 6.05859375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 19.0, 49.0, 176.0, 292.0, 269.0, 127.0, 41.0, 16.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-226.10894775390625, -221.2001953125, -216.29144287109375, -211.38270568847656, -206.4739532470703, -201.56520080566406, -196.6564483642578, -191.74769592285156, -186.83895874023438, -181.93020629882812, -177.02145385742188, -172.1127166748047, -167.20396423339844, -162.2952117919922, -157.38645935058594, -152.4777069091797, -147.56895446777344, -142.6602020263672, -137.75144958496094, -132.84271240234375, -127.9339599609375, -123.02520751953125, -118.116455078125, -113.20770263671875, -108.29895782470703, -103.39020538330078, -98.48146057128906, -93.57270812988281, -88.66395568847656, -83.75521087646484, -78.8464584350586, -73.93771362304688, -69.02894592285156, -64.12019348144531, -59.211448669433594, -54.302696228027344, -49.39394760131836, -44.485198974609375, -39.576446533203125, -34.66769790649414, -29.758949279785156, -24.850200653076172, -19.941450119018555, -15.032700538635254, -10.123950958251953, -5.215202331542969, -0.30645179748535156, 4.602298736572266, 9.51104736328125, 14.41979694366455, 19.32854652404785, 24.23729705810547, 29.146045684814453, 34.05479431152344, 38.96354675292969, 43.87229537963867, 48.781044006347656, 53.68979263305664, 58.598541259765625, 63.507293701171875, 68.41604614257812, 73.32479095458984, 78.2335433959961, 83.14228820800781, 88.05104064941406]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 10.0, 6.0, 11.0, 15.0, 15.0, 14.0, 13.0, 20.0, 23.0, 22.0, 22.0, 24.0, 34.0, 35.0, 34.0, 40.0, 37.0, 36.0, 31.0, 37.0, 41.0, 40.0, 35.0, 38.0, 46.0, 34.0, 26.0, 42.0, 31.0, 26.0, 22.0, 15.0, 23.0, 16.0, 16.0, 13.0, 10.0, 12.0, 9.0, 3.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-33.73252487182617, -32.62526321411133, -31.518001556396484, -30.41073989868164, -29.303478240966797, -28.196216583251953, -27.088956832885742, -25.9816951751709, -24.874433517456055, -23.76717185974121, -22.659910202026367, -21.552648544311523, -20.445388793945312, -19.33812713623047, -18.230865478515625, -17.12360382080078, -16.016342163085938, -14.909080505371094, -13.80181884765625, -12.694558143615723, -11.587296485900879, -10.480034828186035, -9.372774124145508, -8.265512466430664, -7.15825080871582, -6.050989151000977, -4.943727970123291, -3.8364665508270264, -2.7292051315307617, -1.621943473815918, -0.5146822929382324, 0.5925788879394531, 1.6998367309570312, 2.807098150253296, 3.9143595695495605, 5.021620750427246, 6.12888240814209, 7.236144065856934, 8.343404769897461, 9.450666427612305, 10.557928085327148, 11.665189743041992, 12.772451400756836, 13.879712104797363, 14.986973762512207, 16.094234466552734, 17.201496124267578, 18.308757781982422, 19.416019439697266, 20.52328109741211, 21.630542755126953, 22.737804412841797, 23.84506607055664, 24.952327728271484, 26.059587478637695, 27.16684913635254, 28.274110794067383, 29.381372451782227, 30.48863410949707, 31.595895767211914, 32.703155517578125, 33.81041717529297, 34.91767883300781, 36.024940490722656, 37.1322021484375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 16.0, 11.0, 29.0, 40.0, 55.0, 107.0, 173.0, 392.0, 988.0, 3032.0, 11344.0, 73698.0, 3872231.0, 205713.0, 19341.0, 4534.0, 1428.0, 544.0, 258.0, 140.0, 76.0, 43.0, 27.0, 13.0, 13.0, 11.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.609375, -22.947509765625, -22.28564453125, -21.623779296875, -20.9619140625, -20.300048828125, -19.63818359375, -18.976318359375, -18.314453125, -17.652587890625, -16.99072265625, -16.328857421875, -15.6669921875, -15.005126953125, -14.34326171875, -13.681396484375, -13.01953125, -12.357666015625, -11.69580078125, -11.033935546875, -10.3720703125, -9.710205078125, -9.04833984375, -8.386474609375, -7.724609375, -7.062744140625, -6.40087890625, -5.739013671875, -5.0771484375, -4.415283203125, -3.75341796875, -3.091552734375, -2.4296875, -1.767822265625, -1.10595703125, -0.444091796875, 0.2177734375, 0.879638671875, 1.54150390625, 2.203369140625, 2.865234375, 3.527099609375, 4.18896484375, 4.850830078125, 5.5126953125, 6.174560546875, 6.83642578125, 7.498291015625, 8.16015625, 8.822021484375, 9.48388671875, 10.145751953125, 10.8076171875, 11.469482421875, 12.13134765625, 12.793212890625, 13.455078125, 14.116943359375, 14.77880859375, 15.440673828125, 16.1025390625, 16.764404296875, 17.42626953125, 18.088134765625, 18.75]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 8.0, 8.0, 11.0, 8.0, 14.0, 12.0, 23.0, 22.0, 27.0, 24.0, 36.0, 41.0, 32.0, 54.0, 54.0, 61.0, 53.0, 54.0, 46.0, 29.0, 53.0, 49.0, 37.0, 39.0, 33.0, 38.0, 34.0, 23.0, 15.0, 11.0, 14.0, 6.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7024078369140625, -1.642120361328125, -1.5818328857421875, -1.52154541015625, -1.4612579345703125, -1.400970458984375, -1.3406829833984375, -1.2803955078125, -1.2201080322265625, -1.159820556640625, -1.0995330810546875, -1.03924560546875, -0.9789581298828125, -0.918670654296875, -0.8583831787109375, -0.798095703125, -0.7378082275390625, -0.677520751953125, -0.6172332763671875, -0.55694580078125, -0.4966583251953125, -0.436370849609375, -0.3760833740234375, -0.3157958984375, -0.2555084228515625, -0.195220947265625, -0.1349334716796875, -0.07464599609375, -0.0143585205078125, 0.045928955078125, 0.1062164306640625, 0.16650390625, 0.2267913818359375, 0.287078857421875, 0.3473663330078125, 0.40765380859375, 0.4679412841796875, 0.528228759765625, 0.5885162353515625, 0.6488037109375, 0.7090911865234375, 0.769378662109375, 0.8296661376953125, 0.88995361328125, 0.9502410888671875, 1.010528564453125, 1.0708160400390625, 1.131103515625, 1.1913909912109375, 1.251678466796875, 1.3119659423828125, 1.37225341796875, 1.4325408935546875, 1.492828369140625, 1.5531158447265625, 1.6134033203125, 1.6736907958984375, 1.733978271484375, 1.7942657470703125, 1.85455322265625, 1.9148406982421875, 1.975128173828125, 2.0354156494140625, 2.095703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 9.0, 1.0, 12.0, 21.0, 32.0, 68.0, 133.0, 291.0, 748.0, 2316.0, 10074.0, 86451.0, 3914732.0, 160592.0, 14461.0, 2825.0, 871.0, 357.0, 128.0, 80.0, 44.0, 10.0, 9.0, 6.0, 9.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -23.195556640625, -22.57861328125, -21.961669921875, -21.3447265625, -20.727783203125, -20.11083984375, -19.493896484375, -18.876953125, -18.260009765625, -17.64306640625, -17.026123046875, -16.4091796875, -15.792236328125, -15.17529296875, -14.558349609375, -13.94140625, -13.324462890625, -12.70751953125, -12.090576171875, -11.4736328125, -10.856689453125, -10.23974609375, -9.622802734375, -9.005859375, -8.388916015625, -7.77197265625, -7.155029296875, -6.5380859375, -5.921142578125, -5.30419921875, -4.687255859375, -4.0703125, -3.453369140625, -2.83642578125, -2.219482421875, -1.6025390625, -0.985595703125, -0.36865234375, 0.248291015625, 0.865234375, 1.482177734375, 2.09912109375, 2.716064453125, 3.3330078125, 3.949951171875, 4.56689453125, 5.183837890625, 5.80078125, 6.417724609375, 7.03466796875, 7.651611328125, 8.2685546875, 8.885498046875, 9.50244140625, 10.119384765625, 10.736328125, 11.353271484375, 11.97021484375, 12.587158203125, 13.2041015625, 13.821044921875, 14.43798828125, 15.054931640625, 15.671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 10.0, 9.0, 9.0, 27.0, 37.0, 55.0, 64.0, 140.0, 362.0, 1256.0, 1355.0, 348.0, 137.0, 77.0, 50.0, 29.0, 15.0, 21.0, 16.0, 11.0, 10.0, 9.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.10418701171875, -4.9583740234375, -4.81256103515625, -4.666748046875, -4.52093505859375, -4.3751220703125, -4.22930908203125, -4.08349609375, -3.93768310546875, -3.7918701171875, -3.64605712890625, -3.500244140625, -3.35443115234375, -3.2086181640625, -3.06280517578125, -2.9169921875, -2.77117919921875, -2.6253662109375, -2.47955322265625, -2.333740234375, -2.18792724609375, -2.0421142578125, -1.89630126953125, -1.75048828125, -1.60467529296875, -1.4588623046875, -1.31304931640625, -1.167236328125, -1.02142333984375, -0.8756103515625, -0.72979736328125, -0.583984375, -0.43817138671875, -0.2923583984375, -0.14654541015625, -0.000732421875, 0.14508056640625, 0.2908935546875, 0.43670654296875, 0.58251953125, 0.72833251953125, 0.8741455078125, 1.01995849609375, 1.165771484375, 1.31158447265625, 1.4573974609375, 1.60321044921875, 1.7490234375, 1.89483642578125, 2.0406494140625, 2.18646240234375, 2.332275390625, 2.47808837890625, 2.6239013671875, 2.76971435546875, 2.91552734375, 3.06134033203125, 3.2071533203125, 3.35296630859375, 3.498779296875, 3.64459228515625, 3.7904052734375, 3.93621826171875, 4.08203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 36.0, 111.0, 233.0, 317.0, 198.0, 71.0, 18.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.51558303833008, -43.651119232177734, -41.78665542602539, -39.92218780517578, -38.05772399902344, -36.193260192871094, -34.32879638671875, -32.464332580566406, -30.59986686706543, -28.735403060913086, -26.87093734741211, -25.006473541259766, -23.142009735107422, -21.277544021606445, -19.4130802154541, -17.548614501953125, -15.684150695800781, -13.819685935974121, -11.955221176147461, -10.090757369995117, -8.226292610168457, -6.361827850341797, -4.497364044189453, -2.632899284362793, -0.7684345245361328, 1.0960299968719482, 2.9604945182800293, 4.824958801269531, 6.689423561096191, 8.553888320922852, 10.418352127075195, 12.282816886901855, 14.14727783203125, 16.011741638183594, 17.87620735168457, 19.740671157836914, 21.60513687133789, 23.469600677490234, 25.334064483642578, 27.198528289794922, 29.0629940032959, 30.927457809448242, 32.79192352294922, 34.65638732910156, 36.520851135253906, 38.38531494140625, 40.249778747558594, 42.1142463684082, 43.97871017456055, 45.84317398071289, 47.707637786865234, 49.572105407714844, 51.43656921386719, 53.30103302001953, 55.165496826171875, 57.02996063232422, 58.89442443847656, 60.758888244628906, 62.62335205078125, 64.4878158569336, 66.35227966308594, 68.21675109863281, 70.08120727539062, 71.9456787109375, 73.81014251708984]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 7.0, 11.0, 10.0, 18.0, 12.0, 14.0, 19.0, 21.0, 24.0, 28.0, 30.0, 28.0, 32.0, 33.0, 31.0, 45.0, 38.0, 41.0, 49.0, 49.0, 30.0, 43.0, 43.0, 39.0, 38.0, 33.0, 36.0, 20.0, 30.0, 19.0, 12.0, 20.0, 12.0, 8.0, 9.0, 12.0, 10.0, 8.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-12.501359939575195, -12.115266799926758, -11.729172706604004, -11.343079566955566, -10.956985473632812, -10.570892333984375, -10.184799194335938, -9.7987060546875, -9.412611961364746, -9.026518821716309, -8.640424728393555, -8.254331588745117, -7.8682379722595215, -7.482144355773926, -7.096051216125488, -6.709957599639893, -6.323863983154297, -5.937770366668701, -5.5516767501831055, -5.165583610534668, -4.779489994049072, -4.393396377563477, -4.007303237915039, -3.6212096214294434, -3.2351160049438477, -2.849022388458252, -2.4629290103912354, -2.0768356323242188, -1.690742015838623, -1.304648518562317, -0.9185550212860107, -0.5324616432189941, -0.14636802673339844, 0.23972547054290771, 0.6258189678192139, 1.01191246509552, 1.3980059623718262, 1.7840994596481323, 2.1701929569244385, 2.556286334991455, 2.942379951477051, 3.3284735679626465, 3.714566946029663, 4.10066032409668, 4.486753940582275, 4.872847557067871, 5.258940696716309, 5.645034313201904, 6.0311279296875, 6.417221546173096, 6.803315162658691, 7.189408302307129, 7.575501918792725, 7.96159553527832, 8.347688674926758, 8.733781814575195, 9.11987590789795, 9.505969047546387, 9.89206314086914, 10.278156280517578, 10.664249420166016, 11.05034351348877, 11.436436653137207, 11.822530746459961, 12.208623886108398]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 12.0, 20.0, 27.0, 28.0, 39.0, 66.0, 82.0, 125.0, 207.0, 320.0, 585.0, 1001.0, 1862.0, 3505.0, 7923.0, 17030.0, 41560.0, 110471.0, 394825.0, 315453.0, 90364.0, 34547.0, 14657.0, 6666.0, 3204.0, 1629.0, 910.0, 507.0, 297.0, 213.0, 125.0, 78.0, 50.0, 49.0, 26.0, 26.0, 4.0, 12.0, 11.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.96875, -6.7276611328125, -6.486572265625, -6.2454833984375, -6.00439453125, -5.7633056640625, -5.522216796875, -5.2811279296875, -5.0400390625, -4.7989501953125, -4.557861328125, -4.3167724609375, -4.07568359375, -3.8345947265625, -3.593505859375, -3.3524169921875, -3.111328125, -2.8702392578125, -2.629150390625, -2.3880615234375, -2.14697265625, -1.9058837890625, -1.664794921875, -1.4237060546875, -1.1826171875, -0.9415283203125, -0.700439453125, -0.4593505859375, -0.21826171875, 0.0228271484375, 0.263916015625, 0.5050048828125, 0.74609375, 0.9871826171875, 1.228271484375, 1.4693603515625, 1.71044921875, 1.9515380859375, 2.192626953125, 2.4337158203125, 2.6748046875, 2.9158935546875, 3.156982421875, 3.3980712890625, 3.63916015625, 3.8802490234375, 4.121337890625, 4.3624267578125, 4.603515625, 4.8446044921875, 5.085693359375, 5.3267822265625, 5.56787109375, 5.8089599609375, 6.050048828125, 6.2911376953125, 6.5322265625, 6.7733154296875, 7.014404296875, 7.2554931640625, 7.49658203125, 7.7376708984375, 7.978759765625, 8.2198486328125, 8.4609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 8.0, 9.0, 17.0, 12.0, 17.0, 26.0, 32.0, 29.0, 26.0, 34.0, 35.0, 53.0, 47.0, 46.0, 56.0, 40.0, 52.0, 50.0, 44.0, 46.0, 35.0, 39.0, 41.0, 39.0, 31.0, 25.0, 24.0, 16.0, 13.0, 7.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.758544921875, -1.69677734375, -1.635009765625, -1.5732421875, -1.511474609375, -1.44970703125, -1.387939453125, -1.326171875, -1.264404296875, -1.20263671875, -1.140869140625, -1.0791015625, -1.017333984375, -0.95556640625, -0.893798828125, -0.83203125, -0.770263671875, -0.70849609375, -0.646728515625, -0.5849609375, -0.523193359375, -0.46142578125, -0.399658203125, -0.337890625, -0.276123046875, -0.21435546875, -0.152587890625, -0.0908203125, -0.029052734375, 0.03271484375, 0.094482421875, 0.15625, 0.218017578125, 0.27978515625, 0.341552734375, 0.4033203125, 0.465087890625, 0.52685546875, 0.588623046875, 0.650390625, 0.712158203125, 0.77392578125, 0.835693359375, 0.8974609375, 0.959228515625, 1.02099609375, 1.082763671875, 1.14453125, 1.206298828125, 1.26806640625, 1.329833984375, 1.3916015625, 1.453369140625, 1.51513671875, 1.576904296875, 1.638671875, 1.700439453125, 1.76220703125, 1.823974609375, 1.8857421875, 1.947509765625, 2.00927734375, 2.071044921875, 2.1328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 10.0, 6.0, 15.0, 19.0, 20.0, 29.0, 32.0, 39.0, 76.0, 92.0, 157.0, 243.0, 517.0, 1289.0, 3825.0, 14521.0, 68243.0, 563580.0, 333604.0, 46730.0, 10374.0, 2894.0, 1054.0, 441.0, 229.0, 138.0, 96.0, 86.0, 44.0, 32.0, 24.0, 18.0, 18.0, 13.0, 8.0, 8.0, 6.0, 1.0, 0.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.1328125, -12.75634765625, -12.3798828125, -12.00341796875, -11.626953125, -11.25048828125, -10.8740234375, -10.49755859375, -10.12109375, -9.74462890625, -9.3681640625, -8.99169921875, -8.615234375, -8.23876953125, -7.8623046875, -7.48583984375, -7.109375, -6.73291015625, -6.3564453125, -5.97998046875, -5.603515625, -5.22705078125, -4.8505859375, -4.47412109375, -4.09765625, -3.72119140625, -3.3447265625, -2.96826171875, -2.591796875, -2.21533203125, -1.8388671875, -1.46240234375, -1.0859375, -0.70947265625, -0.3330078125, 0.04345703125, 0.419921875, 0.79638671875, 1.1728515625, 1.54931640625, 1.92578125, 2.30224609375, 2.6787109375, 3.05517578125, 3.431640625, 3.80810546875, 4.1845703125, 4.56103515625, 4.9375, 5.31396484375, 5.6904296875, 6.06689453125, 6.443359375, 6.81982421875, 7.1962890625, 7.57275390625, 7.94921875, 8.32568359375, 8.7021484375, 9.07861328125, 9.455078125, 9.83154296875, 10.2080078125, 10.58447265625, 10.9609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 10.0, 8.0, 15.0, 15.0, 28.0, 31.0, 27.0, 31.0, 36.0, 47.0, 49.0, 59.0, 68.0, 55.0, 66.0, 56.0, 48.0, 53.0, 39.0, 47.0, 32.0, 33.0, 25.0, 24.0, 21.0, 13.0, 18.0, 5.0, 11.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0308837890625, -7.718017578125, -7.4051513671875, -7.09228515625, -6.7794189453125, -6.466552734375, -6.1536865234375, -5.8408203125, -5.5279541015625, -5.215087890625, -4.9022216796875, -4.58935546875, -4.2764892578125, -3.963623046875, -3.6507568359375, -3.337890625, -3.0250244140625, -2.712158203125, -2.3992919921875, -2.08642578125, -1.7735595703125, -1.460693359375, -1.1478271484375, -0.8349609375, -0.5220947265625, -0.209228515625, 0.1036376953125, 0.41650390625, 0.7293701171875, 1.042236328125, 1.3551025390625, 1.66796875, 1.9808349609375, 2.293701171875, 2.6065673828125, 2.91943359375, 3.2322998046875, 3.545166015625, 3.8580322265625, 4.1708984375, 4.4837646484375, 4.796630859375, 5.1094970703125, 5.42236328125, 5.7352294921875, 6.048095703125, 6.3609619140625, 6.673828125, 6.9866943359375, 7.299560546875, 7.6124267578125, 7.92529296875, 8.2381591796875, 8.551025390625, 8.8638916015625, 9.1767578125, 9.4896240234375, 9.802490234375, 10.1153564453125, 10.42822265625, 10.7410888671875, 11.053955078125, 11.3668212890625, 11.6796875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 18.0, 22.0, 30.0, 56.0, 94.0, 177.0, 287.0, 516.0, 956.0, 2268.0, 7643.0, 67354.0, 911614.0, 46916.0, 6546.0, 1966.0, 896.0, 482.0, 281.0, 158.0, 107.0, 49.0, 44.0, 24.0, 21.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.967041015625, -11.59814453125, -11.229248046875, -10.8603515625, -10.491455078125, -10.12255859375, -9.753662109375, -9.384765625, -9.015869140625, -8.64697265625, -8.278076171875, -7.9091796875, -7.540283203125, -7.17138671875, -6.802490234375, -6.43359375, -6.064697265625, -5.69580078125, -5.326904296875, -4.9580078125, -4.589111328125, -4.22021484375, -3.851318359375, -3.482421875, -3.113525390625, -2.74462890625, -2.375732421875, -2.0068359375, -1.637939453125, -1.26904296875, -0.900146484375, -0.53125, -0.162353515625, 0.20654296875, 0.575439453125, 0.9443359375, 1.313232421875, 1.68212890625, 2.051025390625, 2.419921875, 2.788818359375, 3.15771484375, 3.526611328125, 3.8955078125, 4.264404296875, 4.63330078125, 5.002197265625, 5.37109375, 5.739990234375, 6.10888671875, 6.477783203125, 6.8466796875, 7.215576171875, 7.58447265625, 7.953369140625, 8.322265625, 8.691162109375, 9.06005859375, 9.428955078125, 9.7978515625, 10.166748046875, 10.53564453125, 10.904541015625, 11.2734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 21.0, 26.0, 40.0, 92.0, 299.0, 312.0, 106.0, 35.0, 23.0, 12.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.002425655722618103, -0.002367943525314331, -0.002310231328010559, -0.002252519130706787, -0.002194806933403015, -0.002137094736099243, -0.002079382538795471, -0.0020216703414916992, -0.0019639581441879272, -0.0019062459468841553, -0.0018485337495803833, -0.0017908215522766113, -0.0017331093549728394, -0.0016753971576690674, -0.0016176849603652954, -0.0015599727630615234, -0.0015022605657577515, -0.0014445483684539795, -0.0013868361711502075, -0.0013291239738464355, -0.0012714117765426636, -0.0012136995792388916, -0.0011559873819351196, -0.0010982751846313477, -0.0010405629873275757, -0.0009828507900238037, -0.0009251385927200317, -0.0008674263954162598, -0.0008097141981124878, -0.0007520020008087158, -0.0006942898035049438, -0.0006365776062011719, -0.0005788654088973999, -0.0005211532115936279, -0.00046344101428985596, -0.000405728816986084, -0.000348016619682312, -0.00029030442237854004, -0.00023259222507476807, -0.0001748800277709961, -0.00011716783046722412, -5.945563316345215e-05, -1.7434358596801758e-06, 5.59687614440918e-05, 0.00011368095874786377, 0.00017139315605163574, 0.00022910535335540771, 0.0002868175506591797, 0.00034452974796295166, 0.00040224194526672363, 0.0004599541425704956, 0.0005176663398742676, 0.0005753785371780396, 0.0006330907344818115, 0.0006908029317855835, 0.0007485151290893555, 0.0008062273263931274, 0.0008639395236968994, 0.0009216517210006714, 0.0009793639183044434, 0.0010370761156082153, 0.0010947883129119873, 0.0011525005102157593, 0.0012102127075195312]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 8.0, 10.0, 14.0, 33.0, 56.0, 107.0, 229.0, 634.0, 2433.0, 20362.0, 985848.0, 34340.0, 3171.0, 773.0, 258.0, 131.0, 59.0, 39.0, 16.0, 8.0, 13.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.265625, -20.63232421875, -19.9990234375, -19.36572265625, -18.732421875, -18.09912109375, -17.4658203125, -16.83251953125, -16.19921875, -15.56591796875, -14.9326171875, -14.29931640625, -13.666015625, -13.03271484375, -12.3994140625, -11.76611328125, -11.1328125, -10.49951171875, -9.8662109375, -9.23291015625, -8.599609375, -7.96630859375, -7.3330078125, -6.69970703125, -6.06640625, -5.43310546875, -4.7998046875, -4.16650390625, -3.533203125, -2.89990234375, -2.2666015625, -1.63330078125, -1.0, -0.36669921875, 0.2666015625, 0.89990234375, 1.533203125, 2.16650390625, 2.7998046875, 3.43310546875, 4.06640625, 4.69970703125, 5.3330078125, 5.96630859375, 6.599609375, 7.23291015625, 7.8662109375, 8.49951171875, 9.1328125, 9.76611328125, 10.3994140625, 11.03271484375, 11.666015625, 12.29931640625, 12.9326171875, 13.56591796875, 14.19921875, 14.83251953125, 15.4658203125, 16.09912109375, 16.732421875, 17.36572265625, 17.9990234375, 18.63232421875, 19.265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 7.0, 12.0, 16.0, 38.0, 73.0, 160.0, 314.0, 200.0, 83.0, 35.0, 21.0, 12.0, 6.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.2613525390625, -4.944580078125, -4.6278076171875, -4.31103515625, -3.9942626953125, -3.677490234375, -3.3607177734375, -3.0439453125, -2.7271728515625, -2.410400390625, -2.0936279296875, -1.77685546875, -1.4600830078125, -1.143310546875, -0.8265380859375, -0.509765625, -0.1929931640625, 0.123779296875, 0.4405517578125, 0.75732421875, 1.0740966796875, 1.390869140625, 1.7076416015625, 2.0244140625, 2.3411865234375, 2.657958984375, 2.9747314453125, 3.29150390625, 3.6082763671875, 3.925048828125, 4.2418212890625, 4.55859375, 4.8753662109375, 5.192138671875, 5.5089111328125, 5.82568359375, 6.1424560546875, 6.459228515625, 6.7760009765625, 7.0927734375, 7.4095458984375, 7.726318359375, 8.0430908203125, 8.35986328125, 8.6766357421875, 8.993408203125, 9.3101806640625, 9.626953125, 9.9437255859375, 10.260498046875, 10.5772705078125, 10.89404296875, 11.2108154296875, 11.527587890625, 11.8443603515625, 12.1611328125, 12.4779052734375, 12.794677734375, 13.1114501953125, 13.42822265625, 13.7449951171875, 14.061767578125, 14.3785400390625, 14.6953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 15.0, 31.0, 97.0, 196.0, 343.0, 206.0, 75.0, 22.0, 15.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.20159912109375, -161.77169799804688, -157.341796875, -152.91189575195312, -148.4819793701172, -144.0520782470703, -139.62217712402344, -135.19227600097656, -130.7623748779297, -126.33247375488281, -121.9025650024414, -117.47266387939453, -113.04276275634766, -108.61285400390625, -104.18295288085938, -99.7530517578125, -95.3231430053711, -90.89324188232422, -86.46333312988281, -82.03343200683594, -77.60353088378906, -73.17362976074219, -68.74372100830078, -64.3138198852539, -59.883914947509766, -55.454010009765625, -51.02410888671875, -46.59420394897461, -42.16429901123047, -37.734397888183594, -33.30449295043945, -28.874589920043945, -24.44469451904297, -20.01479148864746, -15.584887504577637, -11.154983520507812, -6.725080490112305, -2.295177459716797, 2.1347274780273438, 6.564630508422852, 10.99453353881836, 15.424436569213867, 19.854339599609375, 24.284244537353516, 28.714147567749023, 33.14405059814453, 37.57395553588867, 42.00386047363281, 46.43376159667969, 50.86366653442383, 55.2935676574707, 59.723472595214844, 64.15337371826172, 68.58328247070312, 73.01318359375, 77.44308471679688, 81.87298583984375, 86.30288696289062, 90.73279571533203, 95.1626968383789, 99.59259796142578, 104.02250671386719, 108.45240783691406, 112.88230895996094, 117.31221771240234]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 10.0, 5.0, 9.0, 15.0, 12.0, 20.0, 10.0, 13.0, 12.0, 28.0, 18.0, 19.0, 26.0, 32.0, 30.0, 36.0, 35.0, 43.0, 41.0, 45.0, 44.0, 34.0, 54.0, 33.0, 36.0, 42.0, 30.0, 25.0, 42.0, 34.0, 22.0, 20.0, 17.0, 15.0, 17.0, 17.0, 9.0, 4.0, 13.0, 8.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-39.29570388793945, -38.12223434448242, -36.948760986328125, -35.775291442871094, -34.60182189941406, -33.428348541259766, -32.254878997802734, -31.08140754699707, -29.907936096191406, -28.734464645385742, -27.560993194580078, -26.387523651123047, -25.214052200317383, -24.04058074951172, -22.867111206054688, -21.693639755249023, -20.52016830444336, -19.346696853637695, -18.17322540283203, -16.999755859375, -15.826284408569336, -14.652812957763672, -13.479342460632324, -12.305871963500977, -11.132400512695312, -9.958929061889648, -8.7854585647583, -7.611987590789795, -6.438516616821289, -5.265045642852783, -4.091574668884277, -2.9181041717529297, -1.7446327209472656, -0.5711617469787598, 0.6023092269897461, 1.775780200958252, 2.949251174926758, 4.122722148895264, 5.2961931228637695, 6.469663619995117, 7.643135070800781, 8.816606521606445, 9.990077018737793, 11.16354751586914, 12.337018966674805, 13.510490417480469, 14.683960914611816, 15.857431411743164, 17.030902862548828, 18.204374313354492, 19.377845764160156, 20.551315307617188, 21.72478675842285, 22.898258209228516, 24.071727752685547, 25.24519920349121, 26.418670654296875, 27.59214210510254, 28.765613555908203, 29.939083099365234, 31.1125545501709, 32.28602600097656, 33.459495544433594, 34.632965087890625, 35.80643844604492]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 7.0, 11.0, 19.0, 13.0, 19.0, 34.0, 48.0, 75.0, 145.0, 209.0, 395.0, 632.0, 1136.0, 2225.0, 4397.0, 10196.0, 27639.0, 108289.0, 3578000.0, 379329.0, 51419.0, 16507.0, 6713.0, 2970.0, 1640.0, 923.0, 528.0, 270.0, 159.0, 115.0, 69.0, 45.0, 30.0, 26.0, 10.0, 10.0, 7.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.53125, -14.1131591796875, -13.695068359375, -13.2769775390625, -12.85888671875, -12.4407958984375, -12.022705078125, -11.6046142578125, -11.1865234375, -10.7684326171875, -10.350341796875, -9.9322509765625, -9.51416015625, -9.0960693359375, -8.677978515625, -8.2598876953125, -7.841796875, -7.4237060546875, -7.005615234375, -6.5875244140625, -6.16943359375, -5.7513427734375, -5.333251953125, -4.9151611328125, -4.4970703125, -4.0789794921875, -3.660888671875, -3.2427978515625, -2.82470703125, -2.4066162109375, -1.988525390625, -1.5704345703125, -1.15234375, -0.7342529296875, -0.316162109375, 0.1019287109375, 0.52001953125, 0.9381103515625, 1.356201171875, 1.7742919921875, 2.1923828125, 2.6104736328125, 3.028564453125, 3.4466552734375, 3.86474609375, 4.2828369140625, 4.700927734375, 5.1190185546875, 5.537109375, 5.9552001953125, 6.373291015625, 6.7913818359375, 7.20947265625, 7.6275634765625, 8.045654296875, 8.4637451171875, 8.8818359375, 9.2999267578125, 9.718017578125, 10.1361083984375, 10.55419921875, 10.9722900390625, 11.390380859375, 11.8084716796875, 12.2265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 7.0, 15.0, 7.0, 10.0, 14.0, 20.0, 18.0, 18.0, 29.0, 35.0, 20.0, 43.0, 40.0, 42.0, 45.0, 43.0, 44.0, 55.0, 50.0, 36.0, 68.0, 31.0, 38.0, 35.0, 26.0, 35.0, 39.0, 26.0, 25.0, 17.0, 10.0, 17.0, 4.0, 9.0, 3.0, 8.0, 8.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.822265625, -1.759185791015625, -1.69610595703125, -1.633026123046875, -1.5699462890625, -1.506866455078125, -1.44378662109375, -1.380706787109375, -1.317626953125, -1.254547119140625, -1.19146728515625, -1.128387451171875, -1.0653076171875, -1.002227783203125, -0.93914794921875, -0.876068115234375, -0.81298828125, -0.749908447265625, -0.68682861328125, -0.623748779296875, -0.5606689453125, -0.497589111328125, -0.43450927734375, -0.371429443359375, -0.308349609375, -0.245269775390625, -0.18218994140625, -0.119110107421875, -0.0560302734375, 0.007049560546875, 0.07012939453125, 0.133209228515625, 0.1962890625, 0.259368896484375, 0.32244873046875, 0.385528564453125, 0.4486083984375, 0.511688232421875, 0.57476806640625, 0.637847900390625, 0.700927734375, 0.764007568359375, 0.82708740234375, 0.890167236328125, 0.9532470703125, 1.016326904296875, 1.07940673828125, 1.142486572265625, 1.20556640625, 1.268646240234375, 1.33172607421875, 1.394805908203125, 1.4578857421875, 1.520965576171875, 1.58404541015625, 1.647125244140625, 1.710205078125, 1.773284912109375, 1.83636474609375, 1.899444580078125, 1.9625244140625, 2.025604248046875, 2.08868408203125, 2.151763916015625, 2.21484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 10.0, 19.0, 39.0, 83.0, 168.0, 470.0, 1775.0, 12152.0, 200816.0, 3931388.0, 41349.0, 4648.0, 862.0, 267.0, 103.0, 51.0, 38.0, 17.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.78125, -31.8515625, -30.921875, -29.9921875, -29.0625, -28.1328125, -27.203125, -26.2734375, -25.34375, -24.4140625, -23.484375, -22.5546875, -21.625, -20.6953125, -19.765625, -18.8359375, -17.90625, -16.9765625, -16.046875, -15.1171875, -14.1875, -13.2578125, -12.328125, -11.3984375, -10.46875, -9.5390625, -8.609375, -7.6796875, -6.75, -5.8203125, -4.890625, -3.9609375, -3.03125, -2.1015625, -1.171875, -0.2421875, 0.6875, 1.6171875, 2.546875, 3.4765625, 4.40625, 5.3359375, 6.265625, 7.1953125, 8.125, 9.0546875, 9.984375, 10.9140625, 11.84375, 12.7734375, 13.703125, 14.6328125, 15.5625, 16.4921875, 17.421875, 18.3515625, 19.28125, 20.2109375, 21.140625, 22.0703125, 23.0, 23.9296875, 24.859375, 25.7890625, 26.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 6.0, 7.0, 12.0, 27.0, 40.0, 43.0, 69.0, 156.0, 622.0, 2530.0, 293.0, 119.0, 46.0, 24.0, 20.0, 15.0, 14.0, 7.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.419189453125, -9.16650390625, -8.913818359375, -8.6611328125, -8.408447265625, -8.15576171875, -7.903076171875, -7.650390625, -7.397705078125, -7.14501953125, -6.892333984375, -6.6396484375, -6.386962890625, -6.13427734375, -5.881591796875, -5.62890625, -5.376220703125, -5.12353515625, -4.870849609375, -4.6181640625, -4.365478515625, -4.11279296875, -3.860107421875, -3.607421875, -3.354736328125, -3.10205078125, -2.849365234375, -2.5966796875, -2.343994140625, -2.09130859375, -1.838623046875, -1.5859375, -1.333251953125, -1.08056640625, -0.827880859375, -0.5751953125, -0.322509765625, -0.06982421875, 0.182861328125, 0.435546875, 0.688232421875, 0.94091796875, 1.193603515625, 1.4462890625, 1.698974609375, 1.95166015625, 2.204345703125, 2.45703125, 2.709716796875, 2.96240234375, 3.215087890625, 3.4677734375, 3.720458984375, 3.97314453125, 4.225830078125, 4.478515625, 4.731201171875, 4.98388671875, 5.236572265625, 5.4892578125, 5.741943359375, 5.99462890625, 6.247314453125, 6.5]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 18.0, 35.0, 73.0, 103.0, 195.0, 206.0, 150.0, 99.0, 46.0, 29.0, 16.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.949222564697266, -39.78824234008789, -38.62725830078125, -37.466278076171875, -36.305294036865234, -35.14431381225586, -33.98332977294922, -32.822349548339844, -31.661365509033203, -30.500383377075195, -29.339401245117188, -28.17841911315918, -27.017436981201172, -25.856454849243164, -24.695472717285156, -23.53449249267578, -22.373510360717773, -21.212528228759766, -20.051546096801758, -18.89056396484375, -17.729581832885742, -16.568599700927734, -15.407618522644043, -14.246636390686035, -13.085654258728027, -11.92467212677002, -10.763689994812012, -9.60270881652832, -8.441726684570312, -7.2807440757751465, -6.119762420654297, -4.958780288696289, -3.7977981567382812, -2.6368160247802734, -1.4758341312408447, -0.314852237701416, 0.8461298942565918, 2.0071120262145996, 3.168093681335449, 4.329075813293457, 5.490057945251465, 6.651040077209473, 7.8120222091674805, 8.973003387451172, 10.13398551940918, 11.294967651367188, 12.455949783325195, 13.616931915283203, 14.777914047241211, 15.938896179199219, 17.099878311157227, 18.260860443115234, 19.421842575073242, 20.58282470703125, 21.743804931640625, 22.904788970947266, 24.06576919555664, 25.22675132751465, 26.387733459472656, 27.548715591430664, 28.709697723388672, 29.87067985534668, 31.031661987304688, 32.19264221191406, 33.3536262512207]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 10.0, 7.0, 11.0, 19.0, 9.0, 12.0, 14.0, 25.0, 27.0, 31.0, 26.0, 25.0, 46.0, 36.0, 41.0, 38.0, 36.0, 38.0, 32.0, 46.0, 51.0, 56.0, 43.0, 37.0, 35.0, 35.0, 27.0, 31.0, 22.0, 16.0, 22.0, 18.0, 19.0, 11.0, 11.0, 4.0, 5.0, 9.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.395833969116211, -14.941278457641602, -14.486722946166992, -14.0321683883667, -13.57761287689209, -13.12305736541748, -12.668502807617188, -12.213947296142578, -11.759391784667969, -11.30483627319336, -10.85028076171875, -10.395726203918457, -9.941170692443848, -9.486615180969238, -9.032060623168945, -8.577505111694336, -8.122949600219727, -7.668394088745117, -7.213839054107666, -6.759284019470215, -6.3047285079956055, -5.850172996520996, -5.395617961883545, -4.941062927246094, -4.486507415771484, -4.031951904296875, -3.577396869659424, -3.1228415966033936, -2.6682863235473633, -2.213731050491333, -1.7591757774353027, -1.3046205043792725, -0.8500652313232422, -0.3955099582672119, 0.05904531478881836, 0.5136005878448486, 0.9681558609008789, 1.4227111339569092, 1.8772664070129395, 2.3318216800689697, 2.786376953125, 3.2409322261810303, 3.6954874992370605, 4.150042533874512, 4.604598045349121, 5.0591535568237305, 5.513708591461182, 5.968263626098633, 6.422819137573242, 6.877374649047852, 7.331929683685303, 7.786484718322754, 8.241040229797363, 8.695595741271973, 9.150150299072266, 9.604705810546875, 10.059261322021484, 10.513816833496094, 10.968372344970703, 11.422926902770996, 11.877482414245605, 12.332037925720215, 12.786592483520508, 13.241147994995117, 13.695703506469727]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 10.0, 14.0, 17.0, 30.0, 34.0, 42.0, 68.0, 89.0, 147.0, 222.0, 333.0, 610.0, 980.0, 1924.0, 3650.0, 7139.0, 14848.0, 32579.0, 73963.0, 167821.0, 341786.0, 223030.0, 97282.0, 43136.0, 19584.0, 9104.0, 4522.0, 2337.0, 1319.0, 694.0, 413.0, 290.0, 159.0, 101.0, 91.0, 54.0, 39.0, 33.0, 20.0, 11.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3359375, -7.10430908203125, -6.8726806640625, -6.64105224609375, -6.409423828125, -6.17779541015625, -5.9461669921875, -5.71453857421875, -5.48291015625, -5.25128173828125, -5.0196533203125, -4.78802490234375, -4.556396484375, -4.32476806640625, -4.0931396484375, -3.86151123046875, -3.6298828125, -3.39825439453125, -3.1666259765625, -2.93499755859375, -2.703369140625, -2.47174072265625, -2.2401123046875, -2.00848388671875, -1.77685546875, -1.54522705078125, -1.3135986328125, -1.08197021484375, -0.850341796875, -0.61871337890625, -0.3870849609375, -0.15545654296875, 0.076171875, 0.30780029296875, 0.5394287109375, 0.77105712890625, 1.002685546875, 1.23431396484375, 1.4659423828125, 1.69757080078125, 1.92919921875, 2.16082763671875, 2.3924560546875, 2.62408447265625, 2.855712890625, 3.08734130859375, 3.3189697265625, 3.55059814453125, 3.7822265625, 4.01385498046875, 4.2454833984375, 4.47711181640625, 4.708740234375, 4.94036865234375, 5.1719970703125, 5.40362548828125, 5.63525390625, 5.86688232421875, 6.0985107421875, 6.33013916015625, 6.561767578125, 6.79339599609375, 7.0250244140625, 7.25665283203125, 7.48828125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 9.0, 11.0, 7.0, 15.0, 12.0, 14.0, 20.0, 28.0, 20.0, 23.0, 33.0, 37.0, 35.0, 41.0, 39.0, 42.0, 54.0, 50.0, 46.0, 40.0, 44.0, 42.0, 32.0, 38.0, 41.0, 32.0, 29.0, 18.0, 29.0, 25.0, 12.0, 17.0, 15.0, 8.0, 8.0, 9.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6727447509765625, -1.606231689453125, -1.5397186279296875, -1.47320556640625, -1.4066925048828125, -1.340179443359375, -1.2736663818359375, -1.2071533203125, -1.1406402587890625, -1.074127197265625, -1.0076141357421875, -0.94110107421875, -0.8745880126953125, -0.808074951171875, -0.7415618896484375, -0.675048828125, -0.6085357666015625, -0.542022705078125, -0.4755096435546875, -0.40899658203125, -0.3424835205078125, -0.275970458984375, -0.2094573974609375, -0.1429443359375, -0.0764312744140625, -0.009918212890625, 0.0565948486328125, 0.12310791015625, 0.1896209716796875, 0.256134033203125, 0.3226470947265625, 0.38916015625, 0.4556732177734375, 0.522186279296875, 0.5886993408203125, 0.65521240234375, 0.7217254638671875, 0.788238525390625, 0.8547515869140625, 0.9212646484375, 0.9877777099609375, 1.054290771484375, 1.1208038330078125, 1.18731689453125, 1.2538299560546875, 1.320343017578125, 1.3868560791015625, 1.453369140625, 1.5198822021484375, 1.586395263671875, 1.6529083251953125, 1.71942138671875, 1.7859344482421875, 1.852447509765625, 1.9189605712890625, 1.9854736328125, 2.0519866943359375, 2.118499755859375, 2.1850128173828125, 2.25152587890625, 2.3180389404296875, 2.384552001953125, 2.4510650634765625, 2.517578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 9.0, 11.0, 18.0, 18.0, 22.0, 35.0, 46.0, 57.0, 91.0, 110.0, 144.0, 204.0, 310.0, 458.0, 804.0, 1903.0, 5277.0, 21444.0, 117915.0, 588033.0, 252464.0, 44054.0, 9215.0, 2762.0, 1101.0, 626.0, 405.0, 238.0, 166.0, 137.0, 90.0, 85.0, 67.0, 61.0, 33.0, 35.0, 25.0, 20.0, 12.0, 11.0, 6.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.21875, -12.814697265625, -12.41064453125, -12.006591796875, -11.6025390625, -11.198486328125, -10.79443359375, -10.390380859375, -9.986328125, -9.582275390625, -9.17822265625, -8.774169921875, -8.3701171875, -7.966064453125, -7.56201171875, -7.157958984375, -6.75390625, -6.349853515625, -5.94580078125, -5.541748046875, -5.1376953125, -4.733642578125, -4.32958984375, -3.925537109375, -3.521484375, -3.117431640625, -2.71337890625, -2.309326171875, -1.9052734375, -1.501220703125, -1.09716796875, -0.693115234375, -0.2890625, 0.114990234375, 0.51904296875, 0.923095703125, 1.3271484375, 1.731201171875, 2.13525390625, 2.539306640625, 2.943359375, 3.347412109375, 3.75146484375, 4.155517578125, 4.5595703125, 4.963623046875, 5.36767578125, 5.771728515625, 6.17578125, 6.579833984375, 6.98388671875, 7.387939453125, 7.7919921875, 8.196044921875, 8.60009765625, 9.004150390625, 9.408203125, 9.812255859375, 10.21630859375, 10.620361328125, 11.0244140625, 11.428466796875, 11.83251953125, 12.236572265625, 12.640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 11.0, 8.0, 12.0, 17.0, 26.0, 32.0, 28.0, 44.0, 42.0, 67.0, 64.0, 72.0, 74.0, 73.0, 67.0, 70.0, 48.0, 51.0, 43.0, 28.0, 33.0, 18.0, 22.0, 14.0, 8.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.323974609375, -15.78857421875, -15.253173828125, -14.7177734375, -14.182373046875, -13.64697265625, -13.111572265625, -12.576171875, -12.040771484375, -11.50537109375, -10.969970703125, -10.4345703125, -9.899169921875, -9.36376953125, -8.828369140625, -8.29296875, -7.757568359375, -7.22216796875, -6.686767578125, -6.1513671875, -5.615966796875, -5.08056640625, -4.545166015625, -4.009765625, -3.474365234375, -2.93896484375, -2.403564453125, -1.8681640625, -1.332763671875, -0.79736328125, -0.261962890625, 0.2734375, 0.808837890625, 1.34423828125, 1.879638671875, 2.4150390625, 2.950439453125, 3.48583984375, 4.021240234375, 4.556640625, 5.092041015625, 5.62744140625, 6.162841796875, 6.6982421875, 7.233642578125, 7.76904296875, 8.304443359375, 8.83984375, 9.375244140625, 9.91064453125, 10.446044921875, 10.9814453125, 11.516845703125, 12.05224609375, 12.587646484375, 13.123046875, 13.658447265625, 14.19384765625, 14.729248046875, 15.2646484375, 15.800048828125, 16.33544921875, 16.870849609375, 17.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 11.0, 16.0, 13.0, 12.0, 41.0, 47.0, 119.0, 188.0, 339.0, 747.0, 1746.0, 5455.0, 35083.0, 707034.0, 272345.0, 18900.0, 3867.0, 1326.0, 587.0, 296.0, 137.0, 82.0, 65.0, 29.0, 28.0, 10.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-15.3125, -14.9283447265625, -14.544189453125, -14.1600341796875, -13.77587890625, -13.3917236328125, -13.007568359375, -12.6234130859375, -12.2392578125, -11.8551025390625, -11.470947265625, -11.0867919921875, -10.70263671875, -10.3184814453125, -9.934326171875, -9.5501708984375, -9.166015625, -8.7818603515625, -8.397705078125, -8.0135498046875, -7.62939453125, -7.2452392578125, -6.861083984375, -6.4769287109375, -6.0927734375, -5.7086181640625, -5.324462890625, -4.9403076171875, -4.55615234375, -4.1719970703125, -3.787841796875, -3.4036865234375, -3.01953125, -2.6353759765625, -2.251220703125, -1.8670654296875, -1.48291015625, -1.0987548828125, -0.714599609375, -0.3304443359375, 0.0537109375, 0.4378662109375, 0.822021484375, 1.2061767578125, 1.59033203125, 1.9744873046875, 2.358642578125, 2.7427978515625, 3.126953125, 3.5111083984375, 3.895263671875, 4.2794189453125, 4.66357421875, 5.0477294921875, 5.431884765625, 5.8160400390625, 6.2001953125, 6.5843505859375, 6.968505859375, 7.3526611328125, 7.73681640625, 8.1209716796875, 8.505126953125, 8.8892822265625, 9.2734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 3.0, 7.0, 13.0, 21.0, 20.0, 27.0, 55.0, 72.0, 93.0, 239.0, 162.0, 76.0, 54.0, 37.0, 39.0, 22.0, 13.0, 11.0, 4.0, 3.0, 6.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016632080078125, -0.0016224756836891174, -0.0015817433595657349, -0.0015410110354423523, -0.0015002787113189697, -0.0014595463871955872, -0.0014188140630722046, -0.001378081738948822, -0.0013373494148254395, -0.0012966170907020569, -0.0012558847665786743, -0.0012151524424552917, -0.0011744201183319092, -0.0011336877942085266, -0.001092955470085144, -0.0010522231459617615, -0.001011490821838379, -0.0009707584977149963, -0.0009300261735916138, -0.0008892938494682312, -0.0008485615253448486, -0.0008078292012214661, -0.0007670968770980835, -0.0007263645529747009, -0.0006856322288513184, -0.0006448999047279358, -0.0006041675806045532, -0.0005634352564811707, -0.0005227029323577881, -0.0004819706082344055, -0.00044123828411102295, -0.0004005059599876404, -0.0003597736358642578, -0.00031904131174087524, -0.0002783089876174927, -0.0002375766634941101, -0.00019684433937072754, -0.00015611201524734497, -0.0001153796911239624, -7.464736700057983e-05, -3.3915042877197266e-05, 6.817281246185303e-06, 4.754960536956787e-05, 8.828192949295044e-05, 0.000129014253616333, 0.00016974657773971558, 0.00021047890186309814, 0.0002512112259864807, 0.0002919435501098633, 0.00033267587423324585, 0.0003734081983566284, 0.000414140522480011, 0.00045487284660339355, 0.0004956051707267761, 0.0005363374948501587, 0.0005770698189735413, 0.0006178021430969238, 0.0006585344672203064, 0.000699266791343689, 0.0007399991154670715, 0.0007807314395904541, 0.0008214637637138367, 0.0008621960878372192, 0.0009029284119606018, 0.0009436607360839844]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 4.0, 7.0, 10.0, 24.0, 59.0, 161.0, 452.0, 1335.0, 11963.0, 893069.0, 136478.0, 3772.0, 748.0, 248.0, 114.0, 51.0, 24.0, 8.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.171875, -28.4737548828125, -27.775634765625, -27.0775146484375, -26.37939453125, -25.6812744140625, -24.983154296875, -24.2850341796875, -23.5869140625, -22.8887939453125, -22.190673828125, -21.4925537109375, -20.79443359375, -20.0963134765625, -19.398193359375, -18.7000732421875, -18.001953125, -17.3038330078125, -16.605712890625, -15.9075927734375, -15.20947265625, -14.5113525390625, -13.813232421875, -13.1151123046875, -12.4169921875, -11.7188720703125, -11.020751953125, -10.3226318359375, -9.62451171875, -8.9263916015625, -8.228271484375, -7.5301513671875, -6.83203125, -6.1339111328125, -5.435791015625, -4.7376708984375, -4.03955078125, -3.3414306640625, -2.643310546875, -1.9451904296875, -1.2470703125, -0.5489501953125, 0.149169921875, 0.8472900390625, 1.54541015625, 2.2435302734375, 2.941650390625, 3.6397705078125, 4.337890625, 5.0360107421875, 5.734130859375, 6.4322509765625, 7.13037109375, 7.8284912109375, 8.526611328125, 9.2247314453125, 9.9228515625, 10.6209716796875, 11.319091796875, 12.0172119140625, 12.71533203125, 13.4134521484375, 14.111572265625, 14.8096923828125, 15.5078125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 14.0, 18.0, 32.0, 40.0, 65.0, 108.0, 159.0, 193.0, 146.0, 71.0, 54.0, 36.0, 21.0, 7.0, 4.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1484375, -13.821044921875, -13.49365234375, -13.166259765625, -12.8388671875, -12.511474609375, -12.18408203125, -11.856689453125, -11.529296875, -11.201904296875, -10.87451171875, -10.547119140625, -10.2197265625, -9.892333984375, -9.56494140625, -9.237548828125, -8.91015625, -8.582763671875, -8.25537109375, -7.927978515625, -7.6005859375, -7.273193359375, -6.94580078125, -6.618408203125, -6.291015625, -5.963623046875, -5.63623046875, -5.308837890625, -4.9814453125, -4.654052734375, -4.32666015625, -3.999267578125, -3.671875, -3.344482421875, -3.01708984375, -2.689697265625, -2.3623046875, -2.034912109375, -1.70751953125, -1.380126953125, -1.052734375, -0.725341796875, -0.39794921875, -0.070556640625, 0.2568359375, 0.584228515625, 0.91162109375, 1.239013671875, 1.56640625, 1.893798828125, 2.22119140625, 2.548583984375, 2.8759765625, 3.203369140625, 3.53076171875, 3.858154296875, 4.185546875, 4.512939453125, 4.84033203125, 5.167724609375, 5.4951171875, 5.822509765625, 6.14990234375, 6.477294921875, 6.8046875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 24.0, 35.0, 77.0, 122.0, 189.0, 199.0, 141.0, 101.0, 52.0, 17.0, 14.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-132.65936279296875, -128.76719665527344, -124.87501525878906, -120.98284912109375, -117.0906753540039, -113.19850158691406, -109.30633544921875, -105.4141616821289, -101.52198791503906, -97.62981414794922, -93.73764038085938, -89.84547424316406, -85.95330047607422, -82.06112670898438, -78.16896057128906, -74.27678680419922, -70.38461303710938, -66.49243927001953, -62.60026931762695, -58.708099365234375, -54.81592559814453, -50.92375183105469, -47.03158187866211, -43.13941192626953, -39.24723815917969, -35.355064392089844, -31.462894439697266, -27.570722579956055, -23.678550720214844, -19.786378860473633, -15.894207000732422, -12.002035140991211, -8.109870910644531, -4.21769905090332, -0.3255271911621094, 3.5666446685791016, 7.4588165283203125, 11.350988388061523, 15.243160247802734, 19.135332107543945, 23.027503967285156, 26.919675827026367, 30.811847686767578, 34.704017639160156, 38.59619140625, 42.488365173339844, 46.38053512573242, 50.272705078125, 54.164878845214844, 58.05705261230469, 61.949222564697266, 65.84139251708984, 69.73356628417969, 73.62574005126953, 77.51791381835938, 81.41007995605469, 85.30225372314453, 89.19442749023438, 93.08659362792969, 96.97876739501953, 100.87094116210938, 104.76311492919922, 108.65528869628906, 112.54745483398438, 116.43962860107422]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 7.0, 3.0, 8.0, 9.0, 14.0, 7.0, 14.0, 19.0, 21.0, 17.0, 25.0, 38.0, 34.0, 58.0, 43.0, 69.0, 51.0, 67.0, 61.0, 60.0, 50.0, 49.0, 54.0, 31.0, 35.0, 32.0, 18.0, 17.0, 14.0, 20.0, 13.0, 8.0, 5.0, 9.0, 2.0, 3.0, 7.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.0032958984375, -85.32564544677734, -82.64800262451172, -79.97035217285156, -77.29270935058594, -74.61505889892578, -71.93740844726562, -69.259765625, -66.58211517333984, -63.90446853637695, -61.22682189941406, -58.549171447753906, -55.871524810791016, -53.193878173828125, -50.51622772216797, -47.83858108520508, -45.16093444824219, -42.4832878112793, -39.805641174316406, -37.12799072265625, -34.45034408569336, -31.77269744873047, -29.095048904418945, -26.417400360107422, -23.73975372314453, -21.06210708618164, -18.384458541870117, -15.70681095123291, -13.029163360595703, -10.351515769958496, -7.673868179321289, -4.996219635009766, -2.318572998046875, 0.35907459259033203, 3.036722183227539, 5.714369773864746, 8.392017364501953, 11.06966495513916, 13.747312545776367, 16.42496109008789, 19.10260772705078, 21.780254364013672, 24.457902908325195, 27.13555145263672, 29.81319808959961, 32.4908447265625, 35.168495178222656, 37.84614181518555, 40.52378845214844, 43.20143508911133, 45.87908172607422, 48.556732177734375, 51.234378814697266, 53.912025451660156, 56.58967590332031, 59.2673225402832, 61.944969177246094, 64.62261962890625, 67.30026245117188, 69.97791290283203, 72.65556335449219, 75.33320617675781, 78.01085662841797, 80.68850708007812, 83.36614990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 13.0, 6.0, 13.0, 26.0, 37.0, 55.0, 95.0, 160.0, 310.0, 586.0, 1177.0, 2403.0, 5789.0, 16126.0, 60312.0, 753648.0, 3232670.0, 86800.0, 21304.0, 7070.0, 2895.0, 1322.0, 648.0, 355.0, 180.0, 114.0, 69.0, 41.0, 15.0, 10.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.8828125, -12.4549560546875, -12.027099609375, -11.5992431640625, -11.17138671875, -10.7435302734375, -10.315673828125, -9.8878173828125, -9.4599609375, -9.0321044921875, -8.604248046875, -8.1763916015625, -7.74853515625, -7.3206787109375, -6.892822265625, -6.4649658203125, -6.037109375, -5.6092529296875, -5.181396484375, -4.7535400390625, -4.32568359375, -3.8978271484375, -3.469970703125, -3.0421142578125, -2.6142578125, -2.1864013671875, -1.758544921875, -1.3306884765625, -0.90283203125, -0.4749755859375, -0.047119140625, 0.3807373046875, 0.80859375, 1.2364501953125, 1.664306640625, 2.0921630859375, 2.52001953125, 2.9478759765625, 3.375732421875, 3.8035888671875, 4.2314453125, 4.6593017578125, 5.087158203125, 5.5150146484375, 5.94287109375, 6.3707275390625, 6.798583984375, 7.2264404296875, 7.654296875, 8.0821533203125, 8.510009765625, 8.9378662109375, 9.36572265625, 9.7935791015625, 10.221435546875, 10.6492919921875, 11.0771484375, 11.5050048828125, 11.932861328125, 12.3607177734375, 12.78857421875, 13.2164306640625, 13.644287109375, 14.0721435546875, 14.5]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 4.0, 12.0, 12.0, 11.0, 14.0, 27.0, 33.0, 39.0, 34.0, 33.0, 55.0, 56.0, 60.0, 63.0, 59.0, 71.0, 61.0, 45.0, 43.0, 33.0, 38.0, 44.0, 34.0, 19.0, 21.0, 18.0, 17.0, 7.0, 4.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.8441162109375, -3.739013671875, -3.6339111328125, -3.52880859375, -3.4237060546875, -3.318603515625, -3.2135009765625, -3.1083984375, -3.0032958984375, -2.898193359375, -2.7930908203125, -2.68798828125, -2.5828857421875, -2.477783203125, -2.3726806640625, -2.267578125, -2.1624755859375, -2.057373046875, -1.9522705078125, -1.84716796875, -1.7420654296875, -1.636962890625, -1.5318603515625, -1.4267578125, -1.3216552734375, -1.216552734375, -1.1114501953125, -1.00634765625, -0.9012451171875, -0.796142578125, -0.6910400390625, -0.5859375, -0.4808349609375, -0.375732421875, -0.2706298828125, -0.16552734375, -0.0604248046875, 0.044677734375, 0.1497802734375, 0.2548828125, 0.3599853515625, 0.465087890625, 0.5701904296875, 0.67529296875, 0.7803955078125, 0.885498046875, 0.9906005859375, 1.095703125, 1.2008056640625, 1.305908203125, 1.4110107421875, 1.51611328125, 1.6212158203125, 1.726318359375, 1.8314208984375, 1.9365234375, 2.0416259765625, 2.146728515625, 2.2518310546875, 2.35693359375, 2.4620361328125, 2.567138671875, 2.6722412109375, 2.77734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 7.0, 5.0, 21.0, 26.0, 48.0, 96.0, 159.0, 294.0, 612.0, 2105.0, 14807.0, 335602.0, 3794554.0, 39955.0, 4151.0, 996.0, 393.0, 213.0, 109.0, 56.0, 28.0, 26.0, 16.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.5703125, -22.734375, -21.8984375, -21.0625, -20.2265625, -19.390625, -18.5546875, -17.71875, -16.8828125, -16.046875, -15.2109375, -14.375, -13.5390625, -12.703125, -11.8671875, -11.03125, -10.1953125, -9.359375, -8.5234375, -7.6875, -6.8515625, -6.015625, -5.1796875, -4.34375, -3.5078125, -2.671875, -1.8359375, -1.0, -0.1640625, 0.671875, 1.5078125, 2.34375, 3.1796875, 4.015625, 4.8515625, 5.6875, 6.5234375, 7.359375, 8.1953125, 9.03125, 9.8671875, 10.703125, 11.5390625, 12.375, 13.2109375, 14.046875, 14.8828125, 15.71875, 16.5546875, 17.390625, 18.2265625, 19.0625, 19.8984375, 20.734375, 21.5703125, 22.40625, 23.2421875, 24.078125, 24.9140625, 25.75, 26.5859375, 27.421875, 28.2578125, 29.09375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 10.0, 5.0, 26.0, 44.0, 78.0, 229.0, 2280.0, 1095.0, 167.0, 65.0, 49.0, 14.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.265625, -15.79931640625, -15.3330078125, -14.86669921875, -14.400390625, -13.93408203125, -13.4677734375, -13.00146484375, -12.53515625, -12.06884765625, -11.6025390625, -11.13623046875, -10.669921875, -10.20361328125, -9.7373046875, -9.27099609375, -8.8046875, -8.33837890625, -7.8720703125, -7.40576171875, -6.939453125, -6.47314453125, -6.0068359375, -5.54052734375, -5.07421875, -4.60791015625, -4.1416015625, -3.67529296875, -3.208984375, -2.74267578125, -2.2763671875, -1.81005859375, -1.34375, -0.87744140625, -0.4111328125, 0.05517578125, 0.521484375, 0.98779296875, 1.4541015625, 1.92041015625, 2.38671875, 2.85302734375, 3.3193359375, 3.78564453125, 4.251953125, 4.71826171875, 5.1845703125, 5.65087890625, 6.1171875, 6.58349609375, 7.0498046875, 7.51611328125, 7.982421875, 8.44873046875, 8.9150390625, 9.38134765625, 9.84765625, 10.31396484375, 10.7802734375, 11.24658203125, 11.712890625, 12.17919921875, 12.6455078125, 13.11181640625, 13.578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 20.0, 44.0, 193.0, 347.0, 284.0, 88.0, 21.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.44204711914062, -89.44474029541016, -86.44744110107422, -83.45013427734375, -80.45282745361328, -77.45552062988281, -74.45822143554688, -71.4609146118164, -68.46360778808594, -65.46630096435547, -62.468997955322266, -59.47169494628906, -56.474388122558594, -53.47708511352539, -50.47978210449219, -47.48247528076172, -44.48517608642578, -41.48787307739258, -38.49056625366211, -35.493263244628906, -32.49595642089844, -29.498653411865234, -26.50135040283203, -23.504045486450195, -20.50674057006836, -17.509435653686523, -14.512131690979004, -11.514827728271484, -8.517522811889648, -5.5202178955078125, -2.5229148864746094, 0.47439002990722656, 3.4716873168945312, 6.468991756439209, 9.466296195983887, 12.463600158691406, 15.460905075073242, 18.458209991455078, 21.45551300048828, 24.452817916870117, 27.450122833251953, 30.44742774963379, 33.444732666015625, 36.44203567504883, 39.43933868408203, 42.4366455078125, 45.4339485168457, 48.431251525878906, 51.428558349609375, 54.42586135864258, 57.42316818237305, 60.42047119140625, 63.41777801513672, 66.41508483886719, 69.41238403320312, 72.4096908569336, 75.40699768066406, 78.40430450439453, 81.40160369873047, 84.39891052246094, 87.3962173461914, 90.39352416992188, 93.39082336425781, 96.38813018798828, 99.38542938232422]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 10.0, 12.0, 14.0, 9.0, 13.0, 20.0, 25.0, 26.0, 25.0, 39.0, 36.0, 39.0, 42.0, 44.0, 50.0, 70.0, 50.0, 63.0, 68.0, 41.0, 44.0, 40.0, 38.0, 24.0, 28.0, 25.0, 30.0, 20.0, 16.0, 13.0, 9.0, 7.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.645124435424805, -27.810861587524414, -26.976598739624023, -26.142335891723633, -25.308074951171875, -24.473812103271484, -23.639549255371094, -22.805286407470703, -21.971023559570312, -21.136760711669922, -20.30249786376953, -19.46823501586914, -18.63397216796875, -17.79970932006836, -16.9654483795166, -16.13118553161621, -15.29692268371582, -14.46265983581543, -13.628396987915039, -12.794135093688965, -11.959872245788574, -11.125609397888184, -10.29134750366211, -9.457084655761719, -8.622821807861328, -7.7885589599609375, -6.954296588897705, -6.120034217834473, -5.285771369934082, -4.451508522033691, -3.617246150970459, -2.7829837799072266, -1.9487190246582031, -1.1144564151763916, -0.2801938056945801, 0.5540688037872314, 1.388331413269043, 2.2225942611694336, 3.056856632232666, 3.8911190032958984, 4.725381851196289, 5.55964469909668, 6.393907070159912, 7.2281694412231445, 8.062432289123535, 8.896695137023926, 9.73095703125, 10.56521987915039, 11.399482727050781, 12.233745574951172, 13.068008422851562, 13.902270317077637, 14.736533164978027, 15.570796012878418, 16.405057907104492, 17.239320755004883, 18.073583602905273, 18.907846450805664, 19.742109298706055, 20.576372146606445, 21.410633087158203, 22.244895935058594, 23.079158782958984, 23.913421630859375, 24.747684478759766]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 15.0, 17.0, 16.0, 25.0, 34.0, 56.0, 80.0, 113.0, 164.0, 232.0, 380.0, 573.0, 895.0, 1455.0, 2496.0, 4446.0, 8009.0, 15663.0, 30735.0, 64640.0, 134068.0, 237374.0, 251021.0, 149826.0, 72756.0, 35194.0, 17196.0, 9179.0, 4843.0, 2696.0, 1601.0, 948.0, 627.0, 366.0, 264.0, 190.0, 114.0, 73.0, 46.0, 29.0, 24.0, 19.0, 19.0, 12.0, 10.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.01953125, -5.82586669921875, -5.6322021484375, -5.43853759765625, -5.244873046875, -5.05120849609375, -4.8575439453125, -4.66387939453125, -4.47021484375, -4.27655029296875, -4.0828857421875, -3.88922119140625, -3.695556640625, -3.50189208984375, -3.3082275390625, -3.11456298828125, -2.9208984375, -2.72723388671875, -2.5335693359375, -2.33990478515625, -2.146240234375, -1.95257568359375, -1.7589111328125, -1.56524658203125, -1.37158203125, -1.17791748046875, -0.9842529296875, -0.79058837890625, -0.596923828125, -0.40325927734375, -0.2095947265625, -0.01593017578125, 0.177734375, 0.37139892578125, 0.5650634765625, 0.75872802734375, 0.952392578125, 1.14605712890625, 1.3397216796875, 1.53338623046875, 1.72705078125, 1.92071533203125, 2.1143798828125, 2.30804443359375, 2.501708984375, 2.69537353515625, 2.8890380859375, 3.08270263671875, 3.2763671875, 3.47003173828125, 3.6636962890625, 3.85736083984375, 4.051025390625, 4.24468994140625, 4.4383544921875, 4.63201904296875, 4.82568359375, 5.01934814453125, 5.2130126953125, 5.40667724609375, 5.600341796875, 5.79400634765625, 5.9876708984375, 6.18133544921875, 6.375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 5.0, 9.0, 6.0, 12.0, 16.0, 20.0, 20.0, 25.0, 26.0, 31.0, 18.0, 43.0, 39.0, 53.0, 54.0, 68.0, 43.0, 54.0, 52.0, 43.0, 44.0, 39.0, 40.0, 29.0, 39.0, 30.0, 25.0, 16.0, 22.0, 17.0, 14.0, 8.0, 7.0, 7.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.939666748046875, -2.84808349609375, -2.756500244140625, -2.6649169921875, -2.573333740234375, -2.48175048828125, -2.390167236328125, -2.298583984375, -2.207000732421875, -2.11541748046875, -2.023834228515625, -1.9322509765625, -1.840667724609375, -1.74908447265625, -1.657501220703125, -1.56591796875, -1.474334716796875, -1.38275146484375, -1.291168212890625, -1.1995849609375, -1.108001708984375, -1.01641845703125, -0.924835205078125, -0.833251953125, -0.741668701171875, -0.65008544921875, -0.558502197265625, -0.4669189453125, -0.375335693359375, -0.28375244140625, -0.192169189453125, -0.1005859375, -0.009002685546875, 0.08258056640625, 0.174163818359375, 0.2657470703125, 0.357330322265625, 0.44891357421875, 0.540496826171875, 0.632080078125, 0.723663330078125, 0.81524658203125, 0.906829833984375, 0.9984130859375, 1.089996337890625, 1.18157958984375, 1.273162841796875, 1.36474609375, 1.456329345703125, 1.54791259765625, 1.639495849609375, 1.7310791015625, 1.822662353515625, 1.91424560546875, 2.005828857421875, 2.097412109375, 2.188995361328125, 2.28057861328125, 2.372161865234375, 2.4637451171875, 2.555328369140625, 2.64691162109375, 2.738494873046875, 2.830078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 10.0, 16.0, 15.0, 20.0, 35.0, 42.0, 70.0, 83.0, 115.0, 170.0, 244.0, 385.0, 630.0, 1211.0, 3057.0, 10374.0, 50702.0, 312763.0, 529581.0, 110466.0, 19570.0, 4958.0, 1785.0, 807.0, 451.0, 285.0, 203.0, 139.0, 93.0, 74.0, 56.0, 29.0, 29.0, 17.0, 17.0, 13.0, 4.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.446533203125, -11.02587890625, -10.605224609375, -10.1845703125, -9.763916015625, -9.34326171875, -8.922607421875, -8.501953125, -8.081298828125, -7.66064453125, -7.239990234375, -6.8193359375, -6.398681640625, -5.97802734375, -5.557373046875, -5.13671875, -4.716064453125, -4.29541015625, -3.874755859375, -3.4541015625, -3.033447265625, -2.61279296875, -2.192138671875, -1.771484375, -1.350830078125, -0.93017578125, -0.509521484375, -0.0888671875, 0.331787109375, 0.75244140625, 1.173095703125, 1.59375, 2.014404296875, 2.43505859375, 2.855712890625, 3.2763671875, 3.697021484375, 4.11767578125, 4.538330078125, 4.958984375, 5.379638671875, 5.80029296875, 6.220947265625, 6.6416015625, 7.062255859375, 7.48291015625, 7.903564453125, 8.32421875, 8.744873046875, 9.16552734375, 9.586181640625, 10.0068359375, 10.427490234375, 10.84814453125, 11.268798828125, 11.689453125, 12.110107421875, 12.53076171875, 12.951416015625, 13.3720703125, 13.792724609375, 14.21337890625, 14.634033203125, 15.0546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 8.0, 4.0, 6.0, 3.0, 11.0, 13.0, 11.0, 17.0, 17.0, 27.0, 22.0, 30.0, 25.0, 38.0, 43.0, 32.0, 50.0, 43.0, 43.0, 44.0, 46.0, 56.0, 41.0, 58.0, 38.0, 34.0, 33.0, 39.0, 33.0, 21.0, 26.0, 11.0, 18.0, 6.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0078125, -14.5040283203125, -14.000244140625, -13.4964599609375, -12.99267578125, -12.4888916015625, -11.985107421875, -11.4813232421875, -10.9775390625, -10.4737548828125, -9.969970703125, -9.4661865234375, -8.96240234375, -8.4586181640625, -7.954833984375, -7.4510498046875, -6.947265625, -6.4434814453125, -5.939697265625, -5.4359130859375, -4.93212890625, -4.4283447265625, -3.924560546875, -3.4207763671875, -2.9169921875, -2.4132080078125, -1.909423828125, -1.4056396484375, -0.90185546875, -0.3980712890625, 0.105712890625, 0.6094970703125, 1.11328125, 1.6170654296875, 2.120849609375, 2.6246337890625, 3.12841796875, 3.6322021484375, 4.135986328125, 4.6397705078125, 5.1435546875, 5.6473388671875, 6.151123046875, 6.6549072265625, 7.15869140625, 7.6624755859375, 8.166259765625, 8.6700439453125, 9.173828125, 9.6776123046875, 10.181396484375, 10.6851806640625, 11.18896484375, 11.6927490234375, 12.196533203125, 12.7003173828125, 13.2041015625, 13.7078857421875, 14.211669921875, 14.7154541015625, 15.21923828125, 15.7230224609375, 16.226806640625, 16.7305908203125, 17.234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 6.0, 3.0, 2.0, 7.0, 14.0, 22.0, 24.0, 55.0, 113.0, 168.0, 368.0, 961.0, 2359.0, 7394.0, 33033.0, 239687.0, 619509.0, 117705.0, 19219.0, 4954.0, 1664.0, 618.0, 326.0, 137.0, 87.0, 42.0, 27.0, 14.0, 13.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.799072265625, -6.55908203125, -6.319091796875, -6.0791015625, -5.839111328125, -5.59912109375, -5.359130859375, -5.119140625, -4.879150390625, -4.63916015625, -4.399169921875, -4.1591796875, -3.919189453125, -3.67919921875, -3.439208984375, -3.19921875, -2.959228515625, -2.71923828125, -2.479248046875, -2.2392578125, -1.999267578125, -1.75927734375, -1.519287109375, -1.279296875, -1.039306640625, -0.79931640625, -0.559326171875, -0.3193359375, -0.079345703125, 0.16064453125, 0.400634765625, 0.640625, 0.880615234375, 1.12060546875, 1.360595703125, 1.6005859375, 1.840576171875, 2.08056640625, 2.320556640625, 2.560546875, 2.800537109375, 3.04052734375, 3.280517578125, 3.5205078125, 3.760498046875, 4.00048828125, 4.240478515625, 4.48046875, 4.720458984375, 4.96044921875, 5.200439453125, 5.4404296875, 5.680419921875, 5.92041015625, 6.160400390625, 6.400390625, 6.640380859375, 6.88037109375, 7.120361328125, 7.3603515625, 7.600341796875, 7.84033203125, 8.080322265625, 8.3203125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 28.0, 37.0, 56.0, 79.0, 123.0, 143.0, 154.0, 115.0, 78.0, 54.0, 39.0, 19.0, 17.0, 10.0, 9.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00157928466796875, -0.001536548137664795, -0.0014938116073608398, -0.0014510750770568848, -0.0014083385467529297, -0.0013656020164489746, -0.0013228654861450195, -0.0012801289558410645, -0.0012373924255371094, -0.0011946558952331543, -0.0011519193649291992, -0.0011091828346252441, -0.001066446304321289, -0.001023709774017334, -0.000980973243713379, -0.0009382367134094238, -0.0008955001831054688, -0.0008527636528015137, -0.0008100271224975586, -0.0007672905921936035, -0.0007245540618896484, -0.0006818175315856934, -0.0006390810012817383, -0.0005963444709777832, -0.0005536079406738281, -0.000510871410369873, -0.00046813488006591797, -0.0004253983497619629, -0.0003826618194580078, -0.00033992528915405273, -0.00029718875885009766, -0.0002544522285461426, -0.0002117156982421875, -0.00016897916793823242, -0.00012624263763427734, -8.350610733032227e-05, -4.076957702636719e-05, 1.9669532775878906e-06, 4.470348358154297e-05, 8.744001388549805e-05, 0.00013017654418945312, 0.0001729130744934082, 0.00021564960479736328, 0.00025838613510131836, 0.00030112266540527344, 0.0003438591957092285, 0.0003865957260131836, 0.00042933225631713867, 0.00047206878662109375, 0.0005148053169250488, 0.0005575418472290039, 0.000600278377532959, 0.0006430149078369141, 0.0006857514381408691, 0.0007284879684448242, 0.0007712244987487793, 0.0008139610290527344, 0.0008566975593566895, 0.0008994340896606445, 0.0009421706199645996, 0.0009849071502685547, 0.0010276436805725098, 0.0010703802108764648, 0.00111311674118042, 0.001155853271484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 9.0, 14.0, 14.0, 21.0, 28.0, 37.0, 84.0, 130.0, 203.0, 312.0, 630.0, 1363.0, 3939.0, 15190.0, 95454.0, 609255.0, 275135.0, 35191.0, 7139.0, 2253.0, 937.0, 488.0, 283.0, 154.0, 88.0, 55.0, 36.0, 28.0, 20.0, 11.0, 14.0, 6.0, 6.0, 7.0, 0.0, 2.0, 0.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.7734375, -8.52093505859375, -8.2684326171875, -8.01593017578125, -7.763427734375, -7.51092529296875, -7.2584228515625, -7.00592041015625, -6.75341796875, -6.50091552734375, -6.2484130859375, -5.99591064453125, -5.743408203125, -5.49090576171875, -5.2384033203125, -4.98590087890625, -4.7333984375, -4.48089599609375, -4.2283935546875, -3.97589111328125, -3.723388671875, -3.47088623046875, -3.2183837890625, -2.96588134765625, -2.71337890625, -2.46087646484375, -2.2083740234375, -1.95587158203125, -1.703369140625, -1.45086669921875, -1.1983642578125, -0.94586181640625, -0.693359375, -0.44085693359375, -0.1883544921875, 0.06414794921875, 0.316650390625, 0.56915283203125, 0.8216552734375, 1.07415771484375, 1.32666015625, 1.57916259765625, 1.8316650390625, 2.08416748046875, 2.336669921875, 2.58917236328125, 2.8416748046875, 3.09417724609375, 3.3466796875, 3.59918212890625, 3.8516845703125, 4.10418701171875, 4.356689453125, 4.60919189453125, 4.8616943359375, 5.11419677734375, 5.36669921875, 5.61920166015625, 5.8717041015625, 6.12420654296875, 6.376708984375, 6.62921142578125, 6.8817138671875, 7.13421630859375, 7.38671875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 10.0, 11.0, 15.0, 25.0, 29.0, 32.0, 48.0, 70.0, 93.0, 110.0, 101.0, 103.0, 89.0, 63.0, 54.0, 38.0, 36.0, 16.0, 13.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7109375, -9.4505615234375, -9.190185546875, -8.9298095703125, -8.66943359375, -8.4090576171875, -8.148681640625, -7.8883056640625, -7.6279296875, -7.3675537109375, -7.107177734375, -6.8468017578125, -6.58642578125, -6.3260498046875, -6.065673828125, -5.8052978515625, -5.544921875, -5.2845458984375, -5.024169921875, -4.7637939453125, -4.50341796875, -4.2430419921875, -3.982666015625, -3.7222900390625, -3.4619140625, -3.2015380859375, -2.941162109375, -2.6807861328125, -2.42041015625, -2.1600341796875, -1.899658203125, -1.6392822265625, -1.37890625, -1.1185302734375, -0.858154296875, -0.5977783203125, -0.33740234375, -0.0770263671875, 0.183349609375, 0.4437255859375, 0.7041015625, 0.9644775390625, 1.224853515625, 1.4852294921875, 1.74560546875, 2.0059814453125, 2.266357421875, 2.5267333984375, 2.787109375, 3.0474853515625, 3.307861328125, 3.5682373046875, 3.82861328125, 4.0889892578125, 4.349365234375, 4.6097412109375, 4.8701171875, 5.1304931640625, 5.390869140625, 5.6512451171875, 5.91162109375, 6.1719970703125, 6.432373046875, 6.6927490234375, 6.953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 17.0, 58.0, 261.0, 450.0, 178.0, 25.0, 7.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-230.19296264648438, -221.15652465820312, -212.12010192871094, -203.08367919921875, -194.0472412109375, -185.01080322265625, -175.97438049316406, -166.93795776367188, -157.90151977539062, -148.86508178710938, -139.8286590576172, -130.792236328125, -121.75579833984375, -112.71936798095703, -103.68293762207031, -94.6465072631836, -85.61007690429688, -76.57364654541016, -67.53721618652344, -58.50078582763672, -49.46435546875, -40.42792510986328, -31.391494750976562, -22.355064392089844, -13.318634033203125, -4.282203674316406, 4.7542266845703125, 13.790657043457031, 22.82708740234375, 31.86351776123047, 40.89994812011719, 49.936378479003906, 58.9727783203125, 68.00920867919922, 77.04563903808594, 86.08206939697266, 95.11849975585938, 104.1549301147461, 113.19136047363281, 122.22779083251953, 131.26422119140625, 140.3006591796875, 149.3370819091797, 158.37350463867188, 167.40994262695312, 176.44638061523438, 185.48280334472656, 194.51922607421875, 203.5556640625, 212.59210205078125, 221.62852478027344, 230.66494750976562, 239.70138549804688, 248.73782348632812, 257.77423095703125, 266.8106689453125, 275.84710693359375, 284.883544921875, 293.91998291015625, 302.9563903808594, 311.9928283691406, 321.0292663574219, 330.065673828125, 339.10211181640625, 348.1385498046875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 4.0, 8.0, 1.0, 2.0, 0.0, 8.0, 8.0, 12.0, 3.0, 18.0, 12.0, 17.0, 29.0, 24.0, 21.0, 32.0, 40.0, 33.0, 30.0, 41.0, 46.0, 40.0, 34.0, 47.0, 38.0, 40.0, 44.0, 42.0, 43.0, 37.0, 26.0, 29.0, 32.0, 13.0, 17.0, 25.0, 16.0, 16.0, 14.0, 8.0, 10.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.11553955078125, -69.69876098632812, -67.281982421875, -64.86519622802734, -62.44841766357422, -60.031639099121094, -57.6148567199707, -55.19807434082031, -52.78129577636719, -50.36451721191406, -47.94773483276367, -45.53095245361328, -43.114173889160156, -40.69739532470703, -38.28061294555664, -35.86383056640625, -33.447052001953125, -31.030271530151367, -28.61349105834961, -26.19671058654785, -23.779930114746094, -21.363149642944336, -18.946369171142578, -16.52958869934082, -14.112808227539062, -11.696027755737305, -9.279247283935547, -6.862466812133789, -4.445686340332031, -2.0289058685302734, 0.3878746032714844, 2.804655075073242, 5.221443176269531, 7.638223648071289, 10.055004119873047, 12.471784591674805, 14.888565063476562, 17.30534553527832, 19.722126007080078, 22.138906478881836, 24.555686950683594, 26.97246742248535, 29.38924789428711, 31.806028366088867, 34.222808837890625, 36.63958740234375, 39.05636978149414, 41.47315216064453, 43.889930725097656, 46.30670928955078, 48.72349166870117, 51.14027404785156, 53.55705261230469, 55.97383117675781, 58.3906135559082, 60.807395935058594, 63.22417449951172, 65.64095306396484, 68.0577392578125, 70.47451782226562, 72.89129638671875, 75.30807495117188, 77.724853515625, 80.14163970947266, 82.55841827392578]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 2.0, 8.0, 14.0, 10.0, 14.0, 15.0, 20.0, 39.0, 44.0, 57.0, 85.0, 95.0, 153.0, 244.0, 358.0, 660.0, 1278.0, 2838.0, 8025.0, 35370.0, 3910807.0, 204106.0, 19816.0, 5554.0, 2151.0, 1033.0, 505.0, 297.0, 168.0, 126.0, 93.0, 65.0, 59.0, 41.0, 36.0, 22.0, 15.0, 18.0, 14.0, 3.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.25, -15.7965087890625, -15.343017578125, -14.8895263671875, -14.43603515625, -13.9825439453125, -13.529052734375, -13.0755615234375, -12.6220703125, -12.1685791015625, -11.715087890625, -11.2615966796875, -10.80810546875, -10.3546142578125, -9.901123046875, -9.4476318359375, -8.994140625, -8.5406494140625, -8.087158203125, -7.6336669921875, -7.18017578125, -6.7266845703125, -6.273193359375, -5.8197021484375, -5.3662109375, -4.9127197265625, -4.459228515625, -4.0057373046875, -3.55224609375, -3.0987548828125, -2.645263671875, -2.1917724609375, -1.73828125, -1.2847900390625, -0.831298828125, -0.3778076171875, 0.07568359375, 0.5291748046875, 0.982666015625, 1.4361572265625, 1.8896484375, 2.3431396484375, 2.796630859375, 3.2501220703125, 3.70361328125, 4.1571044921875, 4.610595703125, 5.0640869140625, 5.517578125, 5.9710693359375, 6.424560546875, 6.8780517578125, 7.33154296875, 7.7850341796875, 8.238525390625, 8.6920166015625, 9.1455078125, 9.5989990234375, 10.052490234375, 10.5059814453125, 10.95947265625, 11.4129638671875, 11.866455078125, 12.3199462890625, 12.7734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 8.0, 16.0, 11.0, 16.0, 17.0, 18.0, 33.0, 43.0, 26.0, 37.0, 53.0, 47.0, 60.0, 65.0, 59.0, 57.0, 59.0, 50.0, 45.0, 41.0, 48.0, 40.0, 31.0, 24.0, 24.0, 11.0, 12.0, 7.0, 3.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.78515625, -4.64996337890625, -4.5147705078125, -4.37957763671875, -4.244384765625, -4.10919189453125, -3.9739990234375, -3.83880615234375, -3.70361328125, -3.56842041015625, -3.4332275390625, -3.29803466796875, -3.162841796875, -3.02764892578125, -2.8924560546875, -2.75726318359375, -2.6220703125, -2.48687744140625, -2.3516845703125, -2.21649169921875, -2.081298828125, -1.94610595703125, -1.8109130859375, -1.67572021484375, -1.54052734375, -1.40533447265625, -1.2701416015625, -1.13494873046875, -0.999755859375, -0.86456298828125, -0.7293701171875, -0.59417724609375, -0.458984375, -0.32379150390625, -0.1885986328125, -0.05340576171875, 0.081787109375, 0.21697998046875, 0.3521728515625, 0.48736572265625, 0.62255859375, 0.75775146484375, 0.8929443359375, 1.02813720703125, 1.163330078125, 1.29852294921875, 1.4337158203125, 1.56890869140625, 1.7041015625, 1.83929443359375, 1.9744873046875, 2.10968017578125, 2.244873046875, 2.38006591796875, 2.5152587890625, 2.65045166015625, 2.78564453125, 2.92083740234375, 3.0560302734375, 3.19122314453125, 3.326416015625, 3.46160888671875, 3.5968017578125, 3.73199462890625, 3.8671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 13.0, 12.0, 16.0, 16.0, 30.0, 36.0, 60.0, 68.0, 147.0, 236.0, 378.0, 646.0, 1187.0, 3280.0, 14262.0, 197595.0, 3940452.0, 27256.0, 5040.0, 1619.0, 807.0, 425.0, 228.0, 154.0, 95.0, 59.0, 57.0, 32.0, 27.0, 14.0, 11.0, 7.0, 4.0, 9.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.5, -19.9896240234375, -19.479248046875, -18.9688720703125, -18.45849609375, -17.9481201171875, -17.437744140625, -16.9273681640625, -16.4169921875, -15.9066162109375, -15.396240234375, -14.8858642578125, -14.37548828125, -13.8651123046875, -13.354736328125, -12.8443603515625, -12.333984375, -11.8236083984375, -11.313232421875, -10.8028564453125, -10.29248046875, -9.7821044921875, -9.271728515625, -8.7613525390625, -8.2509765625, -7.7406005859375, -7.230224609375, -6.7198486328125, -6.20947265625, -5.6990966796875, -5.188720703125, -4.6783447265625, -4.16796875, -3.6575927734375, -3.147216796875, -2.6368408203125, -2.12646484375, -1.6160888671875, -1.105712890625, -0.5953369140625, -0.0849609375, 0.4254150390625, 0.935791015625, 1.4461669921875, 1.95654296875, 2.4669189453125, 2.977294921875, 3.4876708984375, 3.998046875, 4.5084228515625, 5.018798828125, 5.5291748046875, 6.03955078125, 6.5499267578125, 7.060302734375, 7.5706787109375, 8.0810546875, 8.5914306640625, 9.101806640625, 9.6121826171875, 10.12255859375, 10.6329345703125, 11.143310546875, 11.6536865234375, 12.1640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 18.0, 36.0, 74.0, 2950.0, 818.0, 91.0, 32.0, 16.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2890625, -4.1549072265625, -4.020751953125, -3.8865966796875, -3.75244140625, -3.6182861328125, -3.484130859375, -3.3499755859375, -3.2158203125, -3.0816650390625, -2.947509765625, -2.8133544921875, -2.67919921875, -2.5450439453125, -2.410888671875, -2.2767333984375, -2.142578125, -2.0084228515625, -1.874267578125, -1.7401123046875, -1.60595703125, -1.4718017578125, -1.337646484375, -1.2034912109375, -1.0693359375, -0.9351806640625, -0.801025390625, -0.6668701171875, -0.53271484375, -0.3985595703125, -0.264404296875, -0.1302490234375, 0.00390625, 0.1380615234375, 0.272216796875, 0.4063720703125, 0.54052734375, 0.6746826171875, 0.808837890625, 0.9429931640625, 1.0771484375, 1.2113037109375, 1.345458984375, 1.4796142578125, 1.61376953125, 1.7479248046875, 1.882080078125, 2.0162353515625, 2.150390625, 2.2845458984375, 2.418701171875, 2.5528564453125, 2.68701171875, 2.8211669921875, 2.955322265625, 3.0894775390625, 3.2236328125, 3.3577880859375, 3.491943359375, 3.6260986328125, 3.76025390625, 3.8944091796875, 4.028564453125, 4.1627197265625, 4.296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 14.0, 17.0, 26.0, 74.0, 161.0, 237.0, 222.0, 147.0, 55.0, 27.0, 10.0, 5.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.77552318572998, -8.255213737487793, -7.734903335571289, -7.214593887329102, -6.694283962249756, -6.17397403717041, -5.653664588928223, -5.133354663848877, -4.613044738769531, -4.0927348136901855, -3.572425127029419, -3.0521154403686523, -2.5318055152893066, -2.011495590209961, -1.4911859035491943, -0.9708762168884277, -0.45056629180908203, 0.06974351406097412, 0.5900533199310303, 1.1103631258010864, 1.6306729316711426, 2.1509828567504883, 2.671292543411255, 3.1916022300720215, 3.711912155151367, 4.232222080230713, 4.752532005310059, 5.272841453552246, 5.793151378631592, 6.3134613037109375, 6.833770751953125, 7.354080677032471, 7.874391555786133, 8.39470100402832, 8.915011405944824, 9.435320854187012, 9.955631256103516, 10.475940704345703, 10.99625015258789, 11.516559600830078, 12.036870002746582, 12.55717945098877, 13.077489852905273, 13.597799301147461, 14.118108749389648, 14.638419151306152, 15.15872859954834, 15.679039001464844, 16.19934844970703, 16.71965789794922, 17.239967346191406, 17.760278701782227, 18.280588150024414, 18.8008975982666, 19.32120704650879, 19.841516494750977, 20.361827850341797, 20.882137298583984, 21.402446746826172, 21.922758102416992, 22.44306755065918, 22.963376998901367, 23.483686447143555, 24.003995895385742, 24.52430534362793]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 13.0, 10.0, 6.0, 11.0, 15.0, 15.0, 22.0, 15.0, 25.0, 19.0, 25.0, 25.0, 23.0, 27.0, 32.0, 31.0, 38.0, 38.0, 47.0, 34.0, 40.0, 41.0, 43.0, 40.0, 46.0, 40.0, 35.0, 24.0, 33.0, 24.0, 23.0, 25.0, 13.0, 20.0, 6.0, 11.0, 13.0, 15.0, 8.0, 1.0, 8.0, 1.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.721169948577881, -4.57758092880249, -4.433992385864258, -4.290403366088867, -4.146814346313477, -4.003225326538086, -3.8596365451812744, -3.716047763824463, -3.5724587440490723, -3.4288697242736816, -3.28528094291687, -3.1416921615600586, -2.998103141784668, -2.8545141220092773, -2.710925340652466, -2.5673365592956543, -2.4237475395202637, -2.280158519744873, -2.1365697383880615, -1.9929808378219604, -1.8493919372558594, -1.7058030366897583, -1.5622141361236572, -1.4186252355575562, -1.275036334991455, -1.131447434425354, -0.9878585338592529, -0.8442696332931519, -0.7006807327270508, -0.5570918321609497, -0.41350293159484863, -0.26991403102874756, -0.12632513046264648, 0.01726377010345459, 0.16085267066955566, 0.30444157123565674, 0.4480304718017578, 0.5916193723678589, 0.73520827293396, 0.878797173500061, 1.022386074066162, 1.1659749746322632, 1.3095638751983643, 1.4531527757644653, 1.5967416763305664, 1.7403305768966675, 1.8839194774627686, 2.02750825881958, 2.1710972785949707, 2.3146862983703613, 2.458275079727173, 2.6018638610839844, 2.745452880859375, 2.8890419006347656, 3.032630681991577, 3.1762194633483887, 3.3198084831237793, 3.46339750289917, 3.6069862842559814, 3.750575065612793, 3.8941640853881836, 4.037753105163574, 4.181342124938965, 4.324930667877197, 4.468519687652588]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 20.0, 13.0, 18.0, 27.0, 45.0, 59.0, 92.0, 160.0, 302.0, 655.0, 1650.0, 4961.0, 16905.0, 68960.0, 284022.0, 458565.0, 159725.0, 37518.0, 9730.0, 2933.0, 1136.0, 443.0, 235.0, 133.0, 66.0, 50.0, 35.0, 29.0, 16.0, 15.0, 5.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -11.9407958984375, -11.592529296875, -11.2442626953125, -10.89599609375, -10.5477294921875, -10.199462890625, -9.8511962890625, -9.5029296875, -9.1546630859375, -8.806396484375, -8.4581298828125, -8.10986328125, -7.7615966796875, -7.413330078125, -7.0650634765625, -6.716796875, -6.3685302734375, -6.020263671875, -5.6719970703125, -5.32373046875, -4.9754638671875, -4.627197265625, -4.2789306640625, -3.9306640625, -3.5823974609375, -3.234130859375, -2.8858642578125, -2.53759765625, -2.1893310546875, -1.841064453125, -1.4927978515625, -1.14453125, -0.7962646484375, -0.447998046875, -0.0997314453125, 0.24853515625, 0.5968017578125, 0.945068359375, 1.2933349609375, 1.6416015625, 1.9898681640625, 2.338134765625, 2.6864013671875, 3.03466796875, 3.3829345703125, 3.731201171875, 4.0794677734375, 4.427734375, 4.7760009765625, 5.124267578125, 5.4725341796875, 5.82080078125, 6.1690673828125, 6.517333984375, 6.8656005859375, 7.2138671875, 7.5621337890625, 7.910400390625, 8.2586669921875, 8.60693359375, 8.9552001953125, 9.303466796875, 9.6517333984375, 10.0]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 14.0, 20.0, 17.0, 36.0, 26.0, 38.0, 33.0, 45.0, 48.0, 50.0, 66.0, 63.0, 56.0, 61.0, 59.0, 58.0, 41.0, 48.0, 34.0, 34.0, 28.0, 23.0, 16.0, 15.0, 11.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.78485107421875, -4.6439208984375, -4.50299072265625, -4.362060546875, -4.22113037109375, -4.0802001953125, -3.93927001953125, -3.79833984375, -3.65740966796875, -3.5164794921875, -3.37554931640625, -3.234619140625, -3.09368896484375, -2.9527587890625, -2.81182861328125, -2.6708984375, -2.52996826171875, -2.3890380859375, -2.24810791015625, -2.107177734375, -1.96624755859375, -1.8253173828125, -1.68438720703125, -1.54345703125, -1.40252685546875, -1.2615966796875, -1.12066650390625, -0.979736328125, -0.83880615234375, -0.6978759765625, -0.55694580078125, -0.416015625, -0.27508544921875, -0.1341552734375, 0.00677490234375, 0.147705078125, 0.28863525390625, 0.4295654296875, 0.57049560546875, 0.71142578125, 0.85235595703125, 0.9932861328125, 1.13421630859375, 1.275146484375, 1.41607666015625, 1.5570068359375, 1.69793701171875, 1.8388671875, 1.97979736328125, 2.1207275390625, 2.26165771484375, 2.402587890625, 2.54351806640625, 2.6844482421875, 2.82537841796875, 2.96630859375, 3.10723876953125, 3.2481689453125, 3.38909912109375, 3.530029296875, 3.67095947265625, 3.8118896484375, 3.95281982421875, 4.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 9.0, 17.0, 21.0, 26.0, 39.0, 38.0, 67.0, 103.0, 121.0, 171.0, 253.0, 330.0, 499.0, 906.0, 1872.0, 5406.0, 26603.0, 211315.0, 659698.0, 116835.0, 16498.0, 3924.0, 1450.0, 758.0, 461.0, 314.0, 214.0, 174.0, 97.0, 80.0, 63.0, 45.0, 33.0, 19.0, 30.0, 11.0, 10.0, 5.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.11572265625, -12.6533203125, -12.19091796875, -11.728515625, -11.26611328125, -10.8037109375, -10.34130859375, -9.87890625, -9.41650390625, -8.9541015625, -8.49169921875, -8.029296875, -7.56689453125, -7.1044921875, -6.64208984375, -6.1796875, -5.71728515625, -5.2548828125, -4.79248046875, -4.330078125, -3.86767578125, -3.4052734375, -2.94287109375, -2.48046875, -2.01806640625, -1.5556640625, -1.09326171875, -0.630859375, -0.16845703125, 0.2939453125, 0.75634765625, 1.21875, 1.68115234375, 2.1435546875, 2.60595703125, 3.068359375, 3.53076171875, 3.9931640625, 4.45556640625, 4.91796875, 5.38037109375, 5.8427734375, 6.30517578125, 6.767578125, 7.22998046875, 7.6923828125, 8.15478515625, 8.6171875, 9.07958984375, 9.5419921875, 10.00439453125, 10.466796875, 10.92919921875, 11.3916015625, 11.85400390625, 12.31640625, 12.77880859375, 13.2412109375, 13.70361328125, 14.166015625, 14.62841796875, 15.0908203125, 15.55322265625, 16.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 6.0, 12.0, 12.0, 14.0, 23.0, 22.0, 24.0, 39.0, 38.0, 43.0, 53.0, 50.0, 50.0, 43.0, 55.0, 62.0, 56.0, 50.0, 40.0, 48.0, 36.0, 40.0, 29.0, 26.0, 30.0, 20.0, 12.0, 11.0, 13.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.029541015625, -19.30908203125, -18.588623046875, -17.8681640625, -17.147705078125, -16.42724609375, -15.706787109375, -14.986328125, -14.265869140625, -13.54541015625, -12.824951171875, -12.1044921875, -11.384033203125, -10.66357421875, -9.943115234375, -9.22265625, -8.502197265625, -7.78173828125, -7.061279296875, -6.3408203125, -5.620361328125, -4.89990234375, -4.179443359375, -3.458984375, -2.738525390625, -2.01806640625, -1.297607421875, -0.5771484375, 0.143310546875, 0.86376953125, 1.584228515625, 2.3046875, 3.025146484375, 3.74560546875, 4.466064453125, 5.1865234375, 5.906982421875, 6.62744140625, 7.347900390625, 8.068359375, 8.788818359375, 9.50927734375, 10.229736328125, 10.9501953125, 11.670654296875, 12.39111328125, 13.111572265625, 13.83203125, 14.552490234375, 15.27294921875, 15.993408203125, 16.7138671875, 17.434326171875, 18.15478515625, 18.875244140625, 19.595703125, 20.316162109375, 21.03662109375, 21.757080078125, 22.4775390625, 23.197998046875, 23.91845703125, 24.638916015625, 25.359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 11.0, 22.0, 20.0, 35.0, 49.0, 100.0, 145.0, 249.0, 642.0, 1487.0, 5138.0, 25755.0, 223095.0, 666383.0, 105531.0, 14450.0, 3315.0, 1121.0, 445.0, 222.0, 122.0, 66.0, 43.0, 25.0, 20.0, 16.0, 11.0, 7.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.76617431640625, -7.5635986328125, -7.36102294921875, -7.158447265625, -6.95587158203125, -6.7532958984375, -6.55072021484375, -6.34814453125, -6.14556884765625, -5.9429931640625, -5.74041748046875, -5.537841796875, -5.33526611328125, -5.1326904296875, -4.93011474609375, -4.7275390625, -4.52496337890625, -4.3223876953125, -4.11981201171875, -3.917236328125, -3.71466064453125, -3.5120849609375, -3.30950927734375, -3.10693359375, -2.90435791015625, -2.7017822265625, -2.49920654296875, -2.296630859375, -2.09405517578125, -1.8914794921875, -1.68890380859375, -1.486328125, -1.28375244140625, -1.0811767578125, -0.87860107421875, -0.676025390625, -0.47344970703125, -0.2708740234375, -0.06829833984375, 0.13427734375, 0.33685302734375, 0.5394287109375, 0.74200439453125, 0.944580078125, 1.14715576171875, 1.3497314453125, 1.55230712890625, 1.7548828125, 1.95745849609375, 2.1600341796875, 2.36260986328125, 2.565185546875, 2.76776123046875, 2.9703369140625, 3.17291259765625, 3.37548828125, 3.57806396484375, 3.7806396484375, 3.98321533203125, 4.185791015625, 4.38836669921875, 4.5909423828125, 4.79351806640625, 4.99609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 16.0, 28.0, 20.0, 43.0, 53.0, 68.0, 68.0, 86.0, 107.0, 98.0, 96.0, 67.0, 54.0, 49.0, 32.0, 18.0, 14.0, 14.0, 12.0, 9.0, 8.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006771087646484375, -0.000655055046081543, -0.0006330013275146484, -0.0006109476089477539, -0.0005888938903808594, -0.0005668401718139648, -0.0005447864532470703, -0.0005227327346801758, -0.0005006790161132812, -0.0004786252975463867, -0.0004565715789794922, -0.00043451786041259766, -0.0004124641418457031, -0.0003904104232788086, -0.00036835670471191406, -0.00034630298614501953, -0.000324249267578125, -0.00030219554901123047, -0.00028014183044433594, -0.0002580881118774414, -0.00023603439331054688, -0.00021398067474365234, -0.0001919269561767578, -0.00016987323760986328, -0.00014781951904296875, -0.00012576580047607422, -0.00010371208190917969, -8.165836334228516e-05, -5.9604644775390625e-05, -3.7550926208496094e-05, -1.5497207641601562e-05, 6.556510925292969e-06, 2.86102294921875e-05, 5.066394805908203e-05, 7.271766662597656e-05, 9.47713851928711e-05, 0.00011682510375976562, 0.00013887882232666016, 0.0001609325408935547, 0.00018298625946044922, 0.00020503997802734375, 0.00022709369659423828, 0.0002491474151611328, 0.00027120113372802734, 0.0002932548522949219, 0.0003153085708618164, 0.00033736228942871094, 0.00035941600799560547, 0.0003814697265625, 0.00040352344512939453, 0.00042557716369628906, 0.0004476308822631836, 0.0004696846008300781, 0.0004917383193969727, 0.0005137920379638672, 0.0005358457565307617, 0.0005578994750976562, 0.0005799531936645508, 0.0006020069122314453, 0.0006240606307983398, 0.0006461143493652344, 0.0006681680679321289, 0.0006902217864990234, 0.000712275505065918, 0.0007343292236328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 11.0, 7.0, 14.0, 16.0, 19.0, 35.0, 56.0, 88.0, 132.0, 228.0, 418.0, 838.0, 2013.0, 6694.0, 42405.0, 460080.0, 479923.0, 44547.0, 7004.0, 2075.0, 891.0, 451.0, 247.0, 123.0, 75.0, 51.0, 30.0, 21.0, 15.0, 9.0, 12.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.9356689453125, -6.718994140625, -6.5023193359375, -6.28564453125, -6.0689697265625, -5.852294921875, -5.6356201171875, -5.4189453125, -5.2022705078125, -4.985595703125, -4.7689208984375, -4.55224609375, -4.3355712890625, -4.118896484375, -3.9022216796875, -3.685546875, -3.4688720703125, -3.252197265625, -3.0355224609375, -2.81884765625, -2.6021728515625, -2.385498046875, -2.1688232421875, -1.9521484375, -1.7354736328125, -1.518798828125, -1.3021240234375, -1.08544921875, -0.8687744140625, -0.652099609375, -0.4354248046875, -0.21875, -0.0020751953125, 0.214599609375, 0.4312744140625, 0.64794921875, 0.8646240234375, 1.081298828125, 1.2979736328125, 1.5146484375, 1.7313232421875, 1.947998046875, 2.1646728515625, 2.38134765625, 2.5980224609375, 2.814697265625, 3.0313720703125, 3.248046875, 3.4647216796875, 3.681396484375, 3.8980712890625, 4.11474609375, 4.3314208984375, 4.548095703125, 4.7647705078125, 4.9814453125, 5.1981201171875, 5.414794921875, 5.6314697265625, 5.84814453125, 6.0648193359375, 6.281494140625, 6.4981689453125, 6.71484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 12.0, 15.0, 20.0, 28.0, 35.0, 63.0, 75.0, 107.0, 121.0, 123.0, 109.0, 86.0, 65.0, 46.0, 37.0, 20.0, 18.0, 10.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.16302490234375, -5.8846435546875, -5.60626220703125, -5.327880859375, -5.04949951171875, -4.7711181640625, -4.49273681640625, -4.21435546875, -3.93597412109375, -3.6575927734375, -3.37921142578125, -3.100830078125, -2.82244873046875, -2.5440673828125, -2.26568603515625, -1.9873046875, -1.70892333984375, -1.4305419921875, -1.15216064453125, -0.873779296875, -0.59539794921875, -0.3170166015625, -0.03863525390625, 0.23974609375, 0.51812744140625, 0.7965087890625, 1.07489013671875, 1.353271484375, 1.63165283203125, 1.9100341796875, 2.18841552734375, 2.466796875, 2.74517822265625, 3.0235595703125, 3.30194091796875, 3.580322265625, 3.85870361328125, 4.1370849609375, 4.41546630859375, 4.69384765625, 4.97222900390625, 5.2506103515625, 5.52899169921875, 5.807373046875, 6.08575439453125, 6.3641357421875, 6.64251708984375, 6.9208984375, 7.19927978515625, 7.4776611328125, 7.75604248046875, 8.034423828125, 8.31280517578125, 8.5911865234375, 8.86956787109375, 9.14794921875, 9.42633056640625, 9.7047119140625, 9.98309326171875, 10.261474609375, 10.53985595703125, 10.8182373046875, 11.09661865234375, 11.375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 29.0, 55.0, 146.0, 262.0, 282.0, 147.0, 48.0, 22.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.33538055419922, -60.4007568359375, -54.46613311767578, -48.53150939941406, -42.596885681152344, -36.662261962890625, -30.727638244628906, -24.793014526367188, -18.85839080810547, -12.92376708984375, -6.989143371582031, -1.0545196533203125, 4.880104064941406, 10.814727783203125, 16.749351501464844, 22.683975219726562, 28.61859893798828, 34.55322265625, 40.48784637451172, 46.42247009277344, 52.357093811035156, 58.291717529296875, 64.2263412475586, 70.16096496582031, 76.09558868408203, 82.03021240234375, 87.96483612060547, 93.89945983886719, 99.8340835571289, 105.76870727539062, 111.70333099365234, 117.63795471191406, 123.57257080078125, 129.5072021484375, 135.4418182373047, 141.37643432617188, 147.31106567382812, 153.24569702148438, 159.18031311035156, 165.11492919921875, 171.049560546875, 176.98419189453125, 182.91880798339844, 188.85342407226562, 194.78805541992188, 200.72268676757812, 206.6573028564453, 212.5919189453125, 218.52655029296875, 224.461181640625, 230.3957977294922, 236.33041381835938, 242.26504516601562, 248.19967651367188, 254.13429260253906, 260.06890869140625, 266.0035400390625, 271.93817138671875, 277.872802734375, 283.8074035644531, 289.7420349121094, 295.6766662597656, 301.61126708984375, 307.5458984375, 313.48052978515625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 8.0, 5.0, 13.0, 7.0, 12.0, 15.0, 27.0, 17.0, 29.0, 40.0, 24.0, 36.0, 40.0, 40.0, 45.0, 49.0, 60.0, 55.0, 44.0, 53.0, 46.0, 39.0, 45.0, 23.0, 40.0, 28.0, 26.0, 25.0, 15.0, 17.0, 11.0, 12.0, 5.0, 7.0, 5.0, 10.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.71615600585938, -71.97296905517578, -69.22978973388672, -66.48660278320312, -63.74342346191406, -61.00023651123047, -58.25705337524414, -55.51387023925781, -52.770687103271484, -50.027503967285156, -47.28432083129883, -44.5411376953125, -41.797950744628906, -39.054771423339844, -36.31158447265625, -33.56840133666992, -30.825218200683594, -28.082035064697266, -25.338851928710938, -22.595666885375977, -19.85248374938965, -17.10930061340332, -14.36611557006836, -11.622932434082031, -8.879749298095703, -6.136565685272217, -3.3933820724487305, -0.6501979827880859, 2.092985153198242, 4.83616828918457, 7.579353332519531, 10.32253646850586, 13.065719604492188, 15.808902740478516, 18.552085876464844, 21.295270919799805, 24.038454055786133, 26.78163719177246, 29.524822235107422, 32.26800537109375, 35.01118850708008, 37.754371643066406, 40.497554779052734, 43.24073791503906, 45.983924865722656, 48.72710418701172, 51.47029113769531, 54.21347427368164, 56.95665740966797, 59.6998405456543, 62.443023681640625, 65.18621063232422, 67.92938995361328, 70.67257690429688, 73.41575622558594, 76.15894317626953, 78.90213012695312, 81.64531707763672, 84.38849639892578, 87.13168334960938, 89.87486267089844, 92.61804962158203, 95.36123657226562, 98.10441589355469, 100.84759521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 11.0, 7.0, 9.0, 12.0, 19.0, 21.0, 31.0, 45.0, 74.0, 107.0, 169.0, 245.0, 388.0, 653.0, 1217.0, 2262.0, 4828.0, 12191.0, 40856.0, 406813.0, 3646729.0, 51807.0, 14265.0, 5657.0, 2555.0, 1396.0, 773.0, 427.0, 258.0, 142.0, 90.0, 69.0, 39.0, 32.0, 24.0, 15.0, 12.0, 11.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-7.62109375, -7.39068603515625, -7.1602783203125, -6.92987060546875, -6.699462890625, -6.46905517578125, -6.2386474609375, -6.00823974609375, -5.77783203125, -5.54742431640625, -5.3170166015625, -5.08660888671875, -4.856201171875, -4.62579345703125, -4.3953857421875, -4.16497802734375, -3.9345703125, -3.70416259765625, -3.4737548828125, -3.24334716796875, -3.012939453125, -2.78253173828125, -2.5521240234375, -2.32171630859375, -2.09130859375, -1.86090087890625, -1.6304931640625, -1.40008544921875, -1.169677734375, -0.93927001953125, -0.7088623046875, -0.47845458984375, -0.248046875, -0.01763916015625, 0.2127685546875, 0.44317626953125, 0.673583984375, 0.90399169921875, 1.1343994140625, 1.36480712890625, 1.59521484375, 1.82562255859375, 2.0560302734375, 2.28643798828125, 2.516845703125, 2.74725341796875, 2.9776611328125, 3.20806884765625, 3.4384765625, 3.66888427734375, 3.8992919921875, 4.12969970703125, 4.360107421875, 4.59051513671875, 4.8209228515625, 5.05133056640625, 5.28173828125, 5.51214599609375, 5.7425537109375, 5.97296142578125, 6.203369140625, 6.43377685546875, 6.6641845703125, 6.89459228515625, 7.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 11.0, 14.0, 17.0, 17.0, 16.0, 31.0, 44.0, 36.0, 47.0, 57.0, 59.0, 58.0, 78.0, 69.0, 64.0, 56.0, 61.0, 44.0, 40.0, 51.0, 22.0, 24.0, 22.0, 14.0, 9.0, 13.0, 5.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.8143310546875, -4.659912109375, -4.5054931640625, -4.35107421875, -4.1966552734375, -4.042236328125, -3.8878173828125, -3.7333984375, -3.5789794921875, -3.424560546875, -3.2701416015625, -3.11572265625, -2.9613037109375, -2.806884765625, -2.6524658203125, -2.498046875, -2.3436279296875, -2.189208984375, -2.0347900390625, -1.88037109375, -1.7259521484375, -1.571533203125, -1.4171142578125, -1.2626953125, -1.1082763671875, -0.953857421875, -0.7994384765625, -0.64501953125, -0.4906005859375, -0.336181640625, -0.1817626953125, -0.02734375, 0.1270751953125, 0.281494140625, 0.4359130859375, 0.59033203125, 0.7447509765625, 0.899169921875, 1.0535888671875, 1.2080078125, 1.3624267578125, 1.516845703125, 1.6712646484375, 1.82568359375, 1.9801025390625, 2.134521484375, 2.2889404296875, 2.443359375, 2.5977783203125, 2.752197265625, 2.9066162109375, 3.06103515625, 3.2154541015625, 3.369873046875, 3.5242919921875, 3.6787109375, 3.8331298828125, 3.987548828125, 4.1419677734375, 4.29638671875, 4.4508056640625, 4.605224609375, 4.7596435546875, 4.9140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 8.0, 13.0, 10.0, 16.0, 18.0, 29.0, 45.0, 53.0, 71.0, 85.0, 123.0, 176.0, 274.0, 430.0, 720.0, 1312.0, 2585.0, 6075.0, 16397.0, 65891.0, 3653314.0, 382646.0, 42057.0, 12224.0, 4662.0, 2126.0, 1099.0, 637.0, 363.0, 233.0, 163.0, 135.0, 72.0, 55.0, 49.0, 32.0, 30.0, 16.0, 13.0, 11.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.87890625, -7.6651611328125, -7.451416015625, -7.2376708984375, -7.02392578125, -6.8101806640625, -6.596435546875, -6.3826904296875, -6.1689453125, -5.9552001953125, -5.741455078125, -5.5277099609375, -5.31396484375, -5.1002197265625, -4.886474609375, -4.6727294921875, -4.458984375, -4.2452392578125, -4.031494140625, -3.8177490234375, -3.60400390625, -3.3902587890625, -3.176513671875, -2.9627685546875, -2.7490234375, -2.5352783203125, -2.321533203125, -2.1077880859375, -1.89404296875, -1.6802978515625, -1.466552734375, -1.2528076171875, -1.0390625, -0.8253173828125, -0.611572265625, -0.3978271484375, -0.18408203125, 0.0296630859375, 0.243408203125, 0.4571533203125, 0.6708984375, 0.8846435546875, 1.098388671875, 1.3121337890625, 1.52587890625, 1.7396240234375, 1.953369140625, 2.1671142578125, 2.380859375, 2.5946044921875, 2.808349609375, 3.0220947265625, 3.23583984375, 3.4495849609375, 3.663330078125, 3.8770751953125, 4.0908203125, 4.3045654296875, 4.518310546875, 4.7320556640625, 4.94580078125, 5.1595458984375, 5.373291015625, 5.5870361328125, 5.80078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 18.0, 24.0, 34.0, 91.0, 309.0, 3224.0, 219.0, 61.0, 29.0, 16.0, 10.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.828826904296875, -3.73382568359375, -3.638824462890625, -3.5438232421875, -3.448822021484375, -3.35382080078125, -3.258819580078125, -3.163818359375, -3.068817138671875, -2.97381591796875, -2.878814697265625, -2.7838134765625, -2.688812255859375, -2.59381103515625, -2.498809814453125, -2.40380859375, -2.308807373046875, -2.21380615234375, -2.118804931640625, -2.0238037109375, -1.928802490234375, -1.83380126953125, -1.738800048828125, -1.643798828125, -1.548797607421875, -1.45379638671875, -1.358795166015625, -1.2637939453125, -1.168792724609375, -1.07379150390625, -0.978790283203125, -0.8837890625, -0.788787841796875, -0.69378662109375, -0.598785400390625, -0.5037841796875, -0.408782958984375, -0.31378173828125, -0.218780517578125, -0.123779296875, -0.028778076171875, 0.06622314453125, 0.161224365234375, 0.2562255859375, 0.351226806640625, 0.44622802734375, 0.541229248046875, 0.63623046875, 0.731231689453125, 0.82623291015625, 0.921234130859375, 1.0162353515625, 1.111236572265625, 1.20623779296875, 1.301239013671875, 1.396240234375, 1.491241455078125, 1.58624267578125, 1.681243896484375, 1.7762451171875, 1.871246337890625, 1.96624755859375, 2.061248779296875, 2.15625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 25.0, 72.0, 307.0, 394.0, 157.0, 33.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.83179473876953, -34.04258346557617, -33.25336837768555, -32.46415710449219, -31.674945831298828, -30.885732650756836, -30.096519470214844, -29.307308197021484, -28.518095016479492, -27.7288818359375, -26.93967056274414, -26.15045738220215, -25.361244201660156, -24.572032928466797, -23.782819747924805, -22.993606567382812, -22.204395294189453, -21.41518211364746, -20.6259708404541, -19.83675765991211, -19.04754638671875, -18.258333206176758, -17.469120025634766, -16.679908752441406, -15.890695571899414, -15.101483345031738, -14.312271118164062, -13.52305793762207, -12.733845710754395, -11.944633483886719, -11.155420303344727, -10.36620807647705, -9.576997756958008, -8.787785530090332, -7.998572826385498, -7.209360122680664, -6.420147895812988, -5.6309356689453125, -4.8417229652404785, -4.0525102615356445, -3.2632980346679688, -2.474085569381714, -1.684873104095459, -0.8956606388092041, -0.10644817352294922, 0.6827642917633057, 1.4719767570495605, 2.2611894607543945, 3.0504016876220703, 3.839614152908325, 4.62882661819458, 5.418039321899414, 6.20725154876709, 6.996463775634766, 7.7856764793396, 8.574889183044434, 9.36410140991211, 10.153313636779785, 10.942525863647461, 11.731739044189453, 12.520951271057129, 13.310163497924805, 14.099376678466797, 14.888588905334473, 15.677801132202148]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 3.0, 8.0, 11.0, 14.0, 13.0, 18.0, 19.0, 28.0, 21.0, 25.0, 30.0, 27.0, 24.0, 40.0, 34.0, 37.0, 40.0, 38.0, 46.0, 26.0, 42.0, 40.0, 38.0, 30.0, 49.0, 28.0, 30.0, 23.0, 23.0, 23.0, 24.0, 25.0, 15.0, 13.0, 13.0, 16.0, 15.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.446737766265869, -3.3314435482025146, -3.21614933013916, -3.1008553504943848, -2.9855611324310303, -2.870266914367676, -2.7549726963043213, -2.639678478240967, -2.5243844985961914, -2.409090280532837, -2.2937960624694824, -2.178502082824707, -2.0632078647613525, -1.947913646697998, -1.8326194286346436, -1.717325210571289, -1.6020309925079346, -1.48673677444458, -1.3714426755905151, -1.2561484575271606, -1.1408543586730957, -1.0255601406097412, -0.9102659225463867, -0.794971764087677, -0.6796776056289673, -0.5643834471702576, -0.44908925890922546, -0.33379507064819336, -0.21850091218948364, -0.10320675373077393, 0.012087464332580566, 0.12738162279129028, 0.24267578125, 0.3579699397087097, 0.4732641279697418, 0.5885583162307739, 0.7038524746894836, 0.8191466331481934, 0.9344408512115479, 1.0497350692749023, 1.1650291681289673, 1.2803233861923218, 1.3956174850463867, 1.5109117031097412, 1.6262059211730957, 1.7415000200271606, 1.8567942380905151, 1.97208833694458, 2.0873825550079346, 2.202676773071289, 2.3179709911346436, 2.433265209197998, 2.5485591888427734, 2.663853406906128, 2.7791476249694824, 2.894441843032837, 3.0097360610961914, 3.125030279159546, 3.2403244972229004, 3.355618476867676, 3.4709126949310303, 3.5862069129943848, 3.7015011310577393, 3.8167953491210938, 3.932089328765869]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 3.0, 14.0, 11.0, 29.0, 35.0, 46.0, 57.0, 101.0, 181.0, 308.0, 492.0, 1021.0, 2218.0, 5228.0, 13665.0, 39933.0, 122785.0, 309499.0, 335294.0, 143692.0, 47092.0, 15977.0, 5830.0, 2471.0, 1142.0, 542.0, 333.0, 195.0, 110.0, 68.0, 40.0, 31.0, 25.0, 27.0, 13.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.9375, -6.72119140625, -6.5048828125, -6.28857421875, -6.072265625, -5.85595703125, -5.6396484375, -5.42333984375, -5.20703125, -4.99072265625, -4.7744140625, -4.55810546875, -4.341796875, -4.12548828125, -3.9091796875, -3.69287109375, -3.4765625, -3.26025390625, -3.0439453125, -2.82763671875, -2.611328125, -2.39501953125, -2.1787109375, -1.96240234375, -1.74609375, -1.52978515625, -1.3134765625, -1.09716796875, -0.880859375, -0.66455078125, -0.4482421875, -0.23193359375, -0.015625, 0.20068359375, 0.4169921875, 0.63330078125, 0.849609375, 1.06591796875, 1.2822265625, 1.49853515625, 1.71484375, 1.93115234375, 2.1474609375, 2.36376953125, 2.580078125, 2.79638671875, 3.0126953125, 3.22900390625, 3.4453125, 3.66162109375, 3.8779296875, 4.09423828125, 4.310546875, 4.52685546875, 4.7431640625, 4.95947265625, 5.17578125, 5.39208984375, 5.6083984375, 5.82470703125, 6.041015625, 6.25732421875, 6.4736328125, 6.68994140625, 6.90625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 9.0, 10.0, 15.0, 13.0, 15.0, 13.0, 29.0, 30.0, 31.0, 46.0, 40.0, 46.0, 51.0, 56.0, 55.0, 69.0, 61.0, 59.0, 49.0, 48.0, 39.0, 34.0, 40.0, 36.0, 14.0, 27.0, 17.0, 11.0, 4.0, 10.0, 4.0, 6.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.13360595703125, -3.9976806640625, -3.86175537109375, -3.725830078125, -3.58990478515625, -3.4539794921875, -3.31805419921875, -3.18212890625, -3.04620361328125, -2.9102783203125, -2.77435302734375, -2.638427734375, -2.50250244140625, -2.3665771484375, -2.23065185546875, -2.0947265625, -1.95880126953125, -1.8228759765625, -1.68695068359375, -1.551025390625, -1.41510009765625, -1.2791748046875, -1.14324951171875, -1.00732421875, -0.87139892578125, -0.7354736328125, -0.59954833984375, -0.463623046875, -0.32769775390625, -0.1917724609375, -0.05584716796875, 0.080078125, 0.21600341796875, 0.3519287109375, 0.48785400390625, 0.623779296875, 0.75970458984375, 0.8956298828125, 1.03155517578125, 1.16748046875, 1.30340576171875, 1.4393310546875, 1.57525634765625, 1.711181640625, 1.84710693359375, 1.9830322265625, 2.11895751953125, 2.2548828125, 2.39080810546875, 2.5267333984375, 2.66265869140625, 2.798583984375, 2.93450927734375, 3.0704345703125, 3.20635986328125, 3.34228515625, 3.47821044921875, 3.6141357421875, 3.75006103515625, 3.885986328125, 4.02191162109375, 4.1578369140625, 4.29376220703125, 4.4296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 0.0, 3.0, 6.0, 14.0, 7.0, 18.0, 18.0, 23.0, 26.0, 49.0, 37.0, 60.0, 71.0, 120.0, 170.0, 236.0, 333.0, 458.0, 716.0, 1176.0, 2254.0, 5797.0, 21789.0, 117672.0, 558553.0, 274971.0, 45730.0, 10223.0, 3525.0, 1584.0, 920.0, 567.0, 373.0, 298.0, 191.0, 143.0, 120.0, 69.0, 55.0, 42.0, 32.0, 30.0, 15.0, 15.0, 7.0, 10.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.703125, -9.3973388671875, -9.091552734375, -8.7857666015625, -8.47998046875, -8.1741943359375, -7.868408203125, -7.5626220703125, -7.2568359375, -6.9510498046875, -6.645263671875, -6.3394775390625, -6.03369140625, -5.7279052734375, -5.422119140625, -5.1163330078125, -4.810546875, -4.5047607421875, -4.198974609375, -3.8931884765625, -3.58740234375, -3.2816162109375, -2.975830078125, -2.6700439453125, -2.3642578125, -2.0584716796875, -1.752685546875, -1.4468994140625, -1.14111328125, -0.8353271484375, -0.529541015625, -0.2237548828125, 0.08203125, 0.3878173828125, 0.693603515625, 0.9993896484375, 1.30517578125, 1.6109619140625, 1.916748046875, 2.2225341796875, 2.5283203125, 2.8341064453125, 3.139892578125, 3.4456787109375, 3.75146484375, 4.0572509765625, 4.363037109375, 4.6688232421875, 4.974609375, 5.2803955078125, 5.586181640625, 5.8919677734375, 6.19775390625, 6.5035400390625, 6.809326171875, 7.1151123046875, 7.4208984375, 7.7266845703125, 8.032470703125, 8.3382568359375, 8.64404296875, 8.9498291015625, 9.255615234375, 9.5614013671875, 9.8671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 4.0, 12.0, 12.0, 15.0, 14.0, 7.0, 21.0, 16.0, 19.0, 40.0, 36.0, 37.0, 27.0, 43.0, 52.0, 56.0, 40.0, 71.0, 50.0, 48.0, 56.0, 49.0, 46.0, 30.0, 34.0, 27.0, 31.0, 27.0, 18.0, 9.0, 12.0, 8.0, 5.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.296875, -17.725830078125, -17.15478515625, -16.583740234375, -16.0126953125, -15.441650390625, -14.87060546875, -14.299560546875, -13.728515625, -13.157470703125, -12.58642578125, -12.015380859375, -11.4443359375, -10.873291015625, -10.30224609375, -9.731201171875, -9.16015625, -8.589111328125, -8.01806640625, -7.447021484375, -6.8759765625, -6.304931640625, -5.73388671875, -5.162841796875, -4.591796875, -4.020751953125, -3.44970703125, -2.878662109375, -2.3076171875, -1.736572265625, -1.16552734375, -0.594482421875, -0.0234375, 0.547607421875, 1.11865234375, 1.689697265625, 2.2607421875, 2.831787109375, 3.40283203125, 3.973876953125, 4.544921875, 5.115966796875, 5.68701171875, 6.258056640625, 6.8291015625, 7.400146484375, 7.97119140625, 8.542236328125, 9.11328125, 9.684326171875, 10.25537109375, 10.826416015625, 11.3974609375, 11.968505859375, 12.53955078125, 13.110595703125, 13.681640625, 14.252685546875, 14.82373046875, 15.394775390625, 15.9658203125, 16.536865234375, 17.10791015625, 17.678955078125, 18.25]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 13.0, 10.0, 28.0, 49.0, 126.0, 412.0, 1737.0, 34403.0, 982393.0, 27160.0, 1547.0, 418.0, 129.0, 62.0, 35.0, 16.0, 12.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.8502197265625, -8.395751953125, -7.9412841796875, -7.48681640625, -7.0323486328125, -6.577880859375, -6.1234130859375, -5.6689453125, -5.2144775390625, -4.760009765625, -4.3055419921875, -3.85107421875, -3.3966064453125, -2.942138671875, -2.4876708984375, -2.033203125, -1.5787353515625, -1.124267578125, -0.6697998046875, -0.21533203125, 0.2391357421875, 0.693603515625, 1.1480712890625, 1.6025390625, 2.0570068359375, 2.511474609375, 2.9659423828125, 3.42041015625, 3.8748779296875, 4.329345703125, 4.7838134765625, 5.23828125, 5.6927490234375, 6.147216796875, 6.6016845703125, 7.05615234375, 7.5106201171875, 7.965087890625, 8.4195556640625, 8.8740234375, 9.3284912109375, 9.782958984375, 10.2374267578125, 10.69189453125, 11.1463623046875, 11.600830078125, 12.0552978515625, 12.509765625, 12.9642333984375, 13.418701171875, 13.8731689453125, 14.32763671875, 14.7821044921875, 15.236572265625, 15.6910400390625, 16.1455078125, 16.5999755859375, 17.054443359375, 17.5089111328125, 17.96337890625, 18.4178466796875, 18.872314453125, 19.3267822265625, 19.78125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 11.0, 7.0, 12.0, 15.0, 28.0, 39.0, 51.0, 89.0, 108.0, 127.0, 135.0, 109.0, 87.0, 50.0, 32.0, 24.0, 21.0, 8.0, 17.0, 8.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010805130004882812, -0.0010535269975662231, -0.001026540994644165, -0.000999554991722107, -0.0009725689888000488, -0.0009455829858779907, -0.0009185969829559326, -0.0008916109800338745, -0.0008646249771118164, -0.0008376389741897583, -0.0008106529712677002, -0.0007836669683456421, -0.000756680965423584, -0.0007296949625015259, -0.0007027089595794678, -0.0006757229566574097, -0.0006487369537353516, -0.0006217509508132935, -0.0005947649478912354, -0.0005677789449691772, -0.0005407929420471191, -0.000513806939125061, -0.00048682093620300293, -0.0004598349332809448, -0.0004328489303588867, -0.0004058629274368286, -0.0003788769245147705, -0.0003518909215927124, -0.0003249049186706543, -0.0002979189157485962, -0.0002709329128265381, -0.00024394690990447998, -0.00021696090698242188, -0.00018997490406036377, -0.00016298890113830566, -0.00013600289821624756, -0.00010901689529418945, -8.203089237213135e-05, -5.504488945007324e-05, -2.8058886528015137e-05, -1.0728836059570312e-06, 2.5913119316101074e-05, 5.289912223815918e-05, 7.988512516021729e-05, 0.00010687112808227539, 0.0001338571310043335, 0.0001608431339263916, 0.0001878291368484497, 0.0002148151397705078, 0.00024180114269256592, 0.000268787145614624, 0.00029577314853668213, 0.00032275915145874023, 0.00034974515438079834, 0.00037673115730285645, 0.00040371716022491455, 0.00043070316314697266, 0.00045768916606903076, 0.00048467516899108887, 0.000511661171913147, 0.0005386471748352051, 0.0005656331777572632, 0.0005926191806793213, 0.0006196051836013794, 0.0006465911865234375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 9.0, 12.0, 21.0, 27.0, 51.0, 73.0, 150.0, 290.0, 540.0, 1477.0, 6543.0, 83697.0, 873158.0, 73718.0, 6060.0, 1516.0, 595.0, 259.0, 129.0, 84.0, 47.0, 37.0, 13.0, 13.0, 8.0, 9.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -6.97247314453125, -6.6988525390625, -6.42523193359375, -6.151611328125, -5.87799072265625, -5.6043701171875, -5.33074951171875, -5.05712890625, -4.78350830078125, -4.5098876953125, -4.23626708984375, -3.962646484375, -3.68902587890625, -3.4154052734375, -3.14178466796875, -2.8681640625, -2.59454345703125, -2.3209228515625, -2.04730224609375, -1.773681640625, -1.50006103515625, -1.2264404296875, -0.95281982421875, -0.67919921875, -0.40557861328125, -0.1319580078125, 0.14166259765625, 0.415283203125, 0.68890380859375, 0.9625244140625, 1.23614501953125, 1.509765625, 1.78338623046875, 2.0570068359375, 2.33062744140625, 2.604248046875, 2.87786865234375, 3.1514892578125, 3.42510986328125, 3.69873046875, 3.97235107421875, 4.2459716796875, 4.51959228515625, 4.793212890625, 5.06683349609375, 5.3404541015625, 5.61407470703125, 5.8876953125, 6.16131591796875, 6.4349365234375, 6.70855712890625, 6.982177734375, 7.25579833984375, 7.5294189453125, 7.80303955078125, 8.07666015625, 8.35028076171875, 8.6239013671875, 8.89752197265625, 9.171142578125, 9.44476318359375, 9.7183837890625, 9.99200439453125, 10.265625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 9.0, 32.0, 54.0, 102.0, 163.0, 193.0, 183.0, 127.0, 67.0, 35.0, 18.0, 11.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.296875, -16.94244384765625, -16.5880126953125, -16.23358154296875, -15.879150390625, -15.52471923828125, -15.1702880859375, -14.81585693359375, -14.46142578125, -14.10699462890625, -13.7525634765625, -13.39813232421875, -13.043701171875, -12.68927001953125, -12.3348388671875, -11.98040771484375, -11.6259765625, -11.27154541015625, -10.9171142578125, -10.56268310546875, -10.208251953125, -9.85382080078125, -9.4993896484375, -9.14495849609375, -8.79052734375, -8.43609619140625, -8.0816650390625, -7.72723388671875, -7.372802734375, -7.01837158203125, -6.6639404296875, -6.30950927734375, -5.955078125, -5.60064697265625, -5.2462158203125, -4.89178466796875, -4.537353515625, -4.18292236328125, -3.8284912109375, -3.47406005859375, -3.11962890625, -2.76519775390625, -2.4107666015625, -2.05633544921875, -1.701904296875, -1.34747314453125, -0.9930419921875, -0.63861083984375, -0.2841796875, 0.07025146484375, 0.4246826171875, 0.77911376953125, 1.133544921875, 1.48797607421875, 1.8424072265625, 2.19683837890625, 2.55126953125, 2.90570068359375, 3.2601318359375, 3.61456298828125, 3.968994140625, 4.32342529296875, 4.6778564453125, 5.03228759765625, 5.38671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 16.0, 58.0, 108.0, 220.0, 259.0, 188.0, 83.0, 32.0, 14.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.9035186767578, -200.09164428710938, -195.27978515625, -190.46791076660156, -185.65603637695312, -180.84417724609375, -176.0323028564453, -171.22042846679688, -166.4085693359375, -161.59669494628906, -156.7848358154297, -151.97296142578125, -147.1610870361328, -142.34922790527344, -137.537353515625, -132.72549438476562, -127.91361236572266, -123.10174560546875, -118.28987121582031, -113.4780044555664, -108.6661376953125, -103.85426330566406, -99.04239654541016, -94.23052978515625, -89.41865539550781, -84.6067886352539, -79.79491424560547, -74.98304748535156, -70.17118072509766, -65.35931396484375, -60.54743957519531, -55.735572814941406, -50.92371368408203, -46.11184310913086, -41.29997634887695, -36.48810577392578, -31.676237106323242, -26.864368438720703, -22.05249786376953, -17.240631103515625, -12.428760528564453, -7.616891384124756, -2.8050222396850586, 2.006847381591797, 6.818716049194336, 11.630584716796875, 16.442455291748047, 21.254322052001953, 26.066192626953125, 30.878061294555664, 35.6899299621582, 40.501800537109375, 45.31366729736328, 50.12553787231445, 54.937408447265625, 59.74927520751953, 64.56114196777344, 69.37300872802734, 74.18488311767578, 78.99674987792969, 83.8086166381836, 88.6204833984375, 93.43235778808594, 98.24422454833984, 103.05609893798828]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 10.0, 10.0, 17.0, 16.0, 14.0, 20.0, 29.0, 25.0, 34.0, 45.0, 45.0, 44.0, 45.0, 40.0, 45.0, 40.0, 54.0, 39.0, 45.0, 32.0, 38.0, 40.0, 30.0, 30.0, 27.0, 22.0, 21.0, 15.0, 18.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-74.59950256347656, -72.32041931152344, -70.04133605957031, -67.76225280761719, -65.48316955566406, -63.20408248901367, -60.92499542236328, -58.645912170410156, -56.36682891845703, -54.087745666503906, -51.80866241455078, -49.52957534790039, -47.250492095947266, -44.97140884399414, -42.69232177734375, -40.413238525390625, -38.1341552734375, -35.855072021484375, -33.57598876953125, -31.29690170288086, -29.017818450927734, -26.73873519897461, -24.45965003967285, -22.180564880371094, -19.90148162841797, -17.622398376464844, -15.343313217163086, -13.064229011535645, -10.785144805908203, -8.506060600280762, -6.22697639465332, -3.947892189025879, -1.6688003540039062, 0.6102838516235352, 2.8893680572509766, 5.168452262878418, 7.447536468505859, 9.7266206741333, 12.005704879760742, 14.284789085388184, 16.563873291015625, 18.84295654296875, 21.122041702270508, 23.401126861572266, 25.68021011352539, 27.959293365478516, 30.238378524780273, 32.51746368408203, 34.796546936035156, 37.07563018798828, 39.354713439941406, 41.6338005065918, 43.91288375854492, 46.19196701049805, 48.47105407714844, 50.75013732910156, 53.02922058105469, 55.30830383300781, 57.58738708496094, 59.86647415161133, 62.14555740356445, 64.42464447021484, 66.70372772216797, 68.9828109741211, 71.26189422607422]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 21.0, 19.0, 39.0, 53.0, 77.0, 93.0, 168.0, 286.0, 428.0, 748.0, 1491.0, 3401.0, 9797.0, 51481.0, 4038489.0, 68637.0, 11448.0, 3781.0, 1648.0, 825.0, 467.0, 297.0, 183.0, 104.0, 75.0, 59.0, 46.0, 26.0, 17.0, 10.0, 11.0, 4.0, 7.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.880615234375, -8.51904296875, -8.157470703125, -7.7958984375, -7.434326171875, -7.07275390625, -6.711181640625, -6.349609375, -5.988037109375, -5.62646484375, -5.264892578125, -4.9033203125, -4.541748046875, -4.18017578125, -3.818603515625, -3.45703125, -3.095458984375, -2.73388671875, -2.372314453125, -2.0107421875, -1.649169921875, -1.28759765625, -0.926025390625, -0.564453125, -0.202880859375, 0.15869140625, 0.520263671875, 0.8818359375, 1.243408203125, 1.60498046875, 1.966552734375, 2.328125, 2.689697265625, 3.05126953125, 3.412841796875, 3.7744140625, 4.135986328125, 4.49755859375, 4.859130859375, 5.220703125, 5.582275390625, 5.94384765625, 6.305419921875, 6.6669921875, 7.028564453125, 7.39013671875, 7.751708984375, 8.11328125, 8.474853515625, 8.83642578125, 9.197998046875, 9.5595703125, 9.921142578125, 10.28271484375, 10.644287109375, 11.005859375, 11.367431640625, 11.72900390625, 12.090576171875, 12.4521484375, 12.813720703125, 13.17529296875, 13.536865234375, 13.8984375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 2.0, 10.0, 10.0, 19.0, 11.0, 23.0, 25.0, 29.0, 45.0, 38.0, 50.0, 51.0, 59.0, 56.0, 69.0, 66.0, 72.0, 58.0, 54.0, 47.0, 33.0, 38.0, 34.0, 20.0, 25.0, 13.0, 10.0, 10.0, 13.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.87213134765625, -4.7286376953125, -4.58514404296875, -4.441650390625, -4.29815673828125, -4.1546630859375, -4.01116943359375, -3.86767578125, -3.72418212890625, -3.5806884765625, -3.43719482421875, -3.293701171875, -3.15020751953125, -3.0067138671875, -2.86322021484375, -2.7197265625, -2.57623291015625, -2.4327392578125, -2.28924560546875, -2.145751953125, -2.00225830078125, -1.8587646484375, -1.71527099609375, -1.57177734375, -1.42828369140625, -1.2847900390625, -1.14129638671875, -0.997802734375, -0.85430908203125, -0.7108154296875, -0.56732177734375, -0.423828125, -0.28033447265625, -0.1368408203125, 0.00665283203125, 0.150146484375, 0.29364013671875, 0.4371337890625, 0.58062744140625, 0.72412109375, 0.86761474609375, 1.0111083984375, 1.15460205078125, 1.298095703125, 1.44158935546875, 1.5850830078125, 1.72857666015625, 1.8720703125, 2.01556396484375, 2.1590576171875, 2.30255126953125, 2.446044921875, 2.58953857421875, 2.7330322265625, 2.87652587890625, 3.02001953125, 3.16351318359375, 3.3070068359375, 3.45050048828125, 3.593994140625, 3.73748779296875, 3.8809814453125, 4.02447509765625, 4.16796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 8.0, 10.0, 10.0, 26.0, 33.0, 48.0, 54.0, 69.0, 80.0, 105.0, 179.0, 274.0, 345.0, 514.0, 825.0, 1612.0, 3156.0, 7721.0, 25178.0, 206177.0, 3876970.0, 48860.0, 12179.0, 4436.0, 2107.0, 1106.0, 662.0, 401.0, 298.0, 220.0, 163.0, 114.0, 90.0, 61.0, 44.0, 31.0, 26.0, 21.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.08203125, -5.88067626953125, -5.6793212890625, -5.47796630859375, -5.276611328125, -5.07525634765625, -4.8739013671875, -4.67254638671875, -4.47119140625, -4.26983642578125, -4.0684814453125, -3.86712646484375, -3.665771484375, -3.46441650390625, -3.2630615234375, -3.06170654296875, -2.8603515625, -2.65899658203125, -2.4576416015625, -2.25628662109375, -2.054931640625, -1.85357666015625, -1.6522216796875, -1.45086669921875, -1.24951171875, -1.04815673828125, -0.8468017578125, -0.64544677734375, -0.444091796875, -0.24273681640625, -0.0413818359375, 0.15997314453125, 0.361328125, 0.56268310546875, 0.7640380859375, 0.96539306640625, 1.166748046875, 1.36810302734375, 1.5694580078125, 1.77081298828125, 1.97216796875, 2.17352294921875, 2.3748779296875, 2.57623291015625, 2.777587890625, 2.97894287109375, 3.1802978515625, 3.38165283203125, 3.5830078125, 3.78436279296875, 3.9857177734375, 4.18707275390625, 4.388427734375, 4.58978271484375, 4.7911376953125, 4.99249267578125, 5.19384765625, 5.39520263671875, 5.5965576171875, 5.79791259765625, 5.999267578125, 6.20062255859375, 6.4019775390625, 6.60333251953125, 6.8046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 7.0, 11.0, 18.0, 20.0, 39.0, 76.0, 207.0, 3344.0, 183.0, 74.0, 30.0, 12.0, 17.0, 8.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.375, -1.318817138671875, -1.26263427734375, -1.206451416015625, -1.1502685546875, -1.094085693359375, -1.03790283203125, -0.981719970703125, -0.925537109375, -0.869354248046875, -0.81317138671875, -0.756988525390625, -0.7008056640625, -0.644622802734375, -0.58843994140625, -0.532257080078125, -0.47607421875, -0.419891357421875, -0.36370849609375, -0.307525634765625, -0.2513427734375, -0.195159912109375, -0.13897705078125, -0.082794189453125, -0.026611328125, 0.029571533203125, 0.08575439453125, 0.141937255859375, 0.1981201171875, 0.254302978515625, 0.31048583984375, 0.366668701171875, 0.4228515625, 0.479034423828125, 0.53521728515625, 0.591400146484375, 0.6475830078125, 0.703765869140625, 0.75994873046875, 0.816131591796875, 0.872314453125, 0.928497314453125, 0.98468017578125, 1.040863037109375, 1.0970458984375, 1.153228759765625, 1.20941162109375, 1.265594482421875, 1.32177734375, 1.377960205078125, 1.43414306640625, 1.490325927734375, 1.5465087890625, 1.602691650390625, 1.65887451171875, 1.715057373046875, 1.771240234375, 1.827423095703125, 1.88360595703125, 1.939788818359375, 1.9959716796875, 2.052154541015625, 2.10833740234375, 2.164520263671875, 2.220703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 20.0, 95.0, 304.0, 340.0, 156.0, 57.0, 14.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.305152893066406, -24.706371307373047, -24.107587814331055, -23.508806228637695, -22.910022735595703, -22.311241149902344, -21.71245765686035, -21.113676071166992, -20.514892578125, -19.91611099243164, -19.31732749938965, -18.71854591369629, -18.119762420654297, -17.520980834960938, -16.922197341918945, -16.323415756225586, -15.724634170532227, -15.12585163116455, -14.527069091796875, -13.9282865524292, -13.329504013061523, -12.730722427368164, -12.131939888000488, -11.533157348632812, -10.934374809265137, -10.335592269897461, -9.736809730529785, -9.13802719116211, -8.53924560546875, -7.940462589263916, -7.341680526733398, -6.742897987365723, -6.144113540649414, -5.545331001281738, -4.9465484619140625, -4.347766399383545, -3.748983860015869, -3.1502013206481934, -2.5514190196990967, -1.95263671875, -1.3538541793823242, -0.755071759223938, -0.15628933906555176, 0.4424930810928345, 1.0412755012512207, 1.6400580406188965, 2.238840341567993, 2.83762264251709, 3.4364051818847656, 4.035187721252441, 4.633970260620117, 5.232752323150635, 5.8315348625183105, 6.430317401885986, 7.029099464416504, 7.62788200378418, 8.226664543151855, 8.825447082519531, 9.424229621887207, 10.023012161254883, 10.621793746948242, 11.220577239990234, 11.819358825683594, 12.41814136505127, 13.016923904418945]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 7.0, 3.0, 5.0, 8.0, 13.0, 7.0, 9.0, 12.0, 15.0, 23.0, 17.0, 35.0, 26.0, 36.0, 38.0, 40.0, 46.0, 46.0, 42.0, 49.0, 40.0, 45.0, 53.0, 43.0, 39.0, 35.0, 38.0, 29.0, 34.0, 34.0, 27.0, 21.0, 16.0, 13.0, 11.0, 13.0, 6.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.556063652038574, -3.4452922344207764, -3.3345205783843994, -3.2237491607666016, -3.1129777431488037, -3.002206325531006, -2.891434669494629, -2.780663251876831, -2.669891834259033, -2.5591204166412354, -2.4483487606048584, -2.3375773429870605, -2.2268059253692627, -2.116034507751465, -2.005262851715088, -1.89449143409729, -1.7837198972702026, -1.6729483604431152, -1.5621769428253174, -1.45140540599823, -1.3406339883804321, -1.2298624515533447, -1.1190910339355469, -1.0083194971084595, -0.8975480198860168, -0.7867765426635742, -0.6760050654411316, -0.565233588218689, -0.45446208119392395, -0.34369057416915894, -0.2329190969467163, -0.12214761972427368, -0.011376142501831055, 0.09939534217119217, 0.2101668268442154, 0.3209383189678192, 0.43170979619026184, 0.5424813032150269, 0.6532527804374695, 0.7640242576599121, 0.8747957348823547, 0.9855672121047974, 1.0963387489318848, 1.2071101665496826, 1.31788170337677, 1.4286532402038574, 1.5394246578216553, 1.6501960754394531, 1.7609676122665405, 1.871739149093628, 1.9825105667114258, 2.0932819843292236, 2.2040536403656006, 2.3148250579833984, 2.4255964756011963, 2.536367893218994, 2.647139549255371, 2.757910966873169, 2.868682622909546, 2.9794540405273438, 3.0902254581451416, 3.2009968757629395, 3.3117685317993164, 3.4225399494171143, 3.533311367034912]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 13.0, 16.0, 18.0, 51.0, 75.0, 118.0, 185.0, 303.0, 565.0, 1051.0, 2071.0, 4325.0, 9722.0, 23530.0, 62011.0, 157102.0, 313352.0, 272348.0, 121631.0, 47069.0, 18082.0, 7528.0, 3514.0, 1748.0, 921.0, 487.0, 259.0, 157.0, 103.0, 56.0, 54.0, 29.0, 16.0, 13.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.18359375, -5.00396728515625, -4.8243408203125, -4.64471435546875, -4.465087890625, -4.28546142578125, -4.1058349609375, -3.92620849609375, -3.74658203125, -3.56695556640625, -3.3873291015625, -3.20770263671875, -3.028076171875, -2.84844970703125, -2.6688232421875, -2.48919677734375, -2.3095703125, -2.12994384765625, -1.9503173828125, -1.77069091796875, -1.591064453125, -1.41143798828125, -1.2318115234375, -1.05218505859375, -0.87255859375, -0.69293212890625, -0.5133056640625, -0.33367919921875, -0.154052734375, 0.02557373046875, 0.2052001953125, 0.38482666015625, 0.564453125, 0.74407958984375, 0.9237060546875, 1.10333251953125, 1.282958984375, 1.46258544921875, 1.6422119140625, 1.82183837890625, 2.00146484375, 2.18109130859375, 2.3607177734375, 2.54034423828125, 2.719970703125, 2.89959716796875, 3.0792236328125, 3.25885009765625, 3.4384765625, 3.61810302734375, 3.7977294921875, 3.97735595703125, 4.156982421875, 4.33660888671875, 4.5162353515625, 4.69586181640625, 4.87548828125, 5.05511474609375, 5.2347412109375, 5.41436767578125, 5.593994140625, 5.77362060546875, 5.9532470703125, 6.13287353515625, 6.3125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 2.0, 8.0, 14.0, 11.0, 22.0, 24.0, 33.0, 35.0, 41.0, 39.0, 44.0, 50.0, 67.0, 51.0, 63.0, 68.0, 63.0, 60.0, 63.0, 29.0, 32.0, 33.0, 27.0, 29.0, 16.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66015625, -4.52178955078125, -4.3834228515625, -4.24505615234375, -4.106689453125, -3.96832275390625, -3.8299560546875, -3.69158935546875, -3.55322265625, -3.41485595703125, -3.2764892578125, -3.13812255859375, -2.999755859375, -2.86138916015625, -2.7230224609375, -2.58465576171875, -2.4462890625, -2.30792236328125, -2.1695556640625, -2.03118896484375, -1.892822265625, -1.75445556640625, -1.6160888671875, -1.47772216796875, -1.33935546875, -1.20098876953125, -1.0626220703125, -0.92425537109375, -0.785888671875, -0.64752197265625, -0.5091552734375, -0.37078857421875, -0.232421875, -0.09405517578125, 0.0443115234375, 0.18267822265625, 0.321044921875, 0.45941162109375, 0.5977783203125, 0.73614501953125, 0.87451171875, 1.01287841796875, 1.1512451171875, 1.28961181640625, 1.427978515625, 1.56634521484375, 1.7047119140625, 1.84307861328125, 1.9814453125, 2.11981201171875, 2.2581787109375, 2.39654541015625, 2.534912109375, 2.67327880859375, 2.8116455078125, 2.95001220703125, 3.08837890625, 3.22674560546875, 3.3651123046875, 3.50347900390625, 3.641845703125, 3.78021240234375, 3.9185791015625, 4.05694580078125, 4.1953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 7.0, 10.0, 14.0, 22.0, 38.0, 37.0, 46.0, 74.0, 95.0, 146.0, 200.0, 232.0, 317.0, 507.0, 864.0, 1430.0, 3451.0, 10261.0, 40759.0, 216758.0, 577547.0, 151351.0, 30031.0, 7906.0, 2767.0, 1310.0, 709.0, 472.0, 308.0, 251.0, 181.0, 134.0, 86.0, 51.0, 47.0, 33.0, 26.0, 16.0, 12.0, 11.0, 11.0, 5.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-8.140625, -7.88134765625, -7.6220703125, -7.36279296875, -7.103515625, -6.84423828125, -6.5849609375, -6.32568359375, -6.06640625, -5.80712890625, -5.5478515625, -5.28857421875, -5.029296875, -4.77001953125, -4.5107421875, -4.25146484375, -3.9921875, -3.73291015625, -3.4736328125, -3.21435546875, -2.955078125, -2.69580078125, -2.4365234375, -2.17724609375, -1.91796875, -1.65869140625, -1.3994140625, -1.14013671875, -0.880859375, -0.62158203125, -0.3623046875, -0.10302734375, 0.15625, 0.41552734375, 0.6748046875, 0.93408203125, 1.193359375, 1.45263671875, 1.7119140625, 1.97119140625, 2.23046875, 2.48974609375, 2.7490234375, 3.00830078125, 3.267578125, 3.52685546875, 3.7861328125, 4.04541015625, 4.3046875, 4.56396484375, 4.8232421875, 5.08251953125, 5.341796875, 5.60107421875, 5.8603515625, 6.11962890625, 6.37890625, 6.63818359375, 6.8974609375, 7.15673828125, 7.416015625, 7.67529296875, 7.9345703125, 8.19384765625, 8.453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 11.0, 8.0, 6.0, 9.0, 14.0, 16.0, 16.0, 27.0, 19.0, 25.0, 26.0, 33.0, 33.0, 41.0, 36.0, 36.0, 53.0, 42.0, 54.0, 47.0, 39.0, 41.0, 47.0, 50.0, 30.0, 28.0, 19.0, 24.0, 24.0, 19.0, 18.0, 21.0, 20.0, 15.0, 5.0, 9.0, 9.0, 5.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.78125, -14.3316650390625, -13.882080078125, -13.4324951171875, -12.98291015625, -12.5333251953125, -12.083740234375, -11.6341552734375, -11.1845703125, -10.7349853515625, -10.285400390625, -9.8358154296875, -9.38623046875, -8.9366455078125, -8.487060546875, -8.0374755859375, -7.587890625, -7.1383056640625, -6.688720703125, -6.2391357421875, -5.78955078125, -5.3399658203125, -4.890380859375, -4.4407958984375, -3.9912109375, -3.5416259765625, -3.092041015625, -2.6424560546875, -2.19287109375, -1.7432861328125, -1.293701171875, -0.8441162109375, -0.39453125, 0.0550537109375, 0.504638671875, 0.9542236328125, 1.40380859375, 1.8533935546875, 2.302978515625, 2.7525634765625, 3.2021484375, 3.6517333984375, 4.101318359375, 4.5509033203125, 5.00048828125, 5.4500732421875, 5.899658203125, 6.3492431640625, 6.798828125, 7.2484130859375, 7.697998046875, 8.1475830078125, 8.59716796875, 9.0467529296875, 9.496337890625, 9.9459228515625, 10.3955078125, 10.8450927734375, 11.294677734375, 11.7442626953125, 12.19384765625, 12.6434326171875, 13.093017578125, 13.5426025390625, 13.9921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 9.0, 18.0, 21.0, 53.0, 74.0, 134.0, 319.0, 612.0, 1728.0, 9623.0, 303314.0, 713103.0, 15759.0, 2347.0, 716.0, 320.0, 160.0, 77.0, 37.0, 29.0, 25.0, 17.0, 8.0, 6.0, 10.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3671875, -12.0426025390625, -11.718017578125, -11.3934326171875, -11.06884765625, -10.7442626953125, -10.419677734375, -10.0950927734375, -9.7705078125, -9.4459228515625, -9.121337890625, -8.7967529296875, -8.47216796875, -8.1475830078125, -7.822998046875, -7.4984130859375, -7.173828125, -6.8492431640625, -6.524658203125, -6.2000732421875, -5.87548828125, -5.5509033203125, -5.226318359375, -4.9017333984375, -4.5771484375, -4.2525634765625, -3.927978515625, -3.6033935546875, -3.27880859375, -2.9542236328125, -2.629638671875, -2.3050537109375, -1.98046875, -1.6558837890625, -1.331298828125, -1.0067138671875, -0.68212890625, -0.3575439453125, -0.032958984375, 0.2916259765625, 0.6162109375, 0.9407958984375, 1.265380859375, 1.5899658203125, 1.91455078125, 2.2391357421875, 2.563720703125, 2.8883056640625, 3.212890625, 3.5374755859375, 3.862060546875, 4.1866455078125, 4.51123046875, 4.8358154296875, 5.160400390625, 5.4849853515625, 5.8095703125, 6.1341552734375, 6.458740234375, 6.7833251953125, 7.10791015625, 7.4324951171875, 7.757080078125, 8.0816650390625, 8.40625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 9.0, 5.0, 18.0, 14.0, 27.0, 34.0, 37.0, 39.0, 65.0, 91.0, 119.0, 110.0, 108.0, 76.0, 54.0, 43.0, 29.0, 21.0, 21.0, 7.0, 6.0, 10.0, 7.0, 10.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006155967712402344, -0.0005943924188613892, -0.0005731880664825439, -0.0005519837141036987, -0.0005307793617248535, -0.0005095750093460083, -0.0004883706569671631, -0.00046716630458831787, -0.00044596195220947266, -0.00042475759983062744, -0.0004035532474517822, -0.000382348895072937, -0.0003611445426940918, -0.0003399401903152466, -0.00031873583793640137, -0.00029753148555755615, -0.00027632713317871094, -0.0002551227807998657, -0.0002339184284210205, -0.0002127140760421753, -0.00019150972366333008, -0.00017030537128448486, -0.00014910101890563965, -0.00012789666652679443, -0.00010669231414794922, -8.5487961769104e-05, -6.428360939025879e-05, -4.3079257011413574e-05, -2.187490463256836e-05, -6.705522537231445e-07, 2.053380012512207e-05, 4.1738152503967285e-05, 6.29425048828125e-05, 8.414685726165771e-05, 0.00010535120964050293, 0.00012655556201934814, 0.00014775991439819336, 0.00016896426677703857, 0.0001901686191558838, 0.000211372971534729, 0.00023257732391357422, 0.00025378167629241943, 0.00027498602867126465, 0.00029619038105010986, 0.0003173947334289551, 0.0003385990858078003, 0.0003598034381866455, 0.0003810077905654907, 0.00040221214294433594, 0.00042341649532318115, 0.00044462084770202637, 0.0004658252000808716, 0.0004870295524597168, 0.000508233904838562, 0.0005294382572174072, 0.0005506426095962524, 0.0005718469619750977, 0.0005930513143539429, 0.0006142556667327881, 0.0006354600191116333, 0.0006566643714904785, 0.0006778687238693237, 0.0006990730762481689, 0.0007202774286270142, 0.0007414817810058594]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 12.0, 32.0, 32.0, 76.0, 104.0, 189.0, 317.0, 723.0, 1610.0, 5339.0, 27110.0, 414917.0, 556090.0, 32485.0, 6055.0, 1895.0, 752.0, 330.0, 154.0, 95.0, 62.0, 45.0, 32.0, 24.0, 12.0, 5.0, 8.0, 5.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.5078125, -6.28375244140625, -6.0596923828125, -5.83563232421875, -5.611572265625, -5.38751220703125, -5.1634521484375, -4.93939208984375, -4.71533203125, -4.49127197265625, -4.2672119140625, -4.04315185546875, -3.819091796875, -3.59503173828125, -3.3709716796875, -3.14691162109375, -2.9228515625, -2.69879150390625, -2.4747314453125, -2.25067138671875, -2.026611328125, -1.80255126953125, -1.5784912109375, -1.35443115234375, -1.13037109375, -0.90631103515625, -0.6822509765625, -0.45819091796875, -0.234130859375, -0.01007080078125, 0.2139892578125, 0.43804931640625, 0.662109375, 0.88616943359375, 1.1102294921875, 1.33428955078125, 1.558349609375, 1.78240966796875, 2.0064697265625, 2.23052978515625, 2.45458984375, 2.67864990234375, 2.9027099609375, 3.12677001953125, 3.350830078125, 3.57489013671875, 3.7989501953125, 4.02301025390625, 4.2470703125, 4.47113037109375, 4.6951904296875, 4.91925048828125, 5.143310546875, 5.36737060546875, 5.5914306640625, 5.81549072265625, 6.03955078125, 6.26361083984375, 6.4876708984375, 6.71173095703125, 6.935791015625, 7.15985107421875, 7.3839111328125, 7.60797119140625, 7.83203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 17.0, 25.0, 32.0, 53.0, 81.0, 101.0, 150.0, 137.0, 111.0, 86.0, 71.0, 37.0, 27.0, 12.0, 8.0, 11.0, 7.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.621826171875, -9.37646484375, -9.131103515625, -8.8857421875, -8.640380859375, -8.39501953125, -8.149658203125, -7.904296875, -7.658935546875, -7.41357421875, -7.168212890625, -6.9228515625, -6.677490234375, -6.43212890625, -6.186767578125, -5.94140625, -5.696044921875, -5.45068359375, -5.205322265625, -4.9599609375, -4.714599609375, -4.46923828125, -4.223876953125, -3.978515625, -3.733154296875, -3.48779296875, -3.242431640625, -2.9970703125, -2.751708984375, -2.50634765625, -2.260986328125, -2.015625, -1.770263671875, -1.52490234375, -1.279541015625, -1.0341796875, -0.788818359375, -0.54345703125, -0.298095703125, -0.052734375, 0.192626953125, 0.43798828125, 0.683349609375, 0.9287109375, 1.174072265625, 1.41943359375, 1.664794921875, 1.91015625, 2.155517578125, 2.40087890625, 2.646240234375, 2.8916015625, 3.136962890625, 3.38232421875, 3.627685546875, 3.873046875, 4.118408203125, 4.36376953125, 4.609130859375, 4.8544921875, 5.099853515625, 5.34521484375, 5.590576171875, 5.8359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 12.0, 24.0, 111.0, 354.0, 356.0, 116.0, 23.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.74440002441406, -240.87088012695312, -233.9973602294922, -227.12384033203125, -220.25030517578125, -213.3767852783203, -206.50326538085938, -199.62974548339844, -192.7562255859375, -185.88270568847656, -179.00918579101562, -172.13565063476562, -165.2621307373047, -158.38861083984375, -151.5150909423828, -144.64157104492188, -137.76803588867188, -130.89451599121094, -124.02098846435547, -117.14746856689453, -110.27394104003906, -103.40042114257812, -96.52690124511719, -89.65338134765625, -82.77985382080078, -75.90633392333984, -69.03280639648438, -62.15928649902344, -55.285762786865234, -48.41223907470703, -41.538719177246094, -34.66519546508789, -27.79168701171875, -20.918163299560547, -14.044641494750977, -7.171119689941406, -0.2975959777832031, 6.575927734375, 13.449447631835938, 20.32297134399414, 27.196495056152344, 34.07001876831055, 40.94354248046875, 47.81706237792969, 54.69058609008789, 61.564109802246094, 68.43762969970703, 75.3111572265625, 82.18467712402344, 89.05819702148438, 95.93172454833984, 102.80524444580078, 109.67877197265625, 116.55229187011719, 123.42581176757812, 130.29933166503906, 137.1728515625, 144.04637145996094, 150.91989135742188, 157.79342651367188, 164.6669464111328, 171.54046630859375, 178.4139862060547, 185.28750610351562, 192.16104125976562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 20.0, 19.0, 14.0, 14.0, 21.0, 24.0, 25.0, 28.0, 35.0, 37.0, 42.0, 41.0, 49.0, 62.0, 58.0, 46.0, 52.0, 58.0, 49.0, 45.0, 44.0, 36.0, 34.0, 26.0, 24.0, 12.0, 16.0, 12.0, 14.0, 8.0, 6.0, 8.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.04206848144531, -72.6947250366211, -70.34737396240234, -68.00003051757812, -65.65267944335938, -63.30533218383789, -60.957984924316406, -58.61064147949219, -56.26329040527344, -53.91594314575195, -51.56859588623047, -49.221248626708984, -46.8739013671875, -44.526554107666016, -42.17920684814453, -39.83186340332031, -37.48451614379883, -35.137168884277344, -32.78982162475586, -30.442474365234375, -28.09512710571289, -25.747779846191406, -23.400434494018555, -21.05308723449707, -18.705739974975586, -16.3583927154541, -14.011045455932617, -11.66369915008545, -9.316351890563965, -6.9690046310424805, -4.6216583251953125, -2.274311065673828, 0.07303619384765625, 2.4203832149505615, 4.767730236053467, 7.115077018737793, 9.462424278259277, 11.809771537780762, 14.15711784362793, 16.504465103149414, 18.8518123626709, 21.199159622192383, 23.546506881713867, 25.89385223388672, 28.241199493408203, 30.588546752929688, 32.93589401245117, 35.283241271972656, 37.63058853149414, 39.977935791015625, 42.32528305053711, 44.672630310058594, 47.01997756958008, 49.36732482910156, 51.71466827392578, 54.06201934814453, 56.40936279296875, 58.756710052490234, 61.10405731201172, 63.4514045715332, 65.79875183105469, 68.1460952758789, 70.49344635009766, 72.84078979492188, 75.18814086914062]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 12.0, 6.0, 12.0, 9.0, 15.0, 15.0, 38.0, 45.0, 55.0, 93.0, 144.0, 206.0, 303.0, 551.0, 983.0, 1817.0, 3995.0, 9575.0, 32837.0, 402330.0, 3673607.0, 46299.0, 11938.0, 4528.0, 2051.0, 1146.0, 625.0, 366.0, 215.0, 128.0, 96.0, 56.0, 48.0, 30.0, 17.0, 19.0, 9.0, 12.0, 11.0, 11.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.9608154296875, -7.687255859375, -7.4136962890625, -7.14013671875, -6.8665771484375, -6.593017578125, -6.3194580078125, -6.0458984375, -5.7723388671875, -5.498779296875, -5.2252197265625, -4.95166015625, -4.6781005859375, -4.404541015625, -4.1309814453125, -3.857421875, -3.5838623046875, -3.310302734375, -3.0367431640625, -2.76318359375, -2.4896240234375, -2.216064453125, -1.9425048828125, -1.6689453125, -1.3953857421875, -1.121826171875, -0.8482666015625, -0.57470703125, -0.3011474609375, -0.027587890625, 0.2459716796875, 0.51953125, 0.7930908203125, 1.066650390625, 1.3402099609375, 1.61376953125, 1.8873291015625, 2.160888671875, 2.4344482421875, 2.7080078125, 2.9815673828125, 3.255126953125, 3.5286865234375, 3.80224609375, 4.0758056640625, 4.349365234375, 4.6229248046875, 4.896484375, 5.1700439453125, 5.443603515625, 5.7171630859375, 5.99072265625, 6.2642822265625, 6.537841796875, 6.8114013671875, 7.0849609375, 7.3585205078125, 7.632080078125, 7.9056396484375, 8.17919921875, 8.4527587890625, 8.726318359375, 8.9998779296875, 9.2734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 7.0, 6.0, 9.0, 10.0, 17.0, 20.0, 21.0, 19.0, 34.0, 30.0, 42.0, 55.0, 49.0, 42.0, 47.0, 67.0, 60.0, 56.0, 45.0, 53.0, 49.0, 43.0, 32.0, 32.0, 25.0, 15.0, 18.0, 22.0, 14.0, 10.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.26171875, -4.137115478515625, -4.01251220703125, -3.887908935546875, -3.7633056640625, -3.638702392578125, -3.51409912109375, -3.389495849609375, -3.264892578125, -3.140289306640625, -3.01568603515625, -2.891082763671875, -2.7664794921875, -2.641876220703125, -2.51727294921875, -2.392669677734375, -2.26806640625, -2.143463134765625, -2.01885986328125, -1.894256591796875, -1.7696533203125, -1.645050048828125, -1.52044677734375, -1.395843505859375, -1.271240234375, -1.146636962890625, -1.02203369140625, -0.897430419921875, -0.7728271484375, -0.648223876953125, -0.52362060546875, -0.399017333984375, -0.2744140625, -0.149810791015625, -0.02520751953125, 0.099395751953125, 0.2239990234375, 0.348602294921875, 0.47320556640625, 0.597808837890625, 0.722412109375, 0.847015380859375, 0.97161865234375, 1.096221923828125, 1.2208251953125, 1.345428466796875, 1.47003173828125, 1.594635009765625, 1.71923828125, 1.843841552734375, 1.96844482421875, 2.093048095703125, 2.2176513671875, 2.342254638671875, 2.46685791015625, 2.591461181640625, 2.716064453125, 2.840667724609375, 2.96527099609375, 3.089874267578125, 3.2144775390625, 3.339080810546875, 3.46368408203125, 3.588287353515625, 3.712890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 16.0, 12.0, 8.0, 12.0, 22.0, 30.0, 24.0, 35.0, 45.0, 51.0, 59.0, 71.0, 75.0, 66.0, 73.0, 85.0, 93.0, 153.0, 877.0, 21994.0, 4160036.0, 9029.0, 565.0, 118.0, 78.0, 56.0, 73.0, 65.0, 64.0, 58.0, 47.0, 54.0, 46.0, 37.0, 32.0, 31.0, 22.0, 13.0, 14.0, 7.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-37.78125, -36.77099609375, -35.7607421875, -34.75048828125, -33.740234375, -32.72998046875, -31.7197265625, -30.70947265625, -29.69921875, -28.68896484375, -27.6787109375, -26.66845703125, -25.658203125, -24.64794921875, -23.6376953125, -22.62744140625, -21.6171875, -20.60693359375, -19.5966796875, -18.58642578125, -17.576171875, -16.56591796875, -15.5556640625, -14.54541015625, -13.53515625, -12.52490234375, -11.5146484375, -10.50439453125, -9.494140625, -8.48388671875, -7.4736328125, -6.46337890625, -5.453125, -4.44287109375, -3.4326171875, -2.42236328125, -1.412109375, -0.40185546875, 0.6083984375, 1.61865234375, 2.62890625, 3.63916015625, 4.6494140625, 5.65966796875, 6.669921875, 7.68017578125, 8.6904296875, 9.70068359375, 10.7109375, 11.72119140625, 12.7314453125, 13.74169921875, 14.751953125, 15.76220703125, 16.7724609375, 17.78271484375, 18.79296875, 19.80322265625, 20.8134765625, 21.82373046875, 22.833984375, 23.84423828125, 24.8544921875, 25.86474609375, 26.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 13.0, 40.0, 3528.0, 467.0, 32.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.3125, -33.7091064453125, -33.105712890625, -32.5023193359375, -31.89892578125, -31.2955322265625, -30.692138671875, -30.0887451171875, -29.4853515625, -28.8819580078125, -28.278564453125, -27.6751708984375, -27.07177734375, -26.4683837890625, -25.864990234375, -25.2615966796875, -24.658203125, -24.0548095703125, -23.451416015625, -22.8480224609375, -22.24462890625, -21.6412353515625, -21.037841796875, -20.4344482421875, -19.8310546875, -19.2276611328125, -18.624267578125, -18.0208740234375, -17.41748046875, -16.8140869140625, -16.210693359375, -15.6072998046875, -15.00390625, -14.4005126953125, -13.797119140625, -13.1937255859375, -12.59033203125, -11.9869384765625, -11.383544921875, -10.7801513671875, -10.1767578125, -9.5733642578125, -8.969970703125, -8.3665771484375, -7.76318359375, -7.1597900390625, -6.556396484375, -5.9530029296875, -5.349609375, -4.7462158203125, -4.142822265625, -3.5394287109375, -2.93603515625, -2.3326416015625, -1.729248046875, -1.1258544921875, -0.5224609375, 0.0809326171875, 0.684326171875, 1.2877197265625, 1.89111328125, 2.4945068359375, 3.097900390625, 3.7012939453125, 4.3046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 14.0, 74.0, 257.0, 461.0, 144.0, 36.0, 11.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.0317611694336, -98.79784393310547, -96.56392669677734, -94.33000946044922, -92.0960922241211, -89.86217498779297, -87.62825775146484, -85.39434051513672, -83.1604232788086, -80.92650604248047, -78.69258880615234, -76.45867156982422, -74.2247543334961, -71.99083709716797, -69.75691986083984, -67.52300262451172, -65.2890853881836, -63.05516815185547, -60.821250915527344, -58.58733367919922, -56.353416442871094, -54.11949920654297, -51.885581970214844, -49.65166473388672, -47.417747497558594, -45.18383026123047, -42.949913024902344, -40.71599578857422, -38.482078552246094, -36.24816131591797, -34.014244079589844, -31.78032684326172, -29.546401977539062, -27.312484741210938, -25.078567504882812, -22.844650268554688, -20.610733032226562, -18.376815795898438, -16.142898559570312, -13.908981323242188, -11.675064086914062, -9.441146850585938, -7.2072296142578125, -4.9733123779296875, -2.7393951416015625, -0.5054779052734375, 1.7284393310546875, 3.9623565673828125, 6.1962738037109375, 8.430191040039062, 10.664108276367188, 12.898025512695312, 15.131942749023438, 17.365859985351562, 19.599777221679688, 21.833694458007812, 24.067611694335938, 26.301528930664062, 28.535446166992188, 30.769363403320312, 33.00328063964844, 35.23719787597656, 37.47111511230469, 39.70503234863281, 41.93894958496094]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 3.0, 8.0, 17.0, 11.0, 18.0, 23.0, 39.0, 60.0, 76.0, 98.0, 130.0, 119.0, 111.0, 73.0, 72.0, 46.0, 29.0, 21.0, 12.0, 14.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.319488525390625, -44.61859130859375, -42.917694091796875, -41.216796875, -39.515899658203125, -37.81500244140625, -36.114105224609375, -34.4132080078125, -32.712310791015625, -31.01141357421875, -29.310516357421875, -27.609619140625, -25.908721923828125, -24.20782470703125, -22.506929397583008, -20.806032180786133, -19.10513687133789, -17.404239654541016, -15.70334243774414, -14.002446174621582, -12.301548957824707, -10.600651741027832, -8.899755477905273, -7.198858261108398, -5.497961044311523, -3.7970640659332275, -2.0961670875549316, -0.39527034759521484, 1.3056268692016602, 3.006524085998535, 4.707420349121094, 6.408317565917969, 8.109214782714844, 9.810111999511719, 11.511009216308594, 13.211905479431152, 14.912802696228027, 16.61370086669922, 18.31459617614746, 20.015493392944336, 21.71639060974121, 23.417287826538086, 25.11818504333496, 26.819080352783203, 28.519977569580078, 30.220874786376953, 31.921772003173828, 33.6226692199707, 35.32356643676758, 37.02446365356445, 38.72536087036133, 40.4262580871582, 42.12715530395508, 43.82805252075195, 45.52894592285156, 47.22984313964844, 48.93074035644531, 50.63163757324219, 52.33253479003906, 54.03343200683594, 55.73432922363281, 57.43522644042969, 59.13612365722656, 60.83702087402344, 62.53791809082031]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 15.0, 13.0, 18.0, 23.0, 42.0, 49.0, 77.0, 125.0, 180.0, 303.0, 499.0, 819.0, 1602.0, 3050.0, 7055.0, 18360.0, 57426.0, 209445.0, 448010.0, 210926.0, 58036.0, 18580.0, 6973.0, 3087.0, 1593.0, 843.0, 483.0, 287.0, 189.0, 128.0, 74.0, 73.0, 52.0, 35.0, 21.0, 12.0, 10.0, 7.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.50390625, -7.24957275390625, -6.9952392578125, -6.74090576171875, -6.486572265625, -6.23223876953125, -5.9779052734375, -5.72357177734375, -5.46923828125, -5.21490478515625, -4.9605712890625, -4.70623779296875, -4.451904296875, -4.19757080078125, -3.9432373046875, -3.68890380859375, -3.4345703125, -3.18023681640625, -2.9259033203125, -2.67156982421875, -2.417236328125, -2.16290283203125, -1.9085693359375, -1.65423583984375, -1.39990234375, -1.14556884765625, -0.8912353515625, -0.63690185546875, -0.382568359375, -0.12823486328125, 0.1260986328125, 0.38043212890625, 0.634765625, 0.88909912109375, 1.1434326171875, 1.39776611328125, 1.652099609375, 1.90643310546875, 2.1607666015625, 2.41510009765625, 2.66943359375, 2.92376708984375, 3.1781005859375, 3.43243408203125, 3.686767578125, 3.94110107421875, 4.1954345703125, 4.44976806640625, 4.7041015625, 4.95843505859375, 5.2127685546875, 5.46710205078125, 5.721435546875, 5.97576904296875, 6.2301025390625, 6.48443603515625, 6.73876953125, 6.99310302734375, 7.2474365234375, 7.50177001953125, 7.756103515625, 8.01043701171875, 8.2647705078125, 8.51910400390625, 8.7734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 7.0, 14.0, 14.0, 15.0, 20.0, 38.0, 38.0, 47.0, 59.0, 74.0, 82.0, 78.0, 93.0, 93.0, 59.0, 55.0, 41.0, 43.0, 33.0, 27.0, 15.0, 19.0, 3.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.67578125, -7.45562744140625, -7.2354736328125, -7.01531982421875, -6.795166015625, -6.57501220703125, -6.3548583984375, -6.13470458984375, -5.91455078125, -5.69439697265625, -5.4742431640625, -5.25408935546875, -5.033935546875, -4.81378173828125, -4.5936279296875, -4.37347412109375, -4.1533203125, -3.93316650390625, -3.7130126953125, -3.49285888671875, -3.272705078125, -3.05255126953125, -2.8323974609375, -2.61224365234375, -2.39208984375, -2.17193603515625, -1.9517822265625, -1.73162841796875, -1.511474609375, -1.29132080078125, -1.0711669921875, -0.85101318359375, -0.630859375, -0.41070556640625, -0.1905517578125, 0.02960205078125, 0.249755859375, 0.46990966796875, 0.6900634765625, 0.91021728515625, 1.13037109375, 1.35052490234375, 1.5706787109375, 1.79083251953125, 2.010986328125, 2.23114013671875, 2.4512939453125, 2.67144775390625, 2.8916015625, 3.11175537109375, 3.3319091796875, 3.55206298828125, 3.772216796875, 3.99237060546875, 4.2125244140625, 4.43267822265625, 4.65283203125, 4.87298583984375, 5.0931396484375, 5.31329345703125, 5.533447265625, 5.75360107421875, 5.9737548828125, 6.19390869140625, 6.4140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 10.0, 11.0, 22.0, 34.0, 101.0, 181.0, 490.0, 1504.0, 9091.0, 929437.0, 102979.0, 3292.0, 869.0, 304.0, 103.0, 54.0, 28.0, 13.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.59375, -39.31591796875, -38.0380859375, -36.76025390625, -35.482421875, -34.20458984375, -32.9267578125, -31.64892578125, -30.37109375, -29.09326171875, -27.8154296875, -26.53759765625, -25.259765625, -23.98193359375, -22.7041015625, -21.42626953125, -20.1484375, -18.87060546875, -17.5927734375, -16.31494140625, -15.037109375, -13.75927734375, -12.4814453125, -11.20361328125, -9.92578125, -8.64794921875, -7.3701171875, -6.09228515625, -4.814453125, -3.53662109375, -2.2587890625, -0.98095703125, 0.296875, 1.57470703125, 2.8525390625, 4.13037109375, 5.408203125, 6.68603515625, 7.9638671875, 9.24169921875, 10.51953125, 11.79736328125, 13.0751953125, 14.35302734375, 15.630859375, 16.90869140625, 18.1865234375, 19.46435546875, 20.7421875, 22.02001953125, 23.2978515625, 24.57568359375, 25.853515625, 27.13134765625, 28.4091796875, 29.68701171875, 30.96484375, 32.24267578125, 33.5205078125, 34.79833984375, 36.076171875, 37.35400390625, 38.6318359375, 39.90966796875, 41.1875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 8.0, 23.0, 45.0, 79.0, 127.0, 159.0, 169.0, 149.0, 115.0, 74.0, 26.0, 18.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.4013671875, -63.302734375, -61.2041015625, -59.10546875, -57.0068359375, -54.908203125, -52.8095703125, -50.7109375, -48.6123046875, -46.513671875, -44.4150390625, -42.31640625, -40.2177734375, -38.119140625, -36.0205078125, -33.921875, -31.8232421875, -29.724609375, -27.6259765625, -25.52734375, -23.4287109375, -21.330078125, -19.2314453125, -17.1328125, -15.0341796875, -12.935546875, -10.8369140625, -8.73828125, -6.6396484375, -4.541015625, -2.4423828125, -0.34375, 1.7548828125, 3.853515625, 5.9521484375, 8.05078125, 10.1494140625, 12.248046875, 14.3466796875, 16.4453125, 18.5439453125, 20.642578125, 22.7412109375, 24.83984375, 26.9384765625, 29.037109375, 31.1357421875, 33.234375, 35.3330078125, 37.431640625, 39.5302734375, 41.62890625, 43.7275390625, 45.826171875, 47.9248046875, 50.0234375, 52.1220703125, 54.220703125, 56.3193359375, 58.41796875, 60.5166015625, 62.615234375, 64.7138671875, 66.8125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 10.0, 11.0, 23.0, 20.0, 45.0, 63.0, 98.0, 201.0, 402.0, 784.0, 2193.0, 8460.0, 77056.0, 829644.0, 114784.0, 10420.0, 2427.0, 961.0, 411.0, 209.0, 106.0, 71.0, 41.0, 35.0, 22.0, 19.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1953125, -6.0107421875, -5.826171875, -5.6416015625, -5.45703125, -5.2724609375, -5.087890625, -4.9033203125, -4.71875, -4.5341796875, -4.349609375, -4.1650390625, -3.98046875, -3.7958984375, -3.611328125, -3.4267578125, -3.2421875, -3.0576171875, -2.873046875, -2.6884765625, -2.50390625, -2.3193359375, -2.134765625, -1.9501953125, -1.765625, -1.5810546875, -1.396484375, -1.2119140625, -1.02734375, -0.8427734375, -0.658203125, -0.4736328125, -0.2890625, -0.1044921875, 0.080078125, 0.2646484375, 0.44921875, 0.6337890625, 0.818359375, 1.0029296875, 1.1875, 1.3720703125, 1.556640625, 1.7412109375, 1.92578125, 2.1103515625, 2.294921875, 2.4794921875, 2.6640625, 2.8486328125, 3.033203125, 3.2177734375, 3.40234375, 3.5869140625, 3.771484375, 3.9560546875, 4.140625, 4.3251953125, 4.509765625, 4.6943359375, 4.87890625, 5.0634765625, 5.248046875, 5.4326171875, 5.6171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 8.0, 12.0, 9.0, 13.0, 11.0, 23.0, 25.0, 35.0, 40.0, 47.0, 82.0, 103.0, 131.0, 108.0, 83.0, 60.0, 46.0, 34.0, 22.0, 24.0, 14.0, 11.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007433891296386719, -0.000720590353012085, -0.000697791576385498, -0.0006749927997589111, -0.0006521940231323242, -0.0006293952465057373, -0.0006065964698791504, -0.0005837976932525635, -0.0005609989166259766, -0.0005382001399993896, -0.0005154013633728027, -0.0004926025867462158, -0.0004698038101196289, -0.000447005033493042, -0.0004242062568664551, -0.00040140748023986816, -0.00037860870361328125, -0.00035580992698669434, -0.0003330111503601074, -0.0003102123737335205, -0.0002874135971069336, -0.0002646148204803467, -0.00024181604385375977, -0.00021901726722717285, -0.00019621849060058594, -0.00017341971397399902, -0.0001506209373474121, -0.0001278221607208252, -0.00010502338409423828, -8.222460746765137e-05, -5.942583084106445e-05, -3.662705421447754e-05, -1.3828277587890625e-05, 8.970499038696289e-06, 3.17692756652832e-05, 5.456805229187012e-05, 7.736682891845703e-05, 0.00010016560554504395, 0.00012296438217163086, 0.00014576315879821777, 0.0001685619354248047, 0.0001913607120513916, 0.00021415948867797852, 0.00023695826530456543, 0.00025975704193115234, 0.00028255581855773926, 0.00030535459518432617, 0.0003281533718109131, 0.0003509521484375, 0.0003737509250640869, 0.00039654970169067383, 0.00041934847831726074, 0.00044214725494384766, 0.00046494603157043457, 0.0004877448081970215, 0.0005105435848236084, 0.0005333423614501953, 0.0005561411380767822, 0.0005789399147033691, 0.0006017386913299561, 0.000624537467956543, 0.0006473362445831299, 0.0006701350212097168, 0.0006929337978363037, 0.0007157325744628906]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 5.0, 7.0, 10.0, 13.0, 27.0, 28.0, 43.0, 53.0, 76.0, 116.0, 211.0, 384.0, 716.0, 1551.0, 3778.0, 13208.0, 93204.0, 727052.0, 179175.0, 20221.0, 4876.0, 1810.0, 851.0, 457.0, 249.0, 141.0, 91.0, 57.0, 29.0, 28.0, 26.0, 10.0, 10.0, 10.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.84765625, -4.69439697265625, -4.5411376953125, -4.38787841796875, -4.234619140625, -4.08135986328125, -3.9281005859375, -3.77484130859375, -3.62158203125, -3.46832275390625, -3.3150634765625, -3.16180419921875, -3.008544921875, -2.85528564453125, -2.7020263671875, -2.54876708984375, -2.3955078125, -2.24224853515625, -2.0889892578125, -1.93572998046875, -1.782470703125, -1.62921142578125, -1.4759521484375, -1.32269287109375, -1.16943359375, -1.01617431640625, -0.8629150390625, -0.70965576171875, -0.556396484375, -0.40313720703125, -0.2498779296875, -0.09661865234375, 0.056640625, 0.20989990234375, 0.3631591796875, 0.51641845703125, 0.669677734375, 0.82293701171875, 0.9761962890625, 1.12945556640625, 1.28271484375, 1.43597412109375, 1.5892333984375, 1.74249267578125, 1.895751953125, 2.04901123046875, 2.2022705078125, 2.35552978515625, 2.5087890625, 2.66204833984375, 2.8153076171875, 2.96856689453125, 3.121826171875, 3.27508544921875, 3.4283447265625, 3.58160400390625, 3.73486328125, 3.88812255859375, 4.0413818359375, 4.19464111328125, 4.347900390625, 4.50115966796875, 4.6544189453125, 4.80767822265625, 4.9609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 16.0, 18.0, 41.0, 48.0, 86.0, 103.0, 133.0, 126.0, 111.0, 102.0, 74.0, 47.0, 30.0, 23.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.88372802734375, -8.6580810546875, -8.43243408203125, -8.206787109375, -7.98114013671875, -7.7554931640625, -7.52984619140625, -7.30419921875, -7.07855224609375, -6.8529052734375, -6.62725830078125, -6.401611328125, -6.17596435546875, -5.9503173828125, -5.72467041015625, -5.4990234375, -5.27337646484375, -5.0477294921875, -4.82208251953125, -4.596435546875, -4.37078857421875, -4.1451416015625, -3.91949462890625, -3.69384765625, -3.46820068359375, -3.2425537109375, -3.01690673828125, -2.791259765625, -2.56561279296875, -2.3399658203125, -2.11431884765625, -1.888671875, -1.66302490234375, -1.4373779296875, -1.21173095703125, -0.986083984375, -0.76043701171875, -0.5347900390625, -0.30914306640625, -0.08349609375, 0.14215087890625, 0.3677978515625, 0.59344482421875, 0.819091796875, 1.04473876953125, 1.2703857421875, 1.49603271484375, 1.7216796875, 1.94732666015625, 2.1729736328125, 2.39862060546875, 2.624267578125, 2.84991455078125, 3.0755615234375, 3.30120849609375, 3.52685546875, 3.75250244140625, 3.9781494140625, 4.20379638671875, 4.429443359375, 4.65509033203125, 4.8807373046875, 5.10638427734375, 5.33203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 18.0, 58.0, 254.0, 438.0, 165.0, 42.0, 14.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.3667907714844, -251.2064208984375, -242.04605102539062, -232.88568115234375, -223.7252960205078, -214.56492614746094, -205.40455627441406, -196.24417114257812, -187.08380126953125, -177.92343139648438, -168.7630615234375, -159.60269165039062, -150.4423065185547, -141.2819366455078, -132.12156677246094, -122.96118927001953, -113.80082702636719, -104.64045715332031, -95.4800796508789, -86.31970977783203, -77.15933227539062, -67.99896240234375, -58.838592529296875, -49.67821502685547, -40.517845153808594, -31.357471466064453, -22.197099685668945, -13.036727905273438, -3.876354217529297, 5.284019470214844, 14.444389343261719, 23.604766845703125, 32.76513671875, 41.92551040649414, 51.08588409423828, 60.246253967285156, 69.40663146972656, 78.56700134277344, 87.72737121582031, 96.88774871826172, 106.0481185913086, 115.20848846435547, 124.36886596679688, 133.52923583984375, 142.68960571289062, 151.8499755859375, 161.01034545898438, 170.1707305908203, 179.3311004638672, 188.49147033691406, 197.65184020996094, 206.81222534179688, 215.97259521484375, 225.13296508789062, 234.2933349609375, 243.45370483398438, 252.61407470703125, 261.7744445800781, 270.934814453125, 280.0951843261719, 289.25555419921875, 298.41595458984375, 307.5762939453125, 316.7366943359375, 325.8970642089844]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 5.0, 7.0, 11.0, 15.0, 17.0, 20.0, 30.0, 35.0, 28.0, 36.0, 52.0, 38.0, 60.0, 61.0, 65.0, 61.0, 62.0, 62.0, 48.0, 49.0, 49.0, 32.0, 31.0, 25.0, 17.0, 15.0, 17.0, 11.0, 7.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-152.39544677734375, -147.9127197265625, -143.4299774169922, -138.94725036621094, -134.46450805664062, -129.98178100585938, -125.4990463256836, -121.01631164550781, -116.53358459472656, -112.05084991455078, -107.568115234375, -103.08538818359375, -98.60265350341797, -94.11991882324219, -89.6371841430664, -85.15444946289062, -80.67171478271484, -76.18898010253906, -71.70624542236328, -67.2235107421875, -62.74078369140625, -58.25804901123047, -53.77531433105469, -49.292579650878906, -44.80984878540039, -40.32711410522461, -35.844383239746094, -31.361648559570312, -26.878915786743164, -22.396183013916016, -17.913448333740234, -13.430715560913086, -8.947982788085938, -4.465249538421631, 0.01748371124267578, 4.500217437744141, 8.982950210571289, 13.465682983398438, 17.94841766357422, 22.431150436401367, 26.913883209228516, 31.396615982055664, 35.87934875488281, 40.362083435058594, 44.844818115234375, 49.32754898071289, 53.81028366088867, 58.29301452636719, 62.77574920654297, 67.25848388671875, 71.74121856689453, 76.22395324707031, 80.70668029785156, 85.18941497802734, 89.67214965820312, 94.1548843383789, 98.63761901855469, 103.12035369873047, 107.60308837890625, 112.0858154296875, 116.56855010986328, 121.05128479003906, 125.53401947021484, 130.01675415039062, 134.49948120117188]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 13.0, 21.0, 24.0, 51.0, 90.0, 134.0, 293.0, 685.0, 1731.0, 5304.0, 20725.0, 213643.0, 3836827.0, 93643.0, 14574.0, 3921.0, 1391.0, 594.0, 268.0, 140.0, 79.0, 48.0, 25.0, 18.0, 8.0, 10.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6328125, -11.2735595703125, -10.914306640625, -10.5550537109375, -10.19580078125, -9.8365478515625, -9.477294921875, -9.1180419921875, -8.7587890625, -8.3995361328125, -8.040283203125, -7.6810302734375, -7.32177734375, -6.9625244140625, -6.603271484375, -6.2440185546875, -5.884765625, -5.5255126953125, -5.166259765625, -4.8070068359375, -4.44775390625, -4.0885009765625, -3.729248046875, -3.3699951171875, -3.0107421875, -2.6514892578125, -2.292236328125, -1.9329833984375, -1.57373046875, -1.2144775390625, -0.855224609375, -0.4959716796875, -0.13671875, 0.2225341796875, 0.581787109375, 0.9410400390625, 1.30029296875, 1.6595458984375, 2.018798828125, 2.3780517578125, 2.7373046875, 3.0965576171875, 3.455810546875, 3.8150634765625, 4.17431640625, 4.5335693359375, 4.892822265625, 5.2520751953125, 5.611328125, 5.9705810546875, 6.329833984375, 6.6890869140625, 7.04833984375, 7.4075927734375, 7.766845703125, 8.1260986328125, 8.4853515625, 8.8446044921875, 9.203857421875, 9.5631103515625, 9.92236328125, 10.2816162109375, 10.640869140625, 11.0001220703125, 11.359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 14.0, 15.0, 42.0, 34.0, 55.0, 67.0, 77.0, 96.0, 94.0, 110.0, 93.0, 81.0, 64.0, 39.0, 33.0, 17.0, 20.0, 13.0, 6.0, 5.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.830322265625, -7.60595703125, -7.381591796875, -7.1572265625, -6.932861328125, -6.70849609375, -6.484130859375, -6.259765625, -6.035400390625, -5.81103515625, -5.586669921875, -5.3623046875, -5.137939453125, -4.91357421875, -4.689208984375, -4.46484375, -4.240478515625, -4.01611328125, -3.791748046875, -3.5673828125, -3.343017578125, -3.11865234375, -2.894287109375, -2.669921875, -2.445556640625, -2.22119140625, -1.996826171875, -1.7724609375, -1.548095703125, -1.32373046875, -1.099365234375, -0.875, -0.650634765625, -0.42626953125, -0.201904296875, 0.0224609375, 0.246826171875, 0.47119140625, 0.695556640625, 0.919921875, 1.144287109375, 1.36865234375, 1.593017578125, 1.8173828125, 2.041748046875, 2.26611328125, 2.490478515625, 2.71484375, 2.939208984375, 3.16357421875, 3.387939453125, 3.6123046875, 3.836669921875, 4.06103515625, 4.285400390625, 4.509765625, 4.734130859375, 4.95849609375, 5.182861328125, 5.4072265625, 5.631591796875, 5.85595703125, 6.080322265625, 6.3046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 11.0, 16.0, 22.0, 34.0, 47.0, 111.0, 226.0, 604.0, 2145.0, 13689.0, 308026.0, 3833708.0, 31101.0, 3326.0, 711.0, 239.0, 102.0, 51.0, 33.0, 15.0, 21.0, 14.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.189208984375, -17.56591796875, -16.942626953125, -16.3193359375, -15.696044921875, -15.07275390625, -14.449462890625, -13.826171875, -13.202880859375, -12.57958984375, -11.956298828125, -11.3330078125, -10.709716796875, -10.08642578125, -9.463134765625, -8.83984375, -8.216552734375, -7.59326171875, -6.969970703125, -6.3466796875, -5.723388671875, -5.10009765625, -4.476806640625, -3.853515625, -3.230224609375, -2.60693359375, -1.983642578125, -1.3603515625, -0.737060546875, -0.11376953125, 0.509521484375, 1.1328125, 1.756103515625, 2.37939453125, 3.002685546875, 3.6259765625, 4.249267578125, 4.87255859375, 5.495849609375, 6.119140625, 6.742431640625, 7.36572265625, 7.989013671875, 8.6123046875, 9.235595703125, 9.85888671875, 10.482177734375, 11.10546875, 11.728759765625, 12.35205078125, 12.975341796875, 13.5986328125, 14.221923828125, 14.84521484375, 15.468505859375, 16.091796875, 16.715087890625, 17.33837890625, 17.961669921875, 18.5849609375, 19.208251953125, 19.83154296875, 20.454833984375, 21.078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 11.0, 16.0, 21.0, 28.0, 33.0, 76.0, 175.0, 813.0, 2301.0, 378.0, 110.0, 43.0, 29.0, 16.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.74951171875, -22.1552734375, -21.56103515625, -20.966796875, -20.37255859375, -19.7783203125, -19.18408203125, -18.58984375, -17.99560546875, -17.4013671875, -16.80712890625, -16.212890625, -15.61865234375, -15.0244140625, -14.43017578125, -13.8359375, -13.24169921875, -12.6474609375, -12.05322265625, -11.458984375, -10.86474609375, -10.2705078125, -9.67626953125, -9.08203125, -8.48779296875, -7.8935546875, -7.29931640625, -6.705078125, -6.11083984375, -5.5166015625, -4.92236328125, -4.328125, -3.73388671875, -3.1396484375, -2.54541015625, -1.951171875, -1.35693359375, -0.7626953125, -0.16845703125, 0.42578125, 1.02001953125, 1.6142578125, 2.20849609375, 2.802734375, 3.39697265625, 3.9912109375, 4.58544921875, 5.1796875, 5.77392578125, 6.3681640625, 6.96240234375, 7.556640625, 8.15087890625, 8.7451171875, 9.33935546875, 9.93359375, 10.52783203125, 11.1220703125, 11.71630859375, 12.310546875, 12.90478515625, 13.4990234375, 14.09326171875, 14.6875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 23.0, 46.0, 83.0, 139.0, 176.0, 188.0, 146.0, 77.0, 52.0, 25.0, 11.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.96214294433594, -72.40230560302734, -69.84246063232422, -67.28262329101562, -64.7227783203125, -62.162940979003906, -59.60309982299805, -57.04325866699219, -54.48341751098633, -51.92357635498047, -49.36373519897461, -46.80389404296875, -44.244056701660156, -41.68421173095703, -39.12437438964844, -36.56453323364258, -34.00469207763672, -31.44485092163086, -28.885009765625, -26.325170516967773, -23.765329360961914, -21.205488204956055, -18.645648956298828, -16.08580780029297, -13.52596664428711, -10.96612548828125, -8.406285285949707, -5.846444606781006, -3.2866039276123047, -0.7267627716064453, 1.8330774307250977, 4.392917633056641, 6.9527587890625, 9.51259994506836, 12.072440147399902, 14.632280349731445, 17.192121505737305, 19.751962661743164, 22.31180191040039, 24.87164306640625, 27.43148422241211, 29.99132537841797, 32.55116653442383, 35.11100769042969, 37.67084503173828, 40.230690002441406, 42.79052734375, 45.35036849975586, 47.91020965576172, 50.47005081176758, 53.02989196777344, 55.5897331237793, 58.149574279785156, 60.70941162109375, 63.26925277709961, 65.82909393310547, 68.38893127441406, 70.94876861572266, 73.50861358642578, 76.06845092773438, 78.6282958984375, 81.1881332397461, 83.74797821044922, 86.30781555175781, 88.86766052246094]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 8.0, 9.0, 12.0, 16.0, 38.0, 31.0, 33.0, 47.0, 52.0, 65.0, 66.0, 59.0, 74.0, 82.0, 64.0, 70.0, 50.0, 51.0, 38.0, 36.0, 20.0, 15.0, 18.0, 15.0, 6.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46385192871094, -45.46003341674805, -43.45621109008789, -41.452392578125, -39.448570251464844, -37.44475173950195, -35.44093322753906, -33.437110900878906, -31.433292388916016, -29.429471969604492, -27.42565155029297, -25.421833038330078, -23.418012619018555, -21.41419219970703, -19.41037368774414, -17.406553268432617, -15.402732849121094, -13.39891242980957, -11.395092964172363, -9.391273498535156, -7.387453079223633, -5.383632659912109, -3.3798131942749023, -1.3759937286376953, 0.6278266906738281, 2.6316466331481934, 4.635466575622559, 6.639286518096924, 8.643106460571289, 10.646926879882812, 12.65074634552002, 14.654565811157227, 16.65838623046875, 18.662206649780273, 20.666027069091797, 22.669845581054688, 24.67366600036621, 26.677486419677734, 28.681304931640625, 30.68512535095215, 32.68894577026367, 34.69276428222656, 36.69658660888672, 38.70040512084961, 40.7042236328125, 42.708045959472656, 44.71186447143555, 46.71568298339844, 48.719505310058594, 50.723323822021484, 52.72714614868164, 54.73096466064453, 56.73478698730469, 58.73860549926758, 60.74242401123047, 62.746246337890625, 64.75006103515625, 66.7538833618164, 68.75769805908203, 70.76152038574219, 72.76534271240234, 74.7691650390625, 76.77297973632812, 78.77680206298828, 80.78062438964844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 8.0, 7.0, 7.0, 14.0, 23.0, 32.0, 39.0, 54.0, 100.0, 136.0, 214.0, 321.0, 541.0, 1008.0, 1741.0, 3303.0, 6737.0, 14351.0, 32271.0, 76168.0, 189862.0, 366958.0, 206547.0, 82315.0, 35035.0, 15613.0, 7149.0, 3555.0, 1823.0, 979.0, 567.0, 376.0, 245.0, 143.0, 97.0, 76.0, 41.0, 31.0, 21.0, 14.0, 10.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.38616943359375, -5.2098388671875, -5.03350830078125, -4.857177734375, -4.68084716796875, -4.5045166015625, -4.32818603515625, -4.15185546875, -3.97552490234375, -3.7991943359375, -3.62286376953125, -3.446533203125, -3.27020263671875, -3.0938720703125, -2.91754150390625, -2.7412109375, -2.56488037109375, -2.3885498046875, -2.21221923828125, -2.035888671875, -1.85955810546875, -1.6832275390625, -1.50689697265625, -1.33056640625, -1.15423583984375, -0.9779052734375, -0.80157470703125, -0.625244140625, -0.44891357421875, -0.2725830078125, -0.09625244140625, 0.080078125, 0.25640869140625, 0.4327392578125, 0.60906982421875, 0.785400390625, 0.96173095703125, 1.1380615234375, 1.31439208984375, 1.49072265625, 1.66705322265625, 1.8433837890625, 2.01971435546875, 2.196044921875, 2.37237548828125, 2.5487060546875, 2.72503662109375, 2.9013671875, 3.07769775390625, 3.2540283203125, 3.43035888671875, 3.606689453125, 3.78302001953125, 3.9593505859375, 4.13568115234375, 4.31201171875, 4.48834228515625, 4.6646728515625, 4.84100341796875, 5.017333984375, 5.19366455078125, 5.3699951171875, 5.54632568359375, 5.72265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 10.0, 14.0, 14.0, 24.0, 22.0, 37.0, 27.0, 33.0, 47.0, 47.0, 64.0, 61.0, 67.0, 72.0, 86.0, 60.0, 46.0, 54.0, 40.0, 33.0, 33.0, 20.0, 16.0, 18.0, 11.0, 9.0, 8.0, 11.0, 7.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.92523193359375, -3.7762451171875, -3.62725830078125, -3.478271484375, -3.32928466796875, -3.1802978515625, -3.03131103515625, -2.88232421875, -2.73333740234375, -2.5843505859375, -2.43536376953125, -2.286376953125, -2.13739013671875, -1.9884033203125, -1.83941650390625, -1.6904296875, -1.54144287109375, -1.3924560546875, -1.24346923828125, -1.094482421875, -0.94549560546875, -0.7965087890625, -0.64752197265625, -0.49853515625, -0.34954833984375, -0.2005615234375, -0.05157470703125, 0.097412109375, 0.24639892578125, 0.3953857421875, 0.54437255859375, 0.693359375, 0.84234619140625, 0.9913330078125, 1.14031982421875, 1.289306640625, 1.43829345703125, 1.5872802734375, 1.73626708984375, 1.88525390625, 2.03424072265625, 2.1832275390625, 2.33221435546875, 2.481201171875, 2.63018798828125, 2.7791748046875, 2.92816162109375, 3.0771484375, 3.22613525390625, 3.3751220703125, 3.52410888671875, 3.673095703125, 3.82208251953125, 3.9710693359375, 4.12005615234375, 4.26904296875, 4.41802978515625, 4.5670166015625, 4.71600341796875, 4.864990234375, 5.01397705078125, 5.1629638671875, 5.31195068359375, 5.4609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 16.0, 18.0, 32.0, 47.0, 87.0, 85.0, 172.0, 234.0, 346.0, 601.0, 1167.0, 2661.0, 8867.0, 66841.0, 749833.0, 191780.0, 18016.0, 3974.0, 1642.0, 819.0, 459.0, 268.0, 169.0, 107.0, 71.0, 51.0, 43.0, 22.0, 30.0, 19.0, 4.0, 13.0, 3.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.596923828125, -13.13916015625, -12.681396484375, -12.2236328125, -11.765869140625, -11.30810546875, -10.850341796875, -10.392578125, -9.934814453125, -9.47705078125, -9.019287109375, -8.5615234375, -8.103759765625, -7.64599609375, -7.188232421875, -6.73046875, -6.272705078125, -5.81494140625, -5.357177734375, -4.8994140625, -4.441650390625, -3.98388671875, -3.526123046875, -3.068359375, -2.610595703125, -2.15283203125, -1.695068359375, -1.2373046875, -0.779541015625, -0.32177734375, 0.135986328125, 0.59375, 1.051513671875, 1.50927734375, 1.967041015625, 2.4248046875, 2.882568359375, 3.34033203125, 3.798095703125, 4.255859375, 4.713623046875, 5.17138671875, 5.629150390625, 6.0869140625, 6.544677734375, 7.00244140625, 7.460205078125, 7.91796875, 8.375732421875, 8.83349609375, 9.291259765625, 9.7490234375, 10.206787109375, 10.66455078125, 11.122314453125, 11.580078125, 12.037841796875, 12.49560546875, 12.953369140625, 13.4111328125, 13.868896484375, 14.32666015625, 14.784423828125, 15.2421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 11.0, 10.0, 14.0, 21.0, 20.0, 31.0, 34.0, 52.0, 43.0, 61.0, 63.0, 79.0, 69.0, 83.0, 41.0, 52.0, 47.0, 53.0, 50.0, 34.0, 32.0, 24.0, 22.0, 12.0, 9.0, 10.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.75, -20.064453125, -19.37890625, -18.693359375, -18.0078125, -17.322265625, -16.63671875, -15.951171875, -15.265625, -14.580078125, -13.89453125, -13.208984375, -12.5234375, -11.837890625, -11.15234375, -10.466796875, -9.78125, -9.095703125, -8.41015625, -7.724609375, -7.0390625, -6.353515625, -5.66796875, -4.982421875, -4.296875, -3.611328125, -2.92578125, -2.240234375, -1.5546875, -0.869140625, -0.18359375, 0.501953125, 1.1875, 1.873046875, 2.55859375, 3.244140625, 3.9296875, 4.615234375, 5.30078125, 5.986328125, 6.671875, 7.357421875, 8.04296875, 8.728515625, 9.4140625, 10.099609375, 10.78515625, 11.470703125, 12.15625, 12.841796875, 13.52734375, 14.212890625, 14.8984375, 15.583984375, 16.26953125, 16.955078125, 17.640625, 18.326171875, 19.01171875, 19.697265625, 20.3828125, 21.068359375, 21.75390625, 22.439453125, 23.125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 16.0, 20.0, 34.0, 60.0, 87.0, 166.0, 402.0, 1022.0, 4293.0, 35798.0, 886615.0, 108928.0, 8354.0, 1687.0, 556.0, 222.0, 92.0, 75.0, 48.0, 21.0, 19.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.314453125, -6.05859375, -5.802734375, -5.546875, -5.291015625, -5.03515625, -4.779296875, -4.5234375, -4.267578125, -4.01171875, -3.755859375, -3.5, -3.244140625, -2.98828125, -2.732421875, -2.4765625, -2.220703125, -1.96484375, -1.708984375, -1.453125, -1.197265625, -0.94140625, -0.685546875, -0.4296875, -0.173828125, 0.08203125, 0.337890625, 0.59375, 0.849609375, 1.10546875, 1.361328125, 1.6171875, 1.873046875, 2.12890625, 2.384765625, 2.640625, 2.896484375, 3.15234375, 3.408203125, 3.6640625, 3.919921875, 4.17578125, 4.431640625, 4.6875, 4.943359375, 5.19921875, 5.455078125, 5.7109375, 5.966796875, 6.22265625, 6.478515625, 6.734375, 6.990234375, 7.24609375, 7.501953125, 7.7578125, 8.013671875, 8.26953125, 8.525390625, 8.78125, 9.037109375, 9.29296875, 9.548828125, 9.8046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 4.0, 5.0, 6.0, 14.0, 11.0, 20.0, 29.0, 36.0, 60.0, 135.0, 217.0, 163.0, 124.0, 45.0, 35.0, 23.0, 15.0, 14.0, 12.0, 8.0, 6.0, 1.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012950897216796875, -0.001256793737411499, -0.0012184977531433105, -0.001180201768875122, -0.0011419057846069336, -0.0011036098003387451, -0.0010653138160705566, -0.0010270178318023682, -0.0009887218475341797, -0.0009504258632659912, -0.0009121298789978027, -0.0008738338947296143, -0.0008355379104614258, -0.0007972419261932373, -0.0007589459419250488, -0.0007206499576568604, -0.0006823539733886719, -0.0006440579891204834, -0.0006057620048522949, -0.0005674660205841064, -0.000529170036315918, -0.0004908740520477295, -0.000452578067779541, -0.00041428208351135254, -0.00037598609924316406, -0.0003376901149749756, -0.0002993941307067871, -0.00026109814643859863, -0.00022280216217041016, -0.00018450617790222168, -0.0001462101936340332, -0.00010791420936584473, -6.961822509765625e-05, -3.1322240829467773e-05, 6.973743438720703e-06, 4.526972770690918e-05, 8.356571197509766e-05, 0.00012186169624328613, 0.0001601576805114746, 0.00019845366477966309, 0.00023674964904785156, 0.00027504563331604004, 0.0003133416175842285, 0.000351637601852417, 0.00038993358612060547, 0.00042822957038879395, 0.0004665255546569824, 0.0005048215389251709, 0.0005431175231933594, 0.0005814135074615479, 0.0006197094917297363, 0.0006580054759979248, 0.0006963014602661133, 0.0007345974445343018, 0.0007728934288024902, 0.0008111894130706787, 0.0008494853973388672, 0.0008877813816070557, 0.0009260773658752441, 0.0009643733501434326, 0.001002669334411621, 0.0010409653186798096, 0.001079261302947998, 0.0011175572872161865, 0.001155853271484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 9.0, 2.0, 3.0, 11.0, 13.0, 20.0, 17.0, 32.0, 64.0, 81.0, 125.0, 157.0, 295.0, 513.0, 1023.0, 2297.0, 5680.0, 19700.0, 124904.0, 766511.0, 100288.0, 17222.0, 5289.0, 2074.0, 938.0, 482.0, 277.0, 161.0, 100.0, 75.0, 56.0, 25.0, 30.0, 29.0, 18.0, 14.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.51702880859375, -4.3582763671875, -4.19952392578125, -4.040771484375, -3.88201904296875, -3.7232666015625, -3.56451416015625, -3.40576171875, -3.24700927734375, -3.0882568359375, -2.92950439453125, -2.770751953125, -2.61199951171875, -2.4532470703125, -2.29449462890625, -2.1357421875, -1.97698974609375, -1.8182373046875, -1.65948486328125, -1.500732421875, -1.34197998046875, -1.1832275390625, -1.02447509765625, -0.86572265625, -0.70697021484375, -0.5482177734375, -0.38946533203125, -0.230712890625, -0.07196044921875, 0.0867919921875, 0.24554443359375, 0.404296875, 0.56304931640625, 0.7218017578125, 0.88055419921875, 1.039306640625, 1.19805908203125, 1.3568115234375, 1.51556396484375, 1.67431640625, 1.83306884765625, 1.9918212890625, 2.15057373046875, 2.309326171875, 2.46807861328125, 2.6268310546875, 2.78558349609375, 2.9443359375, 3.10308837890625, 3.2618408203125, 3.42059326171875, 3.579345703125, 3.73809814453125, 3.8968505859375, 4.05560302734375, 4.21435546875, 4.37310791015625, 4.5318603515625, 4.69061279296875, 4.849365234375, 5.00811767578125, 5.1668701171875, 5.32562255859375, 5.484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 6.0, 9.0, 13.0, 16.0, 24.0, 28.0, 28.0, 45.0, 60.0, 68.0, 83.0, 113.0, 106.0, 73.0, 74.0, 59.0, 33.0, 25.0, 23.0, 14.0, 14.0, 12.0, 13.0, 9.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.17578125, -4.03521728515625, -3.8946533203125, -3.75408935546875, -3.613525390625, -3.47296142578125, -3.3323974609375, -3.19183349609375, -3.05126953125, -2.91070556640625, -2.7701416015625, -2.62957763671875, -2.489013671875, -2.34844970703125, -2.2078857421875, -2.06732177734375, -1.9267578125, -1.78619384765625, -1.6456298828125, -1.50506591796875, -1.364501953125, -1.22393798828125, -1.0833740234375, -0.94281005859375, -0.80224609375, -0.66168212890625, -0.5211181640625, -0.38055419921875, -0.239990234375, -0.09942626953125, 0.0411376953125, 0.18170166015625, 0.322265625, 0.46282958984375, 0.6033935546875, 0.74395751953125, 0.884521484375, 1.02508544921875, 1.1656494140625, 1.30621337890625, 1.44677734375, 1.58734130859375, 1.7279052734375, 1.86846923828125, 2.009033203125, 2.14959716796875, 2.2901611328125, 2.43072509765625, 2.5712890625, 2.71185302734375, 2.8524169921875, 2.99298095703125, 3.133544921875, 3.27410888671875, 3.4146728515625, 3.55523681640625, 3.69580078125, 3.83636474609375, 3.9769287109375, 4.11749267578125, 4.258056640625, 4.39862060546875, 4.5391845703125, 4.67974853515625, 4.8203125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 20.0, 35.0, 80.0, 169.0, 255.0, 200.0, 133.0, 52.0, 15.0, 9.0, 6.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.1579818725586, -96.41535949707031, -92.6727294921875, -88.93009948730469, -85.1874771118164, -81.44485473632812, -77.70222473144531, -73.9595947265625, -70.21697235107422, -66.47434997558594, -62.731719970703125, -58.98909378051758, -55.24646759033203, -51.503841400146484, -47.76121520996094, -44.01858901977539, -40.275962829589844, -36.5333366394043, -32.79071044921875, -29.048084259033203, -25.305458068847656, -21.56283187866211, -17.820205688476562, -14.077579498291016, -10.334953308105469, -6.592327117919922, -2.849700927734375, 0.8929252624511719, 4.635551452636719, 8.378177642822266, 12.120803833007812, 15.86343002319336, 19.606063842773438, 23.348690032958984, 27.09131622314453, 30.833942413330078, 34.576568603515625, 38.31919479370117, 42.06182098388672, 45.804447174072266, 49.54707336425781, 53.28969955444336, 57.032325744628906, 60.77495193481445, 64.517578125, 68.26020812988281, 72.0028305053711, 75.74545288085938, 79.48808288574219, 83.230712890625, 86.97333526611328, 90.71595764160156, 94.45858764648438, 98.20121765136719, 101.94384002685547, 105.68646240234375, 109.42909240722656, 113.17172241210938, 116.91434478759766, 120.65696716308594, 124.39959716796875, 128.14222717285156, 131.88485717773438, 135.62747192382812, 139.37010192871094]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 10.0, 14.0, 11.0, 11.0, 25.0, 23.0, 27.0, 26.0, 53.0, 47.0, 54.0, 86.0, 71.0, 68.0, 69.0, 65.0, 48.0, 51.0, 33.0, 40.0, 33.0, 19.0, 26.0, 13.0, 9.0, 11.0, 12.0, 8.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-107.50023651123047, -104.55801391601562, -101.61579132080078, -98.67356872558594, -95.7313461303711, -92.78912353515625, -89.84689331054688, -86.90467834472656, -83.96244812011719, -81.02022552490234, -78.0780029296875, -75.13578033447266, -72.19355773925781, -69.25133514404297, -66.30911254882812, -63.366886138916016, -60.42466735839844, -57.482444763183594, -54.54022216796875, -51.597999572753906, -48.65577697753906, -45.71355438232422, -42.77132797241211, -39.829105377197266, -36.88688278198242, -33.94466018676758, -31.002437591552734, -28.060213088989258, -25.117990493774414, -22.17576789855957, -19.233543395996094, -16.29132080078125, -13.349098205566406, -10.406875610351562, -7.464652061462402, -4.522428512573242, -1.5802059173583984, 1.3620166778564453, 4.304241180419922, 7.246463775634766, 10.18868637084961, 13.130908966064453, 16.073131561279297, 19.015356063842773, 21.957578659057617, 24.89980125427246, 27.842025756835938, 30.78424835205078, 33.726470947265625, 36.66869354248047, 39.61091613769531, 42.553138732910156, 45.495361328125, 48.437583923339844, 51.37981033325195, 54.3220329284668, 57.26425552368164, 60.206478118896484, 63.14870071411133, 66.09092712402344, 69.03314971923828, 71.97537231445312, 74.91759490966797, 77.85981750488281, 80.80204010009766]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 14.0, 19.0, 24.0, 43.0, 62.0, 89.0, 126.0, 219.0, 519.0, 1741.0, 14787.0, 3951857.0, 217147.0, 5881.0, 918.0, 330.0, 166.0, 111.0, 67.0, 36.0, 28.0, 20.0, 17.0, 8.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.283935546875, -18.53662109375, -17.789306640625, -17.0419921875, -16.294677734375, -15.54736328125, -14.800048828125, -14.052734375, -13.305419921875, -12.55810546875, -11.810791015625, -11.0634765625, -10.316162109375, -9.56884765625, -8.821533203125, -8.07421875, -7.326904296875, -6.57958984375, -5.832275390625, -5.0849609375, -4.337646484375, -3.59033203125, -2.843017578125, -2.095703125, -1.348388671875, -0.60107421875, 0.146240234375, 0.8935546875, 1.640869140625, 2.38818359375, 3.135498046875, 3.8828125, 4.630126953125, 5.37744140625, 6.124755859375, 6.8720703125, 7.619384765625, 8.36669921875, 9.114013671875, 9.861328125, 10.608642578125, 11.35595703125, 12.103271484375, 12.8505859375, 13.597900390625, 14.34521484375, 15.092529296875, 15.83984375, 16.587158203125, 17.33447265625, 18.081787109375, 18.8291015625, 19.576416015625, 20.32373046875, 21.071044921875, 21.818359375, 22.565673828125, 23.31298828125, 24.060302734375, 24.8076171875, 25.554931640625, 26.30224609375, 27.049560546875, 27.796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 3.0, 6.0, 15.0, 30.0, 43.0, 66.0, 94.0, 131.0, 162.0, 152.0, 113.0, 74.0, 47.0, 28.0, 15.0, 11.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.2421875, -14.892333984375, -14.54248046875, -14.192626953125, -13.8427734375, -13.492919921875, -13.14306640625, -12.793212890625, -12.443359375, -12.093505859375, -11.74365234375, -11.393798828125, -11.0439453125, -10.694091796875, -10.34423828125, -9.994384765625, -9.64453125, -9.294677734375, -8.94482421875, -8.594970703125, -8.2451171875, -7.895263671875, -7.54541015625, -7.195556640625, -6.845703125, -6.495849609375, -6.14599609375, -5.796142578125, -5.4462890625, -5.096435546875, -4.74658203125, -4.396728515625, -4.046875, -3.697021484375, -3.34716796875, -2.997314453125, -2.6474609375, -2.297607421875, -1.94775390625, -1.597900390625, -1.248046875, -0.898193359375, -0.54833984375, -0.198486328125, 0.1513671875, 0.501220703125, 0.85107421875, 1.200927734375, 1.55078125, 1.900634765625, 2.25048828125, 2.600341796875, 2.9501953125, 3.300048828125, 3.64990234375, 3.999755859375, 4.349609375, 4.699462890625, 5.04931640625, 5.399169921875, 5.7490234375, 6.098876953125, 6.44873046875, 6.798583984375, 7.1484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 14.0, 11.0, 21.0, 24.0, 58.0, 64.0, 109.0, 156.0, 251.0, 461.0, 883.0, 1888.0, 4337.0, 11718.0, 39069.0, 256930.0, 3543980.0, 275769.0, 39888.0, 10939.0, 3925.0, 1667.0, 793.0, 415.0, 309.0, 171.0, 123.0, 86.0, 62.0, 39.0, 34.0, 34.0, 9.0, 14.0, 8.0, 8.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12890625, -6.87884521484375, -6.6287841796875, -6.37872314453125, -6.128662109375, -5.87860107421875, -5.6285400390625, -5.37847900390625, -5.12841796875, -4.87835693359375, -4.6282958984375, -4.37823486328125, -4.128173828125, -3.87811279296875, -3.6280517578125, -3.37799072265625, -3.1279296875, -2.87786865234375, -2.6278076171875, -2.37774658203125, -2.127685546875, -1.87762451171875, -1.6275634765625, -1.37750244140625, -1.12744140625, -0.87738037109375, -0.6273193359375, -0.37725830078125, -0.127197265625, 0.12286376953125, 0.3729248046875, 0.62298583984375, 0.873046875, 1.12310791015625, 1.3731689453125, 1.62322998046875, 1.873291015625, 2.12335205078125, 2.3734130859375, 2.62347412109375, 2.87353515625, 3.12359619140625, 3.3736572265625, 3.62371826171875, 3.873779296875, 4.12384033203125, 4.3739013671875, 4.62396240234375, 4.8740234375, 5.12408447265625, 5.3741455078125, 5.62420654296875, 5.874267578125, 6.12432861328125, 6.3743896484375, 6.62445068359375, 6.87451171875, 7.12457275390625, 7.3746337890625, 7.62469482421875, 7.874755859375, 8.12481689453125, 8.3748779296875, 8.62493896484375, 8.875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 18.0, 16.0, 34.0, 52.0, 113.0, 355.0, 1442.0, 1415.0, 366.0, 113.0, 76.0, 21.0, 15.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.495849609375, -10.03857421875, -9.581298828125, -9.1240234375, -8.666748046875, -8.20947265625, -7.752197265625, -7.294921875, -6.837646484375, -6.38037109375, -5.923095703125, -5.4658203125, -5.008544921875, -4.55126953125, -4.093994140625, -3.63671875, -3.179443359375, -2.72216796875, -2.264892578125, -1.8076171875, -1.350341796875, -0.89306640625, -0.435791015625, 0.021484375, 0.478759765625, 0.93603515625, 1.393310546875, 1.8505859375, 2.307861328125, 2.76513671875, 3.222412109375, 3.6796875, 4.136962890625, 4.59423828125, 5.051513671875, 5.5087890625, 5.966064453125, 6.42333984375, 6.880615234375, 7.337890625, 7.795166015625, 8.25244140625, 8.709716796875, 9.1669921875, 9.624267578125, 10.08154296875, 10.538818359375, 10.99609375, 11.453369140625, 11.91064453125, 12.367919921875, 12.8251953125, 13.282470703125, 13.73974609375, 14.197021484375, 14.654296875, 15.111572265625, 15.56884765625, 16.026123046875, 16.4833984375, 16.940673828125, 17.39794921875, 17.855224609375, 18.3125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 28.0, 68.0, 184.0, 234.0, 223.0, 124.0, 62.0, 32.0, 11.0, 9.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-122.49754333496094, -119.62767791748047, -116.75782012939453, -113.88795471191406, -111.01809692382812, -108.14823150634766, -105.27836608886719, -102.40850830078125, -99.53864288330078, -96.66877746582031, -93.79891967773438, -90.9290542602539, -88.05918884277344, -85.1893310546875, -82.31946563720703, -79.44960021972656, -76.57974243164062, -73.70987701416016, -70.84001922607422, -67.97015380859375, -65.10029602050781, -62.230430603027344, -59.360565185546875, -56.49070358276367, -53.62084197998047, -50.750980377197266, -47.88111877441406, -45.011253356933594, -42.14139175415039, -39.27153015136719, -36.40166473388672, -33.531803131103516, -30.661949157714844, -27.79208755493164, -24.922224044799805, -22.05236053466797, -19.182498931884766, -16.312637329101562, -13.442773818969727, -10.57291030883789, -7.7030487060546875, -4.833186149597168, -1.9633235931396484, 0.9065389633178711, 3.7764015197753906, 6.64626407623291, 9.51612663269043, 12.385990142822266, 15.255851745605469, 18.125713348388672, 20.995576858520508, 23.865440368652344, 26.735301971435547, 29.60516357421875, 32.47502899169922, 35.34489059448242, 38.214752197265625, 41.08461380004883, 43.95447540283203, 46.8243408203125, 49.6942024230957, 52.564064025878906, 55.433929443359375, 58.30379104614258, 61.17365264892578]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 9.0, 14.0, 14.0, 15.0, 28.0, 25.0, 34.0, 47.0, 59.0, 62.0, 57.0, 67.0, 76.0, 67.0, 51.0, 51.0, 48.0, 57.0, 37.0, 30.0, 31.0, 25.0, 25.0, 18.0, 13.0, 13.0, 8.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78485107421875, -32.36203384399414, -30.9392147064209, -29.516395568847656, -28.093578338623047, -26.670761108398438, -25.247941970825195, -23.825122833251953, -22.402305603027344, -20.979488372802734, -19.556669235229492, -18.13385009765625, -16.71103286743164, -15.288214683532715, -13.865396499633789, -12.442578315734863, -11.019760131835938, -9.596941947937012, -8.174123764038086, -6.75130558013916, -5.328487396240234, -3.9056692123413086, -2.482851028442383, -1.060032844543457, 0.36278533935546875, 1.7856035232543945, 3.2084217071533203, 4.631239891052246, 6.054058074951172, 7.476876258850098, 8.899694442749023, 10.32251262664795, 11.74532699584961, 13.168145179748535, 14.590963363647461, 16.013782501220703, 17.436599731445312, 18.859416961669922, 20.282236099243164, 21.705055236816406, 23.127872467041016, 24.550689697265625, 25.973508834838867, 27.39632797241211, 28.81914520263672, 30.241962432861328, 31.66478157043457, 33.08760070800781, 34.51041793823242, 35.93323516845703, 37.356056213378906, 38.778873443603516, 40.201690673828125, 41.624507904052734, 43.047325134277344, 44.47014617919922, 45.89296340942383, 47.31578063964844, 48.73860168457031, 50.16141891479492, 51.58423614501953, 53.00705337524414, 54.42987060546875, 55.852691650390625, 57.275508880615234]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 14.0, 8.0, 16.0, 32.0, 34.0, 58.0, 78.0, 131.0, 169.0, 265.0, 465.0, 738.0, 1345.0, 2485.0, 4837.0, 9789.0, 21434.0, 50626.0, 129081.0, 335383.0, 299191.0, 110865.0, 43944.0, 19058.0, 8666.0, 4389.0, 2311.0, 1272.0, 691.0, 381.0, 270.0, 156.0, 116.0, 74.0, 64.0, 24.0, 24.0, 20.0, 12.0, 5.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.53582763671875, -5.3568115234375, -5.17779541015625, -4.998779296875, -4.81976318359375, -4.6407470703125, -4.46173095703125, -4.28271484375, -4.10369873046875, -3.9246826171875, -3.74566650390625, -3.566650390625, -3.38763427734375, -3.2086181640625, -3.02960205078125, -2.8505859375, -2.67156982421875, -2.4925537109375, -2.31353759765625, -2.134521484375, -1.95550537109375, -1.7764892578125, -1.59747314453125, -1.41845703125, -1.23944091796875, -1.0604248046875, -0.88140869140625, -0.702392578125, -0.52337646484375, -0.3443603515625, -0.16534423828125, 0.013671875, 0.19268798828125, 0.3717041015625, 0.55072021484375, 0.729736328125, 0.90875244140625, 1.0877685546875, 1.26678466796875, 1.44580078125, 1.62481689453125, 1.8038330078125, 1.98284912109375, 2.161865234375, 2.34088134765625, 2.5198974609375, 2.69891357421875, 2.8779296875, 3.05694580078125, 3.2359619140625, 3.41497802734375, 3.593994140625, 3.77301025390625, 3.9520263671875, 4.13104248046875, 4.31005859375, 4.48907470703125, 4.6680908203125, 4.84710693359375, 5.026123046875, 5.20513916015625, 5.3841552734375, 5.56317138671875, 5.7421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 14.0, 12.0, 19.0, 16.0, 39.0, 43.0, 63.0, 81.0, 78.0, 87.0, 92.0, 96.0, 84.0, 75.0, 68.0, 47.0, 25.0, 23.0, 14.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.859375, -8.63421630859375, -8.4090576171875, -8.18389892578125, -7.958740234375, -7.73358154296875, -7.5084228515625, -7.28326416015625, -7.05810546875, -6.83294677734375, -6.6077880859375, -6.38262939453125, -6.157470703125, -5.93231201171875, -5.7071533203125, -5.48199462890625, -5.2568359375, -5.03167724609375, -4.8065185546875, -4.58135986328125, -4.356201171875, -4.13104248046875, -3.9058837890625, -3.68072509765625, -3.45556640625, -3.23040771484375, -3.0052490234375, -2.78009033203125, -2.554931640625, -2.32977294921875, -2.1046142578125, -1.87945556640625, -1.654296875, -1.42913818359375, -1.2039794921875, -0.97882080078125, -0.753662109375, -0.52850341796875, -0.3033447265625, -0.07818603515625, 0.14697265625, 0.37213134765625, 0.5972900390625, 0.82244873046875, 1.047607421875, 1.27276611328125, 1.4979248046875, 1.72308349609375, 1.9482421875, 2.17340087890625, 2.3985595703125, 2.62371826171875, 2.848876953125, 3.07403564453125, 3.2991943359375, 3.52435302734375, 3.74951171875, 3.97467041015625, 4.1998291015625, 4.42498779296875, 4.650146484375, 4.87530517578125, 5.1004638671875, 5.32562255859375, 5.55078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 5.0, 4.0, 10.0, 21.0, 17.0, 40.0, 43.0, 83.0, 91.0, 146.0, 286.0, 433.0, 909.0, 2121.0, 7047.0, 34178.0, 299846.0, 626811.0, 60440.0, 10437.0, 3049.0, 1215.0, 559.0, 294.0, 154.0, 103.0, 76.0, 39.0, 32.0, 19.0, 14.0, 9.0, 6.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.662353515625, -11.26220703125, -10.862060546875, -10.4619140625, -10.061767578125, -9.66162109375, -9.261474609375, -8.861328125, -8.461181640625, -8.06103515625, -7.660888671875, -7.2607421875, -6.860595703125, -6.46044921875, -6.060302734375, -5.66015625, -5.260009765625, -4.85986328125, -4.459716796875, -4.0595703125, -3.659423828125, -3.25927734375, -2.859130859375, -2.458984375, -2.058837890625, -1.65869140625, -1.258544921875, -0.8583984375, -0.458251953125, -0.05810546875, 0.342041015625, 0.7421875, 1.142333984375, 1.54248046875, 1.942626953125, 2.3427734375, 2.742919921875, 3.14306640625, 3.543212890625, 3.943359375, 4.343505859375, 4.74365234375, 5.143798828125, 5.5439453125, 5.944091796875, 6.34423828125, 6.744384765625, 7.14453125, 7.544677734375, 7.94482421875, 8.344970703125, 8.7451171875, 9.145263671875, 9.54541015625, 9.945556640625, 10.345703125, 10.745849609375, 11.14599609375, 11.546142578125, 11.9462890625, 12.346435546875, 12.74658203125, 13.146728515625, 13.546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 6.0, 1.0, 7.0, 7.0, 12.0, 13.0, 17.0, 18.0, 24.0, 30.0, 41.0, 38.0, 51.0, 54.0, 72.0, 58.0, 60.0, 72.0, 72.0, 67.0, 50.0, 40.0, 36.0, 26.0, 33.0, 19.0, 22.0, 12.0, 12.0, 8.0, 10.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.28125, -21.6396484375, -20.998046875, -20.3564453125, -19.71484375, -19.0732421875, -18.431640625, -17.7900390625, -17.1484375, -16.5068359375, -15.865234375, -15.2236328125, -14.58203125, -13.9404296875, -13.298828125, -12.6572265625, -12.015625, -11.3740234375, -10.732421875, -10.0908203125, -9.44921875, -8.8076171875, -8.166015625, -7.5244140625, -6.8828125, -6.2412109375, -5.599609375, -4.9580078125, -4.31640625, -3.6748046875, -3.033203125, -2.3916015625, -1.75, -1.1083984375, -0.466796875, 0.1748046875, 0.81640625, 1.4580078125, 2.099609375, 2.7412109375, 3.3828125, 4.0244140625, 4.666015625, 5.3076171875, 5.94921875, 6.5908203125, 7.232421875, 7.8740234375, 8.515625, 9.1572265625, 9.798828125, 10.4404296875, 11.08203125, 11.7236328125, 12.365234375, 13.0068359375, 13.6484375, 14.2900390625, 14.931640625, 15.5732421875, 16.21484375, 16.8564453125, 17.498046875, 18.1396484375, 18.78125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 10.0, 8.0, 14.0, 16.0, 27.0, 47.0, 122.0, 202.0, 644.0, 2596.0, 30944.0, 1004871.0, 6950.0, 1369.0, 392.0, 146.0, 69.0, 40.0, 23.0, 18.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3125, -24.4765625, -23.640625, -22.8046875, -21.96875, -21.1328125, -20.296875, -19.4609375, -18.625, -17.7890625, -16.953125, -16.1171875, -15.28125, -14.4453125, -13.609375, -12.7734375, -11.9375, -11.1015625, -10.265625, -9.4296875, -8.59375, -7.7578125, -6.921875, -6.0859375, -5.25, -4.4140625, -3.578125, -2.7421875, -1.90625, -1.0703125, -0.234375, 0.6015625, 1.4375, 2.2734375, 3.109375, 3.9453125, 4.78125, 5.6171875, 6.453125, 7.2890625, 8.125, 8.9609375, 9.796875, 10.6328125, 11.46875, 12.3046875, 13.140625, 13.9765625, 14.8125, 15.6484375, 16.484375, 17.3203125, 18.15625, 18.9921875, 19.828125, 20.6640625, 21.5, 22.3359375, 23.171875, 24.0078125, 24.84375, 25.6796875, 26.515625, 27.3515625, 28.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 10.0, 19.0, 41.0, 95.0, 270.0, 322.0, 122.0, 45.0, 24.0, 14.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.003551483154296875, -0.003474414348602295, -0.003397345542907715, -0.0033202767372131348, -0.0032432079315185547, -0.0031661391258239746, -0.0030890703201293945, -0.0030120015144348145, -0.0029349327087402344, -0.0028578639030456543, -0.0027807950973510742, -0.002703726291656494, -0.002626657485961914, -0.002549588680267334, -0.002472519874572754, -0.002395451068878174, -0.0023183822631835938, -0.0022413134574890137, -0.0021642446517944336, -0.0020871758460998535, -0.0020101070404052734, -0.0019330382347106934, -0.0018559694290161133, -0.0017789006233215332, -0.0017018318176269531, -0.001624763011932373, -0.001547694206237793, -0.0014706254005432129, -0.0013935565948486328, -0.0013164877891540527, -0.0012394189834594727, -0.0011623501777648926, -0.0010852813720703125, -0.0010082125663757324, -0.0009311437606811523, -0.0008540749549865723, -0.0007770061492919922, -0.0006999373435974121, -0.000622868537902832, -0.000545799732208252, -0.0004687309265136719, -0.0003916621208190918, -0.0003145933151245117, -0.00023752450942993164, -0.00016045570373535156, -8.338689804077148e-05, -6.318092346191406e-06, 7.075071334838867e-05, 0.00014781951904296875, 0.00022488832473754883, 0.0003019571304321289, 0.000379025936126709, 0.00045609474182128906, 0.0005331635475158691, 0.0006102323532104492, 0.0006873011589050293, 0.0007643699645996094, 0.0008414387702941895, 0.0009185075759887695, 0.0009955763816833496, 0.0010726451873779297, 0.0011497139930725098, 0.0012267827987670898, 0.00130385160446167, 0.00138092041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 24.0, 25.0, 55.0, 86.0, 173.0, 344.0, 1170.0, 6873.0, 964426.0, 71123.0, 2934.0, 737.0, 279.0, 123.0, 72.0, 34.0, 22.0, 11.0, 10.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.6875, -29.953369140625, -29.21923828125, -28.485107421875, -27.7509765625, -27.016845703125, -26.28271484375, -25.548583984375, -24.814453125, -24.080322265625, -23.34619140625, -22.612060546875, -21.8779296875, -21.143798828125, -20.40966796875, -19.675537109375, -18.94140625, -18.207275390625, -17.47314453125, -16.739013671875, -16.0048828125, -15.270751953125, -14.53662109375, -13.802490234375, -13.068359375, -12.334228515625, -11.60009765625, -10.865966796875, -10.1318359375, -9.397705078125, -8.66357421875, -7.929443359375, -7.1953125, -6.461181640625, -5.72705078125, -4.992919921875, -4.2587890625, -3.524658203125, -2.79052734375, -2.056396484375, -1.322265625, -0.588134765625, 0.14599609375, 0.880126953125, 1.6142578125, 2.348388671875, 3.08251953125, 3.816650390625, 4.55078125, 5.284912109375, 6.01904296875, 6.753173828125, 7.4873046875, 8.221435546875, 8.95556640625, 9.689697265625, 10.423828125, 11.157958984375, 11.89208984375, 12.626220703125, 13.3603515625, 14.094482421875, 14.82861328125, 15.562744140625, 16.296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 25.0, 41.0, 107.0, 235.0, 296.0, 166.0, 63.0, 19.0, 12.0, 6.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.5390625, -8.09375, -7.6484375, -7.203125, -6.7578125, -6.3125, -5.8671875, -5.421875, -4.9765625, -4.53125, -4.0859375, -3.640625, -3.1953125, -2.75, -2.3046875, -1.859375, -1.4140625, -0.96875, -0.5234375, -0.078125, 0.3671875, 0.8125, 1.2578125, 1.703125, 2.1484375, 2.59375, 3.0390625, 3.484375, 3.9296875, 4.375, 4.8203125, 5.265625, 5.7109375, 6.15625, 6.6015625, 7.046875, 7.4921875, 7.9375, 8.3828125, 8.828125, 9.2734375, 9.71875, 10.1640625, 10.609375, 11.0546875, 11.5, 11.9453125, 12.390625, 12.8359375, 13.28125, 13.7265625, 14.171875, 14.6171875, 15.0625, 15.5078125, 15.953125, 16.3984375, 16.84375, 17.2890625, 17.734375, 18.1796875, 18.625, 19.0703125, 19.515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 17.0, 67.0, 140.0, 387.0, 267.0, 79.0, 14.0, 10.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.15481567382812, -235.982177734375, -228.8095245361328, -221.6368865966797, -214.4642333984375, -207.29159545898438, -200.11895751953125, -192.94631958007812, -185.77366638183594, -178.6010284423828, -171.42837524414062, -164.2557373046875, -157.08309936523438, -149.9104461669922, -142.73780822753906, -135.56515502929688, -128.39251708984375, -121.2198715209961, -114.04722595214844, -106.87458801269531, -99.70194244384766, -92.529296875, -85.35665893554688, -78.18401336669922, -71.01136779785156, -63.838722229003906, -56.666080474853516, -49.493438720703125, -42.32079315185547, -35.14814758300781, -27.975505828857422, -20.80286407470703, -13.630218505859375, -6.457574844360352, 0.7150688171386719, 7.887712478637695, 15.060356140136719, 22.233001708984375, 29.405643463134766, 36.578285217285156, 43.75093078613281, 50.92357635498047, 58.09621810913086, 65.26885986328125, 72.4415054321289, 79.61415100097656, 86.78678894042969, 93.95943450927734, 101.132080078125, 108.30472564697266, 115.47737121582031, 122.65000915527344, 129.82266235351562, 136.99530029296875, 144.16793823242188, 151.340576171875, 158.5132293701172, 165.6858673095703, 172.8585205078125, 180.03115844726562, 187.20379638671875, 194.37644958496094, 201.54908752441406, 208.72174072265625, 215.89437866210938]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 2.0, 11.0, 7.0, 6.0, 6.0, 20.0, 20.0, 19.0, 26.0, 37.0, 36.0, 50.0, 43.0, 44.0, 62.0, 81.0, 86.0, 60.0, 42.0, 42.0, 44.0, 32.0, 38.0, 19.0, 41.0, 29.0, 17.0, 14.0, 18.0, 11.0, 9.0, 8.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-80.77488708496094, -78.02449798583984, -75.27410125732422, -72.52371215820312, -69.7733154296875, -67.0229263305664, -64.27253723144531, -61.52214431762695, -58.771751403808594, -56.021358489990234, -53.270965576171875, -50.52057647705078, -47.77018356323242, -45.01979064941406, -42.26940155029297, -39.51900863647461, -36.76861572265625, -34.01822280883789, -31.267831802368164, -28.517440795898438, -25.767047882080078, -23.01665496826172, -20.266263961791992, -17.515872955322266, -14.765480041503906, -12.015088081359863, -9.26469612121582, -6.514304161071777, -3.7639122009277344, -1.0135202407836914, 1.7368717193603516, 4.487262725830078, 7.237663269042969, 9.988055229187012, 12.738447189331055, 15.488839149475098, 18.23923110961914, 20.9896240234375, 23.740015029907227, 26.490406036376953, 29.240798950195312, 31.991191864013672, 34.74158477783203, 37.491973876953125, 40.242366790771484, 42.992759704589844, 45.74314880371094, 48.4935417175293, 51.243934631347656, 53.994327545166016, 56.744720458984375, 59.49510955810547, 62.24550247192383, 64.99589538574219, 67.74628448486328, 70.49667358398438, 73.2470703125, 75.9974594116211, 78.74785614013672, 81.49824523925781, 84.24864196777344, 86.99903106689453, 89.74942016601562, 92.49981689453125, 95.25020599365234]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 10.0, 12.0, 16.0, 18.0, 27.0, 38.0, 60.0, 110.0, 199.0, 529.0, 1823.0, 8421.0, 66376.0, 3255858.0, 823553.0, 30389.0, 4894.0, 1144.0, 401.0, 178.0, 67.0, 58.0, 27.0, 25.0, 12.0, 13.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8228759765625, -9.442626953125, -9.0623779296875, -8.68212890625, -8.3018798828125, -7.921630859375, -7.5413818359375, -7.1611328125, -6.7808837890625, -6.400634765625, -6.0203857421875, -5.64013671875, -5.2598876953125, -4.879638671875, -4.4993896484375, -4.119140625, -3.7388916015625, -3.358642578125, -2.9783935546875, -2.59814453125, -2.2178955078125, -1.837646484375, -1.4573974609375, -1.0771484375, -0.6968994140625, -0.316650390625, 0.0635986328125, 0.44384765625, 0.8240966796875, 1.204345703125, 1.5845947265625, 1.96484375, 2.3450927734375, 2.725341796875, 3.1055908203125, 3.48583984375, 3.8660888671875, 4.246337890625, 4.6265869140625, 5.0068359375, 5.3870849609375, 5.767333984375, 6.1475830078125, 6.52783203125, 6.9080810546875, 7.288330078125, 7.6685791015625, 8.048828125, 8.4290771484375, 8.809326171875, 9.1895751953125, 9.56982421875, 9.9500732421875, 10.330322265625, 10.7105712890625, 11.0908203125, 11.4710693359375, 11.851318359375, 12.2315673828125, 12.61181640625, 12.9920654296875, 13.372314453125, 13.7525634765625, 14.1328125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 9.0, 8.0, 11.0, 16.0, 34.0, 39.0, 40.0, 51.0, 70.0, 84.0, 65.0, 97.0, 77.0, 98.0, 64.0, 77.0, 44.0, 26.0, 31.0, 28.0, 15.0, 8.0, 10.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73046875, -3.55059814453125, -3.3707275390625, -3.19085693359375, -3.010986328125, -2.83111572265625, -2.6512451171875, -2.47137451171875, -2.29150390625, -2.11163330078125, -1.9317626953125, -1.75189208984375, -1.572021484375, -1.39215087890625, -1.2122802734375, -1.03240966796875, -0.8525390625, -0.67266845703125, -0.4927978515625, -0.31292724609375, -0.133056640625, 0.04681396484375, 0.2266845703125, 0.40655517578125, 0.58642578125, 0.76629638671875, 0.9461669921875, 1.12603759765625, 1.305908203125, 1.48577880859375, 1.6656494140625, 1.84552001953125, 2.025390625, 2.20526123046875, 2.3851318359375, 2.56500244140625, 2.744873046875, 2.92474365234375, 3.1046142578125, 3.28448486328125, 3.46435546875, 3.64422607421875, 3.8240966796875, 4.00396728515625, 4.183837890625, 4.36370849609375, 4.5435791015625, 4.72344970703125, 4.9033203125, 5.08319091796875, 5.2630615234375, 5.44293212890625, 5.622802734375, 5.80267333984375, 5.9825439453125, 6.16241455078125, 6.34228515625, 6.52215576171875, 6.7020263671875, 6.88189697265625, 7.061767578125, 7.24163818359375, 7.4215087890625, 7.60137939453125, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 5.0, 11.0, 17.0, 18.0, 28.0, 43.0, 59.0, 102.0, 177.0, 373.0, 772.0, 1877.0, 5885.0, 24604.0, 149394.0, 3286537.0, 659434.0, 49822.0, 9915.0, 2919.0, 1101.0, 512.0, 238.0, 152.0, 88.0, 63.0, 42.0, 29.0, 19.0, 13.0, 10.0, 6.0, 5.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.6015625, -10.296630859375, -9.99169921875, -9.686767578125, -9.3818359375, -9.076904296875, -8.77197265625, -8.467041015625, -8.162109375, -7.857177734375, -7.55224609375, -7.247314453125, -6.9423828125, -6.637451171875, -6.33251953125, -6.027587890625, -5.72265625, -5.417724609375, -5.11279296875, -4.807861328125, -4.5029296875, -4.197998046875, -3.89306640625, -3.588134765625, -3.283203125, -2.978271484375, -2.67333984375, -2.368408203125, -2.0634765625, -1.758544921875, -1.45361328125, -1.148681640625, -0.84375, -0.538818359375, -0.23388671875, 0.071044921875, 0.3759765625, 0.680908203125, 0.98583984375, 1.290771484375, 1.595703125, 1.900634765625, 2.20556640625, 2.510498046875, 2.8154296875, 3.120361328125, 3.42529296875, 3.730224609375, 4.03515625, 4.340087890625, 4.64501953125, 4.949951171875, 5.2548828125, 5.559814453125, 5.86474609375, 6.169677734375, 6.474609375, 6.779541015625, 7.08447265625, 7.389404296875, 7.6943359375, 7.999267578125, 8.30419921875, 8.609130859375, 8.9140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 5.0, 5.0, 8.0, 9.0, 12.0, 14.0, 14.0, 24.0, 31.0, 38.0, 49.0, 67.0, 94.0, 118.0, 200.0, 341.0, 603.0, 855.0, 624.0, 406.0, 193.0, 109.0, 74.0, 54.0, 21.0, 26.0, 7.0, 7.0, 11.0, 6.0, 6.0, 7.0, 6.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.5716552734375, -7.322998046875, -7.0743408203125, -6.82568359375, -6.5770263671875, -6.328369140625, -6.0797119140625, -5.8310546875, -5.5823974609375, -5.333740234375, -5.0850830078125, -4.83642578125, -4.5877685546875, -4.339111328125, -4.0904541015625, -3.841796875, -3.5931396484375, -3.344482421875, -3.0958251953125, -2.84716796875, -2.5985107421875, -2.349853515625, -2.1011962890625, -1.8525390625, -1.6038818359375, -1.355224609375, -1.1065673828125, -0.85791015625, -0.6092529296875, -0.360595703125, -0.1119384765625, 0.13671875, 0.3853759765625, 0.634033203125, 0.8826904296875, 1.13134765625, 1.3800048828125, 1.628662109375, 1.8773193359375, 2.1259765625, 2.3746337890625, 2.623291015625, 2.8719482421875, 3.12060546875, 3.3692626953125, 3.617919921875, 3.8665771484375, 4.115234375, 4.3638916015625, 4.612548828125, 4.8612060546875, 5.10986328125, 5.3585205078125, 5.607177734375, 5.8558349609375, 6.1044921875, 6.3531494140625, 6.601806640625, 6.8504638671875, 7.09912109375, 7.3477783203125, 7.596435546875, 7.8450927734375, 8.09375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 13.0, 18.0, 64.0, 98.0, 219.0, 256.0, 169.0, 89.0, 32.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-171.29298400878906, -167.5221405029297, -163.7512969970703, -159.98045349121094, -156.20960998535156, -152.4387664794922, -148.6679229736328, -144.89707946777344, -141.12623596191406, -137.3553924560547, -133.5845489501953, -129.81370544433594, -126.04286193847656, -122.27201843261719, -118.50117492675781, -114.73033142089844, -110.95948791503906, -107.18864440917969, -103.41780090332031, -99.64695739746094, -95.87611389160156, -92.10527038574219, -88.33442687988281, -84.56358337402344, -80.79273223876953, -77.02188873291016, -73.25104522705078, -69.4802017211914, -65.70935821533203, -61.938514709472656, -58.16767120361328, -54.396827697753906, -50.62598419189453, -46.855140686035156, -43.08429718017578, -39.313453674316406, -35.54261016845703, -31.771764755249023, -28.00092124938965, -24.230077743530273, -20.4592342376709, -16.688390731811523, -12.917547225952148, -9.146702766418457, -5.375859260559082, -1.6050148010253906, 2.1658287048339844, 5.936672210693359, 9.707515716552734, 13.47835922241211, 17.249202728271484, 21.02004623413086, 24.790889739990234, 28.561735153198242, 32.33258056640625, 36.103424072265625, 39.874267578125, 43.645111083984375, 47.41595458984375, 51.186798095703125, 54.9576416015625, 58.728485107421875, 62.49932861328125, 66.27017211914062, 70.041015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 1.0, 5.0, 6.0, 12.0, 17.0, 23.0, 13.0, 19.0, 29.0, 49.0, 47.0, 43.0, 49.0, 45.0, 35.0, 62.0, 50.0, 55.0, 52.0, 49.0, 58.0, 47.0, 42.0, 38.0, 39.0, 24.0, 19.0, 18.0, 16.0, 4.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.02311706542969, -59.32658386230469, -57.63005065917969, -55.93351364135742, -54.23698043823242, -52.54044723510742, -50.843910217285156, -49.147377014160156, -47.450843811035156, -45.754310607910156, -44.057777404785156, -42.36124038696289, -40.66470718383789, -38.96817398071289, -37.271636962890625, -35.575103759765625, -33.878570556640625, -32.182037353515625, -30.485502243041992, -28.78896713256836, -27.09243392944336, -25.39590072631836, -23.699365615844727, -22.002830505371094, -20.306297302246094, -18.609764099121094, -16.91322898864746, -15.216694831848145, -13.520160675048828, -11.823626518249512, -10.127092361450195, -8.430558204650879, -6.734020233154297, -5.0374860763549805, -3.340951919555664, -1.6444177627563477, 0.05211639404296875, 1.7486505508422852, 3.4451847076416016, 5.141718864440918, 6.838253021240234, 8.53478717803955, 10.231321334838867, 11.927855491638184, 13.6243896484375, 15.320923805236816, 17.017457962036133, 18.713993072509766, 20.410526275634766, 22.107059478759766, 23.8035945892334, 25.50012969970703, 27.19666290283203, 28.89319610595703, 30.589731216430664, 32.2862663269043, 33.9827995300293, 35.6793327331543, 37.37586975097656, 39.07240295410156, 40.76893615722656, 42.46546936035156, 44.16200256347656, 45.85853958129883, 47.55507278442383]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 16.0, 18.0, 28.0, 37.0, 66.0, 101.0, 153.0, 230.0, 376.0, 576.0, 1029.0, 1886.0, 3602.0, 7184.0, 14418.0, 29942.0, 62879.0, 130906.0, 256986.0, 268575.0, 139363.0, 66953.0, 31813.0, 15372.0, 7474.0, 3743.0, 2008.0, 1167.0, 622.0, 335.0, 242.0, 148.0, 81.0, 59.0, 42.0, 36.0, 18.0, 11.0, 10.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.5, -4.35955810546875, -4.2191162109375, -4.07867431640625, -3.938232421875, -3.79779052734375, -3.6573486328125, -3.51690673828125, -3.37646484375, -3.23602294921875, -3.0955810546875, -2.95513916015625, -2.814697265625, -2.67425537109375, -2.5338134765625, -2.39337158203125, -2.2529296875, -2.11248779296875, -1.9720458984375, -1.83160400390625, -1.691162109375, -1.55072021484375, -1.4102783203125, -1.26983642578125, -1.12939453125, -0.98895263671875, -0.8485107421875, -0.70806884765625, -0.567626953125, -0.42718505859375, -0.2867431640625, -0.14630126953125, -0.005859375, 0.13458251953125, 0.2750244140625, 0.41546630859375, 0.555908203125, 0.69635009765625, 0.8367919921875, 0.97723388671875, 1.11767578125, 1.25811767578125, 1.3985595703125, 1.53900146484375, 1.679443359375, 1.81988525390625, 1.9603271484375, 2.10076904296875, 2.2412109375, 2.38165283203125, 2.5220947265625, 2.66253662109375, 2.802978515625, 2.94342041015625, 3.0838623046875, 3.22430419921875, 3.36474609375, 3.50518798828125, 3.6456298828125, 3.78607177734375, 3.926513671875, 4.06695556640625, 4.2073974609375, 4.34783935546875, 4.48828125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 6.0, 5.0, 6.0, 9.0, 9.0, 12.0, 10.0, 20.0, 14.0, 17.0, 22.0, 36.0, 27.0, 52.0, 39.0, 41.0, 48.0, 51.0, 52.0, 45.0, 46.0, 54.0, 52.0, 53.0, 39.0, 28.0, 32.0, 27.0, 25.0, 23.0, 16.0, 17.0, 12.0, 17.0, 12.0, 6.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.638671875, -3.539398193359375, -3.44012451171875, -3.340850830078125, -3.2415771484375, -3.142303466796875, -3.04302978515625, -2.943756103515625, -2.844482421875, -2.745208740234375, -2.64593505859375, -2.546661376953125, -2.4473876953125, -2.348114013671875, -2.24884033203125, -2.149566650390625, -2.05029296875, -1.951019287109375, -1.85174560546875, -1.752471923828125, -1.6531982421875, -1.553924560546875, -1.45465087890625, -1.355377197265625, -1.256103515625, -1.156829833984375, -1.05755615234375, -0.958282470703125, -0.8590087890625, -0.759735107421875, -0.66046142578125, -0.561187744140625, -0.4619140625, -0.362640380859375, -0.26336669921875, -0.164093017578125, -0.0648193359375, 0.034454345703125, 0.13372802734375, 0.233001708984375, 0.332275390625, 0.431549072265625, 0.53082275390625, 0.630096435546875, 0.7293701171875, 0.828643798828125, 0.92791748046875, 1.027191162109375, 1.12646484375, 1.225738525390625, 1.32501220703125, 1.424285888671875, 1.5235595703125, 1.622833251953125, 1.72210693359375, 1.821380615234375, 1.920654296875, 2.019927978515625, 2.11920166015625, 2.218475341796875, 2.3177490234375, 2.417022705078125, 2.51629638671875, 2.615570068359375, 2.71484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 5.0, 8.0, 7.0, 8.0, 16.0, 24.0, 31.0, 40.0, 50.0, 62.0, 97.0, 107.0, 171.0, 222.0, 273.0, 353.0, 559.0, 757.0, 1203.0, 2070.0, 4212.0, 11807.0, 46240.0, 225574.0, 600794.0, 113238.0, 25130.0, 7305.0, 3022.0, 1683.0, 974.0, 682.0, 431.0, 348.0, 264.0, 202.0, 150.0, 126.0, 73.0, 59.0, 35.0, 39.0, 27.0, 24.0, 12.0, 16.0, 8.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.421875, -8.1527099609375, -7.883544921875, -7.6143798828125, -7.34521484375, -7.0760498046875, -6.806884765625, -6.5377197265625, -6.2685546875, -5.9993896484375, -5.730224609375, -5.4610595703125, -5.19189453125, -4.9227294921875, -4.653564453125, -4.3843994140625, -4.115234375, -3.8460693359375, -3.576904296875, -3.3077392578125, -3.03857421875, -2.7694091796875, -2.500244140625, -2.2310791015625, -1.9619140625, -1.6927490234375, -1.423583984375, -1.1544189453125, -0.88525390625, -0.6160888671875, -0.346923828125, -0.0777587890625, 0.19140625, 0.4605712890625, 0.729736328125, 0.9989013671875, 1.26806640625, 1.5372314453125, 1.806396484375, 2.0755615234375, 2.3447265625, 2.6138916015625, 2.883056640625, 3.1522216796875, 3.42138671875, 3.6905517578125, 3.959716796875, 4.2288818359375, 4.498046875, 4.7672119140625, 5.036376953125, 5.3055419921875, 5.57470703125, 5.8438720703125, 6.113037109375, 6.3822021484375, 6.6513671875, 6.9205322265625, 7.189697265625, 7.4588623046875, 7.72802734375, 7.9971923828125, 8.266357421875, 8.5355224609375, 8.8046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 9.0, 7.0, 10.0, 18.0, 11.0, 23.0, 22.0, 24.0, 31.0, 31.0, 34.0, 41.0, 45.0, 40.0, 41.0, 47.0, 50.0, 53.0, 36.0, 40.0, 43.0, 40.0, 36.0, 37.0, 23.0, 28.0, 17.0, 14.0, 26.0, 19.0, 23.0, 16.0, 10.0, 7.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.6015625, -12.192138671875, -11.78271484375, -11.373291015625, -10.9638671875, -10.554443359375, -10.14501953125, -9.735595703125, -9.326171875, -8.916748046875, -8.50732421875, -8.097900390625, -7.6884765625, -7.279052734375, -6.86962890625, -6.460205078125, -6.05078125, -5.641357421875, -5.23193359375, -4.822509765625, -4.4130859375, -4.003662109375, -3.59423828125, -3.184814453125, -2.775390625, -2.365966796875, -1.95654296875, -1.547119140625, -1.1376953125, -0.728271484375, -0.31884765625, 0.090576171875, 0.5, 0.909423828125, 1.31884765625, 1.728271484375, 2.1376953125, 2.547119140625, 2.95654296875, 3.365966796875, 3.775390625, 4.184814453125, 4.59423828125, 5.003662109375, 5.4130859375, 5.822509765625, 6.23193359375, 6.641357421875, 7.05078125, 7.460205078125, 7.86962890625, 8.279052734375, 8.6884765625, 9.097900390625, 9.50732421875, 9.916748046875, 10.326171875, 10.735595703125, 11.14501953125, 11.554443359375, 11.9638671875, 12.373291015625, 12.78271484375, 13.192138671875, 13.6015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 8.0, 8.0, 7.0, 10.0, 12.0, 28.0, 33.0, 51.0, 75.0, 115.0, 175.0, 310.0, 477.0, 853.0, 1846.0, 4872.0, 15736.0, 74247.0, 711578.0, 193740.0, 30669.0, 7925.0, 2883.0, 1229.0, 623.0, 360.0, 238.0, 140.0, 107.0, 53.0, 42.0, 39.0, 17.0, 9.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.8828125, -4.733642578125, -4.58447265625, -4.435302734375, -4.2861328125, -4.136962890625, -3.98779296875, -3.838623046875, -3.689453125, -3.540283203125, -3.39111328125, -3.241943359375, -3.0927734375, -2.943603515625, -2.79443359375, -2.645263671875, -2.49609375, -2.346923828125, -2.19775390625, -2.048583984375, -1.8994140625, -1.750244140625, -1.60107421875, -1.451904296875, -1.302734375, -1.153564453125, -1.00439453125, -0.855224609375, -0.7060546875, -0.556884765625, -0.40771484375, -0.258544921875, -0.109375, 0.039794921875, 0.18896484375, 0.338134765625, 0.4873046875, 0.636474609375, 0.78564453125, 0.934814453125, 1.083984375, 1.233154296875, 1.38232421875, 1.531494140625, 1.6806640625, 1.829833984375, 1.97900390625, 2.128173828125, 2.27734375, 2.426513671875, 2.57568359375, 2.724853515625, 2.8740234375, 3.023193359375, 3.17236328125, 3.321533203125, 3.470703125, 3.619873046875, 3.76904296875, 3.918212890625, 4.0673828125, 4.216552734375, 4.36572265625, 4.514892578125, 4.6640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 19.0, 22.0, 24.0, 23.0, 38.0, 53.0, 96.0, 156.0, 178.0, 103.0, 61.0, 49.0, 45.0, 27.0, 18.0, 14.0, 14.0, 8.0, 10.0, 9.0, 5.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008721351623535156, -0.0008265599608421326, -0.0007809847593307495, -0.0007354095578193665, -0.0006898343563079834, -0.0006442591547966003, -0.0005986839532852173, -0.0005531087517738342, -0.0005075335502624512, -0.0004619583487510681, -0.00041638314723968506, -0.000370807945728302, -0.00032523274421691895, -0.0002796575427055359, -0.00023408234119415283, -0.00018850713968276978, -0.00014293193817138672, -9.735673666000366e-05, -5.1781535148620605e-05, -6.206333637237549e-06, 3.936886787414551e-05, 8.494406938552856e-05, 0.00013051927089691162, 0.00017609447240829468, 0.00022166967391967773, 0.0002672448754310608, 0.00031282007694244385, 0.0003583952784538269, 0.00040397047996520996, 0.000449545681476593, 0.0004951208829879761, 0.0005406960844993591, 0.0005862712860107422, 0.0006318464875221252, 0.0006774216890335083, 0.0007229968905448914, 0.0007685720920562744, 0.0008141472935676575, 0.0008597224950790405, 0.0009052976965904236, 0.0009508728981018066, 0.0009964480996131897, 0.0010420233011245728, 0.0010875985026359558, 0.0011331737041473389, 0.001178748905658722, 0.001224324107170105, 0.001269899308681488, 0.001315474510192871, 0.0013610497117042542, 0.0014066249132156372, 0.0014522001147270203, 0.0014977753162384033, 0.0015433505177497864, 0.0015889257192611694, 0.0016345009207725525, 0.0016800761222839355, 0.0017256513237953186, 0.0017712265253067017, 0.0018168017268180847, 0.0018623769283294678, 0.0019079521298408508, 0.001953527331352234, 0.001999102532863617, 0.002044677734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 10.0, 16.0, 16.0, 24.0, 34.0, 49.0, 83.0, 140.0, 218.0, 429.0, 888.0, 1943.0, 4447.0, 12619.0, 48727.0, 394445.0, 512498.0, 50501.0, 12957.0, 4531.0, 1904.0, 941.0, 425.0, 277.0, 143.0, 111.0, 57.0, 39.0, 16.0, 20.0, 17.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2216796875, -4.076171875, -3.9306640625, -3.78515625, -3.6396484375, -3.494140625, -3.3486328125, -3.203125, -3.0576171875, -2.912109375, -2.7666015625, -2.62109375, -2.4755859375, -2.330078125, -2.1845703125, -2.0390625, -1.8935546875, -1.748046875, -1.6025390625, -1.45703125, -1.3115234375, -1.166015625, -1.0205078125, -0.875, -0.7294921875, -0.583984375, -0.4384765625, -0.29296875, -0.1474609375, -0.001953125, 0.1435546875, 0.2890625, 0.4345703125, 0.580078125, 0.7255859375, 0.87109375, 1.0166015625, 1.162109375, 1.3076171875, 1.453125, 1.5986328125, 1.744140625, 1.8896484375, 2.03515625, 2.1806640625, 2.326171875, 2.4716796875, 2.6171875, 2.7626953125, 2.908203125, 3.0537109375, 3.19921875, 3.3447265625, 3.490234375, 3.6357421875, 3.78125, 3.9267578125, 4.072265625, 4.2177734375, 4.36328125, 4.5087890625, 4.654296875, 4.7998046875, 4.9453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 14.0, 9.0, 7.0, 5.0, 10.0, 20.0, 23.0, 43.0, 52.0, 55.0, 49.0, 95.0, 114.0, 92.0, 97.0, 67.0, 55.0, 38.0, 29.0, 28.0, 18.0, 22.0, 8.0, 8.0, 11.0, 3.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.53094482421875, -4.3939208984375, -4.25689697265625, -4.119873046875, -3.98284912109375, -3.8458251953125, -3.70880126953125, -3.57177734375, -3.43475341796875, -3.2977294921875, -3.16070556640625, -3.023681640625, -2.88665771484375, -2.7496337890625, -2.61260986328125, -2.4755859375, -2.33856201171875, -2.2015380859375, -2.06451416015625, -1.927490234375, -1.79046630859375, -1.6534423828125, -1.51641845703125, -1.37939453125, -1.24237060546875, -1.1053466796875, -0.96832275390625, -0.831298828125, -0.69427490234375, -0.5572509765625, -0.42022705078125, -0.283203125, -0.14617919921875, -0.0091552734375, 0.12786865234375, 0.264892578125, 0.40191650390625, 0.5389404296875, 0.67596435546875, 0.81298828125, 0.95001220703125, 1.0870361328125, 1.22406005859375, 1.361083984375, 1.49810791015625, 1.6351318359375, 1.77215576171875, 1.9091796875, 2.04620361328125, 2.1832275390625, 2.32025146484375, 2.457275390625, 2.59429931640625, 2.7313232421875, 2.86834716796875, 3.00537109375, 3.14239501953125, 3.2794189453125, 3.41644287109375, 3.553466796875, 3.69049072265625, 3.8275146484375, 3.96453857421875, 4.1015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 7.0, 13.0, 38.0, 99.0, 228.0, 265.0, 154.0, 90.0, 43.0, 21.0, 24.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-142.86318969726562, -139.10525512695312, -135.34732055664062, -131.58938598632812, -127.83145141601562, -124.07351684570312, -120.3155746459961, -116.5576400756836, -112.7997055053711, -109.0417709350586, -105.2838363647461, -101.5259017944336, -97.76795959472656, -94.01002502441406, -90.25209045410156, -86.49415588378906, -82.73622131347656, -78.97828674316406, -75.22035217285156, -71.46241760253906, -67.70448303222656, -63.9465446472168, -60.18860626220703, -56.43067169189453, -52.67273712158203, -48.91480255126953, -45.15686798095703, -41.398929595947266, -37.640995025634766, -33.883060455322266, -30.125123977661133, -26.3671875, -22.60924530029297, -18.85131072998047, -15.093374252319336, -11.33543872833252, -7.577503204345703, -3.819568634033203, -0.06163215637207031, 3.6963043212890625, 7.4542388916015625, 11.212174415588379, 14.970109939575195, 18.728046417236328, 22.485980987548828, 26.243915557861328, 30.00185203552246, 33.759788513183594, 37.517723083496094, 41.275657653808594, 45.033592224121094, 48.79153060913086, 52.54946517944336, 56.30739974975586, 60.065338134765625, 63.823272705078125, 67.58120727539062, 71.33914184570312, 75.09707641601562, 78.85501098632812, 82.61294555664062, 86.37088012695312, 90.12882232666016, 93.88675689697266, 97.64469146728516]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 6.0, 7.0, 5.0, 16.0, 14.0, 16.0, 14.0, 28.0, 25.0, 31.0, 29.0, 19.0, 34.0, 42.0, 43.0, 62.0, 69.0, 92.0, 76.0, 53.0, 33.0, 35.0, 36.0, 32.0, 28.0, 25.0, 25.0, 19.0, 23.0, 12.0, 6.0, 13.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-73.421630859375, -71.5413589477539, -69.66108703613281, -67.78080749511719, -65.9005355834961, -64.020263671875, -62.139991760253906, -60.25971984863281, -58.37944412231445, -56.49917221069336, -54.618896484375, -52.738624572753906, -50.85835266113281, -48.97807693481445, -47.09780502319336, -45.217529296875, -43.337257385253906, -41.45698547363281, -39.57670974731445, -37.69643783569336, -35.816162109375, -33.935890197753906, -32.05561828613281, -30.175344467163086, -28.29507064819336, -26.414796829223633, -24.534523010253906, -22.654251098632812, -20.773977279663086, -18.89370346069336, -17.013431549072266, -15.133157730102539, -13.252883911132812, -11.372610092163086, -9.492337226867676, -7.612063884735107, -5.731790542602539, -3.8515167236328125, -1.9712438583374023, -0.09097099304199219, 1.7893028259277344, 3.6695761680603027, 5.549849510192871, 7.4301228523254395, 9.310396194458008, 11.190670013427734, 13.070942878723145, 14.951215744018555, 16.83148956298828, 18.711763381958008, 20.592037200927734, 22.472309112548828, 24.352582931518555, 26.23285675048828, 28.113128662109375, 29.9934024810791, 31.873676300048828, 33.75394821166992, 35.63422393798828, 37.514495849609375, 39.39476776123047, 41.27504348754883, 43.15531539916992, 45.03559112548828, 46.915863037109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 9.0, 19.0, 29.0, 39.0, 65.0, 104.0, 143.0, 261.0, 539.0, 1083.0, 2521.0, 6557.0, 21658.0, 104413.0, 1990193.0, 1928892.0, 103682.0, 22445.0, 6823.0, 2554.0, 1137.0, 489.0, 241.0, 135.0, 74.0, 57.0, 32.0, 29.0, 14.0, 11.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.140625, -4.9263916015625, -4.712158203125, -4.4979248046875, -4.28369140625, -4.0694580078125, -3.855224609375, -3.6409912109375, -3.4267578125, -3.2125244140625, -2.998291015625, -2.7840576171875, -2.56982421875, -2.3555908203125, -2.141357421875, -1.9271240234375, -1.712890625, -1.4986572265625, -1.284423828125, -1.0701904296875, -0.85595703125, -0.6417236328125, -0.427490234375, -0.2132568359375, 0.0009765625, 0.2152099609375, 0.429443359375, 0.6436767578125, 0.85791015625, 1.0721435546875, 1.286376953125, 1.5006103515625, 1.71484375, 1.9290771484375, 2.143310546875, 2.3575439453125, 2.57177734375, 2.7860107421875, 3.000244140625, 3.2144775390625, 3.4287109375, 3.6429443359375, 3.857177734375, 4.0714111328125, 4.28564453125, 4.4998779296875, 4.714111328125, 4.9283447265625, 5.142578125, 5.3568115234375, 5.571044921875, 5.7852783203125, 5.99951171875, 6.2137451171875, 6.427978515625, 6.6422119140625, 6.8564453125, 7.0706787109375, 7.284912109375, 7.4991455078125, 7.71337890625, 7.9276123046875, 8.141845703125, 8.3560791015625, 8.5703125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 15.0, 15.0, 26.0, 31.0, 37.0, 42.0, 38.0, 53.0, 57.0, 65.0, 77.0, 62.0, 63.0, 71.0, 56.0, 59.0, 43.0, 34.0, 28.0, 27.0, 22.0, 23.0, 12.0, 9.0, 4.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.0234375, -4.90264892578125, -4.7818603515625, -4.66107177734375, -4.540283203125, -4.41949462890625, -4.2987060546875, -4.17791748046875, -4.05712890625, -3.93634033203125, -3.8155517578125, -3.69476318359375, -3.573974609375, -3.45318603515625, -3.3323974609375, -3.21160888671875, -3.0908203125, -2.97003173828125, -2.8492431640625, -2.72845458984375, -2.607666015625, -2.48687744140625, -2.3660888671875, -2.24530029296875, -2.12451171875, -2.00372314453125, -1.8829345703125, -1.76214599609375, -1.641357421875, -1.52056884765625, -1.3997802734375, -1.27899169921875, -1.158203125, -1.03741455078125, -0.9166259765625, -0.79583740234375, -0.675048828125, -0.55426025390625, -0.4334716796875, -0.31268310546875, -0.19189453125, -0.07110595703125, 0.0496826171875, 0.17047119140625, 0.291259765625, 0.41204833984375, 0.5328369140625, 0.65362548828125, 0.7744140625, 0.89520263671875, 1.0159912109375, 1.13677978515625, 1.257568359375, 1.37835693359375, 1.4991455078125, 1.61993408203125, 1.74072265625, 1.86151123046875, 1.9822998046875, 2.10308837890625, 2.223876953125, 2.34466552734375, 2.4654541015625, 2.58624267578125, 2.70703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 7.0, 9.0, 12.0, 19.0, 28.0, 25.0, 41.0, 67.0, 107.0, 210.0, 350.0, 762.0, 1672.0, 4300.0, 12204.0, 45491.0, 274287.0, 3339343.0, 441286.0, 54485.0, 12873.0, 3871.0, 1380.0, 631.0, 305.0, 169.0, 99.0, 64.0, 43.0, 35.0, 25.0, 21.0, 15.0, 11.0, 10.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.5, -7.2698974609375, -7.039794921875, -6.8096923828125, -6.57958984375, -6.3494873046875, -6.119384765625, -5.8892822265625, -5.6591796875, -5.4290771484375, -5.198974609375, -4.9688720703125, -4.73876953125, -4.5086669921875, -4.278564453125, -4.0484619140625, -3.818359375, -3.5882568359375, -3.358154296875, -3.1280517578125, -2.89794921875, -2.6678466796875, -2.437744140625, -2.2076416015625, -1.9775390625, -1.7474365234375, -1.517333984375, -1.2872314453125, -1.05712890625, -0.8270263671875, -0.596923828125, -0.3668212890625, -0.13671875, 0.0933837890625, 0.323486328125, 0.5535888671875, 0.78369140625, 1.0137939453125, 1.243896484375, 1.4739990234375, 1.7041015625, 1.9342041015625, 2.164306640625, 2.3944091796875, 2.62451171875, 2.8546142578125, 3.084716796875, 3.3148193359375, 3.544921875, 3.7750244140625, 4.005126953125, 4.2352294921875, 4.46533203125, 4.6954345703125, 4.925537109375, 5.1556396484375, 5.3857421875, 5.6158447265625, 5.845947265625, 6.0760498046875, 6.30615234375, 6.5362548828125, 6.766357421875, 6.9964599609375, 7.2265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 7.0, 5.0, 10.0, 5.0, 11.0, 10.0, 7.0, 18.0, 24.0, 36.0, 41.0, 42.0, 71.0, 97.0, 138.0, 220.0, 332.0, 625.0, 719.0, 611.0, 415.0, 199.0, 127.0, 81.0, 65.0, 41.0, 24.0, 22.0, 17.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.5860595703125, -6.383056640625, -6.1800537109375, -5.97705078125, -5.7740478515625, -5.571044921875, -5.3680419921875, -5.1650390625, -4.9620361328125, -4.759033203125, -4.5560302734375, -4.35302734375, -4.1500244140625, -3.947021484375, -3.7440185546875, -3.541015625, -3.3380126953125, -3.135009765625, -2.9320068359375, -2.72900390625, -2.5260009765625, -2.322998046875, -2.1199951171875, -1.9169921875, -1.7139892578125, -1.510986328125, -1.3079833984375, -1.10498046875, -0.9019775390625, -0.698974609375, -0.4959716796875, -0.29296875, -0.0899658203125, 0.113037109375, 0.3160400390625, 0.51904296875, 0.7220458984375, 0.925048828125, 1.1280517578125, 1.3310546875, 1.5340576171875, 1.737060546875, 1.9400634765625, 2.14306640625, 2.3460693359375, 2.549072265625, 2.7520751953125, 2.955078125, 3.1580810546875, 3.361083984375, 3.5640869140625, 3.76708984375, 3.9700927734375, 4.173095703125, 4.3760986328125, 4.5791015625, 4.7821044921875, 4.985107421875, 5.1881103515625, 5.39111328125, 5.5941162109375, 5.797119140625, 6.0001220703125, 6.203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 23.0, 28.0, 76.0, 193.0, 279.0, 205.0, 119.0, 32.0, 15.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5028839111328, -132.88723754882812, -129.2716064453125, -125.65596008300781, -122.04031372070312, -118.42467498779297, -114.80903625488281, -111.19338989257812, -107.57774353027344, -103.96210479736328, -100.3464584350586, -96.73081970214844, -93.11517333984375, -89.4995346069336, -85.88389587402344, -82.26824951171875, -78.6526107788086, -75.03697204589844, -71.42132568359375, -67.8056869506836, -64.1900405883789, -60.57440185546875, -56.95875930786133, -53.343116760253906, -49.727474212646484, -46.11183166503906, -42.49618911743164, -38.88054656982422, -35.26490783691406, -31.649263381958008, -28.03362274169922, -24.417980194091797, -20.802337646484375, -17.186695098876953, -13.571053504943848, -9.955411911010742, -6.33976936340332, -2.7241268157958984, 0.8915138244628906, 4.5071563720703125, 8.122798919677734, 11.738441467285156, 15.354083061218262, 18.969724655151367, 22.58536720275879, 26.20100975036621, 29.816650390625, 33.43229293823242, 37.047935485839844, 40.663578033447266, 44.27922058105469, 47.894859313964844, 51.51050567626953, 55.12614440917969, 58.74178695678711, 62.35742950439453, 65.97306823730469, 69.58870697021484, 73.20435333251953, 76.81999206542969, 80.43563842773438, 84.05127716064453, 87.66691589355469, 91.28256225585938, 94.89820861816406]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 4.0, 8.0, 9.0, 6.0, 10.0, 8.0, 23.0, 21.0, 20.0, 24.0, 29.0, 21.0, 35.0, 34.0, 29.0, 46.0, 52.0, 45.0, 45.0, 59.0, 57.0, 56.0, 51.0, 38.0, 38.0, 21.0, 32.0, 19.0, 26.0, 20.0, 14.0, 27.0, 13.0, 8.0, 11.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-37.55016326904297, -36.526187896728516, -35.50221252441406, -34.478233337402344, -33.45425796508789, -32.43028259277344, -31.40630531311035, -30.382328033447266, -29.358352661132812, -28.33437728881836, -27.310400009155273, -26.286422729492188, -25.262447357177734, -24.23847198486328, -23.214494705200195, -22.19051742553711, -21.166542053222656, -20.142566680908203, -19.118589401245117, -18.09461212158203, -17.070636749267578, -16.046661376953125, -15.022684097290039, -13.99870777130127, -12.9747314453125, -11.95075511932373, -10.926778793334961, -9.902802467346191, -8.878826141357422, -7.854849815368652, -6.830873489379883, -5.806897163391113, -4.782924652099609, -3.75894832611084, -2.7349720001220703, -1.7109956741333008, -0.6870193481445312, 0.3369569778442383, 1.3609333038330078, 2.3849096298217773, 3.408885955810547, 4.432862281799316, 5.456838607788086, 6.4808149337768555, 7.504791259765625, 8.528767585754395, 9.552743911743164, 10.576720237731934, 11.600696563720703, 12.624672889709473, 13.648649215698242, 14.672625541687012, 15.696601867675781, 16.720577239990234, 17.74455451965332, 18.768531799316406, 19.79250717163086, 20.816482543945312, 21.8404598236084, 22.864437103271484, 23.888412475585938, 24.91238784790039, 25.936365127563477, 26.960342407226562, 27.984317779541016]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 9.0, 15.0, 16.0, 34.0, 40.0, 67.0, 106.0, 174.0, 256.0, 410.0, 700.0, 1201.0, 1932.0, 3747.0, 7128.0, 14783.0, 33068.0, 79777.0, 211525.0, 365141.0, 195636.0, 73536.0, 30591.0, 13546.0, 6599.0, 3583.0, 1957.0, 1152.0, 663.0, 439.0, 253.0, 155.0, 97.0, 76.0, 48.0, 32.0, 14.0, 11.0, 6.0, 9.0, 5.0, 5.0, 1.0, 8.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.17425537109375, -4.0164794921875, -3.85870361328125, -3.700927734375, -3.54315185546875, -3.3853759765625, -3.22760009765625, -3.06982421875, -2.91204833984375, -2.7542724609375, -2.59649658203125, -2.438720703125, -2.28094482421875, -2.1231689453125, -1.96539306640625, -1.8076171875, -1.64984130859375, -1.4920654296875, -1.33428955078125, -1.176513671875, -1.01873779296875, -0.8609619140625, -0.70318603515625, -0.54541015625, -0.38763427734375, -0.2298583984375, -0.07208251953125, 0.085693359375, 0.24346923828125, 0.4012451171875, 0.55902099609375, 0.716796875, 0.87457275390625, 1.0323486328125, 1.19012451171875, 1.347900390625, 1.50567626953125, 1.6634521484375, 1.82122802734375, 1.97900390625, 2.13677978515625, 2.2945556640625, 2.45233154296875, 2.610107421875, 2.76788330078125, 2.9256591796875, 3.08343505859375, 3.2412109375, 3.39898681640625, 3.5567626953125, 3.71453857421875, 3.872314453125, 4.03009033203125, 4.1878662109375, 4.34564208984375, 4.50341796875, 4.66119384765625, 4.8189697265625, 4.97674560546875, 5.134521484375, 5.29229736328125, 5.4500732421875, 5.60784912109375, 5.765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 12.0, 7.0, 5.0, 10.0, 12.0, 12.0, 11.0, 14.0, 19.0, 18.0, 27.0, 29.0, 34.0, 35.0, 32.0, 36.0, 46.0, 47.0, 39.0, 46.0, 51.0, 44.0, 46.0, 41.0, 40.0, 38.0, 34.0, 37.0, 25.0, 29.0, 25.0, 21.0, 11.0, 12.0, 12.0, 7.0, 10.0, 9.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.54296875, -2.45880126953125, -2.3746337890625, -2.29046630859375, -2.206298828125, -2.12213134765625, -2.0379638671875, -1.95379638671875, -1.86962890625, -1.78546142578125, -1.7012939453125, -1.61712646484375, -1.532958984375, -1.44879150390625, -1.3646240234375, -1.28045654296875, -1.1962890625, -1.11212158203125, -1.0279541015625, -0.94378662109375, -0.859619140625, -0.77545166015625, -0.6912841796875, -0.60711669921875, -0.52294921875, -0.43878173828125, -0.3546142578125, -0.27044677734375, -0.186279296875, -0.10211181640625, -0.0179443359375, 0.06622314453125, 0.150390625, 0.23455810546875, 0.3187255859375, 0.40289306640625, 0.487060546875, 0.57122802734375, 0.6553955078125, 0.73956298828125, 0.82373046875, 0.90789794921875, 0.9920654296875, 1.07623291015625, 1.160400390625, 1.24456787109375, 1.3287353515625, 1.41290283203125, 1.4970703125, 1.58123779296875, 1.6654052734375, 1.74957275390625, 1.833740234375, 1.91790771484375, 2.0020751953125, 2.08624267578125, 2.17041015625, 2.25457763671875, 2.3387451171875, 2.42291259765625, 2.507080078125, 2.59124755859375, 2.6754150390625, 2.75958251953125, 2.84375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 21.0, 21.0, 20.0, 32.0, 52.0, 64.0, 89.0, 118.0, 181.0, 234.0, 348.0, 517.0, 852.0, 1511.0, 3357.0, 9597.0, 39474.0, 244896.0, 636710.0, 83077.0, 16998.0, 5139.0, 2126.0, 1083.0, 613.0, 433.0, 274.0, 195.0, 154.0, 103.0, 67.0, 59.0, 35.0, 28.0, 15.0, 17.0, 12.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6953125, -10.4000244140625, -10.104736328125, -9.8094482421875, -9.51416015625, -9.2188720703125, -8.923583984375, -8.6282958984375, -8.3330078125, -8.0377197265625, -7.742431640625, -7.4471435546875, -7.15185546875, -6.8565673828125, -6.561279296875, -6.2659912109375, -5.970703125, -5.6754150390625, -5.380126953125, -5.0848388671875, -4.78955078125, -4.4942626953125, -4.198974609375, -3.9036865234375, -3.6083984375, -3.3131103515625, -3.017822265625, -2.7225341796875, -2.42724609375, -2.1319580078125, -1.836669921875, -1.5413818359375, -1.24609375, -0.9508056640625, -0.655517578125, -0.3602294921875, -0.06494140625, 0.2303466796875, 0.525634765625, 0.8209228515625, 1.1162109375, 1.4114990234375, 1.706787109375, 2.0020751953125, 2.29736328125, 2.5926513671875, 2.887939453125, 3.1832275390625, 3.478515625, 3.7738037109375, 4.069091796875, 4.3643798828125, 4.65966796875, 4.9549560546875, 5.250244140625, 5.5455322265625, 5.8408203125, 6.1361083984375, 6.431396484375, 6.7266845703125, 7.02197265625, 7.3172607421875, 7.612548828125, 7.9078369140625, 8.203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 2.0, 9.0, 4.0, 12.0, 22.0, 14.0, 18.0, 20.0, 25.0, 21.0, 33.0, 28.0, 32.0, 47.0, 51.0, 48.0, 49.0, 50.0, 48.0, 49.0, 54.0, 43.0, 32.0, 33.0, 36.0, 31.0, 31.0, 23.0, 15.0, 15.0, 10.0, 8.0, 13.0, 15.0, 12.0, 8.0, 4.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.828125, -10.5023193359375, -10.176513671875, -9.8507080078125, -9.52490234375, -9.1990966796875, -8.873291015625, -8.5474853515625, -8.2216796875, -7.8958740234375, -7.570068359375, -7.2442626953125, -6.91845703125, -6.5926513671875, -6.266845703125, -5.9410400390625, -5.615234375, -5.2894287109375, -4.963623046875, -4.6378173828125, -4.31201171875, -3.9862060546875, -3.660400390625, -3.3345947265625, -3.0087890625, -2.6829833984375, -2.357177734375, -2.0313720703125, -1.70556640625, -1.3797607421875, -1.053955078125, -0.7281494140625, -0.40234375, -0.0765380859375, 0.249267578125, 0.5750732421875, 0.90087890625, 1.2266845703125, 1.552490234375, 1.8782958984375, 2.2041015625, 2.5299072265625, 2.855712890625, 3.1815185546875, 3.50732421875, 3.8331298828125, 4.158935546875, 4.4847412109375, 4.810546875, 5.1363525390625, 5.462158203125, 5.7879638671875, 6.11376953125, 6.4395751953125, 6.765380859375, 7.0911865234375, 7.4169921875, 7.7427978515625, 8.068603515625, 8.3944091796875, 8.72021484375, 9.0460205078125, 9.371826171875, 9.6976318359375, 10.0234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 7.0, 7.0, 12.0, 18.0, 15.0, 28.0, 46.0, 63.0, 95.0, 155.0, 265.0, 576.0, 1247.0, 3308.0, 10134.0, 41115.0, 238736.0, 640841.0, 84419.0, 18532.0, 5284.0, 1919.0, 800.0, 361.0, 183.0, 136.0, 81.0, 50.0, 31.0, 29.0, 11.0, 15.0, 8.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.736328125, -3.6331787109375, -3.530029296875, -3.4268798828125, -3.32373046875, -3.2205810546875, -3.117431640625, -3.0142822265625, -2.9111328125, -2.8079833984375, -2.704833984375, -2.6016845703125, -2.49853515625, -2.3953857421875, -2.292236328125, -2.1890869140625, -2.0859375, -1.9827880859375, -1.879638671875, -1.7764892578125, -1.67333984375, -1.5701904296875, -1.467041015625, -1.3638916015625, -1.2607421875, -1.1575927734375, -1.054443359375, -0.9512939453125, -0.84814453125, -0.7449951171875, -0.641845703125, -0.5386962890625, -0.435546875, -0.3323974609375, -0.229248046875, -0.1260986328125, -0.02294921875, 0.0802001953125, 0.183349609375, 0.2864990234375, 0.3896484375, 0.4927978515625, 0.595947265625, 0.6990966796875, 0.80224609375, 0.9053955078125, 1.008544921875, 1.1116943359375, 1.21484375, 1.3179931640625, 1.421142578125, 1.5242919921875, 1.62744140625, 1.7305908203125, 1.833740234375, 1.9368896484375, 2.0400390625, 2.1431884765625, 2.246337890625, 2.3494873046875, 2.45263671875, 2.5557861328125, 2.658935546875, 2.7620849609375, 2.865234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 4.0, 10.0, 5.0, 10.0, 12.0, 11.0, 8.0, 16.0, 35.0, 32.0, 41.0, 71.0, 145.0, 169.0, 130.0, 92.0, 36.0, 43.0, 28.0, 16.0, 14.0, 15.0, 9.0, 7.0, 4.0, 4.0, 5.0, 8.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001201629638671875, -0.0011634379625320435, -0.001125246286392212, -0.0010870546102523804, -0.0010488629341125488, -0.0010106712579727173, -0.0009724795818328857, -0.0009342879056930542, -0.0008960962295532227, -0.0008579045534133911, -0.0008197128772735596, -0.000781521201133728, -0.0007433295249938965, -0.0007051378488540649, -0.0006669461727142334, -0.0006287544965744019, -0.0005905628204345703, -0.0005523711442947388, -0.0005141794681549072, -0.0004759877920150757, -0.00043779611587524414, -0.0003996044397354126, -0.00036141276359558105, -0.0003232210874557495, -0.00028502941131591797, -0.0002468377351760864, -0.00020864605903625488, -0.00017045438289642334, -0.0001322627067565918, -9.407103061676025e-05, -5.587935447692871e-05, -1.7687678337097168e-05, 2.0503997802734375e-05, 5.869567394256592e-05, 9.688735008239746e-05, 0.000135079026222229, 0.00017327070236206055, 0.0002114623785018921, 0.00024965405464172363, 0.0002878457307815552, 0.0003260374069213867, 0.00036422908306121826, 0.0004024207592010498, 0.00044061243534088135, 0.0004788041114807129, 0.0005169957876205444, 0.000555187463760376, 0.0005933791399002075, 0.0006315708160400391, 0.0006697624921798706, 0.0007079541683197021, 0.0007461458444595337, 0.0007843375205993652, 0.0008225291967391968, 0.0008607208728790283, 0.0008989125490188599, 0.0009371042251586914, 0.000975295901298523, 0.0010134875774383545, 0.001051679253578186, 0.0010898709297180176, 0.0011280626058578491, 0.0011662542819976807, 0.0012044459581375122, 0.0012426376342773438]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 6.0, 5.0, 7.0, 11.0, 15.0, 21.0, 31.0, 27.0, 50.0, 74.0, 127.0, 161.0, 277.0, 393.0, 700.0, 1149.0, 2015.0, 3911.0, 8274.0, 19927.0, 61058.0, 252284.0, 549106.0, 97271.0, 29100.0, 11257.0, 5088.0, 2558.0, 1403.0, 787.0, 506.0, 293.0, 192.0, 142.0, 98.0, 62.0, 48.0, 24.0, 16.0, 17.0, 17.0, 5.0, 9.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.63671875, -2.552154541015625, -2.46759033203125, -2.383026123046875, -2.2984619140625, -2.213897705078125, -2.12933349609375, -2.044769287109375, -1.960205078125, -1.875640869140625, -1.79107666015625, -1.706512451171875, -1.6219482421875, -1.537384033203125, -1.45281982421875, -1.368255615234375, -1.28369140625, -1.199127197265625, -1.11456298828125, -1.029998779296875, -0.9454345703125, -0.860870361328125, -0.77630615234375, -0.691741943359375, -0.607177734375, -0.522613525390625, -0.43804931640625, -0.353485107421875, -0.2689208984375, -0.184356689453125, -0.09979248046875, -0.015228271484375, 0.0693359375, 0.153900146484375, 0.23846435546875, 0.323028564453125, 0.4075927734375, 0.492156982421875, 0.57672119140625, 0.661285400390625, 0.745849609375, 0.830413818359375, 0.91497802734375, 0.999542236328125, 1.0841064453125, 1.168670654296875, 1.25323486328125, 1.337799072265625, 1.42236328125, 1.506927490234375, 1.59149169921875, 1.676055908203125, 1.7606201171875, 1.845184326171875, 1.92974853515625, 2.014312744140625, 2.098876953125, 2.183441162109375, 2.26800537109375, 2.352569580078125, 2.4371337890625, 2.521697998046875, 2.60626220703125, 2.690826416015625, 2.775390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 13.0, 14.0, 14.0, 13.0, 21.0, 35.0, 27.0, 45.0, 58.0, 54.0, 88.0, 84.0, 85.0, 82.0, 71.0, 56.0, 42.0, 35.0, 29.0, 20.0, 27.0, 12.0, 12.0, 12.0, 8.0, 12.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.689453125, -3.59991455078125, -3.5103759765625, -3.42083740234375, -3.331298828125, -3.24176025390625, -3.1522216796875, -3.06268310546875, -2.97314453125, -2.88360595703125, -2.7940673828125, -2.70452880859375, -2.614990234375, -2.52545166015625, -2.4359130859375, -2.34637451171875, -2.2568359375, -2.16729736328125, -2.0777587890625, -1.98822021484375, -1.898681640625, -1.80914306640625, -1.7196044921875, -1.63006591796875, -1.54052734375, -1.45098876953125, -1.3614501953125, -1.27191162109375, -1.182373046875, -1.09283447265625, -1.0032958984375, -0.91375732421875, -0.82421875, -0.73468017578125, -0.6451416015625, -0.55560302734375, -0.466064453125, -0.37652587890625, -0.2869873046875, -0.19744873046875, -0.10791015625, -0.01837158203125, 0.0711669921875, 0.16070556640625, 0.250244140625, 0.33978271484375, 0.4293212890625, 0.51885986328125, 0.6083984375, 0.69793701171875, 0.7874755859375, 0.87701416015625, 0.966552734375, 1.05609130859375, 1.1456298828125, 1.23516845703125, 1.32470703125, 1.41424560546875, 1.5037841796875, 1.59332275390625, 1.682861328125, 1.77239990234375, 1.8619384765625, 1.95147705078125, 2.041015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 19.0, 26.0, 54.0, 49.0, 92.0, 160.0, 185.0, 116.0, 83.0, 59.0, 43.0, 27.0, 22.0, 13.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.665138244628906, -52.0051155090332, -50.3450927734375, -48.6850700378418, -47.025047302246094, -45.365020751953125, -43.70499801635742, -42.04497528076172, -40.384952545166016, -38.72492980957031, -37.06490707397461, -35.404884338378906, -33.74485778808594, -32.0848388671875, -30.42481231689453, -28.764789581298828, -27.104766845703125, -25.444744110107422, -23.78472137451172, -22.124696731567383, -20.46467399597168, -18.804651260375977, -17.14462661743164, -15.484603881835938, -13.824581146240234, -12.164558410644531, -10.504534721374512, -8.844511032104492, -7.184488296508789, -5.524465560913086, -3.8644418716430664, -2.204418182373047, -0.5443954467773438, 1.1156277656555176, 2.775650978088379, 4.43567419052124, 6.095697402954102, 7.755720138549805, 9.415743827819824, 11.075767517089844, 12.735790252685547, 14.39581298828125, 16.055835723876953, 17.71586036682129, 19.375883102416992, 21.035905838012695, 22.69593048095703, 24.355953216552734, 26.015975952148438, 27.67599868774414, 29.336021423339844, 30.99604606628418, 32.65606689453125, 34.31609344482422, 35.97611618041992, 37.636138916015625, 39.29616165161133, 40.95618438720703, 42.616207122802734, 44.27622985839844, 45.936256408691406, 47.596275329589844, 49.25630187988281, 50.916324615478516, 52.57634735107422]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 13.0, 10.0, 16.0, 16.0, 25.0, 15.0, 12.0, 25.0, 24.0, 33.0, 40.0, 40.0, 50.0, 54.0, 80.0, 77.0, 71.0, 53.0, 39.0, 46.0, 34.0, 32.0, 28.0, 20.0, 32.0, 21.0, 13.0, 12.0, 14.0, 15.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.35382080078125, -46.90304946899414, -45.45227813720703, -44.001502990722656, -42.55073165893555, -41.09996032714844, -39.64918899536133, -38.19841766357422, -36.747642517089844, -35.296871185302734, -33.846099853515625, -32.39532470703125, -30.94455337524414, -29.49378204345703, -28.043010711669922, -26.59223747253418, -25.14146614074707, -23.69069480895996, -22.23992156982422, -20.78915023803711, -19.338376998901367, -17.887605667114258, -16.436832427978516, -14.986061096191406, -13.53528881072998, -12.084516525268555, -10.633744239807129, -9.182971954345703, -7.7322001457214355, -6.28142786026001, -4.830656051635742, -3.3798837661743164, -1.9291114807128906, -0.4783393144607544, 0.9724328517913818, 2.4232048988342285, 3.8739771842956543, 5.32474946975708, 6.775521278381348, 8.226293563842773, 9.6770658493042, 11.127838134765625, 12.57861042022705, 14.029382705688477, 15.480154037475586, 16.930927276611328, 18.381698608398438, 19.832469940185547, 21.28324317932129, 22.7340145111084, 24.18478775024414, 25.63555908203125, 27.086332321166992, 28.5371036529541, 29.987876892089844, 31.438648223876953, 32.88941955566406, 34.34019088745117, 35.79096221923828, 37.241737365722656, 38.692508697509766, 40.143280029296875, 41.594051361083984, 43.044822692871094, 44.49559783935547]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 12.0, 3.0, 16.0, 21.0, 34.0, 54.0, 76.0, 175.0, 272.0, 569.0, 1206.0, 3064.0, 8897.0, 33097.0, 281033.0, 3308751.0, 493363.0, 45406.0, 11478.0, 3864.0, 1457.0, 686.0, 315.0, 155.0, 96.0, 65.0, 34.0, 23.0, 17.0, 12.0, 5.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9765625, -6.785888671875, -6.59521484375, -6.404541015625, -6.2138671875, -6.023193359375, -5.83251953125, -5.641845703125, -5.451171875, -5.260498046875, -5.06982421875, -4.879150390625, -4.6884765625, -4.497802734375, -4.30712890625, -4.116455078125, -3.92578125, -3.735107421875, -3.54443359375, -3.353759765625, -3.1630859375, -2.972412109375, -2.78173828125, -2.591064453125, -2.400390625, -2.209716796875, -2.01904296875, -1.828369140625, -1.6376953125, -1.447021484375, -1.25634765625, -1.065673828125, -0.875, -0.684326171875, -0.49365234375, -0.302978515625, -0.1123046875, 0.078369140625, 0.26904296875, 0.459716796875, 0.650390625, 0.841064453125, 1.03173828125, 1.222412109375, 1.4130859375, 1.603759765625, 1.79443359375, 1.985107421875, 2.17578125, 2.366455078125, 2.55712890625, 2.747802734375, 2.9384765625, 3.129150390625, 3.31982421875, 3.510498046875, 3.701171875, 3.891845703125, 4.08251953125, 4.273193359375, 4.4638671875, 4.654541015625, 4.84521484375, 5.035888671875, 5.2265625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 5.0, 11.0, 8.0, 9.0, 16.0, 9.0, 14.0, 15.0, 28.0, 28.0, 35.0, 43.0, 52.0, 43.0, 47.0, 46.0, 47.0, 56.0, 51.0, 50.0, 50.0, 45.0, 42.0, 34.0, 45.0, 25.0, 23.0, 20.0, 18.0, 26.0, 15.0, 11.0, 13.0, 13.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.899993896484375, -2.81170654296875, -2.723419189453125, -2.6351318359375, -2.546844482421875, -2.45855712890625, -2.370269775390625, -2.281982421875, -2.193695068359375, -2.10540771484375, -2.017120361328125, -1.9288330078125, -1.840545654296875, -1.75225830078125, -1.663970947265625, -1.57568359375, -1.487396240234375, -1.39910888671875, -1.310821533203125, -1.2225341796875, -1.134246826171875, -1.04595947265625, -0.957672119140625, -0.869384765625, -0.781097412109375, -0.69281005859375, -0.604522705078125, -0.5162353515625, -0.427947998046875, -0.33966064453125, -0.251373291015625, -0.1630859375, -0.074798583984375, 0.01348876953125, 0.101776123046875, 0.1900634765625, 0.278350830078125, 0.36663818359375, 0.454925537109375, 0.543212890625, 0.631500244140625, 0.71978759765625, 0.808074951171875, 0.8963623046875, 0.984649658203125, 1.07293701171875, 1.161224365234375, 1.24951171875, 1.337799072265625, 1.42608642578125, 1.514373779296875, 1.6026611328125, 1.690948486328125, 1.77923583984375, 1.867523193359375, 1.955810546875, 2.044097900390625, 2.13238525390625, 2.220672607421875, 2.3089599609375, 2.397247314453125, 2.48553466796875, 2.573822021484375, 2.662109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 5.0, 11.0, 16.0, 11.0, 26.0, 21.0, 34.0, 54.0, 103.0, 145.0, 242.0, 726.0, 2290.0, 13604.0, 219988.0, 3861204.0, 85613.0, 7681.0, 1445.0, 456.0, 206.0, 101.0, 67.0, 47.0, 28.0, 34.0, 22.0, 27.0, 19.0, 11.0, 9.0, 2.0, 6.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.312255859375, -10.91357421875, -10.514892578125, -10.1162109375, -9.717529296875, -9.31884765625, -8.920166015625, -8.521484375, -8.122802734375, -7.72412109375, -7.325439453125, -6.9267578125, -6.528076171875, -6.12939453125, -5.730712890625, -5.33203125, -4.933349609375, -4.53466796875, -4.135986328125, -3.7373046875, -3.338623046875, -2.93994140625, -2.541259765625, -2.142578125, -1.743896484375, -1.34521484375, -0.946533203125, -0.5478515625, -0.149169921875, 0.24951171875, 0.648193359375, 1.046875, 1.445556640625, 1.84423828125, 2.242919921875, 2.6416015625, 3.040283203125, 3.43896484375, 3.837646484375, 4.236328125, 4.635009765625, 5.03369140625, 5.432373046875, 5.8310546875, 6.229736328125, 6.62841796875, 7.027099609375, 7.42578125, 7.824462890625, 8.22314453125, 8.621826171875, 9.0205078125, 9.419189453125, 9.81787109375, 10.216552734375, 10.615234375, 11.013916015625, 11.41259765625, 11.811279296875, 12.2099609375, 12.608642578125, 13.00732421875, 13.406005859375, 13.8046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 5.0, 5.0, 6.0, 7.0, 12.0, 19.0, 16.0, 26.0, 38.0, 49.0, 96.0, 125.0, 220.0, 396.0, 670.0, 877.0, 597.0, 368.0, 175.0, 103.0, 82.0, 54.0, 37.0, 19.0, 15.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5703125, -5.36614990234375, -5.1619873046875, -4.95782470703125, -4.753662109375, -4.54949951171875, -4.3453369140625, -4.14117431640625, -3.93701171875, -3.73284912109375, -3.5286865234375, -3.32452392578125, -3.120361328125, -2.91619873046875, -2.7120361328125, -2.50787353515625, -2.3037109375, -2.09954833984375, -1.8953857421875, -1.69122314453125, -1.487060546875, -1.28289794921875, -1.0787353515625, -0.87457275390625, -0.67041015625, -0.46624755859375, -0.2620849609375, -0.05792236328125, 0.146240234375, 0.35040283203125, 0.5545654296875, 0.75872802734375, 0.962890625, 1.16705322265625, 1.3712158203125, 1.57537841796875, 1.779541015625, 1.98370361328125, 2.1878662109375, 2.39202880859375, 2.59619140625, 2.80035400390625, 3.0045166015625, 3.20867919921875, 3.412841796875, 3.61700439453125, 3.8211669921875, 4.02532958984375, 4.2294921875, 4.43365478515625, 4.6378173828125, 4.84197998046875, 5.046142578125, 5.25030517578125, 5.4544677734375, 5.65863037109375, 5.86279296875, 6.06695556640625, 6.2711181640625, 6.47528076171875, 6.679443359375, 6.88360595703125, 7.0877685546875, 7.29193115234375, 7.49609375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 20.0, 54.0, 133.0, 261.0, 261.0, 147.0, 55.0, 26.0, 15.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.48782348632812, -102.0858383178711, -98.68384552001953, -95.2818603515625, -91.87986755371094, -88.4778823852539, -85.07589721679688, -81.67390441894531, -78.27191162109375, -74.86992645263672, -71.46793365478516, -68.06594848632812, -64.66395568847656, -61.26197052001953, -57.859981536865234, -54.45799255371094, -51.056007385253906, -47.65401840209961, -44.25202941894531, -40.85004425048828, -37.44805145263672, -34.04606628417969, -30.64407730102539, -27.242088317871094, -23.840099334716797, -20.4381103515625, -17.036121368408203, -13.634134292602539, -10.232145309448242, -6.830156326293945, -3.4281692504882812, -0.026180267333984375, 3.3758087158203125, 6.777797222137451, 10.17978572845459, 13.58177375793457, 16.983762741088867, 20.385751724243164, 23.787738800048828, 27.189727783203125, 30.591716766357422, 33.99370574951172, 37.395694732666016, 40.79768371582031, 44.199668884277344, 47.601661682128906, 51.00364685058594, 54.405635833740234, 57.80762481689453, 61.20961380004883, 64.61160278320312, 68.01358795166016, 71.41558074951172, 74.81756591796875, 78.21955871582031, 81.62154388427734, 85.02352905273438, 88.4255142211914, 91.82750701904297, 95.2294921875, 98.63148498535156, 102.0334701538086, 105.43545532226562, 108.83744812011719, 112.23944091796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 8.0, 10.0, 10.0, 12.0, 15.0, 21.0, 25.0, 21.0, 30.0, 51.0, 52.0, 53.0, 48.0, 59.0, 57.0, 60.0, 56.0, 56.0, 61.0, 51.0, 47.0, 36.0, 24.0, 27.0, 20.0, 21.0, 18.0, 12.0, 2.0, 8.0, 9.0, 5.0, 7.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31557846069336, -28.257265090942383, -27.198951721191406, -26.140636444091797, -25.08232307434082, -24.024009704589844, -22.965694427490234, -21.907381057739258, -20.84906768798828, -19.790754318237305, -18.732440948486328, -17.67412567138672, -16.615812301635742, -15.557498931884766, -14.499184608459473, -13.44087028503418, -12.382556915283203, -11.324243545532227, -10.265929222106934, -9.20761489868164, -8.149301528930664, -7.090987682342529, -6.0326738357543945, -4.97435998916626, -3.916046142578125, -2.8577322959899902, -1.7994184494018555, -0.7411046028137207, 0.31720924377441406, 1.3755230903625488, 2.4338369369506836, 3.4921507835388184, 4.550464630126953, 5.608778476715088, 6.667092323303223, 7.725406169891357, 8.783720016479492, 9.842033386230469, 10.900347709655762, 11.958662033081055, 13.016975402832031, 14.075288772583008, 15.1336030960083, 16.191917419433594, 17.25023078918457, 18.308544158935547, 19.366859436035156, 20.425172805786133, 21.48348617553711, 22.541799545288086, 23.600112915039062, 24.658428192138672, 25.71674156188965, 26.775054931640625, 27.833370208740234, 28.89168357849121, 29.949996948242188, 31.008310317993164, 32.06662368774414, 33.12493896484375, 34.183250427246094, 35.2415657043457, 36.29988098144531, 37.358192443847656, 38.416507720947266]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 10.0, 21.0, 31.0, 67.0, 86.0, 183.0, 298.0, 562.0, 980.0, 2008.0, 4818.0, 11942.0, 38835.0, 152411.0, 435478.0, 290337.0, 75591.0, 21334.0, 7269.0, 3167.0, 1407.0, 748.0, 425.0, 226.0, 108.0, 74.0, 29.0, 28.0, 18.0, 14.0, 10.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.945556640625, -5.75830078125, -5.571044921875, -5.3837890625, -5.196533203125, -5.00927734375, -4.822021484375, -4.634765625, -4.447509765625, -4.26025390625, -4.072998046875, -3.8857421875, -3.698486328125, -3.51123046875, -3.323974609375, -3.13671875, -2.949462890625, -2.76220703125, -2.574951171875, -2.3876953125, -2.200439453125, -2.01318359375, -1.825927734375, -1.638671875, -1.451416015625, -1.26416015625, -1.076904296875, -0.8896484375, -0.702392578125, -0.51513671875, -0.327880859375, -0.140625, 0.046630859375, 0.23388671875, 0.421142578125, 0.6083984375, 0.795654296875, 0.98291015625, 1.170166015625, 1.357421875, 1.544677734375, 1.73193359375, 1.919189453125, 2.1064453125, 2.293701171875, 2.48095703125, 2.668212890625, 2.85546875, 3.042724609375, 3.22998046875, 3.417236328125, 3.6044921875, 3.791748046875, 3.97900390625, 4.166259765625, 4.353515625, 4.540771484375, 4.72802734375, 4.915283203125, 5.1025390625, 5.289794921875, 5.47705078125, 5.664306640625, 5.8515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 6.0, 7.0, 10.0, 10.0, 16.0, 15.0, 20.0, 31.0, 31.0, 27.0, 39.0, 48.0, 36.0, 41.0, 32.0, 49.0, 51.0, 44.0, 47.0, 37.0, 38.0, 38.0, 41.0, 39.0, 29.0, 28.0, 27.0, 23.0, 30.0, 16.0, 16.0, 16.0, 16.0, 8.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0078125, -2.923065185546875, -2.83831787109375, -2.753570556640625, -2.6688232421875, -2.584075927734375, -2.49932861328125, -2.414581298828125, -2.329833984375, -2.245086669921875, -2.16033935546875, -2.075592041015625, -1.9908447265625, -1.906097412109375, -1.82135009765625, -1.736602783203125, -1.65185546875, -1.567108154296875, -1.48236083984375, -1.397613525390625, -1.3128662109375, -1.228118896484375, -1.14337158203125, -1.058624267578125, -0.973876953125, -0.889129638671875, -0.80438232421875, -0.719635009765625, -0.6348876953125, -0.550140380859375, -0.46539306640625, -0.380645751953125, -0.2958984375, -0.211151123046875, -0.12640380859375, -0.041656494140625, 0.0430908203125, 0.127838134765625, 0.21258544921875, 0.297332763671875, 0.382080078125, 0.466827392578125, 0.55157470703125, 0.636322021484375, 0.7210693359375, 0.805816650390625, 0.89056396484375, 0.975311279296875, 1.06005859375, 1.144805908203125, 1.22955322265625, 1.314300537109375, 1.3990478515625, 1.483795166015625, 1.56854248046875, 1.653289794921875, 1.738037109375, 1.822784423828125, 1.90753173828125, 1.992279052734375, 2.0770263671875, 2.161773681640625, 2.24652099609375, 2.331268310546875, 2.416015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 9.0, 13.0, 34.0, 28.0, 53.0, 82.0, 127.0, 210.0, 342.0, 649.0, 1312.0, 2811.0, 7522.0, 27042.0, 140306.0, 644818.0, 175272.0, 32871.0, 8722.0, 3174.0, 1434.0, 727.0, 371.0, 219.0, 131.0, 87.0, 51.0, 32.0, 23.0, 28.0, 8.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9375, -6.71051025390625, -6.4835205078125, -6.25653076171875, -6.029541015625, -5.80255126953125, -5.5755615234375, -5.34857177734375, -5.12158203125, -4.89459228515625, -4.6676025390625, -4.44061279296875, -4.213623046875, -3.98663330078125, -3.7596435546875, -3.53265380859375, -3.3056640625, -3.07867431640625, -2.8516845703125, -2.62469482421875, -2.397705078125, -2.17071533203125, -1.9437255859375, -1.71673583984375, -1.48974609375, -1.26275634765625, -1.0357666015625, -0.80877685546875, -0.581787109375, -0.35479736328125, -0.1278076171875, 0.09918212890625, 0.326171875, 0.55316162109375, 0.7801513671875, 1.00714111328125, 1.234130859375, 1.46112060546875, 1.6881103515625, 1.91510009765625, 2.14208984375, 2.36907958984375, 2.5960693359375, 2.82305908203125, 3.050048828125, 3.27703857421875, 3.5040283203125, 3.73101806640625, 3.9580078125, 4.18499755859375, 4.4119873046875, 4.63897705078125, 4.865966796875, 5.09295654296875, 5.3199462890625, 5.54693603515625, 5.77392578125, 6.00091552734375, 6.2279052734375, 6.45489501953125, 6.681884765625, 6.90887451171875, 7.1358642578125, 7.36285400390625, 7.58984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 7.0, 8.0, 6.0, 18.0, 16.0, 24.0, 25.0, 35.0, 42.0, 30.0, 51.0, 51.0, 53.0, 60.0, 58.0, 67.0, 51.0, 39.0, 56.0, 40.0, 39.0, 35.0, 40.0, 23.0, 19.0, 26.0, 12.0, 9.0, 21.0, 8.0, 4.0, 2.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.5545654296875, -11.202880859375, -10.8511962890625, -10.49951171875, -10.1478271484375, -9.796142578125, -9.4444580078125, -9.0927734375, -8.7410888671875, -8.389404296875, -8.0377197265625, -7.68603515625, -7.3343505859375, -6.982666015625, -6.6309814453125, -6.279296875, -5.9276123046875, -5.575927734375, -5.2242431640625, -4.87255859375, -4.5208740234375, -4.169189453125, -3.8175048828125, -3.4658203125, -3.1141357421875, -2.762451171875, -2.4107666015625, -2.05908203125, -1.7073974609375, -1.355712890625, -1.0040283203125, -0.65234375, -0.3006591796875, 0.051025390625, 0.4027099609375, 0.75439453125, 1.1060791015625, 1.457763671875, 1.8094482421875, 2.1611328125, 2.5128173828125, 2.864501953125, 3.2161865234375, 3.56787109375, 3.9195556640625, 4.271240234375, 4.6229248046875, 4.974609375, 5.3262939453125, 5.677978515625, 6.0296630859375, 6.38134765625, 6.7330322265625, 7.084716796875, 7.4364013671875, 7.7880859375, 8.1397705078125, 8.491455078125, 8.8431396484375, 9.19482421875, 9.5465087890625, 9.898193359375, 10.2498779296875, 10.6015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 13.0, 12.0, 8.0, 21.0, 32.0, 35.0, 63.0, 102.0, 159.0, 253.0, 416.0, 804.0, 1399.0, 2894.0, 5766.0, 12863.0, 32104.0, 90996.0, 418502.0, 336029.0, 90100.0, 31527.0, 12667.0, 5673.0, 2778.0, 1446.0, 763.0, 473.0, 235.0, 148.0, 93.0, 44.0, 50.0, 26.0, 15.0, 16.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.962890625, -1.90679931640625, -1.8507080078125, -1.79461669921875, -1.738525390625, -1.68243408203125, -1.6263427734375, -1.57025146484375, -1.51416015625, -1.45806884765625, -1.4019775390625, -1.34588623046875, -1.289794921875, -1.23370361328125, -1.1776123046875, -1.12152099609375, -1.0654296875, -1.00933837890625, -0.9532470703125, -0.89715576171875, -0.841064453125, -0.78497314453125, -0.7288818359375, -0.67279052734375, -0.61669921875, -0.56060791015625, -0.5045166015625, -0.44842529296875, -0.392333984375, -0.33624267578125, -0.2801513671875, -0.22406005859375, -0.16796875, -0.11187744140625, -0.0557861328125, 0.00030517578125, 0.056396484375, 0.11248779296875, 0.1685791015625, 0.22467041015625, 0.28076171875, 0.33685302734375, 0.3929443359375, 0.44903564453125, 0.505126953125, 0.56121826171875, 0.6173095703125, 0.67340087890625, 0.7294921875, 0.78558349609375, 0.8416748046875, 0.89776611328125, 0.953857421875, 1.00994873046875, 1.0660400390625, 1.12213134765625, 1.17822265625, 1.23431396484375, 1.2904052734375, 1.34649658203125, 1.402587890625, 1.45867919921875, 1.5147705078125, 1.57086181640625, 1.626953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 8.0, 2.0, 10.0, 14.0, 17.0, 12.0, 22.0, 54.0, 76.0, 91.0, 146.0, 146.0, 112.0, 93.0, 55.0, 44.0, 27.0, 20.0, 8.0, 11.0, 5.0, 5.0, 9.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009098052978515625, -0.0008807331323623657, -0.0008516609668731689, -0.0008225888013839722, -0.0007935166358947754, -0.0007644444704055786, -0.0007353723049163818, -0.0007063001394271851, -0.0006772279739379883, -0.0006481558084487915, -0.0006190836429595947, -0.000590011477470398, -0.0005609393119812012, -0.0005318671464920044, -0.0005027949810028076, -0.00047372281551361084, -0.00044465065002441406, -0.0004155784845352173, -0.0003865063190460205, -0.00035743415355682373, -0.00032836198806762695, -0.0002992898225784302, -0.0002702176570892334, -0.00024114549160003662, -0.00021207332611083984, -0.00018300116062164307, -0.0001539289951324463, -0.0001248568296432495, -9.578466415405273e-05, -6.671249866485596e-05, -3.764033317565918e-05, -8.568167686462402e-06, 2.0503997802734375e-05, 4.957616329193115e-05, 7.864832878112793e-05, 0.00010772049427032471, 0.00013679265975952148, 0.00016586482524871826, 0.00019493699073791504, 0.00022400915622711182, 0.0002530813217163086, 0.00028215348720550537, 0.00031122565269470215, 0.0003402978181838989, 0.0003693699836730957, 0.0003984421491622925, 0.00042751431465148926, 0.00045658648014068604, 0.0004856586456298828, 0.0005147308111190796, 0.0005438029766082764, 0.0005728751420974731, 0.0006019473075866699, 0.0006310194730758667, 0.0006600916385650635, 0.0006891638040542603, 0.000718235969543457, 0.0007473081350326538, 0.0007763803005218506, 0.0008054524660110474, 0.0008345246315002441, 0.0008635967969894409, 0.0008926689624786377, 0.0009217411279678345, 0.0009508132934570312]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 14.0, 14.0, 26.0, 53.0, 88.0, 173.0, 361.0, 704.0, 1642.0, 4646.0, 14760.0, 57730.0, 285811.0, 566907.0, 85566.0, 20195.0, 6002.0, 2136.0, 885.0, 432.0, 193.0, 87.0, 62.0, 28.0, 17.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.5595703125, -2.474609375, -2.3896484375, -2.3046875, -2.2197265625, -2.134765625, -2.0498046875, -1.96484375, -1.8798828125, -1.794921875, -1.7099609375, -1.625, -1.5400390625, -1.455078125, -1.3701171875, -1.28515625, -1.2001953125, -1.115234375, -1.0302734375, -0.9453125, -0.8603515625, -0.775390625, -0.6904296875, -0.60546875, -0.5205078125, -0.435546875, -0.3505859375, -0.265625, -0.1806640625, -0.095703125, -0.0107421875, 0.07421875, 0.1591796875, 0.244140625, 0.3291015625, 0.4140625, 0.4990234375, 0.583984375, 0.6689453125, 0.75390625, 0.8388671875, 0.923828125, 1.0087890625, 1.09375, 1.1787109375, 1.263671875, 1.3486328125, 1.43359375, 1.5185546875, 1.603515625, 1.6884765625, 1.7734375, 1.8583984375, 1.943359375, 2.0283203125, 2.11328125, 2.1982421875, 2.283203125, 2.3681640625, 2.453125, 2.5380859375, 2.623046875, 2.7080078125, 2.79296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 16.0, 13.0, 22.0, 16.0, 27.0, 31.0, 39.0, 55.0, 54.0, 84.0, 79.0, 72.0, 86.0, 74.0, 72.0, 59.0, 32.0, 28.0, 26.0, 18.0, 15.0, 17.0, 10.0, 8.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.078094482421875, -2.00775146484375, -1.937408447265625, -1.8670654296875, -1.796722412109375, -1.72637939453125, -1.656036376953125, -1.585693359375, -1.515350341796875, -1.44500732421875, -1.374664306640625, -1.3043212890625, -1.233978271484375, -1.16363525390625, -1.093292236328125, -1.02294921875, -0.952606201171875, -0.88226318359375, -0.811920166015625, -0.7415771484375, -0.671234130859375, -0.60089111328125, -0.530548095703125, -0.460205078125, -0.389862060546875, -0.31951904296875, -0.249176025390625, -0.1788330078125, -0.108489990234375, -0.03814697265625, 0.032196044921875, 0.1025390625, 0.172882080078125, 0.24322509765625, 0.313568115234375, 0.3839111328125, 0.454254150390625, 0.52459716796875, 0.594940185546875, 0.665283203125, 0.735626220703125, 0.80596923828125, 0.876312255859375, 0.9466552734375, 1.016998291015625, 1.08734130859375, 1.157684326171875, 1.22802734375, 1.298370361328125, 1.36871337890625, 1.439056396484375, 1.5093994140625, 1.579742431640625, 1.65008544921875, 1.720428466796875, 1.790771484375, 1.861114501953125, 1.93145751953125, 2.001800537109375, 2.0721435546875, 2.142486572265625, 2.21282958984375, 2.283172607421875, 2.353515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 20.0, 32.0, 82.0, 126.0, 257.0, 263.0, 107.0, 48.0, 18.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.70498657226562, -81.24508666992188, -78.7851791381836, -76.32527923583984, -73.86537170410156, -71.40547180175781, -68.94557189941406, -66.48567199707031, -64.02576446533203, -61.565860748291016, -59.10595703125, -56.64605712890625, -54.186153411865234, -51.72624969482422, -49.26634979248047, -46.80644607543945, -44.34654235839844, -41.88663864135742, -39.426734924316406, -36.966835021972656, -34.50693130493164, -32.047027587890625, -29.587125778198242, -27.12722396850586, -24.667320251464844, -22.207416534423828, -19.747514724731445, -17.287612915039062, -14.827709197998047, -12.367806434631348, -9.907903671264648, -7.448001861572266, -4.98809814453125, -2.528195381164551, -0.06829261779785156, 2.3916101455688477, 4.851512908935547, 7.311415672302246, 9.771318435668945, 12.231220245361328, 14.691123962402344, 17.15102767944336, 19.610929489135742, 22.070831298828125, 24.53073501586914, 26.990638732910156, 29.45054054260254, 31.910442352294922, 34.37034606933594, 36.83024978637695, 39.29015350341797, 41.75005340576172, 44.209957122802734, 46.66986083984375, 49.1297607421875, 51.589664459228516, 54.04956817626953, 56.50947189331055, 58.96937561035156, 61.42927551269531, 63.88917922973633, 66.34908294677734, 68.8089828491211, 71.26889038085938, 73.72879028320312]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 8.0, 14.0, 5.0, 14.0, 12.0, 15.0, 15.0, 25.0, 20.0, 20.0, 32.0, 28.0, 30.0, 28.0, 38.0, 45.0, 57.0, 61.0, 60.0, 74.0, 43.0, 33.0, 40.0, 27.0, 28.0, 22.0, 14.0, 15.0, 18.0, 18.0, 19.0, 9.0, 18.0, 9.0, 10.0, 10.0, 9.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-31.554216384887695, -30.53770637512207, -29.521196365356445, -28.50468635559082, -27.488174438476562, -26.471664428710938, -25.455154418945312, -24.438644409179688, -23.422134399414062, -22.405624389648438, -21.389114379882812, -20.372604370117188, -19.356094360351562, -18.339584350585938, -17.32307243347168, -16.306562423706055, -15.29005241394043, -14.273542404174805, -13.25703239440918, -12.240521430969238, -11.224011421203613, -10.207501411437988, -9.190990447998047, -8.174480438232422, -7.157970428466797, -6.141460418701172, -5.124949932098389, -4.1084394454956055, -3.0919294357299805, -2.0754194259643555, -1.0589089393615723, -0.04239845275878906, 0.9741096496582031, 1.9906198978424072, 3.0071301460266113, 4.0236406326293945, 5.0401506423950195, 6.0566606521606445, 7.073171138763428, 8.089681625366211, 9.106191635131836, 10.122701644897461, 11.139211654663086, 12.155722618103027, 13.172232627868652, 14.188742637634277, 15.205253601074219, 16.221763610839844, 17.23827362060547, 18.254783630371094, 19.27129364013672, 20.287803649902344, 21.30431365966797, 22.320823669433594, 23.33733558654785, 24.353845596313477, 25.3703556060791, 26.386865615844727, 27.40337562561035, 28.419885635375977, 29.436397552490234, 30.45290756225586, 31.469417572021484, 32.48592758178711, 33.502437591552734]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 7.0, 8.0, 8.0, 11.0, 15.0, 24.0, 43.0, 80.0, 172.0, 495.0, 1246.0, 4243.0, 18424.0, 206570.0, 3630039.0, 302969.0, 22544.0, 4852.0, 1489.0, 529.0, 241.0, 119.0, 54.0, 38.0, 17.0, 12.0, 16.0, 5.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.171875, -8.91387939453125, -8.6558837890625, -8.39788818359375, -8.139892578125, -7.88189697265625, -7.6239013671875, -7.36590576171875, -7.10791015625, -6.84991455078125, -6.5919189453125, -6.33392333984375, -6.075927734375, -5.81793212890625, -5.5599365234375, -5.30194091796875, -5.0439453125, -4.78594970703125, -4.5279541015625, -4.26995849609375, -4.011962890625, -3.75396728515625, -3.4959716796875, -3.23797607421875, -2.97998046875, -2.72198486328125, -2.4639892578125, -2.20599365234375, -1.947998046875, -1.69000244140625, -1.4320068359375, -1.17401123046875, -0.916015625, -0.65802001953125, -0.4000244140625, -0.14202880859375, 0.115966796875, 0.37396240234375, 0.6319580078125, 0.88995361328125, 1.14794921875, 1.40594482421875, 1.6639404296875, 1.92193603515625, 2.179931640625, 2.43792724609375, 2.6959228515625, 2.95391845703125, 3.2119140625, 3.46990966796875, 3.7279052734375, 3.98590087890625, 4.243896484375, 4.50189208984375, 4.7598876953125, 5.01788330078125, 5.27587890625, 5.53387451171875, 5.7918701171875, 6.04986572265625, 6.307861328125, 6.56585693359375, 6.8238525390625, 7.08184814453125, 7.33984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 2.0, 7.0, 9.0, 15.0, 6.0, 17.0, 16.0, 17.0, 27.0, 28.0, 29.0, 34.0, 38.0, 49.0, 44.0, 45.0, 57.0, 51.0, 50.0, 48.0, 45.0, 46.0, 47.0, 35.0, 35.0, 35.0, 27.0, 27.0, 20.0, 15.0, 15.0, 13.0, 16.0, 8.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.015625, -2.927154541015625, -2.83868408203125, -2.750213623046875, -2.6617431640625, -2.573272705078125, -2.48480224609375, -2.396331787109375, -2.307861328125, -2.219390869140625, -2.13092041015625, -2.042449951171875, -1.9539794921875, -1.865509033203125, -1.77703857421875, -1.688568115234375, -1.60009765625, -1.511627197265625, -1.42315673828125, -1.334686279296875, -1.2462158203125, -1.157745361328125, -1.06927490234375, -0.980804443359375, -0.892333984375, -0.803863525390625, -0.71539306640625, -0.626922607421875, -0.5384521484375, -0.449981689453125, -0.36151123046875, -0.273040771484375, -0.1845703125, -0.096099853515625, -0.00762939453125, 0.080841064453125, 0.1693115234375, 0.257781982421875, 0.34625244140625, 0.434722900390625, 0.523193359375, 0.611663818359375, 0.70013427734375, 0.788604736328125, 0.8770751953125, 0.965545654296875, 1.05401611328125, 1.142486572265625, 1.23095703125, 1.319427490234375, 1.40789794921875, 1.496368408203125, 1.5848388671875, 1.673309326171875, 1.76177978515625, 1.850250244140625, 1.938720703125, 2.027191162109375, 2.11566162109375, 2.204132080078125, 2.2926025390625, 2.381072998046875, 2.46954345703125, 2.558013916015625, 2.646484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 26.0, 36.0, 82.0, 182.0, 360.0, 1084.0, 9929.0, 2751260.0, 1421442.0, 8182.0, 980.0, 349.0, 155.0, 97.0, 48.0, 25.0, 18.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.913818359375, -17.24951171875, -16.585205078125, -15.9208984375, -15.256591796875, -14.59228515625, -13.927978515625, -13.263671875, -12.599365234375, -11.93505859375, -11.270751953125, -10.6064453125, -9.942138671875, -9.27783203125, -8.613525390625, -7.94921875, -7.284912109375, -6.62060546875, -5.956298828125, -5.2919921875, -4.627685546875, -3.96337890625, -3.299072265625, -2.634765625, -1.970458984375, -1.30615234375, -0.641845703125, 0.0224609375, 0.686767578125, 1.35107421875, 2.015380859375, 2.6796875, 3.343994140625, 4.00830078125, 4.672607421875, 5.3369140625, 6.001220703125, 6.66552734375, 7.329833984375, 7.994140625, 8.658447265625, 9.32275390625, 9.987060546875, 10.6513671875, 11.315673828125, 11.97998046875, 12.644287109375, 13.30859375, 13.972900390625, 14.63720703125, 15.301513671875, 15.9658203125, 16.630126953125, 17.29443359375, 17.958740234375, 18.623046875, 19.287353515625, 19.95166015625, 20.615966796875, 21.2802734375, 21.944580078125, 22.60888671875, 23.273193359375, 23.9375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 9.0, 8.0, 13.0, 21.0, 32.0, 37.0, 79.0, 149.0, 318.0, 744.0, 1184.0, 752.0, 350.0, 167.0, 77.0, 47.0, 24.0, 18.0, 12.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -6.96490478515625, -6.6680908203125, -6.37127685546875, -6.074462890625, -5.77764892578125, -5.4808349609375, -5.18402099609375, -4.88720703125, -4.59039306640625, -4.2935791015625, -3.99676513671875, -3.699951171875, -3.40313720703125, -3.1063232421875, -2.80950927734375, -2.5126953125, -2.21588134765625, -1.9190673828125, -1.62225341796875, -1.325439453125, -1.02862548828125, -0.7318115234375, -0.43499755859375, -0.13818359375, 0.15863037109375, 0.4554443359375, 0.75225830078125, 1.049072265625, 1.34588623046875, 1.6427001953125, 1.93951416015625, 2.236328125, 2.53314208984375, 2.8299560546875, 3.12677001953125, 3.423583984375, 3.72039794921875, 4.0172119140625, 4.31402587890625, 4.61083984375, 4.90765380859375, 5.2044677734375, 5.50128173828125, 5.798095703125, 6.09490966796875, 6.3917236328125, 6.68853759765625, 6.9853515625, 7.28216552734375, 7.5789794921875, 7.87579345703125, 8.172607421875, 8.46942138671875, 8.7662353515625, 9.06304931640625, 9.35986328125, 9.65667724609375, 9.9534912109375, 10.25030517578125, 10.547119140625, 10.84393310546875, 11.1407470703125, 11.43756103515625, 11.734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 10.0, 18.0, 54.0, 73.0, 105.0, 145.0, 189.0, 141.0, 114.0, 62.0, 31.0, 23.0, 9.0, 8.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.0606689453125, -90.87197875976562, -88.68328857421875, -86.4946060180664, -84.30591583251953, -82.11722564697266, -79.92854309082031, -77.73985290527344, -75.55116271972656, -73.36247253417969, -71.17378234863281, -68.98509979248047, -66.7964096069336, -64.60771942138672, -62.41903305053711, -60.2303466796875, -58.041656494140625, -55.85296630859375, -53.66427993774414, -51.47559356689453, -49.286903381347656, -47.09821319580078, -44.90952682495117, -42.72084045410156, -40.53215026855469, -38.34346008300781, -36.1547737121582, -33.966087341308594, -31.77739715576172, -29.588708877563477, -27.400020599365234, -25.211332321166992, -23.02264404296875, -20.833955764770508, -18.645267486572266, -16.456579208374023, -14.267890930175781, -12.079202651977539, -9.890514373779297, -7.701826095581055, -5.5131378173828125, -3.3244495391845703, -1.1357612609863281, 1.052927017211914, 3.2416152954101562, 5.430303573608398, 7.618991851806641, 9.807680130004883, 11.996368408203125, 14.185056686401367, 16.37374496459961, 18.56243324279785, 20.751121520996094, 22.939809799194336, 25.128498077392578, 27.31718635559082, 29.505874633789062, 31.694562911987305, 33.88325119018555, 36.071937561035156, 38.26062774658203, 40.449317932128906, 42.638004302978516, 44.826690673828125, 47.015380859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 2.0, 8.0, 6.0, 10.0, 14.0, 13.0, 25.0, 26.0, 34.0, 33.0, 53.0, 59.0, 56.0, 47.0, 55.0, 46.0, 50.0, 56.0, 46.0, 39.0, 40.0, 49.0, 30.0, 35.0, 33.0, 22.0, 26.0, 16.0, 16.0, 10.0, 8.0, 10.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.73828887939453, -34.621551513671875, -33.504817962646484, -32.388084411621094, -31.271347045898438, -30.154611587524414, -29.03787612915039, -27.921140670776367, -26.804405212402344, -25.68766975402832, -24.570934295654297, -23.454198837280273, -22.33746337890625, -21.220727920532227, -20.103992462158203, -18.98725700378418, -17.870521545410156, -16.753786087036133, -15.63705062866211, -14.520315170288086, -13.403579711914062, -12.286844253540039, -11.170108795166016, -10.053373336791992, -8.936637878417969, -7.819902420043945, -6.703166961669922, -5.586431503295898, -4.469696044921875, -3.3529605865478516, -2.236225128173828, -1.1194896697998047, -0.002750396728515625, 1.1139850616455078, 2.2307205200195312, 3.3474559783935547, 4.464191436767578, 5.580926895141602, 6.697662353515625, 7.814397811889648, 8.931133270263672, 10.047868728637695, 11.164604187011719, 12.281339645385742, 13.398075103759766, 14.514810562133789, 15.631546020507812, 16.748281478881836, 17.86501693725586, 18.981752395629883, 20.098487854003906, 21.21522331237793, 22.331958770751953, 23.448694229125977, 24.5654296875, 25.682165145874023, 26.798900604248047, 27.91563606262207, 29.032371520996094, 30.149106979370117, 31.26584243774414, 32.38257598876953, 33.49931335449219, 34.616050720214844, 35.732784271240234]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 14.0, 10.0, 14.0, 56.0, 90.0, 165.0, 392.0, 1051.0, 3017.0, 10336.0, 49125.0, 328098.0, 544558.0, 88188.0, 16695.0, 4326.0, 1369.0, 591.0, 234.0, 104.0, 50.0, 30.0, 15.0, 11.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.0067138671875, -7.732177734375, -7.4576416015625, -7.18310546875, -6.9085693359375, -6.634033203125, -6.3594970703125, -6.0849609375, -5.8104248046875, -5.535888671875, -5.2613525390625, -4.98681640625, -4.7122802734375, -4.437744140625, -4.1632080078125, -3.888671875, -3.6141357421875, -3.339599609375, -3.0650634765625, -2.79052734375, -2.5159912109375, -2.241455078125, -1.9669189453125, -1.6923828125, -1.4178466796875, -1.143310546875, -0.8687744140625, -0.59423828125, -0.3197021484375, -0.045166015625, 0.2293701171875, 0.50390625, 0.7784423828125, 1.052978515625, 1.3275146484375, 1.60205078125, 1.8765869140625, 2.151123046875, 2.4256591796875, 2.7001953125, 2.9747314453125, 3.249267578125, 3.5238037109375, 3.79833984375, 4.0728759765625, 4.347412109375, 4.6219482421875, 4.896484375, 5.1710205078125, 5.445556640625, 5.7200927734375, 5.99462890625, 6.2691650390625, 6.543701171875, 6.8182373046875, 7.0927734375, 7.3673095703125, 7.641845703125, 7.9163818359375, 8.19091796875, 8.4654541015625, 8.739990234375, 9.0145263671875, 9.2890625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 11.0, 9.0, 7.0, 18.0, 25.0, 16.0, 25.0, 29.0, 37.0, 38.0, 39.0, 42.0, 31.0, 48.0, 41.0, 45.0, 44.0, 47.0, 53.0, 47.0, 47.0, 40.0, 31.0, 32.0, 29.0, 25.0, 24.0, 22.0, 15.0, 15.0, 11.0, 7.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.94915771484375, -2.8572998046875, -2.76544189453125, -2.673583984375, -2.58172607421875, -2.4898681640625, -2.39801025390625, -2.30615234375, -2.21429443359375, -2.1224365234375, -2.03057861328125, -1.938720703125, -1.84686279296875, -1.7550048828125, -1.66314697265625, -1.5712890625, -1.47943115234375, -1.3875732421875, -1.29571533203125, -1.203857421875, -1.11199951171875, -1.0201416015625, -0.92828369140625, -0.83642578125, -0.74456787109375, -0.6527099609375, -0.56085205078125, -0.468994140625, -0.37713623046875, -0.2852783203125, -0.19342041015625, -0.1015625, -0.00970458984375, 0.0821533203125, 0.17401123046875, 0.265869140625, 0.35772705078125, 0.4495849609375, 0.54144287109375, 0.63330078125, 0.72515869140625, 0.8170166015625, 0.90887451171875, 1.000732421875, 1.09259033203125, 1.1844482421875, 1.27630615234375, 1.3681640625, 1.46002197265625, 1.5518798828125, 1.64373779296875, 1.735595703125, 1.82745361328125, 1.9193115234375, 2.01116943359375, 2.10302734375, 2.19488525390625, 2.2867431640625, 2.37860107421875, 2.470458984375, 2.56231689453125, 2.6541748046875, 2.74603271484375, 2.837890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 12.0, 5.0, 19.0, 25.0, 27.0, 32.0, 59.0, 89.0, 143.0, 201.0, 363.0, 667.0, 1414.0, 4193.0, 18018.0, 140661.0, 778332.0, 85434.0, 12858.0, 3364.0, 1184.0, 584.0, 310.0, 194.0, 113.0, 96.0, 51.0, 34.0, 21.0, 14.0, 17.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8671875, -8.53125, -8.1953125, -7.859375, -7.5234375, -7.1875, -6.8515625, -6.515625, -6.1796875, -5.84375, -5.5078125, -5.171875, -4.8359375, -4.5, -4.1640625, -3.828125, -3.4921875, -3.15625, -2.8203125, -2.484375, -2.1484375, -1.8125, -1.4765625, -1.140625, -0.8046875, -0.46875, -0.1328125, 0.203125, 0.5390625, 0.875, 1.2109375, 1.546875, 1.8828125, 2.21875, 2.5546875, 2.890625, 3.2265625, 3.5625, 3.8984375, 4.234375, 4.5703125, 4.90625, 5.2421875, 5.578125, 5.9140625, 6.25, 6.5859375, 6.921875, 7.2578125, 7.59375, 7.9296875, 8.265625, 8.6015625, 8.9375, 9.2734375, 9.609375, 9.9453125, 10.28125, 10.6171875, 10.953125, 11.2890625, 11.625, 11.9609375, 12.296875, 12.6328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 5.0, 7.0, 7.0, 7.0, 8.0, 12.0, 11.0, 18.0, 21.0, 15.0, 22.0, 21.0, 28.0, 39.0, 41.0, 46.0, 47.0, 58.0, 56.0, 49.0, 51.0, 57.0, 44.0, 64.0, 42.0, 37.0, 31.0, 35.0, 23.0, 18.0, 14.0, 16.0, 13.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.859375, -10.48583984375, -10.1123046875, -9.73876953125, -9.365234375, -8.99169921875, -8.6181640625, -8.24462890625, -7.87109375, -7.49755859375, -7.1240234375, -6.75048828125, -6.376953125, -6.00341796875, -5.6298828125, -5.25634765625, -4.8828125, -4.50927734375, -4.1357421875, -3.76220703125, -3.388671875, -3.01513671875, -2.6416015625, -2.26806640625, -1.89453125, -1.52099609375, -1.1474609375, -0.77392578125, -0.400390625, -0.02685546875, 0.3466796875, 0.72021484375, 1.09375, 1.46728515625, 1.8408203125, 2.21435546875, 2.587890625, 2.96142578125, 3.3349609375, 3.70849609375, 4.08203125, 4.45556640625, 4.8291015625, 5.20263671875, 5.576171875, 5.94970703125, 6.3232421875, 6.69677734375, 7.0703125, 7.44384765625, 7.8173828125, 8.19091796875, 8.564453125, 8.93798828125, 9.3115234375, 9.68505859375, 10.05859375, 10.43212890625, 10.8056640625, 11.17919921875, 11.552734375, 11.92626953125, 12.2998046875, 12.67333984375, 13.046875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 15.0, 16.0, 17.0, 18.0, 44.0, 48.0, 90.0, 156.0, 204.0, 405.0, 722.0, 1345.0, 2907.0, 6967.0, 19566.0, 66449.0, 604786.0, 266721.0, 51024.0, 15863.0, 5925.0, 2598.0, 1165.0, 595.0, 343.0, 218.0, 114.0, 70.0, 60.0, 37.0, 17.0, 19.0, 8.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.044921875, -2.960113525390625, -2.87530517578125, -2.790496826171875, -2.7056884765625, -2.620880126953125, -2.53607177734375, -2.451263427734375, -2.366455078125, -2.281646728515625, -2.19683837890625, -2.112030029296875, -2.0272216796875, -1.942413330078125, -1.85760498046875, -1.772796630859375, -1.68798828125, -1.603179931640625, -1.51837158203125, -1.433563232421875, -1.3487548828125, -1.263946533203125, -1.17913818359375, -1.094329833984375, -1.009521484375, -0.924713134765625, -0.83990478515625, -0.755096435546875, -0.6702880859375, -0.585479736328125, -0.50067138671875, -0.415863037109375, -0.3310546875, -0.246246337890625, -0.16143798828125, -0.076629638671875, 0.0081787109375, 0.092987060546875, 0.17779541015625, 0.262603759765625, 0.347412109375, 0.432220458984375, 0.51702880859375, 0.601837158203125, 0.6866455078125, 0.771453857421875, 0.85626220703125, 0.941070556640625, 1.02587890625, 1.110687255859375, 1.19549560546875, 1.280303955078125, 1.3651123046875, 1.449920654296875, 1.53472900390625, 1.619537353515625, 1.704345703125, 1.789154052734375, 1.87396240234375, 1.958770751953125, 2.0435791015625, 2.128387451171875, 2.21319580078125, 2.298004150390625, 2.3828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 3.0, 9.0, 6.0, 15.0, 29.0, 39.0, 62.0, 126.0, 252.0, 203.0, 93.0, 54.0, 30.0, 24.0, 12.0, 7.0, 7.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013713836669921875, -0.0013296008110046387, -0.0012878179550170898, -0.001246035099029541, -0.0012042522430419922, -0.0011624693870544434, -0.0011206865310668945, -0.0010789036750793457, -0.0010371208190917969, -0.000995337963104248, -0.0009535551071166992, -0.0009117722511291504, -0.0008699893951416016, -0.0008282065391540527, -0.0007864236831665039, -0.0007446408271789551, -0.0007028579711914062, -0.0006610751152038574, -0.0006192922592163086, -0.0005775094032287598, -0.0005357265472412109, -0.0004939436912536621, -0.0004521608352661133, -0.00041037797927856445, -0.0003685951232910156, -0.0003268122673034668, -0.00028502941131591797, -0.00024324655532836914, -0.0002014636993408203, -0.00015968084335327148, -0.00011789798736572266, -7.611513137817383e-05, -3.4332275390625e-05, 7.450580596923828e-06, 4.9233436584472656e-05, 9.101629257202148e-05, 0.0001327991485595703, 0.00017458200454711914, 0.00021636486053466797, 0.0002581477165222168, 0.0002999305725097656, 0.00034171342849731445, 0.0003834962844848633, 0.0004252791404724121, 0.00046706199645996094, 0.0005088448524475098, 0.0005506277084350586, 0.0005924105644226074, 0.0006341934204101562, 0.0006759762763977051, 0.0007177591323852539, 0.0007595419883728027, 0.0008013248443603516, 0.0008431077003479004, 0.0008848905563354492, 0.000926673412322998, 0.0009684562683105469, 0.0010102391242980957, 0.0010520219802856445, 0.0010938048362731934, 0.0011355876922607422, 0.001177370548248291, 0.0012191534042358398, 0.0012609362602233887, 0.0013027191162109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 27.0, 26.0, 46.0, 37.0, 69.0, 130.0, 200.0, 296.0, 542.0, 998.0, 1861.0, 4145.0, 10466.0, 33125.0, 144833.0, 706200.0, 103557.0, 25972.0, 8715.0, 3622.0, 1675.0, 788.0, 443.0, 273.0, 165.0, 112.0, 76.0, 41.0, 35.0, 25.0, 18.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.998046875, -2.905517578125, -2.81298828125, -2.720458984375, -2.6279296875, -2.535400390625, -2.44287109375, -2.350341796875, -2.2578125, -2.165283203125, -2.07275390625, -1.980224609375, -1.8876953125, -1.795166015625, -1.70263671875, -1.610107421875, -1.517578125, -1.425048828125, -1.33251953125, -1.239990234375, -1.1474609375, -1.054931640625, -0.96240234375, -0.869873046875, -0.77734375, -0.684814453125, -0.59228515625, -0.499755859375, -0.4072265625, -0.314697265625, -0.22216796875, -0.129638671875, -0.037109375, 0.055419921875, 0.14794921875, 0.240478515625, 0.3330078125, 0.425537109375, 0.51806640625, 0.610595703125, 0.703125, 0.795654296875, 0.88818359375, 0.980712890625, 1.0732421875, 1.165771484375, 1.25830078125, 1.350830078125, 1.443359375, 1.535888671875, 1.62841796875, 1.720947265625, 1.8134765625, 1.906005859375, 1.99853515625, 2.091064453125, 2.18359375, 2.276123046875, 2.36865234375, 2.461181640625, 2.5537109375, 2.646240234375, 2.73876953125, 2.831298828125, 2.923828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 9.0, 9.0, 11.0, 17.0, 25.0, 31.0, 31.0, 45.0, 76.0, 116.0, 165.0, 137.0, 92.0, 63.0, 42.0, 34.0, 21.0, 11.0, 12.0, 16.0, 8.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.2740478515625, -2.169189453125, -2.0643310546875, -1.95947265625, -1.8546142578125, -1.749755859375, -1.6448974609375, -1.5400390625, -1.4351806640625, -1.330322265625, -1.2254638671875, -1.12060546875, -1.0157470703125, -0.910888671875, -0.8060302734375, -0.701171875, -0.5963134765625, -0.491455078125, -0.3865966796875, -0.28173828125, -0.1768798828125, -0.072021484375, 0.0328369140625, 0.1376953125, 0.2425537109375, 0.347412109375, 0.4522705078125, 0.55712890625, 0.6619873046875, 0.766845703125, 0.8717041015625, 0.9765625, 1.0814208984375, 1.186279296875, 1.2911376953125, 1.39599609375, 1.5008544921875, 1.605712890625, 1.7105712890625, 1.8154296875, 1.9202880859375, 2.025146484375, 2.1300048828125, 2.23486328125, 2.3397216796875, 2.444580078125, 2.5494384765625, 2.654296875, 2.7591552734375, 2.864013671875, 2.9688720703125, 3.07373046875, 3.1785888671875, 3.283447265625, 3.3883056640625, 3.4931640625, 3.5980224609375, 3.702880859375, 3.8077392578125, 3.91259765625, 4.0174560546875, 4.122314453125, 4.2271728515625, 4.33203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 19.0, 19.0, 48.0, 71.0, 125.0, 283.0, 220.0, 101.0, 52.0, 25.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.37322998046875, -61.88349914550781, -59.393768310546875, -56.90403747558594, -54.414306640625, -51.92457580566406, -49.43484115600586, -46.94511032104492, -44.455379486083984, -41.96564865112305, -39.47591781616211, -36.98618698120117, -34.49645233154297, -32.00672149658203, -29.516990661621094, -27.027259826660156, -24.53752899169922, -22.04779815673828, -19.558067321777344, -17.068334579467773, -14.578603744506836, -12.088872909545898, -9.599141120910645, -7.109409332275391, -4.619678497314453, -2.1299471855163574, 0.3597841262817383, 2.849515438079834, 5.33924674987793, 7.828977584838867, 10.318709373474121, 12.808441162109375, 15.298171997070312, 17.78790283203125, 20.277633666992188, 22.767366409301758, 25.257097244262695, 27.746828079223633, 30.236560821533203, 32.72629165649414, 35.21602249145508, 37.705753326416016, 40.19548416137695, 42.68521499633789, 45.174949645996094, 47.66468048095703, 50.15441131591797, 52.644142150878906, 55.133872985839844, 57.62360382080078, 60.11333465576172, 62.603065490722656, 65.0927963256836, 67.58252716064453, 70.07225799560547, 72.56199645996094, 75.05172729492188, 77.54145812988281, 80.03118896484375, 82.52091979980469, 85.01065063476562, 87.50038146972656, 89.9901123046875, 92.47984313964844, 94.96957397460938]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 1.0, 6.0, 6.0, 13.0, 9.0, 8.0, 8.0, 15.0, 14.0, 18.0, 13.0, 18.0, 25.0, 18.0, 24.0, 21.0, 32.0, 30.0, 44.0, 56.0, 77.0, 98.0, 80.0, 58.0, 42.0, 27.0, 31.0, 16.0, 27.0, 23.0, 25.0, 14.0, 10.0, 13.0, 14.0, 9.0, 10.0, 8.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.349151611328125, -38.01227569580078, -36.6754035949707, -35.33852767944336, -34.001651763916016, -32.66477966308594, -31.327903747558594, -29.991029739379883, -28.654155731201172, -27.31728172302246, -25.980405807495117, -24.643531799316406, -23.306657791137695, -21.969783782958984, -20.63290786743164, -19.29603385925293, -17.959157943725586, -16.622283935546875, -15.285408973693848, -13.94853401184082, -12.61166000366211, -11.274785041809082, -9.937910079956055, -8.601036071777344, -7.264161109924316, -5.927286624908447, -4.590412139892578, -3.253537178039551, -1.9166626930236816, -0.5797882080078125, 0.7570867538452148, 2.093960762023926, 3.430835723876953, 4.767710208892822, 6.104584693908691, 7.441459655761719, 8.77833366394043, 10.115208625793457, 11.452083587646484, 12.788957595825195, 14.125832557678223, 15.46270751953125, 16.79958152770996, 18.136455535888672, 19.473331451416016, 20.810205459594727, 22.147079467773438, 23.48395538330078, 24.820829391479492, 26.157703399658203, 27.494579315185547, 28.831453323364258, 30.16832733154297, 31.505203247070312, 32.842079162597656, 34.178951263427734, 35.51582717895508, 36.85270309448242, 38.1895751953125, 39.526451110839844, 40.86332702636719, 42.200199127197266, 43.53707504272461, 44.87394714355469, 46.21082305908203]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 6.0, 9.0, 18.0, 22.0, 34.0, 39.0, 78.0, 134.0, 347.0, 845.0, 2740.0, 13030.0, 164695.0, 3698256.0, 291817.0, 17061.0, 3424.0, 984.0, 395.0, 145.0, 62.0, 42.0, 37.0, 15.0, 8.0, 10.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.5625, -11.2374267578125, -10.912353515625, -10.5872802734375, -10.26220703125, -9.9371337890625, -9.612060546875, -9.2869873046875, -8.9619140625, -8.6368408203125, -8.311767578125, -7.9866943359375, -7.66162109375, -7.3365478515625, -7.011474609375, -6.6864013671875, -6.361328125, -6.0362548828125, -5.711181640625, -5.3861083984375, -5.06103515625, -4.7359619140625, -4.410888671875, -4.0858154296875, -3.7607421875, -3.4356689453125, -3.110595703125, -2.7855224609375, -2.46044921875, -2.1353759765625, -1.810302734375, -1.4852294921875, -1.16015625, -0.8350830078125, -0.510009765625, -0.1849365234375, 0.14013671875, 0.4652099609375, 0.790283203125, 1.1153564453125, 1.4404296875, 1.7655029296875, 2.090576171875, 2.4156494140625, 2.74072265625, 3.0657958984375, 3.390869140625, 3.7159423828125, 4.041015625, 4.3660888671875, 4.691162109375, 5.0162353515625, 5.34130859375, 5.6663818359375, 5.991455078125, 6.3165283203125, 6.6416015625, 6.9666748046875, 7.291748046875, 7.6168212890625, 7.94189453125, 8.2669677734375, 8.592041015625, 8.9171142578125, 9.2421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 4.0, 10.0, 5.0, 10.0, 14.0, 9.0, 12.0, 23.0, 20.0, 25.0, 31.0, 36.0, 36.0, 40.0, 45.0, 38.0, 55.0, 54.0, 45.0, 55.0, 53.0, 51.0, 44.0, 41.0, 37.0, 36.0, 33.0, 31.0, 18.0, 13.0, 23.0, 12.0, 15.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.994140625, -2.8956298828125, -2.797119140625, -2.6986083984375, -2.60009765625, -2.5015869140625, -2.403076171875, -2.3045654296875, -2.2060546875, -2.1075439453125, -2.009033203125, -1.9105224609375, -1.81201171875, -1.7135009765625, -1.614990234375, -1.5164794921875, -1.41796875, -1.3194580078125, -1.220947265625, -1.1224365234375, -1.02392578125, -0.9254150390625, -0.826904296875, -0.7283935546875, -0.6298828125, -0.5313720703125, -0.432861328125, -0.3343505859375, -0.23583984375, -0.1373291015625, -0.038818359375, 0.0596923828125, 0.158203125, 0.2567138671875, 0.355224609375, 0.4537353515625, 0.55224609375, 0.6507568359375, 0.749267578125, 0.8477783203125, 0.9462890625, 1.0447998046875, 1.143310546875, 1.2418212890625, 1.34033203125, 1.4388427734375, 1.537353515625, 1.6358642578125, 1.734375, 1.8328857421875, 1.931396484375, 2.0299072265625, 2.12841796875, 2.2269287109375, 2.325439453125, 2.4239501953125, 2.5224609375, 2.6209716796875, 2.719482421875, 2.8179931640625, 2.91650390625, 3.0150146484375, 3.113525390625, 3.2120361328125, 3.310546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 7.0, 9.0, 16.0, 13.0, 17.0, 23.0, 27.0, 53.0, 69.0, 108.0, 211.0, 335.0, 746.0, 1940.0, 10261.0, 189519.0, 3907852.0, 73696.0, 6446.0, 1479.0, 620.0, 304.0, 185.0, 103.0, 57.0, 42.0, 42.0, 26.0, 12.0, 13.0, 10.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-16.546875, -16.0655517578125, -15.584228515625, -15.1029052734375, -14.62158203125, -14.1402587890625, -13.658935546875, -13.1776123046875, -12.6962890625, -12.2149658203125, -11.733642578125, -11.2523193359375, -10.77099609375, -10.2896728515625, -9.808349609375, -9.3270263671875, -8.845703125, -8.3643798828125, -7.883056640625, -7.4017333984375, -6.92041015625, -6.4390869140625, -5.957763671875, -5.4764404296875, -4.9951171875, -4.5137939453125, -4.032470703125, -3.5511474609375, -3.06982421875, -2.5885009765625, -2.107177734375, -1.6258544921875, -1.14453125, -0.6632080078125, -0.181884765625, 0.2994384765625, 0.78076171875, 1.2620849609375, 1.743408203125, 2.2247314453125, 2.7060546875, 3.1873779296875, 3.668701171875, 4.1500244140625, 4.63134765625, 5.1126708984375, 5.593994140625, 6.0753173828125, 6.556640625, 7.0379638671875, 7.519287109375, 8.0006103515625, 8.48193359375, 8.9632568359375, 9.444580078125, 9.9259033203125, 10.4072265625, 10.8885498046875, 11.369873046875, 11.8511962890625, 12.33251953125, 12.8138427734375, 13.295166015625, 13.7764892578125, 14.2578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 12.0, 10.0, 16.0, 29.0, 32.0, 42.0, 71.0, 101.0, 191.0, 391.0, 627.0, 914.0, 685.0, 426.0, 207.0, 96.0, 72.0, 46.0, 27.0, 22.0, 13.0, 9.0, 6.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.055419921875, -6.76708984375, -6.478759765625, -6.1904296875, -5.902099609375, -5.61376953125, -5.325439453125, -5.037109375, -4.748779296875, -4.46044921875, -4.172119140625, -3.8837890625, -3.595458984375, -3.30712890625, -3.018798828125, -2.73046875, -2.442138671875, -2.15380859375, -1.865478515625, -1.5771484375, -1.288818359375, -1.00048828125, -0.712158203125, -0.423828125, -0.135498046875, 0.15283203125, 0.441162109375, 0.7294921875, 1.017822265625, 1.30615234375, 1.594482421875, 1.8828125, 2.171142578125, 2.45947265625, 2.747802734375, 3.0361328125, 3.324462890625, 3.61279296875, 3.901123046875, 4.189453125, 4.477783203125, 4.76611328125, 5.054443359375, 5.3427734375, 5.631103515625, 5.91943359375, 6.207763671875, 6.49609375, 6.784423828125, 7.07275390625, 7.361083984375, 7.6494140625, 7.937744140625, 8.22607421875, 8.514404296875, 8.802734375, 9.091064453125, 9.37939453125, 9.667724609375, 9.9560546875, 10.244384765625, 10.53271484375, 10.821044921875, 11.109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 12.0, 4.0, 10.0, 18.0, 21.0, 48.0, 61.0, 85.0, 102.0, 98.0, 111.0, 89.0, 88.0, 56.0, 41.0, 35.0, 24.0, 24.0, 14.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.08250045776367, -56.4747314453125, -54.86695861816406, -53.25918960571289, -51.65142059326172, -50.04365158081055, -48.435882568359375, -46.82810974121094, -45.220340728759766, -43.612571716308594, -42.004798889160156, -40.397029876708984, -38.78926086425781, -37.18149185180664, -35.57372283935547, -33.96595001220703, -32.35818099975586, -30.750411987304688, -29.142641067504883, -27.534870147705078, -25.927101135253906, -24.319332122802734, -22.71156120300293, -21.103790283203125, -19.496021270751953, -17.88825225830078, -16.280481338500977, -14.672711372375488, -13.06494140625, -11.457171440124512, -9.849401473999023, -8.241631507873535, -6.633857727050781, -5.026087760925293, -3.4183177947998047, -1.8105478286743164, -0.20277786254882812, 1.4049921035766602, 3.0127620697021484, 4.620532035827637, 6.228302001953125, 7.836071968078613, 9.443841934204102, 11.05161190032959, 12.659381866455078, 14.267151832580566, 15.874921798706055, 17.48269271850586, 19.09046173095703, 20.698230743408203, 22.306001663208008, 23.913772583007812, 25.521541595458984, 27.129310607910156, 28.73708152770996, 30.344852447509766, 31.952621459960938, 33.56039047241211, 35.16815948486328, 36.77593231201172, 38.38370132446289, 39.99147033691406, 41.5992431640625, 43.20701217651367, 44.814781188964844]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 7.0, 14.0, 9.0, 13.0, 15.0, 15.0, 26.0, 22.0, 18.0, 37.0, 36.0, 38.0, 56.0, 39.0, 39.0, 43.0, 42.0, 33.0, 41.0, 45.0, 33.0, 33.0, 47.0, 27.0, 43.0, 27.0, 21.0, 23.0, 28.0, 27.0, 19.0, 13.0, 9.0, 11.0, 2.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.074668884277344, -31.95806884765625, -30.841468811035156, -29.724868774414062, -28.60826873779297, -27.491668701171875, -26.37506866455078, -25.258468627929688, -24.141868591308594, -23.0252685546875, -21.908668518066406, -20.792068481445312, -19.67546844482422, -18.558868408203125, -17.44226837158203, -16.325668334960938, -15.209066390991211, -14.092466354370117, -12.975866317749023, -11.85926628112793, -10.742666244506836, -9.626066207885742, -8.509465217590332, -7.392865180969238, -6.2762651443481445, -5.159665107727051, -4.043065071105957, -2.926464557647705, -1.8098645210266113, -0.6932644844055176, 0.4233360290527344, 1.5399360656738281, 2.656536102294922, 3.7731361389160156, 4.889736175537109, 6.006336688995361, 7.122936725616455, 8.23953628540039, 9.3561372756958, 10.472737312316895, 11.589337348937988, 12.705937385559082, 13.822537422180176, 14.939138412475586, 16.05573844909668, 17.172338485717773, 18.288938522338867, 19.40553855895996, 20.522138595581055, 21.63873863220215, 22.755338668823242, 23.871938705444336, 24.98853874206543, 26.105138778686523, 27.22174072265625, 28.338340759277344, 29.454940795898438, 30.57154083251953, 31.688140869140625, 32.80474090576172, 33.92134094238281, 35.037940979003906, 36.154541015625, 37.271141052246094, 38.38774108886719]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 4.0, 7.0, 15.0, 17.0, 24.0, 32.0, 55.0, 79.0, 86.0, 151.0, 169.0, 307.0, 500.0, 751.0, 1130.0, 1953.0, 3205.0, 5724.0, 10185.0, 19624.0, 39682.0, 88460.0, 219362.0, 345381.0, 171160.0, 70640.0, 32688.0, 16151.0, 8826.0, 4861.0, 2667.0, 1633.0, 1049.0, 662.0, 452.0, 285.0, 168.0, 136.0, 78.0, 59.0, 35.0, 28.0, 19.0, 18.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.01470947265625, -3.8731689453125, -3.73162841796875, -3.590087890625, -3.44854736328125, -3.3070068359375, -3.16546630859375, -3.02392578125, -2.88238525390625, -2.7408447265625, -2.59930419921875, -2.457763671875, -2.31622314453125, -2.1746826171875, -2.03314208984375, -1.8916015625, -1.75006103515625, -1.6085205078125, -1.46697998046875, -1.325439453125, -1.18389892578125, -1.0423583984375, -0.90081787109375, -0.75927734375, -0.61773681640625, -0.4761962890625, -0.33465576171875, -0.193115234375, -0.05157470703125, 0.0899658203125, 0.23150634765625, 0.373046875, 0.51458740234375, 0.6561279296875, 0.79766845703125, 0.939208984375, 1.08074951171875, 1.2222900390625, 1.36383056640625, 1.50537109375, 1.64691162109375, 1.7884521484375, 1.92999267578125, 2.071533203125, 2.21307373046875, 2.3546142578125, 2.49615478515625, 2.6376953125, 2.77923583984375, 2.9207763671875, 3.06231689453125, 3.203857421875, 3.34539794921875, 3.4869384765625, 3.62847900390625, 3.77001953125, 3.91156005859375, 4.0531005859375, 4.19464111328125, 4.336181640625, 4.47772216796875, 4.6192626953125, 4.76080322265625, 4.90234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 1.0, 9.0, 6.0, 14.0, 15.0, 9.0, 10.0, 19.0, 14.0, 21.0, 24.0, 31.0, 30.0, 35.0, 42.0, 43.0, 45.0, 62.0, 44.0, 58.0, 44.0, 34.0, 50.0, 37.0, 29.0, 36.0, 35.0, 23.0, 36.0, 27.0, 15.0, 15.0, 16.0, 18.0, 12.0, 14.0, 8.0, 8.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.01470947265625, -2.9161376953125, -2.81756591796875, -2.718994140625, -2.62042236328125, -2.5218505859375, -2.42327880859375, -2.32470703125, -2.22613525390625, -2.1275634765625, -2.02899169921875, -1.930419921875, -1.83184814453125, -1.7332763671875, -1.63470458984375, -1.5361328125, -1.43756103515625, -1.3389892578125, -1.24041748046875, -1.141845703125, -1.04327392578125, -0.9447021484375, -0.84613037109375, -0.74755859375, -0.64898681640625, -0.5504150390625, -0.45184326171875, -0.353271484375, -0.25469970703125, -0.1561279296875, -0.05755615234375, 0.041015625, 0.13958740234375, 0.2381591796875, 0.33673095703125, 0.435302734375, 0.53387451171875, 0.6324462890625, 0.73101806640625, 0.82958984375, 0.92816162109375, 1.0267333984375, 1.12530517578125, 1.223876953125, 1.32244873046875, 1.4210205078125, 1.51959228515625, 1.6181640625, 1.71673583984375, 1.8153076171875, 1.91387939453125, 2.012451171875, 2.11102294921875, 2.2095947265625, 2.30816650390625, 2.40673828125, 2.50531005859375, 2.6038818359375, 2.70245361328125, 2.801025390625, 2.89959716796875, 2.9981689453125, 3.09674072265625, 3.1953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 6.0, 10.0, 10.0, 15.0, 23.0, 21.0, 47.0, 61.0, 81.0, 105.0, 224.0, 278.0, 451.0, 795.0, 1582.0, 3674.0, 12752.0, 90053.0, 823811.0, 94419.0, 12913.0, 3736.0, 1469.0, 737.0, 444.0, 273.0, 166.0, 127.0, 77.0, 60.0, 41.0, 19.0, 19.0, 15.0, 10.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.671875, -12.293701171875, -11.91552734375, -11.537353515625, -11.1591796875, -10.781005859375, -10.40283203125, -10.024658203125, -9.646484375, -9.268310546875, -8.89013671875, -8.511962890625, -8.1337890625, -7.755615234375, -7.37744140625, -6.999267578125, -6.62109375, -6.242919921875, -5.86474609375, -5.486572265625, -5.1083984375, -4.730224609375, -4.35205078125, -3.973876953125, -3.595703125, -3.217529296875, -2.83935546875, -2.461181640625, -2.0830078125, -1.704833984375, -1.32666015625, -0.948486328125, -0.5703125, -0.192138671875, 0.18603515625, 0.564208984375, 0.9423828125, 1.320556640625, 1.69873046875, 2.076904296875, 2.455078125, 2.833251953125, 3.21142578125, 3.589599609375, 3.9677734375, 4.345947265625, 4.72412109375, 5.102294921875, 5.48046875, 5.858642578125, 6.23681640625, 6.614990234375, 6.9931640625, 7.371337890625, 7.74951171875, 8.127685546875, 8.505859375, 8.884033203125, 9.26220703125, 9.640380859375, 10.0185546875, 10.396728515625, 10.77490234375, 11.153076171875, 11.53125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 9.0, 4.0, 8.0, 6.0, 10.0, 10.0, 19.0, 33.0, 16.0, 30.0, 39.0, 40.0, 50.0, 42.0, 58.0, 44.0, 59.0, 50.0, 67.0, 52.0, 50.0, 45.0, 42.0, 45.0, 30.0, 22.0, 16.0, 18.0, 14.0, 12.0, 14.0, 12.0, 7.0, 4.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.7021484375, -12.302734375, -11.9033203125, -11.50390625, -11.1044921875, -10.705078125, -10.3056640625, -9.90625, -9.5068359375, -9.107421875, -8.7080078125, -8.30859375, -7.9091796875, -7.509765625, -7.1103515625, -6.7109375, -6.3115234375, -5.912109375, -5.5126953125, -5.11328125, -4.7138671875, -4.314453125, -3.9150390625, -3.515625, -3.1162109375, -2.716796875, -2.3173828125, -1.91796875, -1.5185546875, -1.119140625, -0.7197265625, -0.3203125, 0.0791015625, 0.478515625, 0.8779296875, 1.27734375, 1.6767578125, 2.076171875, 2.4755859375, 2.875, 3.2744140625, 3.673828125, 4.0732421875, 4.47265625, 4.8720703125, 5.271484375, 5.6708984375, 6.0703125, 6.4697265625, 6.869140625, 7.2685546875, 7.66796875, 8.0673828125, 8.466796875, 8.8662109375, 9.265625, 9.6650390625, 10.064453125, 10.4638671875, 10.86328125, 11.2626953125, 11.662109375, 12.0615234375, 12.4609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 8.0, 12.0, 23.0, 24.0, 46.0, 59.0, 90.0, 138.0, 213.0, 388.0, 728.0, 1391.0, 3352.0, 10549.0, 52125.0, 829399.0, 123537.0, 17513.0, 4868.0, 1942.0, 970.0, 479.0, 235.0, 141.0, 101.0, 55.0, 49.0, 38.0, 26.0, 19.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.134521484375, -5.94091796875, -5.747314453125, -5.5537109375, -5.360107421875, -5.16650390625, -4.972900390625, -4.779296875, -4.585693359375, -4.39208984375, -4.198486328125, -4.0048828125, -3.811279296875, -3.61767578125, -3.424072265625, -3.23046875, -3.036865234375, -2.84326171875, -2.649658203125, -2.4560546875, -2.262451171875, -2.06884765625, -1.875244140625, -1.681640625, -1.488037109375, -1.29443359375, -1.100830078125, -0.9072265625, -0.713623046875, -0.52001953125, -0.326416015625, -0.1328125, 0.060791015625, 0.25439453125, 0.447998046875, 0.6416015625, 0.835205078125, 1.02880859375, 1.222412109375, 1.416015625, 1.609619140625, 1.80322265625, 1.996826171875, 2.1904296875, 2.384033203125, 2.57763671875, 2.771240234375, 2.96484375, 3.158447265625, 3.35205078125, 3.545654296875, 3.7392578125, 3.932861328125, 4.12646484375, 4.320068359375, 4.513671875, 4.707275390625, 4.90087890625, 5.094482421875, 5.2880859375, 5.481689453125, 5.67529296875, 5.868896484375, 6.0625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 31.0, 36.0, 43.0, 81.0, 148.0, 228.0, 136.0, 74.0, 51.0, 24.0, 20.0, 17.0, 10.0, 10.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0], "bins": [-0.0018157958984375, -0.0017684698104858398, -0.0017211437225341797, -0.0016738176345825195, -0.0016264915466308594, -0.0015791654586791992, -0.001531839370727539, -0.001484513282775879, -0.0014371871948242188, -0.0013898611068725586, -0.0013425350189208984, -0.0012952089309692383, -0.0012478828430175781, -0.001200556755065918, -0.0011532306671142578, -0.0011059045791625977, -0.0010585784912109375, -0.0010112524032592773, -0.0009639263153076172, -0.000916600227355957, -0.0008692741394042969, -0.0008219480514526367, -0.0007746219635009766, -0.0007272958755493164, -0.0006799697875976562, -0.0006326436996459961, -0.0005853176116943359, -0.0005379915237426758, -0.0004906654357910156, -0.00044333934783935547, -0.0003960132598876953, -0.00034868717193603516, -0.000301361083984375, -0.00025403499603271484, -0.0002067089080810547, -0.00015938282012939453, -0.00011205673217773438, -6.473064422607422e-05, -1.7404556274414062e-05, 2.9921531677246094e-05, 7.724761962890625e-05, 0.0001245737075805664, 0.00017189979553222656, 0.00021922588348388672, 0.0002665519714355469, 0.00031387805938720703, 0.0003612041473388672, 0.00040853023529052734, 0.0004558563232421875, 0.0005031824111938477, 0.0005505084991455078, 0.000597834587097168, 0.0006451606750488281, 0.0006924867630004883, 0.0007398128509521484, 0.0007871389389038086, 0.0008344650268554688, 0.0008817911148071289, 0.0009291172027587891, 0.0009764432907104492, 0.0010237693786621094, 0.0010710954666137695, 0.0011184215545654297, 0.0011657476425170898, 0.00121307373046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 13.0, 11.0, 18.0, 21.0, 33.0, 57.0, 62.0, 119.0, 233.0, 449.0, 895.0, 2245.0, 6949.0, 31940.0, 354561.0, 605819.0, 33678.0, 7241.0, 2277.0, 916.0, 446.0, 214.0, 119.0, 69.0, 49.0, 41.0, 28.0, 17.0, 6.0, 7.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.52734375, -5.34912109375, -5.1708984375, -4.99267578125, -4.814453125, -4.63623046875, -4.4580078125, -4.27978515625, -4.1015625, -3.92333984375, -3.7451171875, -3.56689453125, -3.388671875, -3.21044921875, -3.0322265625, -2.85400390625, -2.67578125, -2.49755859375, -2.3193359375, -2.14111328125, -1.962890625, -1.78466796875, -1.6064453125, -1.42822265625, -1.25, -1.07177734375, -0.8935546875, -0.71533203125, -0.537109375, -0.35888671875, -0.1806640625, -0.00244140625, 0.17578125, 0.35400390625, 0.5322265625, 0.71044921875, 0.888671875, 1.06689453125, 1.2451171875, 1.42333984375, 1.6015625, 1.77978515625, 1.9580078125, 2.13623046875, 2.314453125, 2.49267578125, 2.6708984375, 2.84912109375, 3.02734375, 3.20556640625, 3.3837890625, 3.56201171875, 3.740234375, 3.91845703125, 4.0966796875, 4.27490234375, 4.453125, 4.63134765625, 4.8095703125, 4.98779296875, 5.166015625, 5.34423828125, 5.5224609375, 5.70068359375, 5.87890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 5.0, 11.0, 7.0, 14.0, 26.0, 40.0, 45.0, 54.0, 83.0, 88.0, 137.0, 121.0, 90.0, 63.0, 49.0, 40.0, 31.0, 33.0, 22.0, 9.0, 11.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.673828125, -3.520599365234375, -3.36737060546875, -3.214141845703125, -3.0609130859375, -2.907684326171875, -2.75445556640625, -2.601226806640625, -2.447998046875, -2.294769287109375, -2.14154052734375, -1.988311767578125, -1.8350830078125, -1.681854248046875, -1.52862548828125, -1.375396728515625, -1.22216796875, -1.068939208984375, -0.91571044921875, -0.762481689453125, -0.6092529296875, -0.456024169921875, -0.30279541015625, -0.149566650390625, 0.003662109375, 0.156890869140625, 0.31011962890625, 0.463348388671875, 0.6165771484375, 0.769805908203125, 0.92303466796875, 1.076263427734375, 1.2294921875, 1.382720947265625, 1.53594970703125, 1.689178466796875, 1.8424072265625, 1.995635986328125, 2.14886474609375, 2.302093505859375, 2.455322265625, 2.608551025390625, 2.76177978515625, 2.915008544921875, 3.0682373046875, 3.221466064453125, 3.37469482421875, 3.527923583984375, 3.68115234375, 3.834381103515625, 3.98760986328125, 4.140838623046875, 4.2940673828125, 4.447296142578125, 4.60052490234375, 4.753753662109375, 4.906982421875, 5.060211181640625, 5.21343994140625, 5.366668701171875, 5.5198974609375, 5.673126220703125, 5.82635498046875, 5.979583740234375, 6.1328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 10.0, 6.0, 20.0, 30.0, 77.0, 227.0, 541.0, 80.0, 13.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.19970703125, -410.7074890136719, -402.2152404785156, -393.7230224609375, -385.23077392578125, -376.7385559082031, -368.2463073730469, -359.75408935546875, -351.2618408203125, -342.7696228027344, -334.2773742675781, -325.78515625, -317.29290771484375, -308.8006896972656, -300.3084411621094, -291.81622314453125, -283.3240051269531, -274.831787109375, -266.33953857421875, -257.8473205566406, -249.35507202148438, -240.86285400390625, -232.37062072753906, -223.87838745117188, -215.3861541748047, -206.8939208984375, -198.4016876220703, -189.90945434570312, -181.417236328125, -172.92498779296875, -164.43276977539062, -155.94053649902344, -147.4483184814453, -138.95608520507812, -130.46385192871094, -121.97162628173828, -113.4793930053711, -104.9871597290039, -96.49493408203125, -88.00270080566406, -79.51046752929688, -71.01823425292969, -62.526004791259766, -54.033775329589844, -45.541542053222656, -37.04930877685547, -28.557079315185547, -20.064849853515625, -11.572616577148438, -3.080385208129883, 5.411846160888672, 13.904077529907227, 22.39630889892578, 30.88854217529297, 39.38077163696289, 47.87300109863281, 56.365234375, 64.85746765136719, 73.34970092773438, 81.84192657470703, 90.33415985107422, 98.8263931274414, 107.31861877441406, 115.81085205078125, 124.30308532714844]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 4.0, 11.0, 7.0, 10.0, 3.0, 13.0, 21.0, 15.0, 16.0, 30.0, 29.0, 31.0, 36.0, 34.0, 48.0, 62.0, 113.0, 138.0, 58.0, 54.0, 38.0, 26.0, 36.0, 34.0, 14.0, 20.0, 8.0, 13.0, 16.0, 10.0, 10.0, 5.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.19107437133789, -53.47248077392578, -51.753883361816406, -50.0352897644043, -48.31669616699219, -46.59809875488281, -44.8795051574707, -43.160911560058594, -41.44231414794922, -39.72372055053711, -38.005123138427734, -36.286529541015625, -34.56793212890625, -32.84933853149414, -31.13074493408203, -29.41214942932129, -27.693553924560547, -25.974958419799805, -24.256362915039062, -22.537769317626953, -20.81917381286621, -19.10057830810547, -17.38198471069336, -15.663389205932617, -13.944793701171875, -12.226198196411133, -10.507603645324707, -8.789009094238281, -7.070413589477539, -5.351818084716797, -3.633223533630371, -1.9146289825439453, -0.19603729248046875, 1.5225577354431152, 3.241152763366699, 4.959747791290283, 6.678342819213867, 8.39693832397461, 10.115532875061035, 11.834127426147461, 13.552722930908203, 15.271318435668945, 16.989913940429688, 18.708507537841797, 20.42710304260254, 22.14569854736328, 23.86429214477539, 25.582887649536133, 27.301483154296875, 29.020078659057617, 30.73867416381836, 32.45726776123047, 34.175865173339844, 35.89445877075195, 37.61305236816406, 39.33164978027344, 41.05024337768555, 42.768836975097656, 44.48743438720703, 46.20602798461914, 47.92462158203125, 49.643218994140625, 51.361812591552734, 53.080406188964844, 54.79900360107422]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 8.0, 14.0, 29.0, 46.0, 48.0, 83.0, 141.0, 207.0, 356.0, 645.0, 1334.0, 2976.0, 7153.0, 21991.0, 96140.0, 874706.0, 2653218.0, 451566.0, 57788.0, 15593.0, 5461.0, 2362.0, 1102.0, 526.0, 310.0, 173.0, 122.0, 45.0, 41.0, 35.0, 23.0, 8.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.063232421875, -8.81396484375, -8.564697265625, -8.3154296875, -8.066162109375, -7.81689453125, -7.567626953125, -7.318359375, -7.069091796875, -6.81982421875, -6.570556640625, -6.3212890625, -6.072021484375, -5.82275390625, -5.573486328125, -5.32421875, -5.074951171875, -4.82568359375, -4.576416015625, -4.3271484375, -4.077880859375, -3.82861328125, -3.579345703125, -3.330078125, -3.080810546875, -2.83154296875, -2.582275390625, -2.3330078125, -2.083740234375, -1.83447265625, -1.585205078125, -1.3359375, -1.086669921875, -0.83740234375, -0.588134765625, -0.3388671875, -0.089599609375, 0.15966796875, 0.408935546875, 0.658203125, 0.907470703125, 1.15673828125, 1.406005859375, 1.6552734375, 1.904541015625, 2.15380859375, 2.403076171875, 2.65234375, 2.901611328125, 3.15087890625, 3.400146484375, 3.6494140625, 3.898681640625, 4.14794921875, 4.397216796875, 4.646484375, 4.895751953125, 5.14501953125, 5.394287109375, 5.6435546875, 5.892822265625, 6.14208984375, 6.391357421875, 6.640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 6.0, 8.0, 14.0, 15.0, 18.0, 18.0, 18.0, 28.0, 36.0, 42.0, 41.0, 44.0, 44.0, 64.0, 46.0, 54.0, 54.0, 53.0, 54.0, 37.0, 48.0, 32.0, 39.0, 31.0, 24.0, 27.0, 28.0, 21.0, 9.0, 14.0, 12.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65234375, -2.54205322265625, -2.4317626953125, -2.32147216796875, -2.211181640625, -2.10089111328125, -1.9906005859375, -1.88031005859375, -1.77001953125, -1.65972900390625, -1.5494384765625, -1.43914794921875, -1.328857421875, -1.21856689453125, -1.1082763671875, -0.99798583984375, -0.8876953125, -0.77740478515625, -0.6671142578125, -0.55682373046875, -0.446533203125, -0.33624267578125, -0.2259521484375, -0.11566162109375, -0.00537109375, 0.10491943359375, 0.2152099609375, 0.32550048828125, 0.435791015625, 0.54608154296875, 0.6563720703125, 0.76666259765625, 0.876953125, 0.98724365234375, 1.0975341796875, 1.20782470703125, 1.318115234375, 1.42840576171875, 1.5386962890625, 1.64898681640625, 1.75927734375, 1.86956787109375, 1.9798583984375, 2.09014892578125, 2.200439453125, 2.31072998046875, 2.4210205078125, 2.53131103515625, 2.6416015625, 2.75189208984375, 2.8621826171875, 2.97247314453125, 3.082763671875, 3.19305419921875, 3.3033447265625, 3.41363525390625, 3.52392578125, 3.63421630859375, 3.7445068359375, 3.85479736328125, 3.965087890625, 4.07537841796875, 4.1856689453125, 4.29595947265625, 4.40625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 7.0, 4.0, 22.0, 66.0, 168.0, 517.0, 5571.0, 4183484.0, 3815.0, 429.0, 127.0, 54.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.375, -88.046875, -84.71875, -81.390625, -78.0625, -74.734375, -71.40625, -68.078125, -64.75, -61.421875, -58.09375, -54.765625, -51.4375, -48.109375, -44.78125, -41.453125, -38.125, -34.796875, -31.46875, -28.140625, -24.8125, -21.484375, -18.15625, -14.828125, -11.5, -8.171875, -4.84375, -1.515625, 1.8125, 5.140625, 8.46875, 11.796875, 15.125, 18.453125, 21.78125, 25.109375, 28.4375, 31.765625, 35.09375, 38.421875, 41.75, 45.078125, 48.40625, 51.734375, 55.0625, 58.390625, 61.71875, 65.046875, 68.375, 71.703125, 75.03125, 78.359375, 81.6875, 85.015625, 88.34375, 91.671875, 95.0, 98.328125, 101.65625, 104.984375, 108.3125, 111.640625, 114.96875, 118.296875, 121.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 23.0, 70.0, 222.0, 788.0, 2010.0, 677.0, 200.0, 59.0, 18.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.0625, -65.67578125, -64.2890625, -62.90234375, -61.515625, -60.12890625, -58.7421875, -57.35546875, -55.96875, -54.58203125, -53.1953125, -51.80859375, -50.421875, -49.03515625, -47.6484375, -46.26171875, -44.875, -43.48828125, -42.1015625, -40.71484375, -39.328125, -37.94140625, -36.5546875, -35.16796875, -33.78125, -32.39453125, -31.0078125, -29.62109375, -28.234375, -26.84765625, -25.4609375, -24.07421875, -22.6875, -21.30078125, -19.9140625, -18.52734375, -17.140625, -15.75390625, -14.3671875, -12.98046875, -11.59375, -10.20703125, -8.8203125, -7.43359375, -6.046875, -4.66015625, -3.2734375, -1.88671875, -0.5, 0.88671875, 2.2734375, 3.66015625, 5.046875, 6.43359375, 7.8203125, 9.20703125, 10.59375, 11.98046875, 13.3671875, 14.75390625, 16.140625, 17.52734375, 18.9140625, 20.30078125, 21.6875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 17.0, 44.0, 69.0, 171.0, 287.0, 180.0, 95.0, 41.0, 22.0, 16.0, 4.0, 7.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-351.4676818847656, -344.0564880371094, -336.64532470703125, -329.234130859375, -321.8229675292969, -314.4117736816406, -307.0005798339844, -299.58941650390625, -292.17822265625, -284.76702880859375, -277.3558654785156, -269.9446716308594, -262.53350830078125, -255.122314453125, -247.7111358642578, -240.29995727539062, -232.88876342773438, -225.4775848388672, -218.06640625, -210.65521240234375, -203.24403381347656, -195.83285522460938, -188.4216766357422, -181.010498046875, -173.5993194580078, -166.18814086914062, -158.77696228027344, -151.3657684326172, -143.95458984375, -136.5434112548828, -129.13223266601562, -121.7210464477539, -114.30986022949219, -106.898681640625, -99.48749542236328, -92.0763168334961, -84.66513061523438, -77.25395202636719, -69.8427734375, -62.43158721923828, -55.02040481567383, -47.609222412109375, -40.19804000854492, -32.78685760498047, -25.37567710876465, -17.964496612548828, -10.553314208984375, -3.142131805419922, 4.269050598144531, 11.680233001708984, 19.091415405273438, 26.502595901489258, 33.913780212402344, 41.32495880126953, 48.736141204833984, 56.14732360839844, 63.55850601196289, 70.96968841552734, 78.38086700439453, 85.79205322265625, 93.20323181152344, 100.61441040039062, 108.02559661865234, 115.43678283691406, 122.84796142578125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 6.0, 7.0, 12.0, 21.0, 28.0, 43.0, 62.0, 87.0, 93.0, 107.0, 126.0, 124.0, 82.0, 62.0, 45.0, 31.0, 17.0, 11.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.00119018554688, -150.85809326171875, -144.71499633789062, -138.5718994140625, -132.42880249023438, -126.28569793701172, -120.14259338378906, -113.99949645996094, -107.85639953613281, -101.71330261230469, -95.57020568847656, -89.4271011352539, -83.28400421142578, -77.14090728759766, -70.997802734375, -64.85470581054688, -58.71160888671875, -52.568511962890625, -46.425411224365234, -40.282310485839844, -34.13921356201172, -27.99611473083496, -21.853015899658203, -15.709915161132812, -9.566818237304688, -3.4237194061279297, 2.719379425048828, 8.862478256225586, 15.005577087402344, 21.1486759185791, 27.29177474975586, 33.43487548828125, 39.577972412109375, 45.7210693359375, 51.86417007446289, 58.00727081298828, 64.1503677368164, 70.29346466064453, 76.43656921386719, 82.57966613769531, 88.72276306152344, 94.86585998535156, 101.00895690917969, 107.15206146240234, 113.29515838623047, 119.4382553100586, 125.58135986328125, 131.72445678710938, 137.8675537109375, 144.01065063476562, 150.15374755859375, 156.29684448242188, 162.43994140625, 168.5830535888672, 174.7261505126953, 180.86924743652344, 187.01234436035156, 193.1554412841797, 199.2985382080078, 205.44163513183594, 211.58474731445312, 217.72784423828125, 223.87094116210938, 230.0140380859375, 236.15713500976562]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 16.0, 20.0, 20.0, 22.0, 35.0, 44.0, 65.0, 73.0, 83.0, 142.0, 221.0, 341.0, 554.0, 895.0, 1516.0, 2814.0, 5628.0, 12904.0, 35996.0, 144215.0, 628438.0, 150916.0, 37654.0, 13228.0, 5774.0, 2819.0, 1559.0, 851.0, 531.0, 345.0, 223.0, 146.0, 112.0, 81.0, 62.0, 51.0, 42.0, 25.0, 16.0, 16.0, 14.0, 10.0, 9.0, 9.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.37890625, -6.16986083984375, -5.9608154296875, -5.75177001953125, -5.542724609375, -5.33367919921875, -5.1246337890625, -4.91558837890625, -4.70654296875, -4.49749755859375, -4.2884521484375, -4.07940673828125, -3.870361328125, -3.66131591796875, -3.4522705078125, -3.24322509765625, -3.0341796875, -2.82513427734375, -2.6160888671875, -2.40704345703125, -2.197998046875, -1.98895263671875, -1.7799072265625, -1.57086181640625, -1.36181640625, -1.15277099609375, -0.9437255859375, -0.73468017578125, -0.525634765625, -0.31658935546875, -0.1075439453125, 0.10150146484375, 0.310546875, 0.51959228515625, 0.7286376953125, 0.93768310546875, 1.146728515625, 1.35577392578125, 1.5648193359375, 1.77386474609375, 1.98291015625, 2.19195556640625, 2.4010009765625, 2.61004638671875, 2.819091796875, 3.02813720703125, 3.2371826171875, 3.44622802734375, 3.6552734375, 3.86431884765625, 4.0733642578125, 4.28240966796875, 4.491455078125, 4.70050048828125, 4.9095458984375, 5.11859130859375, 5.32763671875, 5.53668212890625, 5.7457275390625, 5.95477294921875, 6.163818359375, 6.37286376953125, 6.5819091796875, 6.79095458984375, 7.0]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 7.0, 12.0, 8.0, 13.0, 23.0, 35.0, 43.0, 57.0, 65.0, 74.0, 75.0, 74.0, 77.0, 73.0, 80.0, 63.0, 45.0, 45.0, 36.0, 29.0, 10.0, 18.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80078125, -6.575439453125, -6.35009765625, -6.124755859375, -5.8994140625, -5.674072265625, -5.44873046875, -5.223388671875, -4.998046875, -4.772705078125, -4.54736328125, -4.322021484375, -4.0966796875, -3.871337890625, -3.64599609375, -3.420654296875, -3.1953125, -2.969970703125, -2.74462890625, -2.519287109375, -2.2939453125, -2.068603515625, -1.84326171875, -1.617919921875, -1.392578125, -1.167236328125, -0.94189453125, -0.716552734375, -0.4912109375, -0.265869140625, -0.04052734375, 0.184814453125, 0.41015625, 0.635498046875, 0.86083984375, 1.086181640625, 1.3115234375, 1.536865234375, 1.76220703125, 1.987548828125, 2.212890625, 2.438232421875, 2.66357421875, 2.888916015625, 3.1142578125, 3.339599609375, 3.56494140625, 3.790283203125, 4.015625, 4.240966796875, 4.46630859375, 4.691650390625, 4.9169921875, 5.142333984375, 5.36767578125, 5.593017578125, 5.818359375, 6.043701171875, 6.26904296875, 6.494384765625, 6.7197265625, 6.945068359375, 7.17041015625, 7.395751953125, 7.62109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 5.0, 11.0, 18.0, 21.0, 28.0, 43.0, 71.0, 94.0, 202.0, 306.0, 713.0, 2207.0, 13914.0, 860812.0, 159126.0, 8000.0, 1579.0, 578.0, 315.0, 170.0, 97.0, 69.0, 55.0, 27.0, 23.0, 17.0, 9.0, 3.0, 10.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.328125, -15.81591796875, -15.3037109375, -14.79150390625, -14.279296875, -13.76708984375, -13.2548828125, -12.74267578125, -12.23046875, -11.71826171875, -11.2060546875, -10.69384765625, -10.181640625, -9.66943359375, -9.1572265625, -8.64501953125, -8.1328125, -7.62060546875, -7.1083984375, -6.59619140625, -6.083984375, -5.57177734375, -5.0595703125, -4.54736328125, -4.03515625, -3.52294921875, -3.0107421875, -2.49853515625, -1.986328125, -1.47412109375, -0.9619140625, -0.44970703125, 0.0625, 0.57470703125, 1.0869140625, 1.59912109375, 2.111328125, 2.62353515625, 3.1357421875, 3.64794921875, 4.16015625, 4.67236328125, 5.1845703125, 5.69677734375, 6.208984375, 6.72119140625, 7.2333984375, 7.74560546875, 8.2578125, 8.77001953125, 9.2822265625, 9.79443359375, 10.306640625, 10.81884765625, 11.3310546875, 11.84326171875, 12.35546875, 12.86767578125, 13.3798828125, 13.89208984375, 14.404296875, 14.91650390625, 15.4287109375, 15.94091796875, 16.453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 5.0, 8.0, 10.0, 9.0, 6.0, 7.0, 15.0, 18.0, 12.0, 12.0, 29.0, 28.0, 22.0, 44.0, 52.0, 58.0, 63.0, 76.0, 73.0, 87.0, 63.0, 52.0, 41.0, 35.0, 26.0, 21.0, 28.0, 18.0, 16.0, 15.0, 9.0, 9.0, 7.0, 12.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.718017578125, -17.01416015625, -16.310302734375, -15.6064453125, -14.902587890625, -14.19873046875, -13.494873046875, -12.791015625, -12.087158203125, -11.38330078125, -10.679443359375, -9.9755859375, -9.271728515625, -8.56787109375, -7.864013671875, -7.16015625, -6.456298828125, -5.75244140625, -5.048583984375, -4.3447265625, -3.640869140625, -2.93701171875, -2.233154296875, -1.529296875, -0.825439453125, -0.12158203125, 0.582275390625, 1.2861328125, 1.989990234375, 2.69384765625, 3.397705078125, 4.1015625, 4.805419921875, 5.50927734375, 6.213134765625, 6.9169921875, 7.620849609375, 8.32470703125, 9.028564453125, 9.732421875, 10.436279296875, 11.14013671875, 11.843994140625, 12.5478515625, 13.251708984375, 13.95556640625, 14.659423828125, 15.36328125, 16.067138671875, 16.77099609375, 17.474853515625, 18.1787109375, 18.882568359375, 19.58642578125, 20.290283203125, 20.994140625, 21.697998046875, 22.40185546875, 23.105712890625, 23.8095703125, 24.513427734375, 25.21728515625, 25.921142578125, 26.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 12.0, 9.0, 15.0, 28.0, 21.0, 27.0, 55.0, 70.0, 94.0, 151.0, 246.0, 494.0, 1047.0, 3062.0, 13205.0, 200382.0, 807031.0, 16353.0, 3552.0, 1297.0, 591.0, 297.0, 159.0, 96.0, 71.0, 49.0, 27.0, 33.0, 18.0, 12.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.677734375, -2.588653564453125, -2.49957275390625, -2.410491943359375, -2.3214111328125, -2.232330322265625, -2.14324951171875, -2.054168701171875, -1.965087890625, -1.876007080078125, -1.78692626953125, -1.697845458984375, -1.6087646484375, -1.519683837890625, -1.43060302734375, -1.341522216796875, -1.25244140625, -1.163360595703125, -1.07427978515625, -0.985198974609375, -0.8961181640625, -0.807037353515625, -0.71795654296875, -0.628875732421875, -0.539794921875, -0.450714111328125, -0.36163330078125, -0.272552490234375, -0.1834716796875, -0.094390869140625, -0.00531005859375, 0.083770751953125, 0.1728515625, 0.261932373046875, 0.35101318359375, 0.440093994140625, 0.5291748046875, 0.618255615234375, 0.70733642578125, 0.796417236328125, 0.885498046875, 0.974578857421875, 1.06365966796875, 1.152740478515625, 1.2418212890625, 1.330902099609375, 1.41998291015625, 1.509063720703125, 1.59814453125, 1.687225341796875, 1.77630615234375, 1.865386962890625, 1.9544677734375, 2.043548583984375, 2.13262939453125, 2.221710205078125, 2.310791015625, 2.399871826171875, 2.48895263671875, 2.578033447265625, 2.6671142578125, 2.756195068359375, 2.84527587890625, 2.934356689453125, 3.0234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 12.0, 9.0, 16.0, 15.0, 26.0, 35.0, 46.0, 67.0, 140.0, 201.0, 153.0, 94.0, 55.0, 40.0, 28.0, 21.0, 6.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005412101745605469, -0.0005235373973846436, -0.0005058646202087402, -0.0004881918430328369, -0.0004705190658569336, -0.0004528462886810303, -0.00043517351150512695, -0.00041750073432922363, -0.0003998279571533203, -0.000382155179977417, -0.00036448240280151367, -0.00034680962562561035, -0.00032913684844970703, -0.0003114640712738037, -0.0002937912940979004, -0.00027611851692199707, -0.00025844573974609375, -0.00024077296257019043, -0.0002231001853942871, -0.0002054274082183838, -0.00018775463104248047, -0.00017008185386657715, -0.00015240907669067383, -0.0001347362995147705, -0.00011706352233886719, -9.939074516296387e-05, -8.171796798706055e-05, -6.404519081115723e-05, -4.6372413635253906e-05, -2.8699636459350586e-05, -1.1026859283447266e-05, 6.645917892456055e-06, 2.4318695068359375e-05, 4.1991472244262695e-05, 5.9664249420166016e-05, 7.733702659606934e-05, 9.500980377197266e-05, 0.00011268258094787598, 0.0001303553581237793, 0.00014802813529968262, 0.00016570091247558594, 0.00018337368965148926, 0.00020104646682739258, 0.0002187192440032959, 0.00023639202117919922, 0.00025406479835510254, 0.00027173757553100586, 0.0002894103527069092, 0.0003070831298828125, 0.0003247559070587158, 0.00034242868423461914, 0.00036010146141052246, 0.0003777742385864258, 0.0003954470157623291, 0.0004131197929382324, 0.00043079257011413574, 0.00044846534729003906, 0.0004661381244659424, 0.0004838109016418457, 0.000501483678817749, 0.0005191564559936523, 0.0005368292331695557, 0.000554502010345459, 0.0005721747875213623, 0.0005898475646972656]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 14.0, 8.0, 15.0, 20.0, 32.0, 48.0, 88.0, 191.0, 376.0, 824.0, 2223.0, 6924.0, 26448.0, 246707.0, 722413.0, 30098.0, 7733.0, 2445.0, 966.0, 410.0, 215.0, 97.0, 75.0, 49.0, 26.0, 23.0, 15.0, 13.0, 8.0, 5.0, 5.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5927734375, -1.537933349609375, -1.48309326171875, -1.428253173828125, -1.3734130859375, -1.318572998046875, -1.26373291015625, -1.208892822265625, -1.154052734375, -1.099212646484375, -1.04437255859375, -0.989532470703125, -0.9346923828125, -0.879852294921875, -0.82501220703125, -0.770172119140625, -0.71533203125, -0.660491943359375, -0.60565185546875, -0.550811767578125, -0.4959716796875, -0.441131591796875, -0.38629150390625, -0.331451416015625, -0.276611328125, -0.221771240234375, -0.16693115234375, -0.112091064453125, -0.0572509765625, -0.002410888671875, 0.05242919921875, 0.107269287109375, 0.162109375, 0.216949462890625, 0.27178955078125, 0.326629638671875, 0.3814697265625, 0.436309814453125, 0.49114990234375, 0.545989990234375, 0.600830078125, 0.655670166015625, 0.71051025390625, 0.765350341796875, 0.8201904296875, 0.875030517578125, 0.92987060546875, 0.984710693359375, 1.03955078125, 1.094390869140625, 1.14923095703125, 1.204071044921875, 1.2589111328125, 1.313751220703125, 1.36859130859375, 1.423431396484375, 1.478271484375, 1.533111572265625, 1.58795166015625, 1.642791748046875, 1.6976318359375, 1.752471923828125, 1.80731201171875, 1.862152099609375, 1.9169921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 3.0, 15.0, 10.0, 16.0, 26.0, 21.0, 38.0, 62.0, 110.0, 159.0, 179.0, 114.0, 62.0, 48.0, 25.0, 12.0, 11.0, 18.0, 6.0, 6.0, 6.0, 7.0, 4.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.130859375, -2.05194091796875, -1.9730224609375, -1.89410400390625, -1.815185546875, -1.73626708984375, -1.6573486328125, -1.57843017578125, -1.49951171875, -1.42059326171875, -1.3416748046875, -1.26275634765625, -1.183837890625, -1.10491943359375, -1.0260009765625, -0.94708251953125, -0.8681640625, -0.78924560546875, -0.7103271484375, -0.63140869140625, -0.552490234375, -0.47357177734375, -0.3946533203125, -0.31573486328125, -0.23681640625, -0.15789794921875, -0.0789794921875, -6.103515625e-05, 0.078857421875, 0.15777587890625, 0.2366943359375, 0.31561279296875, 0.39453125, 0.47344970703125, 0.5523681640625, 0.63128662109375, 0.710205078125, 0.78912353515625, 0.8680419921875, 0.94696044921875, 1.02587890625, 1.10479736328125, 1.1837158203125, 1.26263427734375, 1.341552734375, 1.42047119140625, 1.4993896484375, 1.57830810546875, 1.6572265625, 1.73614501953125, 1.8150634765625, 1.89398193359375, 1.972900390625, 2.05181884765625, 2.1307373046875, 2.20965576171875, 2.28857421875, 2.36749267578125, 2.4464111328125, 2.52532958984375, 2.604248046875, 2.68316650390625, 2.7620849609375, 2.84100341796875, 2.919921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 18.0, 70.0, 564.0, 241.0, 57.0, 22.0, 13.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.38475036621094, -92.17329406738281, -85.96183776855469, -79.75038146972656, -73.53892517089844, -67.32746887207031, -61.11601257324219, -54.90455627441406, -48.69309997558594, -42.48164367675781, -36.27018737792969, -30.058731079101562, -23.847274780273438, -17.635818481445312, -11.424362182617188, -5.2129058837890625, 0.9985504150390625, 7.2100067138671875, 13.421463012695312, 19.632919311523438, 25.844375610351562, 32.05583190917969, 38.26728820800781, 44.47874450683594, 50.69020080566406, 56.90165710449219, 63.11311340332031, 69.32456970214844, 75.53602600097656, 81.74748229980469, 87.95893859863281, 94.17039489746094, 100.3818359375, 106.59329223632812, 112.80474853515625, 119.01620483398438, 125.2276611328125, 131.43911743164062, 137.65057373046875, 143.86203002929688, 150.073486328125, 156.28494262695312, 162.49639892578125, 168.70785522460938, 174.9193115234375, 181.13076782226562, 187.34222412109375, 193.55368041992188, 199.76513671875, 205.97659301757812, 212.18804931640625, 218.39950561523438, 224.6109619140625, 230.82241821289062, 237.03387451171875, 243.24533081054688, 249.456787109375, 255.66824340820312, 261.87969970703125, 268.0911560058594, 274.3026123046875, 280.5140686035156, 286.72552490234375, 292.9369812011719, 299.1484375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 4.0, 11.0, 11.0, 12.0, 16.0, 14.0, 27.0, 32.0, 33.0, 26.0, 132.0, 228.0, 178.0, 61.0, 26.0, 29.0, 20.0, 23.0, 23.0, 18.0, 20.0, 10.0, 8.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-103.32322692871094, -100.2532730102539, -97.1833267211914, -94.11337280273438, -91.04342651367188, -87.97347259521484, -84.90351867675781, -81.83357238769531, -78.76362609863281, -75.69367218017578, -72.62372589111328, -69.55377197265625, -66.48382568359375, -63.41387176513672, -60.34392166137695, -57.27397155761719, -54.204017639160156, -51.13406753540039, -48.064117431640625, -44.994163513183594, -41.924217224121094, -38.85426330566406, -35.7843132019043, -32.71436309814453, -29.644412994384766, -26.574462890625, -23.504512786865234, -20.434560775756836, -17.36461067199707, -14.294660568237305, -11.224708557128906, -8.15475845336914, -5.084800720214844, -2.01485013961792, 1.055100440979004, 4.125051498413086, 7.195001602172852, 10.264951705932617, 13.334903717041016, 16.40485382080078, 19.474803924560547, 22.544754028320312, 25.614704132080078, 28.684656143188477, 31.754606246948242, 34.824554443359375, 37.894508361816406, 40.96445846557617, 44.03440856933594, 47.1043586730957, 50.17430877685547, 53.2442626953125, 56.314208984375, 59.38416290283203, 62.4541130065918, 65.52406311035156, 68.59400939941406, 71.6639633178711, 74.7339096069336, 77.80386352539062, 80.87380981445312, 83.94376373291016, 87.01371765136719, 90.08366394042969, 93.15361785888672]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 12.0, 18.0, 29.0, 36.0, 43.0, 52.0, 68.0, 364.0, 91.0, 60.0, 53.0, 43.0, 45.0, 20.0, 17.0, 12.0, 7.0, 10.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.670654296875, -5.41943359375, -5.168212890625, -4.9169921875, -4.665771484375, -4.41455078125, -4.163330078125, -3.912109375, -3.660888671875, -3.40966796875, -3.158447265625, -2.9072265625, -2.656005859375, -2.40478515625, -2.153564453125, -1.90234375, -1.651123046875, -1.39990234375, -1.148681640625, -0.8974609375, -0.646240234375, -0.39501953125, -0.143798828125, 0.107421875, 0.358642578125, 0.60986328125, 0.861083984375, 1.1123046875, 1.363525390625, 1.61474609375, 1.865966796875, 2.1171875, 2.368408203125, 2.61962890625, 2.870849609375, 3.1220703125, 3.373291015625, 3.62451171875, 3.875732421875, 4.126953125, 4.378173828125, 4.62939453125, 4.880615234375, 5.1318359375, 5.383056640625, 5.63427734375, 5.885498046875, 6.13671875, 6.387939453125, 6.63916015625, 6.890380859375, 7.1416015625, 7.392822265625, 7.64404296875, 7.895263671875, 8.146484375, 8.397705078125, 8.64892578125, 8.900146484375, 9.1513671875, 9.402587890625, 9.65380859375, 9.905029296875, 10.15625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 8.0, 19.0, 14.0, 19.0, 30.0, 45.0, 83.0, 171.0, 507.0, 1522.0, 8938.0, 8353223.0, 20485.0, 2333.0, 653.0, 239.0, 111.0, 49.0, 35.0, 24.0, 23.0, 12.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-69.6004409790039, -67.46888732910156, -65.33732604980469, -63.205772399902344, -61.074214935302734, -58.942657470703125, -56.81110382080078, -54.67954635620117, -52.54798889160156, -50.41643142700195, -48.284873962402344, -46.1533203125, -44.02176284790039, -41.89020538330078, -39.75865173339844, -37.62709426879883, -35.49553680419922, -33.36397933959961, -31.232423782348633, -29.100868225097656, -26.969310760498047, -24.837753295898438, -22.70619773864746, -20.574642181396484, -18.443084716796875, -16.311527252197266, -14.179971694946289, -12.048415184020996, -9.916858673095703, -7.78530216217041, -5.653745651245117, -3.522189140319824, -1.3906326293945312, 0.7409238815307617, 2.8724803924560547, 5.004036903381348, 7.135593414306641, 9.267149925231934, 11.398706436157227, 13.53026294708252, 15.661819458007812, 17.793376922607422, 19.9249324798584, 22.056488037109375, 24.188045501708984, 26.319602966308594, 28.45115852355957, 30.582714080810547, 32.714271545410156, 34.845829010009766, 36.977386474609375, 39.10894012451172, 41.24049758911133, 43.37205505371094, 45.50360870361328, 47.63516616821289, 49.7667236328125, 51.89828109741211, 54.02983856201172, 56.16139221191406, 58.29294967651367, 60.42450714111328, 62.556060791015625, 64.6876220703125, 66.81917572021484]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 7.0, 2.0, 3.0, 9.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 4.0, 4.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.514328002929688, -26.93609619140625, -25.35786247253418, -23.77962875366211, -22.201396942138672, -20.623165130615234, -19.044931411743164, -17.466697692871094, -15.888465881347656, -14.310233116149902, -12.732000350952148, -11.153767585754395, -9.57553482055664, -7.997302055358887, -6.419069290161133, -4.840836524963379, -3.262603759765625, -1.684370994567871, -0.10613822937011719, 1.4720945358276367, 3.0503273010253906, 4.6285600662231445, 6.206792831420898, 7.785025596618652, 9.363258361816406, 10.94149112701416, 12.519723892211914, 14.097956657409668, 15.676189422607422, 17.25442123413086, 18.83265495300293, 20.410888671875, 21.989120483398438, 23.567352294921875, 25.145586013793945, 26.723819732666016, 28.302051544189453, 29.88028335571289, 31.45851707458496, 33.03675079345703, 34.61498260498047, 36.193214416503906, 37.771446228027344, 39.34968185424805, 40.927913665771484, 42.50614547729492, 44.084381103515625, 45.66261291503906, 47.2408447265625, 48.81907653808594, 50.397308349609375, 51.97554397583008, 53.553775787353516, 55.13200759887695, 56.710243225097656, 58.288475036621094, 59.86670684814453, 61.44493865966797, 63.023170471191406, 64.60140228271484, 66.17964172363281, 67.75787353515625, 69.33610534667969, 70.91433715820312, 72.49256896972656]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 14.0, 23.0, 38.0, 51.0, 80.0, 161.0, 294.0, 660.0, 1571.0, 4504.0, 15379.0, 68568.0, 259713.0, 133941.0, 27641.0, 7184.0, 2402.0, 1008.0, 460.0, 245.0, 125.0, 80.0, 42.0, 21.0, 13.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.1875, -47.5859375, -45.984375, -44.3828125, -42.78125, -41.1796875, -39.578125, -37.9765625, -36.375, -34.7734375, -33.171875, -31.5703125, -29.96875, -28.3671875, -26.765625, -25.1640625, -23.5625, -21.9609375, -20.359375, -18.7578125, -17.15625, -15.5546875, -13.953125, -12.3515625, -10.75, -9.1484375, -7.546875, -5.9453125, -4.34375, -2.7421875, -1.140625, 0.4609375, 2.0625, 3.6640625, 5.265625, 6.8671875, 8.46875, 10.0703125, 11.671875, 13.2734375, 14.875, 16.4765625, 18.078125, 19.6796875, 21.28125, 22.8828125, 24.484375, 26.0859375, 27.6875, 29.2890625, 30.890625, 32.4921875, 34.09375, 35.6953125, 37.296875, 38.8984375, 40.5, 42.1015625, 43.703125, 45.3046875, 46.90625, 48.5078125, 50.109375, 51.7109375, 53.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 8.0, 18.0, 25.0, 27.0, 30.0, 33.0, 44.0, 52.0, 72.0, 75.0, 73.0, 80.0, 74.0, 65.0, 55.0, 55.0, 40.0, 33.0, 26.0, 15.0, 10.0, 12.0, 7.0, 8.0, 10.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.15234375, -5.96868896484375, -5.7850341796875, -5.60137939453125, -5.417724609375, -5.23406982421875, -5.0504150390625, -4.86676025390625, -4.68310546875, -4.49945068359375, -4.3157958984375, -4.13214111328125, -3.948486328125, -3.76483154296875, -3.5811767578125, -3.39752197265625, -3.2138671875, -3.03021240234375, -2.8465576171875, -2.66290283203125, -2.479248046875, -2.29559326171875, -2.1119384765625, -1.92828369140625, -1.74462890625, -1.56097412109375, -1.3773193359375, -1.19366455078125, -1.010009765625, -0.82635498046875, -0.6427001953125, -0.45904541015625, -0.275390625, -0.09173583984375, 0.0919189453125, 0.27557373046875, 0.459228515625, 0.64288330078125, 0.8265380859375, 1.01019287109375, 1.19384765625, 1.37750244140625, 1.5611572265625, 1.74481201171875, 1.928466796875, 2.11212158203125, 2.2957763671875, 2.47943115234375, 2.6630859375, 2.84674072265625, 3.0303955078125, 3.21405029296875, 3.397705078125, 3.58135986328125, 3.7650146484375, 3.94866943359375, 4.13232421875, 4.31597900390625, 4.4996337890625, 4.68328857421875, 4.866943359375, 5.05059814453125, 5.2342529296875, 5.41790771484375, 5.6015625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 5.0, 15.0, 14.0, 32.0, 58.0, 82.0, 71.0, 63.0, 39.0, 18.0, 19.0, 12.0, 7.0, 4.0, 6.0, 8.0, 3.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.826414108276367, -24.456937789916992, -23.087461471557617, -21.71798324584961, -20.348506927490234, -18.97903060913086, -17.609554290771484, -16.24007797241211, -14.870601654052734, -13.50112533569336, -12.131649017333984, -10.762171745300293, -9.392695426940918, -8.023219108581543, -6.653741836547852, -5.284265518188477, -3.9147891998291016, -2.5453126430511475, -1.1758360862731934, 0.19364070892333984, 1.5631170272827148, 2.93259334564209, 4.302070617675781, 5.671546936035156, 7.041023254394531, 8.410499572753906, 9.779975891113281, 11.149453163146973, 12.518929481506348, 13.888405799865723, 15.257883071899414, 16.62735939025879, 17.99683380126953, 19.366310119628906, 20.73578643798828, 22.105262756347656, 23.47473907470703, 24.844215393066406, 26.213693618774414, 27.58316993713379, 28.952646255493164, 30.32212257385254, 31.691598892211914, 33.06107711791992, 34.4305534362793, 35.80002975463867, 37.16950607299805, 38.53898239135742, 39.9084587097168, 41.27793502807617, 42.64741134643555, 44.01688766479492, 45.3863639831543, 46.75584030151367, 48.12532043457031, 49.49479675292969, 50.86427307128906, 52.23374938964844, 53.60322570800781, 54.97270202636719, 56.34217834472656, 57.71165466308594, 59.08113098144531, 60.45060729980469, 61.82008361816406]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 0.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 10.0, 14.0, 29.0, 42.0, 59.0, 84.0, 63.0, 56.0, 39.0, 19.0, 17.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.326555252075195, -26.490676879882812, -25.65479850769043, -24.818920135498047, -23.983043670654297, -23.14716339111328, -22.31128692626953, -21.47540855407715, -20.639530181884766, -19.803651809692383, -18.9677734375, -18.131895065307617, -17.296016693115234, -16.460140228271484, -15.624261856079102, -14.788383483886719, -13.952505111694336, -13.116626739501953, -12.28074836730957, -11.444870948791504, -10.608992576599121, -9.773114204406738, -8.937236785888672, -8.101358413696289, -7.265480041503906, -6.429601669311523, -5.593723773956299, -4.757845878601074, -3.9219675064086914, -3.0860891342163086, -2.250211238861084, -1.4143333435058594, -0.5784568786621094, 0.25742125511169434, 1.093299388885498, 1.9291775226593018, 2.7650556564331055, 3.6009340286254883, 4.436811923980713, 5.2726898193359375, 6.10856819152832, 6.944446563720703, 7.780324459075928, 8.616202354431152, 9.452080726623535, 10.287959098815918, 11.123836517333984, 11.959714889526367, 12.79559326171875, 13.631471633911133, 14.467350006103516, 15.303227424621582, 16.13910675048828, 16.97498321533203, 17.810861587524414, 18.646739959716797, 19.48261833190918, 20.318496704101562, 21.154375076293945, 21.990253448486328, 22.826129913330078, 23.662010192871094, 24.497886657714844, 25.333765029907227, 26.16964340209961]}, "eval/loss": 5.3852667808532715, "eval/wer": 1.35650535501785, "eval/runtime": 686.8292, "eval/samples_per_second": 3.847, "eval/steps_per_second": 0.482} \ No newline at end of file +{"train/loss": 2.7226, "train/learning_rate": 2.1101543942992875e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 35174, "_timestamp": 1646982413, "_step": 6003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 8.0, 9.0, 17.0, 17.0, 13.0, 12.0, 22.0, 27.0, 29.0, 29.0, 32.0, 34.0, 26.0, 43.0, 38.0, 41.0, 34.0, 43.0, 55.0, 34.0, 32.0, 42.0, 43.0, 41.0, 28.0, 29.0, 45.0, 29.0, 29.0, 13.0, 18.0, 22.0, 15.0, 11.0, 8.0, 8.0, 5.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.104436874389648, -13.784018516540527, -13.463600158691406, -13.143182754516602, -12.82276439666748, -12.50234603881836, -12.181928634643555, -11.861510276794434, -11.541091918945312, -11.220673561096191, -10.90025520324707, -10.579837799072266, -10.259419441223145, -9.939001083374023, -9.618583679199219, -9.298165321350098, -8.977746963500977, -8.657328605651855, -8.336910247802734, -8.01649284362793, -7.696074485778809, -7.3756561279296875, -7.055238246917725, -6.734820365905762, -6.414402008056641, -6.0939836502075195, -5.773565769195557, -5.453147888183594, -5.132729530334473, -4.812311172485352, -4.491893291473389, -4.171475410461426, -3.851058006286621, -3.530639886856079, -3.210221767425537, -2.889803647994995, -2.569385528564453, -2.248967409133911, -1.9285492897033691, -1.6081311702728271, -1.2877130508422852, -0.9672949314117432, -0.6468768119812012, -0.3264586925506592, -0.0060405731201171875, 0.3143775463104248, 0.6347956657409668, 0.9552137851715088, 1.2756319046020508, 1.5960500240325928, 1.9164681434631348, 2.2368862628936768, 2.5573043823242188, 2.8777225017547607, 3.1981406211853027, 3.5185587406158447, 3.8389768600463867, 4.159395217895508, 4.479813098907471, 4.800230979919434, 5.120649337768555, 5.441067695617676, 5.761485576629639, 6.081903457641602, 6.402321815490723]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 3.0, 14.0, 14.0, 18.0, 15.0, 15.0, 13.0, 23.0, 34.0, 23.0, 25.0, 41.0, 31.0, 33.0, 35.0, 33.0, 46.0, 30.0, 35.0, 44.0, 40.0, 25.0, 22.0, 37.0, 32.0, 24.0, 31.0, 24.0, 25.0, 22.0, 20.0, 28.0, 16.0, 17.0, 21.0, 13.0, 9.0, 19.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-10.389012336730957, -10.077750205993652, -9.766488075256348, -9.455225944519043, -9.143962860107422, -8.832700729370117, -8.521438598632812, -8.210176467895508, -7.898914337158203, -7.587652206420898, -7.276390075683594, -6.965127468109131, -6.653865337371826, -6.3426032066345215, -6.031340599060059, -5.720078468322754, -5.408816337585449, -5.0975542068481445, -4.78629207611084, -4.475029468536377, -4.163767337799072, -3.8525052070617676, -3.541242837905884, -3.22998046875, -2.9187183380126953, -2.6074562072753906, -2.296193838119507, -1.9849315881729126, -1.6736693382263184, -1.3624070882797241, -1.0511448383331299, -0.7398824691772461, -0.4286203384399414, -0.11735808849334717, 0.19390416145324707, 0.5051664113998413, 0.8164286613464355, 1.1276909112930298, 1.438953161239624, 1.7502155303955078, 2.0614776611328125, 2.372739791870117, 2.684002161026001, 2.9952645301818848, 3.3065266609191895, 3.617788791656494, 3.929051160812378, 4.240313529968262, 4.551575660705566, 4.862837791442871, 5.174099922180176, 5.485362529754639, 5.796624660491943, 6.107886791229248, 6.419149398803711, 6.730411529541016, 7.04167366027832, 7.352935791015625, 7.66419792175293, 7.975460529327393, 8.286722183227539, 8.59798526763916, 8.909247398376465, 9.22050952911377, 9.531771659851074]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 9.0, 5.0, 12.0, 20.0, 53.0, 82.0, 134.0, 225.0, 347.0, 588.0, 854.0, 1408.0, 2314.0, 3799.0, 6163.0, 9889.0, 15410.0, 24360.0, 38350.0, 59343.0, 90629.0, 135415.0, 196980.0, 275513.0, 363914.0, 445566.0, 492764.0, 485901.0, 427128.0, 340018.0, 252449.0, 176690.0, 121570.0, 80241.0, 52873.0, 33876.0, 21700.0, 14103.0, 8800.0, 5519.0, 3470.0, 2257.0, 1314.0, 878.0, 512.0, 303.0, 206.0, 131.0, 86.0, 54.0, 22.0, 16.0, 12.0, 10.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.3828125, -8.1197509765625, -7.856689453125, -7.5936279296875, -7.33056640625, -7.0675048828125, -6.804443359375, -6.5413818359375, -6.2783203125, -6.0152587890625, -5.752197265625, -5.4891357421875, -5.22607421875, -4.9630126953125, -4.699951171875, -4.4368896484375, -4.173828125, -3.9107666015625, -3.647705078125, -3.3846435546875, -3.12158203125, -2.8585205078125, -2.595458984375, -2.3323974609375, -2.0693359375, -1.8062744140625, -1.543212890625, -1.2801513671875, -1.01708984375, -0.7540283203125, -0.490966796875, -0.2279052734375, 0.03515625, 0.2982177734375, 0.561279296875, 0.8243408203125, 1.08740234375, 1.3504638671875, 1.613525390625, 1.8765869140625, 2.1396484375, 2.4027099609375, 2.665771484375, 2.9288330078125, 3.19189453125, 3.4549560546875, 3.718017578125, 3.9810791015625, 4.244140625, 4.5072021484375, 4.770263671875, 5.0333251953125, 5.29638671875, 5.5594482421875, 5.822509765625, 6.0855712890625, 6.3486328125, 6.6116943359375, 6.874755859375, 7.1378173828125, 7.40087890625, 7.6639404296875, 7.927001953125, 8.1900634765625, 8.453125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 14.0, 5.0, 6.0, 12.0, 11.0, 20.0, 16.0, 25.0, 17.0, 31.0, 31.0, 27.0, 33.0, 37.0, 32.0, 29.0, 35.0, 42.0, 42.0, 25.0, 30.0, 38.0, 31.0, 32.0, 24.0, 30.0, 26.0, 17.0, 32.0, 19.0, 21.0, 27.0, 16.0, 19.0, 18.0, 26.0, 16.0, 14.0, 9.0, 8.0, 8.0, 6.0, 9.0, 0.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.421875, -7.18927001953125, -6.9566650390625, -6.72406005859375, -6.491455078125, -6.25885009765625, -6.0262451171875, -5.79364013671875, -5.56103515625, -5.32843017578125, -5.0958251953125, -4.86322021484375, -4.630615234375, -4.39801025390625, -4.1654052734375, -3.93280029296875, -3.7001953125, -3.46759033203125, -3.2349853515625, -3.00238037109375, -2.769775390625, -2.53717041015625, -2.3045654296875, -2.07196044921875, -1.83935546875, -1.60675048828125, -1.3741455078125, -1.14154052734375, -0.908935546875, -0.67633056640625, -0.4437255859375, -0.21112060546875, 0.021484375, 0.25408935546875, 0.4866943359375, 0.71929931640625, 0.951904296875, 1.18450927734375, 1.4171142578125, 1.64971923828125, 1.88232421875, 2.11492919921875, 2.3475341796875, 2.58013916015625, 2.812744140625, 3.04534912109375, 3.2779541015625, 3.51055908203125, 3.7431640625, 3.97576904296875, 4.2083740234375, 4.44097900390625, 4.673583984375, 4.90618896484375, 5.1387939453125, 5.37139892578125, 5.60400390625, 5.83660888671875, 6.0692138671875, 6.30181884765625, 6.534423828125, 6.76702880859375, 6.9996337890625, 7.23223876953125, 7.46484375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 9.0, 18.0, 33.0, 56.0, 75.0, 157.0, 219.0, 397.0, 636.0, 1143.0, 1765.0, 3004.0, 4931.0, 8007.0, 13234.0, 21243.0, 33629.0, 52129.0, 79303.0, 115602.0, 165230.0, 227527.0, 298698.0, 366861.0, 420312.0, 442428.0, 431101.0, 384272.0, 317623.0, 247247.0, 181209.0, 129345.0, 88518.0, 58480.0, 37524.0, 23685.0, 15016.0, 9460.0, 5649.0, 3477.0, 2079.0, 1244.0, 712.0, 398.0, 253.0, 154.0, 79.0, 51.0, 30.0, 18.0, 11.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.8515625, -7.6033935546875, -7.355224609375, -7.1070556640625, -6.85888671875, -6.6107177734375, -6.362548828125, -6.1143798828125, -5.8662109375, -5.6180419921875, -5.369873046875, -5.1217041015625, -4.87353515625, -4.6253662109375, -4.377197265625, -4.1290283203125, -3.880859375, -3.6326904296875, -3.384521484375, -3.1363525390625, -2.88818359375, -2.6400146484375, -2.391845703125, -2.1436767578125, -1.8955078125, -1.6473388671875, -1.399169921875, -1.1510009765625, -0.90283203125, -0.6546630859375, -0.406494140625, -0.1583251953125, 0.08984375, 0.3380126953125, 0.586181640625, 0.8343505859375, 1.08251953125, 1.3306884765625, 1.578857421875, 1.8270263671875, 2.0751953125, 2.3233642578125, 2.571533203125, 2.8197021484375, 3.06787109375, 3.3160400390625, 3.564208984375, 3.8123779296875, 4.060546875, 4.3087158203125, 4.556884765625, 4.8050537109375, 5.05322265625, 5.3013916015625, 5.549560546875, 5.7977294921875, 6.0458984375, 6.2940673828125, 6.542236328125, 6.7904052734375, 7.03857421875, 7.2867431640625, 7.534912109375, 7.7830810546875, 8.03125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 15.0, 19.0, 18.0, 23.0, 36.0, 37.0, 48.0, 75.0, 86.0, 88.0, 104.0, 128.0, 152.0, 181.0, 166.0, 181.0, 199.0, 203.0, 226.0, 218.0, 200.0, 220.0, 192.0, 167.0, 162.0, 159.0, 134.0, 110.0, 97.0, 73.0, 71.0, 70.0, 42.0, 37.0, 29.0, 22.0, 22.0, 9.0, 16.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.04339599609375, -3.9110107421875, -3.77862548828125, -3.646240234375, -3.51385498046875, -3.3814697265625, -3.24908447265625, -3.11669921875, -2.98431396484375, -2.8519287109375, -2.71954345703125, -2.587158203125, -2.45477294921875, -2.3223876953125, -2.19000244140625, -2.0576171875, -1.92523193359375, -1.7928466796875, -1.66046142578125, -1.528076171875, -1.39569091796875, -1.2633056640625, -1.13092041015625, -0.99853515625, -0.86614990234375, -0.7337646484375, -0.60137939453125, -0.468994140625, -0.33660888671875, -0.2042236328125, -0.07183837890625, 0.060546875, 0.19293212890625, 0.3253173828125, 0.45770263671875, 0.590087890625, 0.72247314453125, 0.8548583984375, 0.98724365234375, 1.11962890625, 1.25201416015625, 1.3843994140625, 1.51678466796875, 1.649169921875, 1.78155517578125, 1.9139404296875, 2.04632568359375, 2.1787109375, 2.31109619140625, 2.4434814453125, 2.57586669921875, 2.708251953125, 2.84063720703125, 2.9730224609375, 3.10540771484375, 3.23779296875, 3.37017822265625, 3.5025634765625, 3.63494873046875, 3.767333984375, 3.89971923828125, 4.0321044921875, 4.16448974609375, 4.296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 9.0, 4.0, 8.0, 3.0, 8.0, 11.0, 15.0, 12.0, 20.0, 18.0, 25.0, 21.0, 24.0, 16.0, 30.0, 23.0, 36.0, 37.0, 36.0, 32.0, 46.0, 45.0, 43.0, 50.0, 43.0, 42.0, 36.0, 41.0, 39.0, 34.0, 27.0, 24.0, 25.0, 15.0, 16.0, 13.0, 16.0, 10.0, 11.0, 3.0, 8.0, 4.0, 5.0, 6.0, 3.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-10.4581937789917, -10.15226936340332, -9.846344947814941, -9.540420532226562, -9.234496116638184, -8.928571701049805, -8.622647285461426, -8.316722869873047, -8.010798454284668, -7.704874038696289, -7.39894962310791, -7.093025207519531, -6.787100791931152, -6.481176376342773, -6.1752519607543945, -5.869327545166016, -5.563403129577637, -5.257478713989258, -4.951554298400879, -4.6456298828125, -4.339705467224121, -4.033781051635742, -3.7278566360473633, -3.4219322204589844, -3.1160078048706055, -2.8100833892822266, -2.5041589736938477, -2.1982345581054688, -1.8923101425170898, -1.586385726928711, -1.280461311340332, -0.9745368957519531, -0.6686115264892578, -0.3626871109008789, -0.0567626953125, 0.2491617202758789, 0.5550861358642578, 0.8610105514526367, 1.1669349670410156, 1.4728593826293945, 1.7787837982177734, 2.0847082138061523, 2.3906326293945312, 2.69655704498291, 3.002481460571289, 3.308405876159668, 3.614330291748047, 3.920254707336426, 4.226179122924805, 4.532103538513184, 4.8380279541015625, 5.143952369689941, 5.44987678527832, 5.755801200866699, 6.061725616455078, 6.367650032043457, 6.673574447631836, 6.979498863220215, 7.285423278808594, 7.591347694396973, 7.897272109985352, 8.20319652557373, 8.50912094116211, 8.815045356750488, 9.120969772338867]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 6.0, 11.0, 7.0, 6.0, 14.0, 19.0, 14.0, 13.0, 13.0, 34.0, 29.0, 29.0, 35.0, 33.0, 40.0, 29.0, 36.0, 40.0, 41.0, 40.0, 38.0, 38.0, 35.0, 33.0, 34.0, 28.0, 27.0, 31.0, 27.0, 34.0, 20.0, 19.0, 12.0, 16.0, 18.0, 13.0, 23.0, 16.0, 6.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.67910385131836, -9.376543045043945, -9.073982238769531, -8.771421432495117, -8.468860626220703, -8.166299819946289, -7.863739013671875, -7.561178207397461, -7.258617401123047, -6.956056594848633, -6.653495788574219, -6.350934982299805, -6.048374176025391, -5.745813369750977, -5.4432525634765625, -5.140691757202148, -4.838130950927734, -4.53557014465332, -4.233009338378906, -3.930448532104492, -3.627887725830078, -3.325326919555664, -3.02276611328125, -2.720205307006836, -2.417644500732422, -2.115083694458008, -1.8125228881835938, -1.5099620819091797, -1.2074012756347656, -0.9048404693603516, -0.6022796630859375, -0.29971885681152344, 0.002841949462890625, 0.3054027557373047, 0.6079635620117188, 0.9105243682861328, 1.2130851745605469, 1.515645980834961, 1.818206787109375, 2.120767593383789, 2.423328399658203, 2.725889205932617, 3.0284500122070312, 3.3310108184814453, 3.6335716247558594, 3.9361324310302734, 4.2386932373046875, 4.541254043579102, 4.843814849853516, 5.14637565612793, 5.448936462402344, 5.751497268676758, 6.054058074951172, 6.356618881225586, 6.6591796875, 6.961740493774414, 7.264301300048828, 7.566862106323242, 7.869422912597656, 8.17198371887207, 8.474544525146484, 8.777105331420898, 9.079666137695312, 9.382226943969727, 9.68478775024414]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 14.0, 29.0, 30.0, 50.0, 68.0, 89.0, 122.0, 197.0, 266.0, 383.0, 546.0, 743.0, 1092.0, 1534.0, 2316.0, 3716.0, 5647.0, 9073.0, 14827.0, 25097.0, 43585.0, 76493.0, 133669.0, 208879.0, 206369.0, 130781.0, 75500.0, 42937.0, 24386.0, 14628.0, 8903.0, 5510.0, 3581.0, 2332.0, 1605.0, 1081.0, 715.0, 493.0, 365.0, 253.0, 162.0, 143.0, 97.0, 73.0, 43.0, 39.0, 26.0, 22.0, 13.0, 6.0, 5.0, 6.0, 2.0, 1.0], "bins": [-5.9609375, -5.7855224609375, -5.610107421875, -5.4346923828125, -5.25927734375, -5.0838623046875, -4.908447265625, -4.7330322265625, -4.5576171875, -4.3822021484375, -4.206787109375, -4.0313720703125, -3.85595703125, -3.6805419921875, -3.505126953125, -3.3297119140625, -3.154296875, -2.9788818359375, -2.803466796875, -2.6280517578125, -2.45263671875, -2.2772216796875, -2.101806640625, -1.9263916015625, -1.7509765625, -1.5755615234375, -1.400146484375, -1.2247314453125, -1.04931640625, -0.8739013671875, -0.698486328125, -0.5230712890625, -0.34765625, -0.1722412109375, 0.003173828125, 0.1785888671875, 0.35400390625, 0.5294189453125, 0.704833984375, 0.8802490234375, 1.0556640625, 1.2310791015625, 1.406494140625, 1.5819091796875, 1.75732421875, 1.9327392578125, 2.108154296875, 2.2835693359375, 2.458984375, 2.6343994140625, 2.809814453125, 2.9852294921875, 3.16064453125, 3.3360595703125, 3.511474609375, 3.6868896484375, 3.8623046875, 4.0377197265625, 4.213134765625, 4.3885498046875, 4.56396484375, 4.7393798828125, 4.914794921875, 5.0902099609375, 5.265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 6.0, 12.0, 6.0, 7.0, 13.0, 18.0, 15.0, 11.0, 16.0, 36.0, 26.0, 29.0, 33.0, 33.0, 36.0, 35.0, 32.0, 42.0, 39.0, 46.0, 32.0, 36.0, 39.0, 29.0, 35.0, 26.0, 31.0, 28.0, 29.0, 32.0, 22.0, 20.0, 13.0, 18.0, 14.0, 14.0, 21.0, 17.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.53125, -9.2353515625, -8.939453125, -8.6435546875, -8.34765625, -8.0517578125, -7.755859375, -7.4599609375, -7.1640625, -6.8681640625, -6.572265625, -6.2763671875, -5.98046875, -5.6845703125, -5.388671875, -5.0927734375, -4.796875, -4.5009765625, -4.205078125, -3.9091796875, -3.61328125, -3.3173828125, -3.021484375, -2.7255859375, -2.4296875, -2.1337890625, -1.837890625, -1.5419921875, -1.24609375, -0.9501953125, -0.654296875, -0.3583984375, -0.0625, 0.2333984375, 0.529296875, 0.8251953125, 1.12109375, 1.4169921875, 1.712890625, 2.0087890625, 2.3046875, 2.6005859375, 2.896484375, 3.1923828125, 3.48828125, 3.7841796875, 4.080078125, 4.3759765625, 4.671875, 4.9677734375, 5.263671875, 5.5595703125, 5.85546875, 6.1513671875, 6.447265625, 6.7431640625, 7.0390625, 7.3349609375, 7.630859375, 7.9267578125, 8.22265625, 8.5185546875, 8.814453125, 9.1103515625, 9.40625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 13.0, 14.0, 12.0, 17.0, 35.0, 41.0, 67.0, 108.0, 133.0, 203.0, 298.0, 458.0, 702.0, 1123.0, 1909.0, 3400.0, 6616.0, 13928.0, 37788.0, 148093.0, 535589.0, 213666.0, 49833.0, 17287.0, 7653.0, 3859.0, 2137.0, 1273.0, 793.0, 493.0, 298.0, 189.0, 157.0, 108.0, 85.0, 52.0, 41.0, 18.0, 21.0, 10.0, 6.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.641845703125, -9.34619140625, -9.050537109375, -8.7548828125, -8.459228515625, -8.16357421875, -7.867919921875, -7.572265625, -7.276611328125, -6.98095703125, -6.685302734375, -6.3896484375, -6.093994140625, -5.79833984375, -5.502685546875, -5.20703125, -4.911376953125, -4.61572265625, -4.320068359375, -4.0244140625, -3.728759765625, -3.43310546875, -3.137451171875, -2.841796875, -2.546142578125, -2.25048828125, -1.954833984375, -1.6591796875, -1.363525390625, -1.06787109375, -0.772216796875, -0.4765625, -0.180908203125, 0.11474609375, 0.410400390625, 0.7060546875, 1.001708984375, 1.29736328125, 1.593017578125, 1.888671875, 2.184326171875, 2.47998046875, 2.775634765625, 3.0712890625, 3.366943359375, 3.66259765625, 3.958251953125, 4.25390625, 4.549560546875, 4.84521484375, 5.140869140625, 5.4365234375, 5.732177734375, 6.02783203125, 6.323486328125, 6.619140625, 6.914794921875, 7.21044921875, 7.506103515625, 7.8017578125, 8.097412109375, 8.39306640625, 8.688720703125, 8.984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 15.0, 10.0, 9.0, 15.0, 15.0, 23.0, 25.0, 17.0, 22.0, 22.0, 29.0, 33.0, 30.0, 23.0, 32.0, 30.0, 34.0, 36.0, 23.0, 35.0, 50.0, 50.0, 35.0, 40.0, 24.0, 25.0, 40.0, 24.0, 30.0, 23.0, 27.0, 21.0, 22.0, 20.0, 16.0, 15.0, 8.0, 9.0, 4.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0], "bins": [-6.69140625, -6.49725341796875, -6.3031005859375, -6.10894775390625, -5.914794921875, -5.72064208984375, -5.5264892578125, -5.33233642578125, -5.13818359375, -4.94403076171875, -4.7498779296875, -4.55572509765625, -4.361572265625, -4.16741943359375, -3.9732666015625, -3.77911376953125, -3.5849609375, -3.39080810546875, -3.1966552734375, -3.00250244140625, -2.808349609375, -2.61419677734375, -2.4200439453125, -2.22589111328125, -2.03173828125, -1.83758544921875, -1.6434326171875, -1.44927978515625, -1.255126953125, -1.06097412109375, -0.8668212890625, -0.67266845703125, -0.478515625, -0.28436279296875, -0.0902099609375, 0.10394287109375, 0.298095703125, 0.49224853515625, 0.6864013671875, 0.88055419921875, 1.07470703125, 1.26885986328125, 1.4630126953125, 1.65716552734375, 1.851318359375, 2.04547119140625, 2.2396240234375, 2.43377685546875, 2.6279296875, 2.82208251953125, 3.0162353515625, 3.21038818359375, 3.404541015625, 3.59869384765625, 3.7928466796875, 3.98699951171875, 4.18115234375, 4.37530517578125, 4.5694580078125, 4.76361083984375, 4.957763671875, 5.15191650390625, 5.3460693359375, 5.54022216796875, 5.734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 8.0, 11.0, 19.0, 22.0, 33.0, 37.0, 69.0, 112.0, 116.0, 179.0, 307.0, 414.0, 705.0, 1282.0, 2404.0, 5193.0, 13920.0, 61526.0, 726875.0, 194492.0, 25282.0, 7996.0, 3359.0, 1613.0, 947.0, 542.0, 342.0, 222.0, 164.0, 95.0, 84.0, 50.0, 30.0, 35.0, 19.0, 13.0, 16.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.22393798828125, -6.0338134765625, -5.84368896484375, -5.653564453125, -5.46343994140625, -5.2733154296875, -5.08319091796875, -4.89306640625, -4.70294189453125, -4.5128173828125, -4.32269287109375, -4.132568359375, -3.94244384765625, -3.7523193359375, -3.56219482421875, -3.3720703125, -3.18194580078125, -2.9918212890625, -2.80169677734375, -2.611572265625, -2.42144775390625, -2.2313232421875, -2.04119873046875, -1.85107421875, -1.66094970703125, -1.4708251953125, -1.28070068359375, -1.090576171875, -0.90045166015625, -0.7103271484375, -0.52020263671875, -0.330078125, -0.13995361328125, 0.0501708984375, 0.24029541015625, 0.430419921875, 0.62054443359375, 0.8106689453125, 1.00079345703125, 1.19091796875, 1.38104248046875, 1.5711669921875, 1.76129150390625, 1.951416015625, 2.14154052734375, 2.3316650390625, 2.52178955078125, 2.7119140625, 2.90203857421875, 3.0921630859375, 3.28228759765625, 3.472412109375, 3.66253662109375, 3.8526611328125, 4.04278564453125, 4.23291015625, 4.42303466796875, 4.6131591796875, 4.80328369140625, 4.993408203125, 5.18353271484375, 5.3736572265625, 5.56378173828125, 5.75390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 8.0, 8.0, 9.0, 31.0, 31.0, 67.0, 130.0, 207.0, 207.0, 143.0, 81.0, 38.0, 14.0, 9.0, 6.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007839202880859375, -0.0007601827383041382, -0.0007364451885223389, -0.0007127076387405396, -0.0006889700889587402, -0.0006652325391769409, -0.0006414949893951416, -0.0006177574396133423, -0.000594019889831543, -0.0005702823400497437, -0.0005465447902679443, -0.000522807240486145, -0.0004990696907043457, -0.0004753321409225464, -0.00045159459114074707, -0.00042785704135894775, -0.00040411949157714844, -0.0003803819417953491, -0.0003566443920135498, -0.0003329068422317505, -0.00030916929244995117, -0.00028543174266815186, -0.00026169419288635254, -0.00023795664310455322, -0.0002142190933227539, -0.0001904815435409546, -0.00016674399375915527, -0.00014300644397735596, -0.00011926889419555664, -9.553134441375732e-05, -7.179379463195801e-05, -4.805624485015869e-05, -2.4318695068359375e-05, -5.811452865600586e-07, 2.3156404495239258e-05, 4.6893954277038574e-05, 7.063150405883789e-05, 9.436905384063721e-05, 0.00011810660362243652, 0.00014184415340423584, 0.00016558170318603516, 0.00018931925296783447, 0.0002130568027496338, 0.0002367943525314331, 0.0002605319023132324, 0.00028426945209503174, 0.00030800700187683105, 0.00033174455165863037, 0.0003554821014404297, 0.000379219651222229, 0.0004029572010040283, 0.00042669475078582764, 0.00045043230056762695, 0.00047416985034942627, 0.0004979074001312256, 0.0005216449499130249, 0.0005453824996948242, 0.0005691200494766235, 0.0005928575992584229, 0.0006165951490402222, 0.0006403326988220215, 0.0006640702486038208, 0.0006878077983856201, 0.0007115453481674194, 0.0007352828979492188]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 4.0, 11.0, 14.0, 15.0, 18.0, 32.0, 58.0, 77.0, 112.0, 182.0, 241.0, 352.0, 463.0, 772.0, 1204.0, 1992.0, 3574.0, 6789.0, 15402.0, 38476.0, 105845.0, 298430.0, 351526.0, 137010.0, 48183.0, 19131.0, 8445.0, 4118.0, 2192.0, 1262.0, 847.0, 529.0, 367.0, 281.0, 174.0, 129.0, 84.0, 57.0, 52.0, 27.0, 19.0, 23.0, 5.0, 5.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.91796875, -4.76947021484375, -4.6209716796875, -4.47247314453125, -4.323974609375, -4.17547607421875, -4.0269775390625, -3.87847900390625, -3.72998046875, -3.58148193359375, -3.4329833984375, -3.28448486328125, -3.135986328125, -2.98748779296875, -2.8389892578125, -2.69049072265625, -2.5419921875, -2.39349365234375, -2.2449951171875, -2.09649658203125, -1.947998046875, -1.79949951171875, -1.6510009765625, -1.50250244140625, -1.35400390625, -1.20550537109375, -1.0570068359375, -0.90850830078125, -0.760009765625, -0.61151123046875, -0.4630126953125, -0.31451416015625, -0.166015625, -0.01751708984375, 0.1309814453125, 0.27947998046875, 0.427978515625, 0.57647705078125, 0.7249755859375, 0.87347412109375, 1.02197265625, 1.17047119140625, 1.3189697265625, 1.46746826171875, 1.615966796875, 1.76446533203125, 1.9129638671875, 2.06146240234375, 2.2099609375, 2.35845947265625, 2.5069580078125, 2.65545654296875, 2.803955078125, 2.95245361328125, 3.1009521484375, 3.24945068359375, 3.39794921875, 3.54644775390625, 3.6949462890625, 3.84344482421875, 3.991943359375, 4.14044189453125, 4.2889404296875, 4.43743896484375, 4.5859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 4.0, 9.0, 8.0, 20.0, 21.0, 28.0, 30.0, 43.0, 86.0, 133.0, 145.0, 127.0, 91.0, 67.0, 51.0, 32.0, 15.0, 21.0, 20.0, 9.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1601715087890625, -1.111358642578125, -1.0625457763671875, -1.01373291015625, -0.9649200439453125, -0.916107177734375, -0.8672943115234375, -0.8184814453125, -0.7696685791015625, -0.720855712890625, -0.6720428466796875, -0.62322998046875, -0.5744171142578125, -0.525604248046875, -0.4767913818359375, -0.427978515625, -0.3791656494140625, -0.330352783203125, -0.2815399169921875, -0.23272705078125, -0.1839141845703125, -0.135101318359375, -0.0862884521484375, -0.0374755859375, 0.0113372802734375, 0.060150146484375, 0.1089630126953125, 0.15777587890625, 0.2065887451171875, 0.255401611328125, 0.3042144775390625, 0.35302734375, 0.4018402099609375, 0.450653076171875, 0.4994659423828125, 0.54827880859375, 0.5970916748046875, 0.645904541015625, 0.6947174072265625, 0.7435302734375, 0.7923431396484375, 0.841156005859375, 0.8899688720703125, 0.93878173828125, 0.9875946044921875, 1.036407470703125, 1.0852203369140625, 1.134033203125, 1.1828460693359375, 1.231658935546875, 1.2804718017578125, 1.32928466796875, 1.3780975341796875, 1.426910400390625, 1.4757232666015625, 1.5245361328125, 1.5733489990234375, 1.622161865234375, 1.6709747314453125, 1.71978759765625, 1.7686004638671875, 1.817413330078125, 1.8662261962890625, 1.9150390625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 8.0, 6.0, 9.0, 8.0, 16.0, 12.0, 12.0, 22.0, 16.0, 27.0, 13.0, 22.0, 30.0, 27.0, 26.0, 33.0, 41.0, 44.0, 33.0, 38.0, 47.0, 53.0, 39.0, 39.0, 42.0, 44.0, 40.0, 37.0, 27.0, 23.0, 18.0, 16.0, 23.0, 14.0, 18.0, 13.0, 13.0, 7.0, 7.0, 5.0, 6.0, 7.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.455994606018066, -10.153267860412598, -9.850540161132812, -9.547813415527344, -9.245086669921875, -8.94235897064209, -8.639632225036621, -8.336904525756836, -8.034177780151367, -7.73145055770874, -7.428723335266113, -7.1259965896606445, -6.823269367218018, -6.520542144775391, -6.217815399169922, -5.915088176727295, -5.612360954284668, -5.309633731842041, -5.006906509399414, -4.704179763793945, -4.401452541351318, -4.098725318908691, -3.7959983348846436, -3.4932713508605957, -3.1905441284179688, -2.887816905975342, -2.585089921951294, -2.282362937927246, -1.9796357154846191, -1.6769086122512817, -1.3741815090179443, -1.0714545249938965, -0.7687263488769531, -0.4659992456436157, -0.16327214241027832, 0.13945496082305908, 0.4421820640563965, 0.7449091672897339, 1.0476362705230713, 1.3503632545471191, 1.653090476989746, 1.9558175802230835, 2.258544683456421, 2.5612716674804688, 2.8639988899230957, 3.1667261123657227, 3.4694530963897705, 3.7721800804138184, 4.074907302856445, 4.377634525299072, 4.680361747741699, 4.983088493347168, 5.285815715789795, 5.588542938232422, 5.891269683837891, 6.193996906280518, 6.4967241287231445, 6.7994513511657715, 7.102178573608398, 7.404905319213867, 7.707632541656494, 8.010359764099121, 8.31308650970459, 8.615814208984375, 8.918540954589844]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 4.0, 11.0, 5.0, 8.0, 10.0, 13.0, 18.0, 14.0, 16.0, 24.0, 27.0, 30.0, 28.0, 31.0, 45.0, 33.0, 40.0, 35.0, 35.0, 44.0, 35.0, 47.0, 31.0, 32.0, 28.0, 35.0, 38.0, 27.0, 23.0, 35.0, 20.0, 26.0, 13.0, 19.0, 17.0, 17.0, 16.0, 18.0, 5.0, 6.0, 10.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.74306869506836, -9.444079399108887, -9.145090103149414, -8.846100807189941, -8.547111511230469, -8.248123168945312, -7.94913387298584, -7.650144577026367, -7.3511552810668945, -7.052165985107422, -6.753176689147949, -6.454187870025635, -6.155198574066162, -5.8562092781066895, -5.557220458984375, -5.258231163024902, -4.95924186706543, -4.660252571105957, -4.361263275146484, -4.06227445602417, -3.7632851600646973, -3.4642958641052246, -3.165306806564331, -2.8663177490234375, -2.567328453063965, -2.268339157104492, -1.9693500995635986, -1.6703609228134155, -1.3713717460632324, -1.0723825693130493, -0.7733933925628662, -0.47440433502197266, -0.1754150390625, 0.1235741376876831, 0.4225633144378662, 0.7215524911880493, 1.0205416679382324, 1.3195308446884155, 1.6185200214385986, 1.9175090789794922, 2.216498374938965, 2.5154876708984375, 2.814476728439331, 3.1134657859802246, 3.4124550819396973, 3.71144437789917, 4.010433197021484, 4.309422492980957, 4.60841178894043, 4.907401084899902, 5.206390380859375, 5.5053791999816895, 5.804368495941162, 6.103357791900635, 6.402346611022949, 6.701335906982422, 7.0003252029418945, 7.299314498901367, 7.59830379486084, 7.897292613983154, 8.196281433105469, 8.495270729064941, 8.794260025024414, 9.093249320983887, 9.39223861694336]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 16.0, 10.0, 30.0, 25.0, 64.0, 104.0, 134.0, 209.0, 295.0, 524.0, 749.0, 1161.0, 1717.0, 2736.0, 3963.0, 5911.0, 8534.0, 12299.0, 17430.0, 23644.0, 32368.0, 42054.0, 52726.0, 63289.0, 74079.0, 82335.0, 86679.0, 87579.0, 83937.0, 76728.0, 66606.0, 55593.0, 44150.0, 34272.0, 25810.0, 18718.0, 13346.0, 9431.0, 6451.0, 4269.0, 2897.0, 1919.0, 1316.0, 866.0, 545.0, 364.0, 229.0, 170.0, 87.0, 83.0, 34.0, 19.0, 23.0, 12.0, 9.0, 3.0, 5.0], "bins": [-7.91796875, -7.6859130859375, -7.453857421875, -7.2218017578125, -6.98974609375, -6.7576904296875, -6.525634765625, -6.2935791015625, -6.0615234375, -5.8294677734375, -5.597412109375, -5.3653564453125, -5.13330078125, -4.9012451171875, -4.669189453125, -4.4371337890625, -4.205078125, -3.9730224609375, -3.740966796875, -3.5089111328125, -3.27685546875, -3.0447998046875, -2.812744140625, -2.5806884765625, -2.3486328125, -2.1165771484375, -1.884521484375, -1.6524658203125, -1.42041015625, -1.1883544921875, -0.956298828125, -0.7242431640625, -0.4921875, -0.2601318359375, -0.028076171875, 0.2039794921875, 0.43603515625, 0.6680908203125, 0.900146484375, 1.1322021484375, 1.3642578125, 1.5963134765625, 1.828369140625, 2.0604248046875, 2.29248046875, 2.5245361328125, 2.756591796875, 2.9886474609375, 3.220703125, 3.4527587890625, 3.684814453125, 3.9168701171875, 4.14892578125, 4.3809814453125, 4.613037109375, 4.8450927734375, 5.0771484375, 5.3092041015625, 5.541259765625, 5.7733154296875, 6.00537109375, 6.2374267578125, 6.469482421875, 6.7015380859375, 6.93359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 9.0, 6.0, 9.0, 13.0, 17.0, 15.0, 13.0, 26.0, 26.0, 28.0, 30.0, 34.0, 38.0, 34.0, 41.0, 37.0, 35.0, 42.0, 37.0, 41.0, 36.0, 32.0, 29.0, 34.0, 40.0, 27.0, 20.0, 35.0, 23.0, 23.0, 18.0, 20.0, 15.0, 18.0, 13.0, 20.0, 6.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.4921875, -9.2020263671875, -8.911865234375, -8.6217041015625, -8.33154296875, -8.0413818359375, -7.751220703125, -7.4610595703125, -7.1708984375, -6.8807373046875, -6.590576171875, -6.3004150390625, -6.01025390625, -5.7200927734375, -5.429931640625, -5.1397705078125, -4.849609375, -4.5594482421875, -4.269287109375, -3.9791259765625, -3.68896484375, -3.3988037109375, -3.108642578125, -2.8184814453125, -2.5283203125, -2.2381591796875, -1.947998046875, -1.6578369140625, -1.36767578125, -1.0775146484375, -0.787353515625, -0.4971923828125, -0.20703125, 0.0831298828125, 0.373291015625, 0.6634521484375, 0.95361328125, 1.2437744140625, 1.533935546875, 1.8240966796875, 2.1142578125, 2.4044189453125, 2.694580078125, 2.9847412109375, 3.27490234375, 3.5650634765625, 3.855224609375, 4.1453857421875, 4.435546875, 4.7257080078125, 5.015869140625, 5.3060302734375, 5.59619140625, 5.8863525390625, 6.176513671875, 6.4666748046875, 6.7568359375, 7.0469970703125, 7.337158203125, 7.6273193359375, 7.91748046875, 8.2076416015625, 8.497802734375, 8.7879638671875, 9.078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 7.0, 12.0, 32.0, 46.0, 82.0, 134.0, 219.0, 319.0, 649.0, 970.0, 1634.0, 2841.0, 4766.0, 7680.0, 12283.0, 19030.0, 29181.0, 42539.0, 60000.0, 78688.0, 97339.0, 110114.0, 115314.0, 109942.0, 96624.0, 78316.0, 59234.0, 42081.0, 28578.0, 18756.0, 12053.0, 7550.0, 4492.0, 2773.0, 1646.0, 993.0, 684.0, 394.0, 217.0, 130.0, 82.0, 39.0, 26.0, 26.0, 12.0, 3.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.7734375, -10.4417724609375, -10.110107421875, -9.7784423828125, -9.44677734375, -9.1151123046875, -8.783447265625, -8.4517822265625, -8.1201171875, -7.7884521484375, -7.456787109375, -7.1251220703125, -6.79345703125, -6.4617919921875, -6.130126953125, -5.7984619140625, -5.466796875, -5.1351318359375, -4.803466796875, -4.4718017578125, -4.14013671875, -3.8084716796875, -3.476806640625, -3.1451416015625, -2.8134765625, -2.4818115234375, -2.150146484375, -1.8184814453125, -1.48681640625, -1.1551513671875, -0.823486328125, -0.4918212890625, -0.16015625, 0.1715087890625, 0.503173828125, 0.8348388671875, 1.16650390625, 1.4981689453125, 1.829833984375, 2.1614990234375, 2.4931640625, 2.8248291015625, 3.156494140625, 3.4881591796875, 3.81982421875, 4.1514892578125, 4.483154296875, 4.8148193359375, 5.146484375, 5.4781494140625, 5.809814453125, 6.1414794921875, 6.47314453125, 6.8048095703125, 7.136474609375, 7.4681396484375, 7.7998046875, 8.1314697265625, 8.463134765625, 8.7947998046875, 9.12646484375, 9.4581298828125, 9.789794921875, 10.1214599609375, 10.453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 3.0, 15.0, 8.0, 15.0, 13.0, 14.0, 20.0, 23.0, 28.0, 29.0, 38.0, 29.0, 31.0, 42.0, 46.0, 53.0, 35.0, 38.0, 33.0, 36.0, 43.0, 27.0, 48.0, 35.0, 39.0, 33.0, 33.0, 27.0, 23.0, 23.0, 11.0, 23.0, 11.0, 7.0, 7.0, 12.0, 6.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.75390625, -6.54119873046875, -6.3284912109375, -6.11578369140625, -5.903076171875, -5.69036865234375, -5.4776611328125, -5.26495361328125, -5.05224609375, -4.83953857421875, -4.6268310546875, -4.41412353515625, -4.201416015625, -3.98870849609375, -3.7760009765625, -3.56329345703125, -3.3505859375, -3.13787841796875, -2.9251708984375, -2.71246337890625, -2.499755859375, -2.28704833984375, -2.0743408203125, -1.86163330078125, -1.64892578125, -1.43621826171875, -1.2235107421875, -1.01080322265625, -0.798095703125, -0.58538818359375, -0.3726806640625, -0.15997314453125, 0.052734375, 0.26544189453125, 0.4781494140625, 0.69085693359375, 0.903564453125, 1.11627197265625, 1.3289794921875, 1.54168701171875, 1.75439453125, 1.96710205078125, 2.1798095703125, 2.39251708984375, 2.605224609375, 2.81793212890625, 3.0306396484375, 3.24334716796875, 3.4560546875, 3.66876220703125, 3.8814697265625, 4.09417724609375, 4.306884765625, 4.51959228515625, 4.7322998046875, 4.94500732421875, 5.15771484375, 5.37042236328125, 5.5831298828125, 5.79583740234375, 6.008544921875, 6.22125244140625, 6.4339599609375, 6.64666748046875, 6.859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 7.0, 12.0, 14.0, 25.0, 33.0, 50.0, 72.0, 111.0, 178.0, 286.0, 449.0, 675.0, 1174.0, 1789.0, 2920.0, 4696.0, 7919.0, 12719.0, 21007.0, 32963.0, 51622.0, 76936.0, 104877.0, 130370.0, 140888.0, 131122.0, 107062.0, 77524.0, 52492.0, 33711.0, 21307.0, 12976.0, 7872.0, 4802.0, 2918.0, 1795.0, 1164.0, 707.0, 472.0, 307.0, 184.0, 126.0, 72.0, 52.0, 40.0, 28.0, 14.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.039794921875, -3.91162109375, -3.783447265625, -3.6552734375, -3.527099609375, -3.39892578125, -3.270751953125, -3.142578125, -3.014404296875, -2.88623046875, -2.758056640625, -2.6298828125, -2.501708984375, -2.37353515625, -2.245361328125, -2.1171875, -1.989013671875, -1.86083984375, -1.732666015625, -1.6044921875, -1.476318359375, -1.34814453125, -1.219970703125, -1.091796875, -0.963623046875, -0.83544921875, -0.707275390625, -0.5791015625, -0.450927734375, -0.32275390625, -0.194580078125, -0.06640625, 0.061767578125, 0.18994140625, 0.318115234375, 0.4462890625, 0.574462890625, 0.70263671875, 0.830810546875, 0.958984375, 1.087158203125, 1.21533203125, 1.343505859375, 1.4716796875, 1.599853515625, 1.72802734375, 1.856201171875, 1.984375, 2.112548828125, 2.24072265625, 2.368896484375, 2.4970703125, 2.625244140625, 2.75341796875, 2.881591796875, 3.009765625, 3.137939453125, 3.26611328125, 3.394287109375, 3.5224609375, 3.650634765625, 3.77880859375, 3.906982421875, 4.03515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 6.0, 7.0, 12.0, 10.0, 15.0, 18.0, 17.0, 21.0, 29.0, 24.0, 40.0, 41.0, 43.0, 40.0, 46.0, 52.0, 40.0, 53.0, 70.0, 48.0, 67.0, 51.0, 41.0, 37.0, 25.0, 29.0, 20.0, 23.0, 11.0, 12.0, 8.0, 8.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00048279762268066406, -0.0004680268466472626, -0.0004532560706138611, -0.0004384852945804596, -0.0004237145185470581, -0.0004089437425136566, -0.0003941729664802551, -0.00037940219044685364, -0.00036463141441345215, -0.00034986063838005066, -0.00033508986234664917, -0.0003203190863132477, -0.0003055483102798462, -0.0002907775342464447, -0.0002760067582130432, -0.0002612359821796417, -0.00024646520614624023, -0.00023169443011283875, -0.00021692365407943726, -0.00020215287804603577, -0.00018738210201263428, -0.0001726113259792328, -0.0001578405499458313, -0.0001430697739124298, -0.00012829899787902832, -0.00011352822184562683, -9.875744581222534e-05, -8.398666977882385e-05, -6.921589374542236e-05, -5.4445117712020874e-05, -3.9674341678619385e-05, -2.4903565645217896e-05, -1.0132789611816406e-05, 4.637986421585083e-06, 1.9408762454986572e-05, 3.417953848838806e-05, 4.895031452178955e-05, 6.372109055519104e-05, 7.849186658859253e-05, 9.326264262199402e-05, 0.00010803341865539551, 0.000122804194688797, 0.00013757497072219849, 0.00015234574675559998, 0.00016711652278900146, 0.00018188729882240295, 0.00019665807485580444, 0.00021142885088920593, 0.00022619962692260742, 0.0002409704029560089, 0.0002557411789894104, 0.0002705119550228119, 0.0002852827310562134, 0.00030005350708961487, 0.00031482428312301636, 0.00032959505915641785, 0.00034436583518981934, 0.0003591366112232208, 0.0003739073872566223, 0.0003886781632900238, 0.0004034489393234253, 0.0004182197153568268, 0.00043299049139022827, 0.00044776126742362976, 0.00046253204345703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 4.0, 10.0, 7.0, 24.0, 24.0, 50.0, 78.0, 91.0, 170.0, 190.0, 337.0, 480.0, 755.0, 1154.0, 1808.0, 2806.0, 4717.0, 7686.0, 12605.0, 20573.0, 33186.0, 52089.0, 76455.0, 106052.0, 129966.0, 139483.0, 131100.0, 105919.0, 78610.0, 52912.0, 34141.0, 21215.0, 12934.0, 7942.0, 4803.0, 2901.0, 1819.0, 1215.0, 737.0, 496.0, 321.0, 229.0, 155.0, 103.0, 67.0, 49.0, 37.0, 25.0, 10.0, 7.0, 8.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.88671875, -3.763427734375, -3.64013671875, -3.516845703125, -3.3935546875, -3.270263671875, -3.14697265625, -3.023681640625, -2.900390625, -2.777099609375, -2.65380859375, -2.530517578125, -2.4072265625, -2.283935546875, -2.16064453125, -2.037353515625, -1.9140625, -1.790771484375, -1.66748046875, -1.544189453125, -1.4208984375, -1.297607421875, -1.17431640625, -1.051025390625, -0.927734375, -0.804443359375, -0.68115234375, -0.557861328125, -0.4345703125, -0.311279296875, -0.18798828125, -0.064697265625, 0.05859375, 0.181884765625, 0.30517578125, 0.428466796875, 0.5517578125, 0.675048828125, 0.79833984375, 0.921630859375, 1.044921875, 1.168212890625, 1.29150390625, 1.414794921875, 1.5380859375, 1.661376953125, 1.78466796875, 1.907958984375, 2.03125, 2.154541015625, 2.27783203125, 2.401123046875, 2.5244140625, 2.647705078125, 2.77099609375, 2.894287109375, 3.017578125, 3.140869140625, 3.26416015625, 3.387451171875, 3.5107421875, 3.634033203125, 3.75732421875, 3.880615234375, 4.00390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 10.0, 18.0, 19.0, 26.0, 21.0, 31.0, 38.0, 48.0, 46.0, 66.0, 76.0, 49.0, 55.0, 57.0, 41.0, 58.0, 48.0, 38.0, 36.0, 31.0, 31.0, 25.0, 17.0, 12.0, 9.0, 13.0, 13.0, 5.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.959197998046875, -1.89495849609375, -1.830718994140625, -1.7664794921875, -1.702239990234375, -1.63800048828125, -1.573760986328125, -1.509521484375, -1.445281982421875, -1.38104248046875, -1.316802978515625, -1.2525634765625, -1.188323974609375, -1.12408447265625, -1.059844970703125, -0.99560546875, -0.931365966796875, -0.86712646484375, -0.802886962890625, -0.7386474609375, -0.674407958984375, -0.61016845703125, -0.545928955078125, -0.481689453125, -0.417449951171875, -0.35321044921875, -0.288970947265625, -0.2247314453125, -0.160491943359375, -0.09625244140625, -0.032012939453125, 0.0322265625, 0.096466064453125, 0.16070556640625, 0.224945068359375, 0.2891845703125, 0.353424072265625, 0.41766357421875, 0.481903076171875, 0.546142578125, 0.610382080078125, 0.67462158203125, 0.738861083984375, 0.8031005859375, 0.867340087890625, 0.93157958984375, 0.995819091796875, 1.06005859375, 1.124298095703125, 1.18853759765625, 1.252777099609375, 1.3170166015625, 1.381256103515625, 1.44549560546875, 1.509735107421875, 1.573974609375, 1.638214111328125, 1.70245361328125, 1.766693115234375, 1.8309326171875, 1.895172119140625, 1.95941162109375, 2.023651123046875, 2.087890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 9.0, 12.0, 8.0, 16.0, 9.0, 18.0, 22.0, 19.0, 37.0, 32.0, 27.0, 21.0, 36.0, 31.0, 37.0, 31.0, 46.0, 33.0, 54.0, 47.0, 39.0, 41.0, 43.0, 40.0, 30.0, 38.0, 31.0, 26.0, 21.0, 15.0, 17.0, 13.0, 14.0, 13.0, 12.0, 6.0, 9.0, 9.0, 4.0, 4.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.584078788757324, -9.281476020812988, -8.978874206542969, -8.676271438598633, -8.373669624328613, -8.071066856384277, -7.7684645652771, -7.465862274169922, -7.163259983062744, -6.860657691955566, -6.558055400848389, -6.255453109741211, -5.952850341796875, -5.6502485275268555, -5.3476457595825195, -5.045043468475342, -4.742441177368164, -4.439838886260986, -4.137236595153809, -3.8346340656280518, -3.532031774520874, -3.2294294834136963, -2.9268269538879395, -2.6242246627807617, -2.321622371673584, -2.0190200805664062, -1.716417670249939, -1.4138152599334717, -1.111212968826294, -0.8086106777191162, -0.5060082674026489, -0.20340585708618164, 0.0991973876953125, 0.401799738407135, 0.7044020891189575, 1.0070044994354248, 1.3096067905426025, 1.6122090816497803, 1.9148114919662476, 2.217413902282715, 2.5200161933898926, 2.8226184844970703, 3.125220775604248, 3.427823305130005, 3.7304255962371826, 4.033027648925781, 4.335630416870117, 4.638232707977295, 4.940834999084473, 5.24343729019165, 5.546039581298828, 5.848641872406006, 6.151244163513184, 6.4538469314575195, 6.756449222564697, 7.059051513671875, 7.361653804779053, 7.6642560958862305, 7.966858386993408, 8.269460678100586, 8.572063446044922, 8.874665260314941, 9.177268028259277, 9.479869842529297, 9.782472610473633]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 10.0, 8.0, 7.0, 10.0, 13.0, 16.0, 13.0, 18.0, 26.0, 18.0, 23.0, 25.0, 35.0, 32.0, 39.0, 41.0, 43.0, 44.0, 52.0, 32.0, 45.0, 51.0, 35.0, 35.0, 36.0, 33.0, 37.0, 31.0, 24.0, 21.0, 24.0, 18.0, 22.0, 13.0, 14.0, 9.0, 7.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.64548397064209, -10.315455436706543, -9.985426902770996, -9.655397415161133, -9.325368881225586, -8.995340347290039, -8.665311813354492, -8.335283279418945, -8.005254745483398, -7.675226211547852, -7.3451972007751465, -7.0151686668396, -6.6851396560668945, -6.355111122131348, -6.025082588195801, -5.695054054260254, -5.365024566650391, -5.034996032714844, -4.704967021942139, -4.374938488006592, -4.044909477233887, -3.71488094329834, -3.384852409362793, -3.054823637008667, -2.724794864654541, -2.394766092300415, -2.064737319946289, -1.7347087860107422, -1.4046800136566162, -1.0746512413024902, -0.7446225881576538, -0.4145939350128174, -0.084564208984375, 0.2454645037651062, 0.5754932165145874, 0.9055219292640686, 1.2355506420135498, 1.5655794143676758, 1.8956080675125122, 2.2256367206573486, 2.5556654930114746, 2.8856942653656006, 3.2157230377197266, 3.5457515716552734, 3.8757803440093994, 4.205809116363525, 4.535837650299072, 4.865866661071777, 5.195895195007324, 5.525923728942871, 5.855952739715576, 6.185981273651123, 6.516010284423828, 6.846038818359375, 7.176067352294922, 7.506095886230469, 7.836124897003174, 8.166153907775879, 8.496182441711426, 8.826210975646973, 9.15623950958252, 9.486268997192383, 9.81629753112793, 10.146326065063477, 10.476354598999023]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [4.0, 8.0, 6.0, 12.0, 23.0, 25.0, 40.0, 54.0, 97.0, 168.0, 274.0, 428.0, 567.0, 878.0, 1337.0, 2225.0, 3411.0, 5107.0, 7816.0, 12059.0, 18320.0, 27599.0, 42260.0, 62912.0, 92310.0, 133517.0, 186631.0, 253182.0, 326801.0, 393902.0, 439139.0, 446920.0, 414939.0, 354020.0, 280631.0, 211098.0, 152485.0, 106177.0, 72942.0, 49233.0, 32260.0, 21848.0, 13912.0, 9353.0, 6115.0, 3919.0, 2552.0, 1720.0, 1110.0, 721.0, 427.0, 305.0, 186.0, 110.0, 73.0, 53.0, 34.0, 24.0, 10.0, 8.0, 0.0, 4.0, 1.0, 2.0], "bins": [-7.45703125, -7.21795654296875, -6.9788818359375, -6.73980712890625, -6.500732421875, -6.26165771484375, -6.0225830078125, -5.78350830078125, -5.54443359375, -5.30535888671875, -5.0662841796875, -4.82720947265625, -4.588134765625, -4.34906005859375, -4.1099853515625, -3.87091064453125, -3.6318359375, -3.39276123046875, -3.1536865234375, -2.91461181640625, -2.675537109375, -2.43646240234375, -2.1973876953125, -1.95831298828125, -1.71923828125, -1.48016357421875, -1.2410888671875, -1.00201416015625, -0.762939453125, -0.52386474609375, -0.2847900390625, -0.04571533203125, 0.193359375, 0.43243408203125, 0.6715087890625, 0.91058349609375, 1.149658203125, 1.38873291015625, 1.6278076171875, 1.86688232421875, 2.10595703125, 2.34503173828125, 2.5841064453125, 2.82318115234375, 3.062255859375, 3.30133056640625, 3.5404052734375, 3.77947998046875, 4.0185546875, 4.25762939453125, 4.4967041015625, 4.73577880859375, 4.974853515625, 5.21392822265625, 5.4530029296875, 5.69207763671875, 5.93115234375, 6.17022705078125, 6.4093017578125, 6.64837646484375, 6.887451171875, 7.12652587890625, 7.3656005859375, 7.60467529296875, 7.84375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 7.0, 3.0, 16.0, 11.0, 14.0, 11.0, 13.0, 20.0, 24.0, 20.0, 23.0, 28.0, 33.0, 32.0, 34.0, 37.0, 46.0, 37.0, 53.0, 32.0, 38.0, 40.0, 47.0, 36.0, 33.0, 43.0, 23.0, 30.0, 28.0, 27.0, 23.0, 21.0, 18.0, 14.0, 16.0, 11.0, 7.0, 7.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.4583740234375, -8.190185546875, -7.9219970703125, -7.65380859375, -7.3856201171875, -7.117431640625, -6.8492431640625, -6.5810546875, -6.3128662109375, -6.044677734375, -5.7764892578125, -5.50830078125, -5.2401123046875, -4.971923828125, -4.7037353515625, -4.435546875, -4.1673583984375, -3.899169921875, -3.6309814453125, -3.36279296875, -3.0946044921875, -2.826416015625, -2.5582275390625, -2.2900390625, -2.0218505859375, -1.753662109375, -1.4854736328125, -1.21728515625, -0.9490966796875, -0.680908203125, -0.4127197265625, -0.14453125, 0.1236572265625, 0.391845703125, 0.6600341796875, 0.92822265625, 1.1964111328125, 1.464599609375, 1.7327880859375, 2.0009765625, 2.2691650390625, 2.537353515625, 2.8055419921875, 3.07373046875, 3.3419189453125, 3.610107421875, 3.8782958984375, 4.146484375, 4.4146728515625, 4.682861328125, 4.9510498046875, 5.21923828125, 5.4874267578125, 5.755615234375, 6.0238037109375, 6.2919921875, 6.5601806640625, 6.828369140625, 7.0965576171875, 7.36474609375, 7.6329345703125, 7.901123046875, 8.1693115234375, 8.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 18.0, 29.0, 49.0, 76.0, 141.0, 216.0, 361.0, 617.0, 1046.0, 1672.0, 2845.0, 4583.0, 7457.0, 11930.0, 19071.0, 29816.0, 45279.0, 68769.0, 100653.0, 142537.0, 194644.0, 256983.0, 320425.0, 375054.0, 413644.0, 421271.0, 397908.0, 348375.0, 286333.0, 222656.0, 166025.0, 118230.0, 81797.0, 55477.0, 36400.0, 23242.0, 14591.0, 9244.0, 5832.0, 3534.0, 2188.0, 1288.0, 776.0, 533.0, 254.0, 146.0, 115.0, 50.0, 45.0, 16.0, 15.0, 13.0, 5.0, 1.0, 2.0, 1.0], "bins": [-8.0625, -7.81988525390625, -7.5772705078125, -7.33465576171875, -7.092041015625, -6.84942626953125, -6.6068115234375, -6.36419677734375, -6.12158203125, -5.87896728515625, -5.6363525390625, -5.39373779296875, -5.151123046875, -4.90850830078125, -4.6658935546875, -4.42327880859375, -4.1806640625, -3.93804931640625, -3.6954345703125, -3.45281982421875, -3.210205078125, -2.96759033203125, -2.7249755859375, -2.48236083984375, -2.23974609375, -1.99713134765625, -1.7545166015625, -1.51190185546875, -1.269287109375, -1.02667236328125, -0.7840576171875, -0.54144287109375, -0.298828125, -0.05621337890625, 0.1864013671875, 0.42901611328125, 0.671630859375, 0.91424560546875, 1.1568603515625, 1.39947509765625, 1.64208984375, 1.88470458984375, 2.1273193359375, 2.36993408203125, 2.612548828125, 2.85516357421875, 3.0977783203125, 3.34039306640625, 3.5830078125, 3.82562255859375, 4.0682373046875, 4.31085205078125, 4.553466796875, 4.79608154296875, 5.0386962890625, 5.28131103515625, 5.52392578125, 5.76654052734375, 6.0091552734375, 6.25177001953125, 6.494384765625, 6.73699951171875, 6.9796142578125, 7.22222900390625, 7.46484375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 9.0, 6.0, 8.0, 9.0, 13.0, 20.0, 17.0, 15.0, 31.0, 49.0, 42.0, 44.0, 50.0, 75.0, 76.0, 83.0, 102.0, 110.0, 138.0, 132.0, 159.0, 169.0, 183.0, 194.0, 193.0, 180.0, 179.0, 179.0, 160.0, 163.0, 182.0, 145.0, 121.0, 129.0, 111.0, 94.0, 82.0, 86.0, 70.0, 44.0, 34.0, 39.0, 25.0, 20.0, 22.0, 20.0, 16.0, 13.0, 11.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0], "bins": [-3.6640625, -3.548553466796875, -3.43304443359375, -3.317535400390625, -3.2020263671875, -3.086517333984375, -2.97100830078125, -2.855499267578125, -2.739990234375, -2.624481201171875, -2.50897216796875, -2.393463134765625, -2.2779541015625, -2.162445068359375, -2.04693603515625, -1.931427001953125, -1.81591796875, -1.700408935546875, -1.58489990234375, -1.469390869140625, -1.3538818359375, -1.238372802734375, -1.12286376953125, -1.007354736328125, -0.891845703125, -0.776336669921875, -0.66082763671875, -0.545318603515625, -0.4298095703125, -0.314300537109375, -0.19879150390625, -0.083282470703125, 0.0322265625, 0.147735595703125, 0.26324462890625, 0.378753662109375, 0.4942626953125, 0.609771728515625, 0.72528076171875, 0.840789794921875, 0.956298828125, 1.071807861328125, 1.18731689453125, 1.302825927734375, 1.4183349609375, 1.533843994140625, 1.64935302734375, 1.764862060546875, 1.88037109375, 1.995880126953125, 2.11138916015625, 2.226898193359375, 2.3424072265625, 2.457916259765625, 2.57342529296875, 2.688934326171875, 2.804443359375, 2.919952392578125, 3.03546142578125, 3.150970458984375, 3.2664794921875, 3.381988525390625, 3.49749755859375, 3.613006591796875, 3.728515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 7.0, 6.0, 6.0, 9.0, 13.0, 16.0, 25.0, 23.0, 19.0, 28.0, 25.0, 30.0, 28.0, 34.0, 39.0, 53.0, 46.0, 51.0, 46.0, 48.0, 44.0, 36.0, 35.0, 43.0, 35.0, 30.0, 32.0, 43.0, 30.0, 14.0, 13.0, 20.0, 16.0, 9.0, 8.0, 14.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.409661293029785, -10.067312240600586, -9.724963188171387, -9.382614135742188, -9.040265083312988, -8.697916030883789, -8.355566024780273, -8.01321792602539, -7.670868396759033, -7.328519344329834, -6.986170291900635, -6.643820762634277, -6.301471710205078, -5.959122657775879, -5.61677360534668, -5.2744245529174805, -4.932075500488281, -4.589726448059082, -4.247377395629883, -3.9050281047821045, -3.5626790523529053, -3.220329999923706, -2.8779807090759277, -2.5356316566467285, -2.1932826042175293, -1.85093355178833, -1.5085843801498413, -1.1662352085113525, -0.8238861560821533, -0.4815371036529541, -0.13918781280517578, 0.20316123962402344, 0.5455093383789062, 0.8878584504127502, 1.2302075624465942, 1.572556734085083, 1.9149057865142822, 2.2572548389434814, 2.5996041297912598, 2.941953182220459, 3.284302234649658, 3.6266512870788574, 3.9690003395080566, 4.311349868774414, 4.653698921203613, 4.9960479736328125, 5.338397026062012, 5.680746078491211, 6.02309513092041, 6.365444183349609, 6.707793235778809, 7.050142288208008, 7.392491340637207, 7.734840393066406, 8.077190399169922, 8.419538497924805, 8.76188850402832, 9.10423755645752, 9.446586608886719, 9.788935661315918, 10.131284713745117, 10.473633766174316, 10.815982818603516, 11.158332824707031, 11.500680923461914]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 11.0, 9.0, 7.0, 9.0, 9.0, 13.0, 14.0, 11.0, 13.0, 13.0, 21.0, 22.0, 27.0, 29.0, 28.0, 43.0, 38.0, 30.0, 40.0, 42.0, 32.0, 42.0, 26.0, 47.0, 38.0, 36.0, 41.0, 32.0, 35.0, 27.0, 33.0, 19.0, 26.0, 25.0, 12.0, 10.0, 17.0, 11.0, 15.0, 9.0, 4.0, 10.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.375836372375488, -9.074422836303711, -8.773009300231934, -8.471595764160156, -8.170182228088379, -7.868768692016602, -7.567354679107666, -7.265941143035889, -6.964527606964111, -6.663114070892334, -6.361700534820557, -6.060286998748779, -5.758872985839844, -5.457459449768066, -5.156045913696289, -4.854632377624512, -4.553218841552734, -4.251805305480957, -3.9503917694091797, -3.6489779949188232, -3.347564458847046, -3.0461509227752686, -2.744737148284912, -2.4433236122131348, -2.1419100761413574, -1.84049654006958, -1.5390828847885132, -1.2376692295074463, -0.936255693435669, -0.6348421573638916, -0.3334285020828247, -0.03201484680175781, 0.2693977355957031, 0.5708113312721252, 0.8722249269485474, 1.1736385822296143, 1.4750521183013916, 1.776465654373169, 2.0778794288635254, 2.3792929649353027, 2.68070650100708, 2.9821200370788574, 3.2835335731506348, 3.584947347640991, 3.8863608837127686, 4.187774658203125, 4.489188194274902, 4.79060173034668, 5.092015266418457, 5.393428802490234, 5.694842338562012, 5.996255874633789, 6.297669410705566, 6.599082946777344, 6.900496959686279, 7.201910495758057, 7.503324031829834, 7.804737567901611, 8.106151580810547, 8.407565116882324, 8.708978652954102, 9.010392189025879, 9.311805725097656, 9.613219261169434, 9.914632797241211]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 10.0, 14.0, 23.0, 35.0, 41.0, 50.0, 94.0, 131.0, 194.0, 269.0, 408.0, 628.0, 1006.0, 1616.0, 2706.0, 4399.0, 7418.0, 12953.0, 23002.0, 41927.0, 74379.0, 127960.0, 192461.0, 206557.0, 147292.0, 88160.0, 49369.0, 27927.0, 15379.0, 8789.0, 5104.0, 3062.0, 1864.0, 1137.0, 743.0, 463.0, 323.0, 198.0, 127.0, 112.0, 64.0, 45.0, 25.0, 26.0, 14.0, 13.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.91015625, -5.726318359375, -5.54248046875, -5.358642578125, -5.1748046875, -4.990966796875, -4.80712890625, -4.623291015625, -4.439453125, -4.255615234375, -4.07177734375, -3.887939453125, -3.7041015625, -3.520263671875, -3.33642578125, -3.152587890625, -2.96875, -2.784912109375, -2.60107421875, -2.417236328125, -2.2333984375, -2.049560546875, -1.86572265625, -1.681884765625, -1.498046875, -1.314208984375, -1.13037109375, -0.946533203125, -0.7626953125, -0.578857421875, -0.39501953125, -0.211181640625, -0.02734375, 0.156494140625, 0.34033203125, 0.524169921875, 0.7080078125, 0.891845703125, 1.07568359375, 1.259521484375, 1.443359375, 1.627197265625, 1.81103515625, 1.994873046875, 2.1787109375, 2.362548828125, 2.54638671875, 2.730224609375, 2.9140625, 3.097900390625, 3.28173828125, 3.465576171875, 3.6494140625, 3.833251953125, 4.01708984375, 4.200927734375, 4.384765625, 4.568603515625, 4.75244140625, 4.936279296875, 5.1201171875, 5.303955078125, 5.48779296875, 5.671630859375, 5.85546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 2.0, 8.0, 7.0, 11.0, 6.0, 11.0, 11.0, 12.0, 15.0, 13.0, 12.0, 18.0, 20.0, 27.0, 28.0, 26.0, 33.0, 44.0, 36.0, 32.0, 43.0, 38.0, 35.0, 32.0, 45.0, 36.0, 38.0, 32.0, 38.0, 43.0, 17.0, 39.0, 23.0, 20.0, 32.0, 17.0, 10.0, 16.0, 10.0, 9.0, 18.0, 3.0, 10.0, 6.0, 4.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.40625, -9.1070556640625, -8.807861328125, -8.5086669921875, -8.20947265625, -7.9102783203125, -7.611083984375, -7.3118896484375, -7.0126953125, -6.7135009765625, -6.414306640625, -6.1151123046875, -5.81591796875, -5.5167236328125, -5.217529296875, -4.9183349609375, -4.619140625, -4.3199462890625, -4.020751953125, -3.7215576171875, -3.42236328125, -3.1231689453125, -2.823974609375, -2.5247802734375, -2.2255859375, -1.9263916015625, -1.627197265625, -1.3280029296875, -1.02880859375, -0.7296142578125, -0.430419921875, -0.1312255859375, 0.16796875, 0.4671630859375, 0.766357421875, 1.0655517578125, 1.36474609375, 1.6639404296875, 1.963134765625, 2.2623291015625, 2.5615234375, 2.8607177734375, 3.159912109375, 3.4591064453125, 3.75830078125, 4.0574951171875, 4.356689453125, 4.6558837890625, 4.955078125, 5.2542724609375, 5.553466796875, 5.8526611328125, 6.15185546875, 6.4510498046875, 6.750244140625, 7.0494384765625, 7.3486328125, 7.6478271484375, 7.947021484375, 8.2462158203125, 8.54541015625, 8.8446044921875, 9.143798828125, 9.4429931640625, 9.7421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 4.0, 6.0, 4.0, 12.0, 13.0, 22.0, 29.0, 24.0, 44.0, 54.0, 107.0, 106.0, 187.0, 204.0, 344.0, 448.0, 735.0, 1104.0, 1696.0, 2875.0, 5255.0, 10107.0, 21708.0, 52899.0, 138308.0, 326922.0, 287885.0, 113979.0, 44023.0, 18713.0, 8803.0, 4702.0, 2608.0, 1580.0, 932.0, 636.0, 462.0, 267.0, 193.0, 143.0, 117.0, 84.0, 62.0, 32.0, 28.0, 20.0, 21.0, 13.0, 12.0, 7.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0], "bins": [-6.21875, -6.02972412109375, -5.8406982421875, -5.65167236328125, -5.462646484375, -5.27362060546875, -5.0845947265625, -4.89556884765625, -4.70654296875, -4.51751708984375, -4.3284912109375, -4.13946533203125, -3.950439453125, -3.76141357421875, -3.5723876953125, -3.38336181640625, -3.1943359375, -3.00531005859375, -2.8162841796875, -2.62725830078125, -2.438232421875, -2.24920654296875, -2.0601806640625, -1.87115478515625, -1.68212890625, -1.49310302734375, -1.3040771484375, -1.11505126953125, -0.926025390625, -0.73699951171875, -0.5479736328125, -0.35894775390625, -0.169921875, 0.01910400390625, 0.2081298828125, 0.39715576171875, 0.586181640625, 0.77520751953125, 0.9642333984375, 1.15325927734375, 1.34228515625, 1.53131103515625, 1.7203369140625, 1.90936279296875, 2.098388671875, 2.28741455078125, 2.4764404296875, 2.66546630859375, 2.8544921875, 3.04351806640625, 3.2325439453125, 3.42156982421875, 3.610595703125, 3.79962158203125, 3.9886474609375, 4.17767333984375, 4.36669921875, 4.55572509765625, 4.7447509765625, 4.93377685546875, 5.122802734375, 5.31182861328125, 5.5008544921875, 5.68988037109375, 5.87890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 4.0, 6.0, 3.0, 8.0, 8.0, 12.0, 9.0, 14.0, 9.0, 25.0, 14.0, 27.0, 28.0, 32.0, 27.0, 43.0, 39.0, 37.0, 27.0, 28.0, 44.0, 38.0, 40.0, 41.0, 39.0, 44.0, 32.0, 30.0, 29.0, 32.0, 25.0, 41.0, 29.0, 19.0, 20.0, 17.0, 15.0, 10.0, 12.0, 13.0, 7.0, 7.0, 5.0, 1.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-7.19140625, -6.98876953125, -6.7861328125, -6.58349609375, -6.380859375, -6.17822265625, -5.9755859375, -5.77294921875, -5.5703125, -5.36767578125, -5.1650390625, -4.96240234375, -4.759765625, -4.55712890625, -4.3544921875, -4.15185546875, -3.94921875, -3.74658203125, -3.5439453125, -3.34130859375, -3.138671875, -2.93603515625, -2.7333984375, -2.53076171875, -2.328125, -2.12548828125, -1.9228515625, -1.72021484375, -1.517578125, -1.31494140625, -1.1123046875, -0.90966796875, -0.70703125, -0.50439453125, -0.3017578125, -0.09912109375, 0.103515625, 0.30615234375, 0.5087890625, 0.71142578125, 0.9140625, 1.11669921875, 1.3193359375, 1.52197265625, 1.724609375, 1.92724609375, 2.1298828125, 2.33251953125, 2.53515625, 2.73779296875, 2.9404296875, 3.14306640625, 3.345703125, 3.54833984375, 3.7509765625, 3.95361328125, 4.15625, 4.35888671875, 4.5615234375, 4.76416015625, 4.966796875, 5.16943359375, 5.3720703125, 5.57470703125, 5.77734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 15.0, 16.0, 16.0, 36.0, 45.0, 73.0, 88.0, 141.0, 216.0, 353.0, 627.0, 1022.0, 2215.0, 5910.0, 27348.0, 898733.0, 95816.0, 9461.0, 3174.0, 1345.0, 744.0, 397.0, 254.0, 151.0, 100.0, 69.0, 51.0, 38.0, 27.0, 20.0, 10.0, 6.0, 4.0, 11.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.924072265625, -10.54345703125, -10.162841796875, -9.7822265625, -9.401611328125, -9.02099609375, -8.640380859375, -8.259765625, -7.879150390625, -7.49853515625, -7.117919921875, -6.7373046875, -6.356689453125, -5.97607421875, -5.595458984375, -5.21484375, -4.834228515625, -4.45361328125, -4.072998046875, -3.6923828125, -3.311767578125, -2.93115234375, -2.550537109375, -2.169921875, -1.789306640625, -1.40869140625, -1.028076171875, -0.6474609375, -0.266845703125, 0.11376953125, 0.494384765625, 0.875, 1.255615234375, 1.63623046875, 2.016845703125, 2.3974609375, 2.778076171875, 3.15869140625, 3.539306640625, 3.919921875, 4.300537109375, 4.68115234375, 5.061767578125, 5.4423828125, 5.822998046875, 6.20361328125, 6.584228515625, 6.96484375, 7.345458984375, 7.72607421875, 8.106689453125, 8.4873046875, 8.867919921875, 9.24853515625, 9.629150390625, 10.009765625, 10.390380859375, 10.77099609375, 11.151611328125, 11.5322265625, 11.912841796875, 12.29345703125, 12.674072265625, 13.0546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 19.0, 30.0, 83.0, 133.0, 215.0, 216.0, 131.0, 80.0, 33.0, 17.0, 13.0, 3.0, 2.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001346588134765625, -0.001316666603088379, -0.0012867450714111328, -0.0012568235397338867, -0.0012269020080566406, -0.0011969804763793945, -0.0011670589447021484, -0.0011371374130249023, -0.0011072158813476562, -0.0010772943496704102, -0.001047372817993164, -0.001017451286315918, -0.0009875297546386719, -0.0009576082229614258, -0.0009276866912841797, -0.0008977651596069336, -0.0008678436279296875, -0.0008379220962524414, -0.0008080005645751953, -0.0007780790328979492, -0.0007481575012207031, -0.000718235969543457, -0.0006883144378662109, -0.0006583929061889648, -0.0006284713745117188, -0.0005985498428344727, -0.0005686283111572266, -0.0005387067794799805, -0.0005087852478027344, -0.0004788637161254883, -0.0004489421844482422, -0.0004190206527709961, -0.00038909912109375, -0.0003591775894165039, -0.0003292560577392578, -0.0002993345260620117, -0.0002694129943847656, -0.00023949146270751953, -0.00020956993103027344, -0.00017964839935302734, -0.00014972686767578125, -0.00011980533599853516, -8.988380432128906e-05, -5.996227264404297e-05, -3.0040740966796875e-05, -1.1920928955078125e-07, 2.9802322387695312e-05, 5.9723854064941406e-05, 8.96453857421875e-05, 0.0001195669174194336, 0.0001494884490966797, 0.00017940998077392578, 0.00020933151245117188, 0.00023925304412841797, 0.00026917457580566406, 0.00029909610748291016, 0.00032901763916015625, 0.00035893917083740234, 0.00038886070251464844, 0.00041878223419189453, 0.0004487037658691406, 0.0004786252975463867, 0.0005085468292236328, 0.0005384683609008789, 0.000568389892578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 7.0, 15.0, 12.0, 25.0, 30.0, 36.0, 54.0, 72.0, 118.0, 139.0, 233.0, 317.0, 459.0, 677.0, 1049.0, 1704.0, 2889.0, 5776.0, 14047.0, 48201.0, 312295.0, 532760.0, 89563.0, 20836.0, 7673.0, 3705.0, 2063.0, 1281.0, 787.0, 517.0, 358.0, 273.0, 166.0, 105.0, 79.0, 50.0, 45.0, 34.0, 27.0, 21.0, 15.0, 15.0, 9.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.92578125, -8.6484375, -8.37109375, -8.09375, -7.81640625, -7.5390625, -7.26171875, -6.984375, -6.70703125, -6.4296875, -6.15234375, -5.875, -5.59765625, -5.3203125, -5.04296875, -4.765625, -4.48828125, -4.2109375, -3.93359375, -3.65625, -3.37890625, -3.1015625, -2.82421875, -2.546875, -2.26953125, -1.9921875, -1.71484375, -1.4375, -1.16015625, -0.8828125, -0.60546875, -0.328125, -0.05078125, 0.2265625, 0.50390625, 0.78125, 1.05859375, 1.3359375, 1.61328125, 1.890625, 2.16796875, 2.4453125, 2.72265625, 3.0, 3.27734375, 3.5546875, 3.83203125, 4.109375, 4.38671875, 4.6640625, 4.94140625, 5.21875, 5.49609375, 5.7734375, 6.05078125, 6.328125, 6.60546875, 6.8828125, 7.16015625, 7.4375, 7.71484375, 7.9921875, 8.26953125, 8.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 10.0, 10.0, 12.0, 18.0, 15.0, 35.0, 33.0, 64.0, 83.0, 123.0, 129.0, 146.0, 93.0, 63.0, 51.0, 39.0, 20.0, 14.0, 11.0, 7.0, 1.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.0205078125, -1.95703125, -1.8935546875, -1.830078125, -1.7666015625, -1.703125, -1.6396484375, -1.576171875, -1.5126953125, -1.44921875, -1.3857421875, -1.322265625, -1.2587890625, -1.1953125, -1.1318359375, -1.068359375, -1.0048828125, -0.94140625, -0.8779296875, -0.814453125, -0.7509765625, -0.6875, -0.6240234375, -0.560546875, -0.4970703125, -0.43359375, -0.3701171875, -0.306640625, -0.2431640625, -0.1796875, -0.1162109375, -0.052734375, 0.0107421875, 0.07421875, 0.1376953125, 0.201171875, 0.2646484375, 0.328125, 0.3916015625, 0.455078125, 0.5185546875, 0.58203125, 0.6455078125, 0.708984375, 0.7724609375, 0.8359375, 0.8994140625, 0.962890625, 1.0263671875, 1.08984375, 1.1533203125, 1.216796875, 1.2802734375, 1.34375, 1.4072265625, 1.470703125, 1.5341796875, 1.59765625, 1.6611328125, 1.724609375, 1.7880859375, 1.8515625, 1.9150390625, 1.978515625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 7.0, 7.0, 7.0, 12.0, 17.0, 19.0, 21.0, 18.0, 36.0, 30.0, 40.0, 32.0, 42.0, 43.0, 42.0, 50.0, 43.0, 55.0, 56.0, 47.0, 40.0, 40.0, 31.0, 34.0, 42.0, 34.0, 32.0, 15.0, 22.0, 12.0, 18.0, 17.0, 5.0, 5.0, 11.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.436753273010254, -10.071313858032227, -9.7058744430542, -9.340435028076172, -8.974996566772461, -8.609557151794434, -8.244117736816406, -7.878678321838379, -7.51323938369751, -7.147799968719482, -6.782361030578613, -6.416921615600586, -6.051482200622559, -5.6860432624816895, -5.320603847503662, -4.955164909362793, -4.589725494384766, -4.224286079406738, -3.858847141265869, -3.493407726287842, -3.1279685497283936, -2.7625293731689453, -2.397089958190918, -2.0316507816314697, -1.6662116050720215, -1.3007724285125732, -0.9353331327438354, -0.5698938369750977, -0.20445466041564941, 0.16098451614379883, 0.5264239311218262, 0.8918631076812744, 1.2573022842407227, 1.622741460800171, 1.9881807565689087, 2.3536200523376465, 2.7190592288970947, 3.084498405456543, 3.4499378204345703, 3.8153769969940186, 4.180816173553467, 4.546255588531494, 4.911694526672363, 5.277133941650391, 5.642573356628418, 6.008012294769287, 6.3734517097473145, 6.738890647888184, 7.104330062866211, 7.469769477844238, 7.835208415985107, 8.200647354125977, 8.566086769104004, 8.931526184082031, 9.296965599060059, 9.662405014038086, 10.027843475341797, 10.393282890319824, 10.758722305297852, 11.124160766601562, 11.48960018157959, 11.855039596557617, 12.220479011535645, 12.585918426513672, 12.9513578414917]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 10.0, 6.0, 6.0, 10.0, 9.0, 21.0, 10.0, 9.0, 17.0, 18.0, 20.0, 25.0, 33.0, 26.0, 34.0, 34.0, 45.0, 35.0, 40.0, 28.0, 41.0, 38.0, 34.0, 45.0, 32.0, 31.0, 39.0, 34.0, 37.0, 32.0, 17.0, 24.0, 27.0, 13.0, 10.0, 20.0, 12.0, 11.0, 13.0, 8.0, 7.0, 7.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.277950286865234, -8.9810209274292, -8.684091567993164, -8.387163162231445, -8.09023380279541, -7.793304443359375, -7.49637508392334, -7.199445724487305, -6.902516841888428, -6.605587482452393, -6.308658599853516, -6.0117292404174805, -5.714799880981445, -5.417870998382568, -5.120941638946533, -4.824012756347656, -4.527083396911621, -4.230154037475586, -3.933225154876709, -3.636295795440674, -3.3393666744232178, -3.0424375534057617, -2.7455081939697266, -2.4485790729522705, -2.1516499519348145, -1.8547208309173584, -1.5577915906906128, -1.2608623504638672, -0.9639332294464111, -0.6670041084289551, -0.3700748682022095, -0.07314562797546387, 0.2237834930419922, 0.520712673664093, 0.8176418542861938, 1.1145710945129395, 1.4115002155303955, 1.7084293365478516, 2.0053586959838867, 2.3022878170013428, 2.599216938018799, 2.896146059036255, 3.193075180053711, 3.490004539489746, 3.786933660507202, 4.083862781524658, 4.380792140960693, 4.67772102355957, 4.9746503829956055, 5.271579742431641, 5.568508625030518, 5.865437984466553, 6.16236686706543, 6.459296226501465, 6.7562255859375, 7.053154945373535, 7.350083827972412, 7.647013187408447, 7.943942070007324, 8.24087142944336, 8.537800788879395, 8.83473014831543, 9.131658554077148, 9.428587913513184, 9.725517272949219]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 10.0, 19.0, 41.0, 64.0, 87.0, 140.0, 201.0, 308.0, 512.0, 808.0, 1218.0, 1875.0, 2797.0, 4252.0, 6347.0, 9439.0, 13961.0, 19428.0, 27074.0, 36860.0, 48352.0, 60769.0, 72483.0, 83123.0, 90918.0, 93244.0, 90123.0, 82869.0, 71880.0, 59426.0, 47097.0, 36006.0, 26697.0, 19235.0, 13383.0, 9374.0, 6214.0, 4206.0, 2739.0, 1805.0, 1174.0, 717.0, 465.0, 279.0, 189.0, 122.0, 81.0, 54.0, 35.0, 17.0, 15.0, 9.0, 6.0, 7.0, 0.0, 1.0], "bins": [-8.484375, -8.2308349609375, -7.977294921875, -7.7237548828125, -7.47021484375, -7.2166748046875, -6.963134765625, -6.7095947265625, -6.4560546875, -6.2025146484375, -5.948974609375, -5.6954345703125, -5.44189453125, -5.1883544921875, -4.934814453125, -4.6812744140625, -4.427734375, -4.1741943359375, -3.920654296875, -3.6671142578125, -3.41357421875, -3.1600341796875, -2.906494140625, -2.6529541015625, -2.3994140625, -2.1458740234375, -1.892333984375, -1.6387939453125, -1.38525390625, -1.1317138671875, -0.878173828125, -0.6246337890625, -0.37109375, -0.1175537109375, 0.135986328125, 0.3895263671875, 0.64306640625, 0.8966064453125, 1.150146484375, 1.4036865234375, 1.6572265625, 1.9107666015625, 2.164306640625, 2.4178466796875, 2.67138671875, 2.9249267578125, 3.178466796875, 3.4320068359375, 3.685546875, 3.9390869140625, 4.192626953125, 4.4461669921875, 4.69970703125, 4.9532470703125, 5.206787109375, 5.4603271484375, 5.7138671875, 5.9674072265625, 6.220947265625, 6.4744873046875, 6.72802734375, 6.9815673828125, 7.235107421875, 7.4886474609375, 7.7421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 8.0, 6.0, 9.0, 10.0, 14.0, 14.0, 11.0, 14.0, 19.0, 18.0, 30.0, 27.0, 24.0, 30.0, 43.0, 37.0, 39.0, 38.0, 30.0, 33.0, 36.0, 40.0, 44.0, 37.0, 30.0, 35.0, 36.0, 30.0, 42.0, 21.0, 22.0, 28.0, 15.0, 11.0, 16.0, 14.0, 12.0, 13.0, 6.0, 12.0, 2.0, 9.0, 3.0, 3.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.0, -8.7154541015625, -8.430908203125, -8.1463623046875, -7.86181640625, -7.5772705078125, -7.292724609375, -7.0081787109375, -6.7236328125, -6.4390869140625, -6.154541015625, -5.8699951171875, -5.58544921875, -5.3009033203125, -5.016357421875, -4.7318115234375, -4.447265625, -4.1627197265625, -3.878173828125, -3.5936279296875, -3.30908203125, -3.0245361328125, -2.739990234375, -2.4554443359375, -2.1708984375, -1.8863525390625, -1.601806640625, -1.3172607421875, -1.03271484375, -0.7481689453125, -0.463623046875, -0.1790771484375, 0.10546875, 0.3900146484375, 0.674560546875, 0.9591064453125, 1.24365234375, 1.5281982421875, 1.812744140625, 2.0972900390625, 2.3818359375, 2.6663818359375, 2.950927734375, 3.2354736328125, 3.52001953125, 3.8045654296875, 4.089111328125, 4.3736572265625, 4.658203125, 4.9427490234375, 5.227294921875, 5.5118408203125, 5.79638671875, 6.0809326171875, 6.365478515625, 6.6500244140625, 6.9345703125, 7.2191162109375, 7.503662109375, 7.7882080078125, 8.07275390625, 8.3572998046875, 8.641845703125, 8.9263916015625, 9.2109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 8.0, 11.0, 27.0, 38.0, 60.0, 90.0, 140.0, 240.0, 327.0, 567.0, 819.0, 1365.0, 2220.0, 3527.0, 5717.0, 8914.0, 13969.0, 21477.0, 32081.0, 46422.0, 63612.0, 83237.0, 100286.0, 112366.0, 114792.0, 106842.0, 91504.0, 72886.0, 54192.0, 37753.0, 25989.0, 17100.0, 11247.0, 6954.0, 4423.0, 2669.0, 1777.0, 1032.0, 679.0, 406.0, 295.0, 172.0, 120.0, 77.0, 52.0, 32.0, 15.0, 9.0, 8.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.545166015625, -10.20751953125, -9.869873046875, -9.5322265625, -9.194580078125, -8.85693359375, -8.519287109375, -8.181640625, -7.843994140625, -7.50634765625, -7.168701171875, -6.8310546875, -6.493408203125, -6.15576171875, -5.818115234375, -5.48046875, -5.142822265625, -4.80517578125, -4.467529296875, -4.1298828125, -3.792236328125, -3.45458984375, -3.116943359375, -2.779296875, -2.441650390625, -2.10400390625, -1.766357421875, -1.4287109375, -1.091064453125, -0.75341796875, -0.415771484375, -0.078125, 0.259521484375, 0.59716796875, 0.934814453125, 1.2724609375, 1.610107421875, 1.94775390625, 2.285400390625, 2.623046875, 2.960693359375, 3.29833984375, 3.635986328125, 3.9736328125, 4.311279296875, 4.64892578125, 4.986572265625, 5.32421875, 5.661865234375, 5.99951171875, 6.337158203125, 6.6748046875, 7.012451171875, 7.35009765625, 7.687744140625, 8.025390625, 8.363037109375, 8.70068359375, 9.038330078125, 9.3759765625, 9.713623046875, 10.05126953125, 10.388916015625, 10.7265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 6.0, 12.0, 13.0, 15.0, 9.0, 22.0, 14.0, 24.0, 24.0, 19.0, 28.0, 34.0, 34.0, 31.0, 32.0, 33.0, 48.0, 34.0, 46.0, 44.0, 40.0, 36.0, 36.0, 26.0, 36.0, 27.0, 33.0, 31.0, 29.0, 28.0, 19.0, 17.0, 19.0, 14.0, 12.0, 8.0, 10.0, 8.0, 9.0, 7.0, 5.0, 4.0, 1.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.41082763671875, -6.2122802734375, -6.01373291015625, -5.815185546875, -5.61663818359375, -5.4180908203125, -5.21954345703125, -5.02099609375, -4.82244873046875, -4.6239013671875, -4.42535400390625, -4.226806640625, -4.02825927734375, -3.8297119140625, -3.63116455078125, -3.4326171875, -3.23406982421875, -3.0355224609375, -2.83697509765625, -2.638427734375, -2.43988037109375, -2.2413330078125, -2.04278564453125, -1.84423828125, -1.64569091796875, -1.4471435546875, -1.24859619140625, -1.050048828125, -0.85150146484375, -0.6529541015625, -0.45440673828125, -0.255859375, -0.05731201171875, 0.1412353515625, 0.33978271484375, 0.538330078125, 0.73687744140625, 0.9354248046875, 1.13397216796875, 1.33251953125, 1.53106689453125, 1.7296142578125, 1.92816162109375, 2.126708984375, 2.32525634765625, 2.5238037109375, 2.72235107421875, 2.9208984375, 3.11944580078125, 3.3179931640625, 3.51654052734375, 3.715087890625, 3.91363525390625, 4.1121826171875, 4.31072998046875, 4.50927734375, 4.70782470703125, 4.9063720703125, 5.10491943359375, 5.303466796875, 5.50201416015625, 5.7005615234375, 5.89910888671875, 6.09765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 11.0, 9.0, 23.0, 34.0, 44.0, 73.0, 121.0, 178.0, 260.0, 402.0, 665.0, 1144.0, 1770.0, 2723.0, 4445.0, 7170.0, 11722.0, 18839.0, 29577.0, 46539.0, 69226.0, 96975.0, 121857.0, 137063.0, 133228.0, 112702.0, 85818.0, 60054.0, 39432.0, 24937.0, 15793.0, 9864.0, 5961.0, 3645.0, 2306.0, 1480.0, 899.0, 551.0, 348.0, 263.0, 143.0, 87.0, 71.0, 41.0, 26.0, 9.0, 11.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2421875, -4.10882568359375, -3.9754638671875, -3.84210205078125, -3.708740234375, -3.57537841796875, -3.4420166015625, -3.30865478515625, -3.17529296875, -3.04193115234375, -2.9085693359375, -2.77520751953125, -2.641845703125, -2.50848388671875, -2.3751220703125, -2.24176025390625, -2.1083984375, -1.97503662109375, -1.8416748046875, -1.70831298828125, -1.574951171875, -1.44158935546875, -1.3082275390625, -1.17486572265625, -1.04150390625, -0.90814208984375, -0.7747802734375, -0.64141845703125, -0.508056640625, -0.37469482421875, -0.2413330078125, -0.10797119140625, 0.025390625, 0.15875244140625, 0.2921142578125, 0.42547607421875, 0.558837890625, 0.69219970703125, 0.8255615234375, 0.95892333984375, 1.09228515625, 1.22564697265625, 1.3590087890625, 1.49237060546875, 1.625732421875, 1.75909423828125, 1.8924560546875, 2.02581787109375, 2.1591796875, 2.29254150390625, 2.4259033203125, 2.55926513671875, 2.692626953125, 2.82598876953125, 2.9593505859375, 3.09271240234375, 3.22607421875, 3.35943603515625, 3.4927978515625, 3.62615966796875, 3.759521484375, 3.89288330078125, 4.0262451171875, 4.15960693359375, 4.29296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 10.0, 5.0, 15.0, 14.0, 13.0, 18.0, 25.0, 25.0, 42.0, 59.0, 49.0, 43.0, 40.0, 58.0, 62.0, 51.0, 76.0, 60.0, 44.0, 41.0, 36.0, 44.0, 33.0, 29.0, 29.0, 21.0, 13.0, 11.0, 3.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005974769592285156, -0.0005784407258033752, -0.0005594044923782349, -0.0005403682589530945, -0.0005213320255279541, -0.0005022957921028137, -0.00048325955867767334, -0.00046422332525253296, -0.0004451870918273926, -0.0004261508584022522, -0.0004071146249771118, -0.00038807839155197144, -0.00036904215812683105, -0.0003500059247016907, -0.0003309696912765503, -0.0003119334578514099, -0.00029289722442626953, -0.00027386099100112915, -0.00025482475757598877, -0.0002357885241508484, -0.000216752290725708, -0.00019771605730056763, -0.00017867982387542725, -0.00015964359045028687, -0.00014060735702514648, -0.0001215711236000061, -0.00010253489017486572, -8.349865674972534e-05, -6.446242332458496e-05, -4.542618989944458e-05, -2.63899564743042e-05, -7.353723049163818e-06, 1.1682510375976562e-05, 3.071874380111694e-05, 4.9754977226257324e-05, 6.87912106513977e-05, 8.782744407653809e-05, 0.00010686367750167847, 0.00012589991092681885, 0.00014493614435195923, 0.0001639723777770996, 0.00018300861120224, 0.00020204484462738037, 0.00022108107805252075, 0.00024011731147766113, 0.0002591535449028015, 0.0002781897783279419, 0.0002972260117530823, 0.00031626224517822266, 0.00033529847860336304, 0.0003543347120285034, 0.0003733709454536438, 0.0003924071788787842, 0.00041144341230392456, 0.00043047964572906494, 0.0004495158791542053, 0.0004685521125793457, 0.0004875883460044861, 0.0005066245794296265, 0.0005256608128547668, 0.0005446970462799072, 0.0005637332797050476, 0.000582769513130188, 0.0006018057465553284, 0.0006208419799804688]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 13.0, 17.0, 24.0, 31.0, 44.0, 65.0, 111.0, 158.0, 252.0, 423.0, 732.0, 1226.0, 2093.0, 3628.0, 6381.0, 11637.0, 19699.0, 34005.0, 56310.0, 86398.0, 120801.0, 148074.0, 153431.0, 133179.0, 101518.0, 67611.0, 42225.0, 24844.0, 14331.0, 8210.0, 4678.0, 2620.0, 1487.0, 881.0, 515.0, 351.0, 183.0, 124.0, 91.0, 46.0, 21.0, 29.0, 15.0, 12.0, 11.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.85546875, -4.7047119140625, -4.553955078125, -4.4031982421875, -4.25244140625, -4.1016845703125, -3.950927734375, -3.8001708984375, -3.6494140625, -3.4986572265625, -3.347900390625, -3.1971435546875, -3.04638671875, -2.8956298828125, -2.744873046875, -2.5941162109375, -2.443359375, -2.2926025390625, -2.141845703125, -1.9910888671875, -1.84033203125, -1.6895751953125, -1.538818359375, -1.3880615234375, -1.2373046875, -1.0865478515625, -0.935791015625, -0.7850341796875, -0.63427734375, -0.4835205078125, -0.332763671875, -0.1820068359375, -0.03125, 0.1195068359375, 0.270263671875, 0.4210205078125, 0.57177734375, 0.7225341796875, 0.873291015625, 1.0240478515625, 1.1748046875, 1.3255615234375, 1.476318359375, 1.6270751953125, 1.77783203125, 1.9285888671875, 2.079345703125, 2.2301025390625, 2.380859375, 2.5316162109375, 2.682373046875, 2.8331298828125, 2.98388671875, 3.1346435546875, 3.285400390625, 3.4361572265625, 3.5869140625, 3.7376708984375, 3.888427734375, 4.0391845703125, 4.18994140625, 4.3406982421875, 4.491455078125, 4.6422119140625, 4.79296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 12.0, 5.0, 12.0, 14.0, 11.0, 19.0, 25.0, 27.0, 27.0, 29.0, 34.0, 34.0, 41.0, 47.0, 48.0, 40.0, 56.0, 46.0, 58.0, 54.0, 50.0, 43.0, 29.0, 33.0, 26.0, 41.0, 23.0, 19.0, 11.0, 23.0, 12.0, 4.0, 11.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.439453125, -1.3881683349609375, -1.336883544921875, -1.2855987548828125, -1.23431396484375, -1.1830291748046875, -1.131744384765625, -1.0804595947265625, -1.0291748046875, -0.9778900146484375, -0.926605224609375, -0.8753204345703125, -0.82403564453125, -0.7727508544921875, -0.721466064453125, -0.6701812744140625, -0.618896484375, -0.5676116943359375, -0.516326904296875, -0.4650421142578125, -0.41375732421875, -0.3624725341796875, -0.311187744140625, -0.2599029541015625, -0.2086181640625, -0.1573333740234375, -0.106048583984375, -0.0547637939453125, -0.00347900390625, 0.0478057861328125, 0.099090576171875, 0.1503753662109375, 0.20166015625, 0.2529449462890625, 0.304229736328125, 0.3555145263671875, 0.40679931640625, 0.4580841064453125, 0.509368896484375, 0.5606536865234375, 0.6119384765625, 0.6632232666015625, 0.714508056640625, 0.7657928466796875, 0.81707763671875, 0.8683624267578125, 0.919647216796875, 0.9709320068359375, 1.022216796875, 1.0735015869140625, 1.124786376953125, 1.1760711669921875, 1.22735595703125, 1.2786407470703125, 1.329925537109375, 1.3812103271484375, 1.4324951171875, 1.4837799072265625, 1.535064697265625, 1.5863494873046875, 1.63763427734375, 1.6889190673828125, 1.740203857421875, 1.7914886474609375, 1.8427734375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 12.0, 8.0, 6.0, 13.0, 14.0, 14.0, 21.0, 21.0, 34.0, 35.0, 36.0, 39.0, 47.0, 43.0, 41.0, 53.0, 43.0, 57.0, 57.0, 50.0, 32.0, 36.0, 40.0, 37.0, 32.0, 26.0, 21.0, 23.0, 19.0, 14.0, 11.0, 19.0, 13.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.24126148223877, -10.870044708251953, -10.498828887939453, -10.127612113952637, -9.75639533996582, -9.38517951965332, -9.013962745666504, -8.642745971679688, -8.271530151367188, -7.900313854217529, -7.529097080230713, -7.157880783081055, -6.786664009094238, -6.41544771194458, -6.044231414794922, -5.6730146408081055, -5.301797866821289, -4.930581569671631, -4.5593647956848145, -4.188148498535156, -3.816931962966919, -3.4457154273986816, -3.0744991302490234, -2.703282594680786, -2.332066059112549, -1.9608495235443115, -1.5896331071853638, -1.218416690826416, -0.8472001552581787, -0.4759836196899414, -0.1047673225402832, 0.2664492130279541, 0.6376657485961914, 1.0088822841644287, 1.3800987005233765, 1.7513151168823242, 2.1225316524505615, 2.493748188018799, 2.864964485168457, 3.2361810207366943, 3.6073975563049316, 3.978614091873169, 4.349830627441406, 4.7210469245910645, 5.092263221740723, 5.463479995727539, 5.834696292877197, 6.2059125900268555, 6.577129364013672, 6.94834566116333, 7.3195624351501465, 7.690778732299805, 8.061995506286621, 8.433212280273438, 8.804428100585938, 9.175644874572754, 9.54686164855957, 9.918078422546387, 10.289294242858887, 10.660511016845703, 11.03172779083252, 11.402944564819336, 11.774160385131836, 12.145377159118652, 12.516592979431152]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 10.0, 10.0, 12.0, 8.0, 9.0, 12.0, 20.0, 14.0, 27.0, 26.0, 30.0, 39.0, 42.0, 33.0, 22.0, 36.0, 32.0, 43.0, 39.0, 47.0, 38.0, 38.0, 43.0, 47.0, 39.0, 31.0, 26.0, 38.0, 28.0, 31.0, 19.0, 23.0, 13.0, 13.0, 12.0, 10.0, 3.0, 11.0, 2.0, 7.0, 5.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.42354679107666, -11.083907127380371, -10.744266510009766, -10.404626846313477, -10.064986228942871, -9.725346565246582, -9.385705947875977, -9.046066284179688, -8.706426620483398, -8.36678695678711, -8.027146339416504, -7.687506675720215, -7.347866058349609, -7.00822639465332, -6.668586254119873, -6.328946113586426, -5.98930549621582, -5.649665355682373, -5.310025215148926, -4.970385551452637, -4.630744934082031, -4.291105270385742, -3.951465129852295, -3.6118249893188477, -3.2721848487854004, -2.932544708251953, -2.592904567718506, -2.2532646656036377, -1.9136245250701904, -1.5739843845367432, -1.234344482421875, -0.8947043418884277, -0.5550642013549805, -0.21542412042617798, 0.12421596050262451, 0.4638559818267822, 0.8034961223602295, 1.1431362628936768, 1.482776165008545, 1.8224163055419922, 2.1620564460754395, 2.5016965866088867, 2.841336727142334, 3.180976629257202, 3.5206167697906494, 3.8602569103240967, 4.199896812438965, 4.539536952972412, 4.879177093505859, 5.218817234039307, 5.558457374572754, 5.898097038269043, 6.237737655639648, 6.5773773193359375, 6.917017459869385, 7.256657600402832, 7.596297740936279, 7.935937881469727, 8.275577545166016, 8.615218162536621, 8.95485782623291, 9.294498443603516, 9.634138107299805, 9.973777770996094, 10.3134183883667]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 11.0, 13.0, 25.0, 42.0, 51.0, 97.0, 129.0, 230.0, 347.0, 595.0, 866.0, 1443.0, 2376.0, 3671.0, 5884.0, 9457.0, 14870.0, 23456.0, 36857.0, 56913.0, 86738.0, 128732.0, 185494.0, 257788.0, 337411.0, 414545.0, 464928.0, 470876.0, 431344.0, 360255.0, 278020.0, 203408.0, 142787.0, 96658.0, 63999.0, 41802.0, 26756.0, 17041.0, 10714.0, 6634.0, 4237.0, 2559.0, 1572.0, 1009.0, 616.0, 377.0, 253.0, 160.0, 104.0, 60.0, 29.0, 16.0, 13.0, 10.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.671875, -8.41015625, -8.1484375, -7.88671875, -7.625, -7.36328125, -7.1015625, -6.83984375, -6.578125, -6.31640625, -6.0546875, -5.79296875, -5.53125, -5.26953125, -5.0078125, -4.74609375, -4.484375, -4.22265625, -3.9609375, -3.69921875, -3.4375, -3.17578125, -2.9140625, -2.65234375, -2.390625, -2.12890625, -1.8671875, -1.60546875, -1.34375, -1.08203125, -0.8203125, -0.55859375, -0.296875, -0.03515625, 0.2265625, 0.48828125, 0.75, 1.01171875, 1.2734375, 1.53515625, 1.796875, 2.05859375, 2.3203125, 2.58203125, 2.84375, 3.10546875, 3.3671875, 3.62890625, 3.890625, 4.15234375, 4.4140625, 4.67578125, 4.9375, 5.19921875, 5.4609375, 5.72265625, 5.984375, 6.24609375, 6.5078125, 6.76953125, 7.03125, 7.29296875, 7.5546875, 7.81640625, 8.078125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 12.0, 9.0, 12.0, 7.0, 15.0, 12.0, 17.0, 18.0, 27.0, 30.0, 27.0, 34.0, 41.0, 30.0, 35.0, 27.0, 35.0, 42.0, 35.0, 46.0, 35.0, 41.0, 50.0, 40.0, 38.0, 36.0, 28.0, 28.0, 28.0, 32.0, 20.0, 21.0, 15.0, 14.0, 10.0, 6.0, 14.0, 4.0, 4.0, 4.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-9.5546875, -9.2685546875, -8.982421875, -8.6962890625, -8.41015625, -8.1240234375, -7.837890625, -7.5517578125, -7.265625, -6.9794921875, -6.693359375, -6.4072265625, -6.12109375, -5.8349609375, -5.548828125, -5.2626953125, -4.9765625, -4.6904296875, -4.404296875, -4.1181640625, -3.83203125, -3.5458984375, -3.259765625, -2.9736328125, -2.6875, -2.4013671875, -2.115234375, -1.8291015625, -1.54296875, -1.2568359375, -0.970703125, -0.6845703125, -0.3984375, -0.1123046875, 0.173828125, 0.4599609375, 0.74609375, 1.0322265625, 1.318359375, 1.6044921875, 1.890625, 2.1767578125, 2.462890625, 2.7490234375, 3.03515625, 3.3212890625, 3.607421875, 3.8935546875, 4.1796875, 4.4658203125, 4.751953125, 5.0380859375, 5.32421875, 5.6103515625, 5.896484375, 6.1826171875, 6.46875, 6.7548828125, 7.041015625, 7.3271484375, 7.61328125, 7.8994140625, 8.185546875, 8.4716796875, 8.7578125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 23.0, 19.0, 38.0, 64.0, 122.0, 197.0, 359.0, 580.0, 963.0, 1613.0, 2550.0, 4320.0, 7034.0, 11207.0, 18142.0, 28218.0, 43002.0, 64437.0, 94963.0, 135095.0, 184974.0, 244419.0, 306901.0, 363970.0, 403786.0, 416469.0, 399596.0, 356484.0, 298383.0, 235917.0, 177947.0, 129253.0, 90460.0, 60982.0, 41329.0, 26208.0, 16835.0, 10499.0, 6573.0, 4072.0, 2510.0, 1528.0, 918.0, 567.0, 310.0, 197.0, 120.0, 53.0, 26.0, 27.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-8.4296875, -8.17755126953125, -7.9254150390625, -7.67327880859375, -7.421142578125, -7.16900634765625, -6.9168701171875, -6.66473388671875, -6.41259765625, -6.16046142578125, -5.9083251953125, -5.65618896484375, -5.404052734375, -5.15191650390625, -4.8997802734375, -4.64764404296875, -4.3955078125, -4.14337158203125, -3.8912353515625, -3.63909912109375, -3.386962890625, -3.13482666015625, -2.8826904296875, -2.63055419921875, -2.37841796875, -2.12628173828125, -1.8741455078125, -1.62200927734375, -1.369873046875, -1.11773681640625, -0.8656005859375, -0.61346435546875, -0.361328125, -0.10919189453125, 0.1429443359375, 0.39508056640625, 0.647216796875, 0.89935302734375, 1.1514892578125, 1.40362548828125, 1.65576171875, 1.90789794921875, 2.1600341796875, 2.41217041015625, 2.664306640625, 2.91644287109375, 3.1685791015625, 3.42071533203125, 3.6728515625, 3.92498779296875, 4.1771240234375, 4.42926025390625, 4.681396484375, 4.93353271484375, 5.1856689453125, 5.43780517578125, 5.68994140625, 5.94207763671875, 6.1942138671875, 6.44635009765625, 6.698486328125, 6.95062255859375, 7.2027587890625, 7.45489501953125, 7.70703125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 5.0, 8.0, 14.0, 14.0, 16.0, 37.0, 21.0, 34.0, 38.0, 73.0, 57.0, 77.0, 96.0, 100.0, 97.0, 153.0, 175.0, 153.0, 171.0, 157.0, 182.0, 211.0, 204.0, 242.0, 178.0, 194.0, 194.0, 169.0, 142.0, 119.0, 122.0, 99.0, 98.0, 89.0, 55.0, 70.0, 53.0, 35.0, 28.0, 25.0, 24.0, 15.0, 7.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.10546875, -3.9705810546875, -3.835693359375, -3.7008056640625, -3.56591796875, -3.4310302734375, -3.296142578125, -3.1612548828125, -3.0263671875, -2.8914794921875, -2.756591796875, -2.6217041015625, -2.48681640625, -2.3519287109375, -2.217041015625, -2.0821533203125, -1.947265625, -1.8123779296875, -1.677490234375, -1.5426025390625, -1.40771484375, -1.2728271484375, -1.137939453125, -1.0030517578125, -0.8681640625, -0.7332763671875, -0.598388671875, -0.4635009765625, -0.32861328125, -0.1937255859375, -0.058837890625, 0.0760498046875, 0.2109375, 0.3458251953125, 0.480712890625, 0.6156005859375, 0.75048828125, 0.8853759765625, 1.020263671875, 1.1551513671875, 1.2900390625, 1.4249267578125, 1.559814453125, 1.6947021484375, 1.82958984375, 1.9644775390625, 2.099365234375, 2.2342529296875, 2.369140625, 2.5040283203125, 2.638916015625, 2.7738037109375, 2.90869140625, 3.0435791015625, 3.178466796875, 3.3133544921875, 3.4482421875, 3.5831298828125, 3.718017578125, 3.8529052734375, 3.98779296875, 4.1226806640625, 4.257568359375, 4.3924560546875, 4.52734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 3.0, 4.0, 6.0, 4.0, 9.0, 17.0, 13.0, 19.0, 20.0, 19.0, 25.0, 37.0, 33.0, 25.0, 47.0, 40.0, 56.0, 39.0, 49.0, 38.0, 42.0, 41.0, 39.0, 41.0, 33.0, 38.0, 38.0, 38.0, 27.0, 36.0, 18.0, 22.0, 11.0, 17.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.316300392150879, -9.949918746948242, -9.583538055419922, -9.217156410217285, -8.850774765014648, -8.484393119812012, -8.118011474609375, -7.751630783081055, -7.385249137878418, -7.018867492675781, -6.652486324310303, -6.286105155944824, -5.9197235107421875, -5.553341865539551, -5.186960697174072, -4.820579528808594, -4.454197883605957, -4.08781623840332, -3.721435070037842, -3.355053663253784, -2.9886722564697266, -2.622290849685669, -2.2559094429016113, -1.8895280361175537, -1.523146629333496, -1.1567652225494385, -0.7903838157653809, -0.42400240898132324, -0.057621002197265625, 0.308760404586792, 0.6751418113708496, 1.0415232181549072, 1.4079046249389648, 1.7742860317230225, 2.14066743850708, 2.5070488452911377, 2.8734302520751953, 3.239811658859253, 3.6061930656433105, 3.972574472427368, 4.338955879211426, 4.7053375244140625, 5.071718692779541, 5.4380998611450195, 5.804481506347656, 6.170863151550293, 6.5372443199157715, 6.90362548828125, 7.270007133483887, 7.636388778686523, 8.002769470214844, 8.36915111541748, 8.735532760620117, 9.101914405822754, 9.46829605102539, 9.834676742553711, 10.201058387756348, 10.567440032958984, 10.933820724487305, 11.300202369689941, 11.666584014892578, 12.032965660095215, 12.399347305297852, 12.765727996826172, 13.132109642028809]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 11.0, 15.0, 17.0, 13.0, 15.0, 24.0, 18.0, 20.0, 30.0, 29.0, 39.0, 43.0, 39.0, 38.0, 45.0, 43.0, 47.0, 40.0, 39.0, 29.0, 44.0, 32.0, 43.0, 36.0, 27.0, 35.0, 28.0, 14.0, 25.0, 23.0, 14.0, 14.0, 12.0, 13.0, 9.0, 7.0, 9.0, 5.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.262622833251953, -11.906577110290527, -11.550531387329102, -11.19448471069336, -10.838438987731934, -10.482393264770508, -10.126346588134766, -9.77030086517334, -9.414255142211914, -9.058209419250488, -8.702163696289062, -8.34611701965332, -7.9900712966918945, -7.634025573730469, -7.277979373931885, -6.921933174133301, -6.565887451171875, -6.209841728210449, -5.853795528411865, -5.497749328613281, -5.1417036056518555, -4.78565788269043, -4.429611682891846, -4.073565483093262, -3.717519760131836, -3.361473798751831, -3.005427837371826, -2.6493818759918213, -2.2933359146118164, -1.9372899532318115, -1.5812439918518066, -1.2251980304718018, -0.8691530227661133, -0.5131070613861084, -0.15706110000610352, 0.19898486137390137, 0.5550308227539062, 0.9110767841339111, 1.267122745513916, 1.623168706893921, 1.9792146682739258, 2.3352606296539307, 2.6913065910339355, 3.0473525524139404, 3.4033985137939453, 3.75944447517395, 4.115490436553955, 4.471536636352539, 4.827582359313965, 5.183628082275391, 5.539674282073975, 5.895720481872559, 6.251766204833984, 6.60781192779541, 6.963858127593994, 7.319904327392578, 7.675950050354004, 8.03199577331543, 8.388042449951172, 8.744088172912598, 9.100133895874023, 9.45617961883545, 9.812225341796875, 10.168272018432617, 10.524317741394043]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 10.0, 14.0, 18.0, 34.0, 38.0, 43.0, 81.0, 116.0, 132.0, 222.0, 321.0, 457.0, 685.0, 1020.0, 1467.0, 2257.0, 3382.0, 5095.0, 7898.0, 12325.0, 20359.0, 33789.0, 57878.0, 97281.0, 154349.0, 198757.0, 170044.0, 111096.0, 66275.0, 39641.0, 23321.0, 14127.0, 9015.0, 5655.0, 3589.0, 2463.0, 1585.0, 1132.0, 803.0, 516.0, 373.0, 268.0, 169.0, 131.0, 111.0, 56.0, 54.0, 34.0, 17.0, 17.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.31640625, -5.15350341796875, -4.9906005859375, -4.82769775390625, -4.664794921875, -4.50189208984375, -4.3389892578125, -4.17608642578125, -4.01318359375, -3.85028076171875, -3.6873779296875, -3.52447509765625, -3.361572265625, -3.19866943359375, -3.0357666015625, -2.87286376953125, -2.7099609375, -2.54705810546875, -2.3841552734375, -2.22125244140625, -2.058349609375, -1.89544677734375, -1.7325439453125, -1.56964111328125, -1.40673828125, -1.24383544921875, -1.0809326171875, -0.91802978515625, -0.755126953125, -0.59222412109375, -0.4293212890625, -0.26641845703125, -0.103515625, 0.05938720703125, 0.2222900390625, 0.38519287109375, 0.548095703125, 0.71099853515625, 0.8739013671875, 1.03680419921875, 1.19970703125, 1.36260986328125, 1.5255126953125, 1.68841552734375, 1.851318359375, 2.01422119140625, 2.1771240234375, 2.34002685546875, 2.5029296875, 2.66583251953125, 2.8287353515625, 2.99163818359375, 3.154541015625, 3.31744384765625, 3.4803466796875, 3.64324951171875, 3.80615234375, 3.96905517578125, 4.1319580078125, 4.29486083984375, 4.457763671875, 4.62066650390625, 4.7835693359375, 4.94647216796875, 5.109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 16.0, 12.0, 12.0, 16.0, 20.0, 23.0, 20.0, 21.0, 30.0, 34.0, 42.0, 41.0, 34.0, 44.0, 41.0, 44.0, 46.0, 36.0, 39.0, 36.0, 37.0, 33.0, 43.0, 30.0, 31.0, 41.0, 19.0, 15.0, 27.0, 18.0, 14.0, 11.0, 12.0, 12.0, 9.0, 8.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.5865478515625, -11.235595703125, -10.8846435546875, -10.53369140625, -10.1827392578125, -9.831787109375, -9.4808349609375, -9.1298828125, -8.7789306640625, -8.427978515625, -8.0770263671875, -7.72607421875, -7.3751220703125, -7.024169921875, -6.6732177734375, -6.322265625, -5.9713134765625, -5.620361328125, -5.2694091796875, -4.91845703125, -4.5675048828125, -4.216552734375, -3.8656005859375, -3.5146484375, -3.1636962890625, -2.812744140625, -2.4617919921875, -2.11083984375, -1.7598876953125, -1.408935546875, -1.0579833984375, -0.70703125, -0.3560791015625, -0.005126953125, 0.3458251953125, 0.69677734375, 1.0477294921875, 1.398681640625, 1.7496337890625, 2.1005859375, 2.4515380859375, 2.802490234375, 3.1534423828125, 3.50439453125, 3.8553466796875, 4.206298828125, 4.5572509765625, 4.908203125, 5.2591552734375, 5.610107421875, 5.9610595703125, 6.31201171875, 6.6629638671875, 7.013916015625, 7.3648681640625, 7.7158203125, 8.0667724609375, 8.417724609375, 8.7686767578125, 9.11962890625, 9.4705810546875, 9.821533203125, 10.1724853515625, 10.5234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 22.0, 25.0, 36.0, 56.0, 83.0, 144.0, 188.0, 326.0, 462.0, 830.0, 1301.0, 2196.0, 3970.0, 7421.0, 14936.0, 32547.0, 78668.0, 202586.0, 356511.0, 202194.0, 79099.0, 32790.0, 15048.0, 7425.0, 3954.0, 2275.0, 1346.0, 725.0, 500.0, 332.0, 193.0, 113.0, 86.0, 38.0, 37.0, 23.0, 21.0, 10.0, 9.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.72271728515625, -4.5626220703125, -4.40252685546875, -4.242431640625, -4.08233642578125, -3.9222412109375, -3.76214599609375, -3.60205078125, -3.44195556640625, -3.2818603515625, -3.12176513671875, -2.961669921875, -2.80157470703125, -2.6414794921875, -2.48138427734375, -2.3212890625, -2.16119384765625, -2.0010986328125, -1.84100341796875, -1.680908203125, -1.52081298828125, -1.3607177734375, -1.20062255859375, -1.04052734375, -0.88043212890625, -0.7203369140625, -0.56024169921875, -0.400146484375, -0.24005126953125, -0.0799560546875, 0.08013916015625, 0.240234375, 0.40032958984375, 0.5604248046875, 0.72052001953125, 0.880615234375, 1.04071044921875, 1.2008056640625, 1.36090087890625, 1.52099609375, 1.68109130859375, 1.8411865234375, 2.00128173828125, 2.161376953125, 2.32147216796875, 2.4815673828125, 2.64166259765625, 2.8017578125, 2.96185302734375, 3.1219482421875, 3.28204345703125, 3.442138671875, 3.60223388671875, 3.7623291015625, 3.92242431640625, 4.08251953125, 4.24261474609375, 4.4027099609375, 4.56280517578125, 4.722900390625, 4.88299560546875, 5.0430908203125, 5.20318603515625, 5.36328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 5.0, 11.0, 11.0, 11.0, 12.0, 18.0, 27.0, 28.0, 26.0, 27.0, 31.0, 49.0, 27.0, 36.0, 49.0, 48.0, 29.0, 35.0, 39.0, 41.0, 38.0, 45.0, 31.0, 35.0, 35.0, 29.0, 21.0, 36.0, 31.0, 19.0, 20.0, 12.0, 16.0, 3.0, 14.0, 9.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.5859375, -7.362548828125, -7.13916015625, -6.915771484375, -6.6923828125, -6.468994140625, -6.24560546875, -6.022216796875, -5.798828125, -5.575439453125, -5.35205078125, -5.128662109375, -4.9052734375, -4.681884765625, -4.45849609375, -4.235107421875, -4.01171875, -3.788330078125, -3.56494140625, -3.341552734375, -3.1181640625, -2.894775390625, -2.67138671875, -2.447998046875, -2.224609375, -2.001220703125, -1.77783203125, -1.554443359375, -1.3310546875, -1.107666015625, -0.88427734375, -0.660888671875, -0.4375, -0.214111328125, 0.00927734375, 0.232666015625, 0.4560546875, 0.679443359375, 0.90283203125, 1.126220703125, 1.349609375, 1.572998046875, 1.79638671875, 2.019775390625, 2.2431640625, 2.466552734375, 2.68994140625, 2.913330078125, 3.13671875, 3.360107421875, 3.58349609375, 3.806884765625, 4.0302734375, 4.253662109375, 4.47705078125, 4.700439453125, 4.923828125, 5.147216796875, 5.37060546875, 5.593994140625, 5.8173828125, 6.040771484375, 6.26416015625, 6.487548828125, 6.7109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 8.0, 10.0, 14.0, 25.0, 30.0, 45.0, 74.0, 96.0, 158.0, 212.0, 316.0, 546.0, 925.0, 1699.0, 3254.0, 7532.0, 24364.0, 190477.0, 726873.0, 66921.0, 14132.0, 5105.0, 2415.0, 1263.0, 705.0, 442.0, 291.0, 183.0, 128.0, 92.0, 65.0, 44.0, 25.0, 23.0, 16.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.5115966796875, -6.296630859375, -6.0816650390625, -5.86669921875, -5.6517333984375, -5.436767578125, -5.2218017578125, -5.0068359375, -4.7918701171875, -4.576904296875, -4.3619384765625, -4.14697265625, -3.9320068359375, -3.717041015625, -3.5020751953125, -3.287109375, -3.0721435546875, -2.857177734375, -2.6422119140625, -2.42724609375, -2.2122802734375, -1.997314453125, -1.7823486328125, -1.5673828125, -1.3524169921875, -1.137451171875, -0.9224853515625, -0.70751953125, -0.4925537109375, -0.277587890625, -0.0626220703125, 0.15234375, 0.3673095703125, 0.582275390625, 0.7972412109375, 1.01220703125, 1.2271728515625, 1.442138671875, 1.6571044921875, 1.8720703125, 2.0870361328125, 2.302001953125, 2.5169677734375, 2.73193359375, 2.9468994140625, 3.161865234375, 3.3768310546875, 3.591796875, 3.8067626953125, 4.021728515625, 4.2366943359375, 4.45166015625, 4.6666259765625, 4.881591796875, 5.0965576171875, 5.3115234375, 5.5264892578125, 5.741455078125, 5.9564208984375, 6.17138671875, 6.3863525390625, 6.601318359375, 6.8162841796875, 7.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 18.0, 12.0, 27.0, 55.0, 61.0, 98.0, 131.0, 129.0, 137.0, 91.0, 46.0, 38.0, 24.0, 20.0, 25.0, 8.0, 8.0, 10.0, 4.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006456375122070312, -0.0006262585520744324, -0.0006068795919418335, -0.0005875006318092346, -0.0005681216716766357, -0.0005487427115440369, -0.000529363751411438, -0.0005099847912788391, -0.0004906058311462402, -0.00047122687101364136, -0.0004518479108810425, -0.0004324689507484436, -0.0004130899906158447, -0.00039371103048324585, -0.00037433207035064697, -0.0003549531102180481, -0.0003355741500854492, -0.00031619518995285034, -0.00029681622982025146, -0.0002774372696876526, -0.0002580583095550537, -0.00023867934942245483, -0.00021930038928985596, -0.00019992142915725708, -0.0001805424690246582, -0.00016116350889205933, -0.00014178454875946045, -0.00012240558862686157, -0.0001030266284942627, -8.364766836166382e-05, -6.426870822906494e-05, -4.4889748096466064e-05, -2.5510787963867188e-05, -6.1318278312683105e-06, 1.3247132301330566e-05, 3.262609243392944e-05, 5.200505256652832e-05, 7.13840126991272e-05, 9.076297283172607e-05, 0.00011014193296432495, 0.00012952089309692383, 0.0001488998532295227, 0.00016827881336212158, 0.00018765777349472046, 0.00020703673362731934, 0.0002264156937599182, 0.0002457946538925171, 0.00026517361402511597, 0.00028455257415771484, 0.0003039315342903137, 0.0003233104944229126, 0.0003426894545555115, 0.00036206841468811035, 0.00038144737482070923, 0.0004008263349533081, 0.000420205295085907, 0.00043958425521850586, 0.00045896321535110474, 0.0004783421754837036, 0.0004977211356163025, 0.0005171000957489014, 0.0005364790558815002, 0.0005558580160140991, 0.000575236976146698, 0.0005946159362792969]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 19.0, 22.0, 28.0, 62.0, 76.0, 94.0, 185.0, 272.0, 398.0, 560.0, 881.0, 1265.0, 2019.0, 2961.0, 4611.0, 7274.0, 12562.0, 23117.0, 48703.0, 122724.0, 313398.0, 295086.0, 112852.0, 45513.0, 21793.0, 11900.0, 7151.0, 4469.0, 2946.0, 1886.0, 1262.0, 820.0, 541.0, 365.0, 265.0, 151.0, 102.0, 52.0, 48.0, 36.0, 17.0, 24.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.44140625, -4.29315185546875, -4.1448974609375, -3.99664306640625, -3.848388671875, -3.70013427734375, -3.5518798828125, -3.40362548828125, -3.25537109375, -3.10711669921875, -2.9588623046875, -2.81060791015625, -2.662353515625, -2.51409912109375, -2.3658447265625, -2.21759033203125, -2.0693359375, -1.92108154296875, -1.7728271484375, -1.62457275390625, -1.476318359375, -1.32806396484375, -1.1798095703125, -1.03155517578125, -0.88330078125, -0.73504638671875, -0.5867919921875, -0.43853759765625, -0.290283203125, -0.14202880859375, 0.0062255859375, 0.15447998046875, 0.302734375, 0.45098876953125, 0.5992431640625, 0.74749755859375, 0.895751953125, 1.04400634765625, 1.1922607421875, 1.34051513671875, 1.48876953125, 1.63702392578125, 1.7852783203125, 1.93353271484375, 2.081787109375, 2.23004150390625, 2.3782958984375, 2.52655029296875, 2.6748046875, 2.82305908203125, 2.9713134765625, 3.11956787109375, 3.267822265625, 3.41607666015625, 3.5643310546875, 3.71258544921875, 3.86083984375, 4.00909423828125, 4.1573486328125, 4.30560302734375, 4.453857421875, 4.60211181640625, 4.7503662109375, 4.89862060546875, 5.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 5.0, 3.0, 3.0, 7.0, 4.0, 5.0, 12.0, 3.0, 9.0, 20.0, 20.0, 26.0, 38.0, 49.0, 67.0, 105.0, 121.0, 119.0, 95.0, 74.0, 45.0, 32.0, 22.0, 19.0, 12.0, 13.0, 6.0, 6.0, 7.0, 8.0, 4.0, 9.0, 4.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.841796875, -1.7859039306640625, -1.730010986328125, -1.6741180419921875, -1.61822509765625, -1.5623321533203125, -1.506439208984375, -1.4505462646484375, -1.3946533203125, -1.3387603759765625, -1.282867431640625, -1.2269744873046875, -1.17108154296875, -1.1151885986328125, -1.059295654296875, -1.0034027099609375, -0.947509765625, -0.8916168212890625, -0.835723876953125, -0.7798309326171875, -0.72393798828125, -0.6680450439453125, -0.612152099609375, -0.5562591552734375, -0.5003662109375, -0.4444732666015625, -0.388580322265625, -0.3326873779296875, -0.27679443359375, -0.2209014892578125, -0.165008544921875, -0.1091156005859375, -0.05322265625, 0.0026702880859375, 0.058563232421875, 0.1144561767578125, 0.17034912109375, 0.2262420654296875, 0.282135009765625, 0.3380279541015625, 0.3939208984375, 0.4498138427734375, 0.505706787109375, 0.5615997314453125, 0.61749267578125, 0.6733856201171875, 0.729278564453125, 0.7851715087890625, 0.841064453125, 0.8969573974609375, 0.952850341796875, 1.0087432861328125, 1.06463623046875, 1.1205291748046875, 1.176422119140625, 1.2323150634765625, 1.2882080078125, 1.3441009521484375, 1.399993896484375, 1.4558868408203125, 1.51177978515625, 1.5676727294921875, 1.623565673828125, 1.6794586181640625, 1.7353515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 3.0, 13.0, 17.0, 9.0, 19.0, 15.0, 25.0, 29.0, 34.0, 29.0, 41.0, 46.0, 55.0, 53.0, 48.0, 46.0, 44.0, 41.0, 35.0, 52.0, 40.0, 38.0, 35.0, 33.0, 36.0, 30.0, 20.0, 14.0, 25.0, 13.0, 12.0, 13.0, 2.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796053886413574, -10.41100788116455, -10.025961875915527, -9.640915870666504, -9.25586986541748, -8.87082290649414, -8.485776901245117, -8.100730895996094, -7.71568489074707, -7.330638885498047, -6.945592880249023, -6.560546875, -6.175500392913818, -5.790454387664795, -5.4054083824157715, -5.02036190032959, -4.635316371917725, -4.250270366668701, -3.8652241230010986, -3.480178117752075, -3.0951318740844727, -2.710085868835449, -2.325039863586426, -1.9399936199188232, -1.5549476146697998, -1.1699014902114868, -0.7848554253578186, -0.3998093605041504, -0.014763236045837402, 0.3702828884124756, 0.755328893661499, 1.1403751373291016, 1.525421142578125, 1.910467267036438, 2.295513391494751, 2.6805593967437744, 3.065605640411377, 3.4506516456604004, 3.835697650909424, 4.2207441329956055, 4.605790138244629, 4.990836143493652, 5.375882148742676, 5.760928153991699, 6.145974636077881, 6.531020641326904, 6.916066646575928, 7.301113128662109, 7.686158657073975, 8.071205139160156, 8.45625114440918, 8.841297149658203, 9.226343154907227, 9.61138916015625, 9.996435165405273, 10.381481170654297, 10.76652717590332, 11.151573181152344, 11.536619186401367, 11.92166519165039, 12.306711196899414, 12.691757202148438, 13.076803207397461, 13.4618501663208, 13.846896171569824]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 12.0, 9.0, 11.0, 14.0, 9.0, 20.0, 26.0, 20.0, 24.0, 33.0, 30.0, 39.0, 48.0, 33.0, 34.0, 46.0, 37.0, 49.0, 49.0, 37.0, 37.0, 35.0, 38.0, 42.0, 37.0, 34.0, 29.0, 23.0, 20.0, 22.0, 16.0, 12.0, 19.0, 11.0, 10.0, 11.0, 7.0, 7.0, 6.0, 1.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.813156127929688, -12.449249267578125, -12.085343360900879, -11.721437454223633, -11.35753059387207, -10.993623733520508, -10.629717826843262, -10.265811920166016, -9.901905059814453, -9.53799819946289, -9.174092292785645, -8.810186386108398, -8.446279525756836, -8.082372665405273, -7.718466758728027, -7.354560375213623, -6.990653991699219, -6.6267476081848145, -6.26284122467041, -5.898934841156006, -5.535028457641602, -5.171122074127197, -4.807215690612793, -4.443309307098389, -4.079402923583984, -3.71549654006958, -3.351590156555176, -2.9876837730407715, -2.623777389526367, -2.259871006011963, -1.8959646224975586, -1.5320582389831543, -1.1681509017944336, -0.8042445182800293, -0.440338134765625, -0.0764317512512207, 0.2874746322631836, 0.6513810157775879, 1.0152873992919922, 1.3791937828063965, 1.7431001663208008, 2.107006549835205, 2.4709129333496094, 2.8348193168640137, 3.198725700378418, 3.5626320838928223, 3.9265384674072266, 4.290444850921631, 4.654351234436035, 5.0182576179504395, 5.382164001464844, 5.746070384979248, 6.109976768493652, 6.473883152008057, 6.837789535522461, 7.201695919036865, 7.5656023025512695, 7.929508686065674, 8.293415069580078, 8.65732192993164, 9.021227836608887, 9.385133743286133, 9.749040603637695, 10.112947463989258, 10.476853370666504]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 7.0, 8.0, 11.0, 6.0, 26.0, 36.0, 58.0, 78.0, 147.0, 199.0, 311.0, 570.0, 866.0, 1416.0, 2376.0, 3947.0, 6219.0, 9496.0, 14930.0, 23251.0, 34320.0, 48084.0, 65046.0, 82407.0, 97682.0, 107500.0, 109967.0, 103440.0, 89887.0, 73227.0, 55358.0, 40207.0, 27646.0, 18034.0, 11901.0, 7498.0, 4729.0, 2876.0, 1841.0, 1102.0, 684.0, 448.0, 261.0, 175.0, 100.0, 69.0, 45.0, 28.0, 15.0, 11.0, 3.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.375, -9.0648193359375, -8.754638671875, -8.4444580078125, -8.13427734375, -7.8240966796875, -7.513916015625, -7.2037353515625, -6.8935546875, -6.5833740234375, -6.273193359375, -5.9630126953125, -5.65283203125, -5.3426513671875, -5.032470703125, -4.7222900390625, -4.412109375, -4.1019287109375, -3.791748046875, -3.4815673828125, -3.17138671875, -2.8612060546875, -2.551025390625, -2.2408447265625, -1.9306640625, -1.6204833984375, -1.310302734375, -1.0001220703125, -0.68994140625, -0.3797607421875, -0.069580078125, 0.2406005859375, 0.55078125, 0.8609619140625, 1.171142578125, 1.4813232421875, 1.79150390625, 2.1016845703125, 2.411865234375, 2.7220458984375, 3.0322265625, 3.3424072265625, 3.652587890625, 3.9627685546875, 4.27294921875, 4.5831298828125, 4.893310546875, 5.2034912109375, 5.513671875, 5.8238525390625, 6.134033203125, 6.4442138671875, 6.75439453125, 7.0645751953125, 7.374755859375, 7.6849365234375, 7.9951171875, 8.3052978515625, 8.615478515625, 8.9256591796875, 9.23583984375, 9.5460205078125, 9.856201171875, 10.1663818359375, 10.4765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 9.0, 16.0, 16.0, 19.0, 21.0, 25.0, 24.0, 31.0, 33.0, 37.0, 48.0, 37.0, 33.0, 48.0, 35.0, 50.0, 40.0, 42.0, 34.0, 39.0, 42.0, 36.0, 33.0, 33.0, 27.0, 26.0, 20.0, 18.0, 17.0, 16.0, 15.0, 10.0, 11.0, 10.0, 8.0, 8.0, 4.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.7554931640625, -11.409423828125, -11.0633544921875, -10.71728515625, -10.3712158203125, -10.025146484375, -9.6790771484375, -9.3330078125, -8.9869384765625, -8.640869140625, -8.2947998046875, -7.94873046875, -7.6026611328125, -7.256591796875, -6.9105224609375, -6.564453125, -6.2183837890625, -5.872314453125, -5.5262451171875, -5.18017578125, -4.8341064453125, -4.488037109375, -4.1419677734375, -3.7958984375, -3.4498291015625, -3.103759765625, -2.7576904296875, -2.41162109375, -2.0655517578125, -1.719482421875, -1.3734130859375, -1.02734375, -0.6812744140625, -0.335205078125, 0.0108642578125, 0.35693359375, 0.7030029296875, 1.049072265625, 1.3951416015625, 1.7412109375, 2.0872802734375, 2.433349609375, 2.7794189453125, 3.12548828125, 3.4715576171875, 3.817626953125, 4.1636962890625, 4.509765625, 4.8558349609375, 5.201904296875, 5.5479736328125, 5.89404296875, 6.2401123046875, 6.586181640625, 6.9322509765625, 7.2783203125, 7.6243896484375, 7.970458984375, 8.3165283203125, 8.66259765625, 9.0086669921875, 9.354736328125, 9.7008056640625, 10.046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 8.0, 16.0, 20.0, 32.0, 56.0, 68.0, 124.0, 202.0, 301.0, 488.0, 789.0, 1278.0, 2123.0, 3349.0, 5397.0, 9014.0, 14292.0, 22458.0, 33978.0, 49539.0, 68166.0, 88267.0, 104977.0, 115340.0, 115666.0, 106627.0, 89329.0, 69445.0, 50503.0, 34883.0, 23044.0, 14934.0, 9170.0, 5577.0, 3427.0, 2057.0, 1371.0, 837.0, 520.0, 304.0, 193.0, 133.0, 76.0, 60.0, 43.0, 25.0, 16.0, 10.0, 7.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-11.1328125, -10.7957763671875, -10.458740234375, -10.1217041015625, -9.78466796875, -9.4476318359375, -9.110595703125, -8.7735595703125, -8.4365234375, -8.0994873046875, -7.762451171875, -7.4254150390625, -7.08837890625, -6.7513427734375, -6.414306640625, -6.0772705078125, -5.740234375, -5.4031982421875, -5.066162109375, -4.7291259765625, -4.39208984375, -4.0550537109375, -3.718017578125, -3.3809814453125, -3.0439453125, -2.7069091796875, -2.369873046875, -2.0328369140625, -1.69580078125, -1.3587646484375, -1.021728515625, -0.6846923828125, -0.34765625, -0.0106201171875, 0.326416015625, 0.6634521484375, 1.00048828125, 1.3375244140625, 1.674560546875, 2.0115966796875, 2.3486328125, 2.6856689453125, 3.022705078125, 3.3597412109375, 3.69677734375, 4.0338134765625, 4.370849609375, 4.7078857421875, 5.044921875, 5.3819580078125, 5.718994140625, 6.0560302734375, 6.39306640625, 6.7301025390625, 7.067138671875, 7.4041748046875, 7.7412109375, 8.0782470703125, 8.415283203125, 8.7523193359375, 9.08935546875, 9.4263916015625, 9.763427734375, 10.1004638671875, 10.4375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 5.0, 11.0, 12.0, 20.0, 22.0, 25.0, 15.0, 32.0, 30.0, 35.0, 34.0, 39.0, 44.0, 40.0, 36.0, 32.0, 58.0, 43.0, 48.0, 38.0, 33.0, 28.0, 40.0, 44.0, 40.0, 31.0, 19.0, 27.0, 21.0, 15.0, 13.0, 13.0, 12.0, 16.0, 3.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.5697021484375, -7.330810546875, -7.0919189453125, -6.85302734375, -6.6141357421875, -6.375244140625, -6.1363525390625, -5.8974609375, -5.6585693359375, -5.419677734375, -5.1807861328125, -4.94189453125, -4.7030029296875, -4.464111328125, -4.2252197265625, -3.986328125, -3.7474365234375, -3.508544921875, -3.2696533203125, -3.03076171875, -2.7918701171875, -2.552978515625, -2.3140869140625, -2.0751953125, -1.8363037109375, -1.597412109375, -1.3585205078125, -1.11962890625, -0.8807373046875, -0.641845703125, -0.4029541015625, -0.1640625, 0.0748291015625, 0.313720703125, 0.5526123046875, 0.79150390625, 1.0303955078125, 1.269287109375, 1.5081787109375, 1.7470703125, 1.9859619140625, 2.224853515625, 2.4637451171875, 2.70263671875, 2.9415283203125, 3.180419921875, 3.4193115234375, 3.658203125, 3.8970947265625, 4.135986328125, 4.3748779296875, 4.61376953125, 4.8526611328125, 5.091552734375, 5.3304443359375, 5.5693359375, 5.8082275390625, 6.047119140625, 6.2860107421875, 6.52490234375, 6.7637939453125, 7.002685546875, 7.2415771484375, 7.48046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 15.0, 19.0, 22.0, 37.0, 39.0, 64.0, 96.0, 133.0, 201.0, 335.0, 451.0, 717.0, 1156.0, 1912.0, 2985.0, 5123.0, 8514.0, 15091.0, 27037.0, 48088.0, 81693.0, 125855.0, 165203.0, 173426.0, 145353.0, 100606.0, 61519.0, 35479.0, 19758.0, 11035.0, 6494.0, 3713.0, 2306.0, 1415.0, 909.0, 592.0, 385.0, 228.0, 169.0, 112.0, 79.0, 66.0, 27.0, 28.0, 17.0, 8.0, 15.0, 7.0, 4.0, 5.0, 2.0, 3.0, 3.0], "bins": [-6.3671875, -6.18115234375, -5.9951171875, -5.80908203125, -5.623046875, -5.43701171875, -5.2509765625, -5.06494140625, -4.87890625, -4.69287109375, -4.5068359375, -4.32080078125, -4.134765625, -3.94873046875, -3.7626953125, -3.57666015625, -3.390625, -3.20458984375, -3.0185546875, -2.83251953125, -2.646484375, -2.46044921875, -2.2744140625, -2.08837890625, -1.90234375, -1.71630859375, -1.5302734375, -1.34423828125, -1.158203125, -0.97216796875, -0.7861328125, -0.60009765625, -0.4140625, -0.22802734375, -0.0419921875, 0.14404296875, 0.330078125, 0.51611328125, 0.7021484375, 0.88818359375, 1.07421875, 1.26025390625, 1.4462890625, 1.63232421875, 1.818359375, 2.00439453125, 2.1904296875, 2.37646484375, 2.5625, 2.74853515625, 2.9345703125, 3.12060546875, 3.306640625, 3.49267578125, 3.6787109375, 3.86474609375, 4.05078125, 4.23681640625, 4.4228515625, 4.60888671875, 4.794921875, 4.98095703125, 5.1669921875, 5.35302734375, 5.5390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 11.0, 10.0, 12.0, 22.0, 22.0, 22.0, 27.0, 36.0, 39.0, 39.0, 46.0, 60.0, 52.0, 59.0, 60.0, 56.0, 50.0, 48.0, 48.0, 26.0, 44.0, 40.0, 30.0, 29.0, 20.0, 14.0, 16.0, 7.0, 5.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006170272827148438, -0.0005972012877464294, -0.0005773752927780151, -0.0005575492978096008, -0.0005377233028411865, -0.0005178973078727722, -0.0004980713129043579, -0.0004782453179359436, -0.0004584193229675293, -0.000438593327999115, -0.0004187673330307007, -0.0003989413380622864, -0.00037911534309387207, -0.00035928934812545776, -0.00033946335315704346, -0.00031963735818862915, -0.00029981136322021484, -0.00027998536825180054, -0.00026015937328338623, -0.00024033337831497192, -0.00022050738334655762, -0.0002006813883781433, -0.000180855393409729, -0.0001610293984413147, -0.0001412034034729004, -0.00012137740850448608, -0.00010155141353607178, -8.172541856765747e-05, -6.189942359924316e-05, -4.207342863082886e-05, -2.224743366241455e-05, -2.421438694000244e-06, 1.7404556274414062e-05, 3.723055124282837e-05, 5.7056546211242676e-05, 7.688254117965698e-05, 9.670853614807129e-05, 0.0001165345311164856, 0.0001363605260848999, 0.0001561865210533142, 0.00017601251602172852, 0.00019583851099014282, 0.00021566450595855713, 0.00023549050092697144, 0.00025531649589538574, 0.00027514249086380005, 0.00029496848583221436, 0.00031479448080062866, 0.00033462047576904297, 0.0003544464707374573, 0.0003742724657058716, 0.0003940984606742859, 0.0004139244556427002, 0.0004337504506111145, 0.0004535764455795288, 0.0004734024405479431, 0.0004932284355163574, 0.0005130544304847717, 0.000532880425453186, 0.0005527064204216003, 0.0005725324153900146, 0.000592358410358429, 0.0006121844053268433, 0.0006320104002952576, 0.0006518363952636719]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 7.0, 13.0, 9.0, 14.0, 16.0, 26.0, 41.0, 55.0, 84.0, 112.0, 171.0, 241.0, 378.0, 541.0, 769.0, 1159.0, 1583.0, 2500.0, 3877.0, 6207.0, 10221.0, 16968.0, 27827.0, 45225.0, 71560.0, 104428.0, 134548.0, 149909.0, 141547.0, 113135.0, 79985.0, 51585.0, 32303.0, 19578.0, 11718.0, 7162.0, 4566.0, 2770.0, 1813.0, 1225.0, 794.0, 574.0, 411.0, 258.0, 171.0, 132.0, 96.0, 73.0, 55.0, 42.0, 26.0, 19.0, 11.0, 11.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0], "bins": [-5.4921875, -5.318603515625, -5.14501953125, -4.971435546875, -4.7978515625, -4.624267578125, -4.45068359375, -4.277099609375, -4.103515625, -3.929931640625, -3.75634765625, -3.582763671875, -3.4091796875, -3.235595703125, -3.06201171875, -2.888427734375, -2.71484375, -2.541259765625, -2.36767578125, -2.194091796875, -2.0205078125, -1.846923828125, -1.67333984375, -1.499755859375, -1.326171875, -1.152587890625, -0.97900390625, -0.805419921875, -0.6318359375, -0.458251953125, -0.28466796875, -0.111083984375, 0.0625, 0.236083984375, 0.40966796875, 0.583251953125, 0.7568359375, 0.930419921875, 1.10400390625, 1.277587890625, 1.451171875, 1.624755859375, 1.79833984375, 1.971923828125, 2.1455078125, 2.319091796875, 2.49267578125, 2.666259765625, 2.83984375, 3.013427734375, 3.18701171875, 3.360595703125, 3.5341796875, 3.707763671875, 3.88134765625, 4.054931640625, 4.228515625, 4.402099609375, 4.57568359375, 4.749267578125, 4.9228515625, 5.096435546875, 5.27001953125, 5.443603515625, 5.6171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 10.0, 14.0, 14.0, 16.0, 22.0, 30.0, 28.0, 34.0, 55.0, 57.0, 70.0, 69.0, 73.0, 63.0, 71.0, 50.0, 52.0, 66.0, 39.0, 42.0, 22.0, 21.0, 16.0, 15.0, 8.0, 9.0, 6.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.53125, -2.448883056640625, -2.36651611328125, -2.284149169921875, -2.2017822265625, -2.119415283203125, -2.03704833984375, -1.954681396484375, -1.872314453125, -1.789947509765625, -1.70758056640625, -1.625213623046875, -1.5428466796875, -1.460479736328125, -1.37811279296875, -1.295745849609375, -1.21337890625, -1.131011962890625, -1.04864501953125, -0.966278076171875, -0.8839111328125, -0.801544189453125, -0.71917724609375, -0.636810302734375, -0.554443359375, -0.472076416015625, -0.38970947265625, -0.307342529296875, -0.2249755859375, -0.142608642578125, -0.06024169921875, 0.022125244140625, 0.1044921875, 0.186859130859375, 0.26922607421875, 0.351593017578125, 0.4339599609375, 0.516326904296875, 0.59869384765625, 0.681060791015625, 0.763427734375, 0.845794677734375, 0.92816162109375, 1.010528564453125, 1.0928955078125, 1.175262451171875, 1.25762939453125, 1.339996337890625, 1.42236328125, 1.504730224609375, 1.58709716796875, 1.669464111328125, 1.7518310546875, 1.834197998046875, 1.91656494140625, 1.998931884765625, 2.081298828125, 2.163665771484375, 2.24603271484375, 2.328399658203125, 2.4107666015625, 2.493133544921875, 2.57550048828125, 2.657867431640625, 2.740234375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 3.0, 5.0, 8.0, 8.0, 12.0, 5.0, 17.0, 15.0, 29.0, 24.0, 21.0, 26.0, 35.0, 43.0, 47.0, 40.0, 44.0, 49.0, 36.0, 50.0, 47.0, 37.0, 35.0, 44.0, 42.0, 34.0, 34.0, 26.0, 32.0, 25.0, 28.0, 20.0, 24.0, 8.0, 9.0, 9.0, 6.0, 3.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.549898147583008, -10.191729545593262, -9.833560943603516, -9.475393295288086, -9.11722469329834, -8.759056091308594, -8.400887489318848, -8.042718887329102, -7.684550762176514, -7.326382160186768, -6.96821403503418, -6.610045433044434, -6.2518768310546875, -5.8937087059021, -5.5355401039123535, -5.177371978759766, -4.8192033767700195, -4.461034774780273, -4.1028666496276855, -3.7446980476379395, -3.3865296840667725, -3.0283613204956055, -2.6701927185058594, -2.3120243549346924, -1.9538559913635254, -1.5956876277923584, -1.2375191450119019, -0.8793506622314453, -0.5211822986602783, -0.16301393508911133, 0.19515466690063477, 0.5533230304718018, 0.9114904403686523, 1.2696588039398193, 1.6278272867202759, 1.9859957695007324, 2.3441641330718994, 2.7023324966430664, 3.0605010986328125, 3.4186694622039795, 3.7768378257751465, 4.135006427764893, 4.4931745529174805, 4.851343154907227, 5.209511756896973, 5.5676798820495605, 5.925848484039307, 6.2840166091918945, 6.642185211181641, 7.000353813171387, 7.358521938323975, 7.716690540313721, 8.074858665466309, 8.433027267456055, 8.7911958694458, 9.149364471435547, 9.507532119750977, 9.865700721740723, 10.223869323730469, 10.582036972045898, 10.940205574035645, 11.29837417602539, 11.656542778015137, 12.014711380004883, 12.372879981994629]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 5.0, 5.0, 7.0, 18.0, 11.0, 20.0, 14.0, 24.0, 35.0, 29.0, 23.0, 36.0, 29.0, 36.0, 43.0, 56.0, 42.0, 32.0, 41.0, 51.0, 48.0, 45.0, 35.0, 34.0, 26.0, 36.0, 32.0, 30.0, 27.0, 19.0, 18.0, 17.0, 12.0, 21.0, 9.0, 6.0, 7.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.709505081176758, -13.33723258972168, -12.964960098266602, -12.592687606811523, -12.220415115356445, -11.848142623901367, -11.475870132446289, -11.103597640991211, -10.731325149536133, -10.359052658081055, -9.986780166625977, -9.614507675170898, -9.24223518371582, -8.869962692260742, -8.497690200805664, -8.125417709350586, -7.753144264221191, -7.380871772766113, -7.008599281311035, -6.636326789855957, -6.264054298400879, -5.891781806945801, -5.5195088386535645, -5.147236347198486, -4.774963855743408, -4.40269136428833, -4.030418872833252, -3.6581461429595947, -3.2858736515045166, -2.9136011600494385, -2.5413284301757812, -2.169055938720703, -1.7967844009399414, -1.4245119094848633, -1.0522392988204956, -0.6799666881561279, -0.3076941967010498, 0.06457829475402832, 0.43685102462768555, 0.8091235160827637, 1.1813960075378418, 1.55366849899292, 1.9259411096572876, 2.2982137203216553, 2.6704862117767334, 3.0427587032318115, 3.4150314331054688, 3.787303924560547, 4.159576416015625, 4.531848907470703, 4.904121398925781, 5.276393890380859, 5.6486663818359375, 6.020938873291016, 6.393211841583252, 6.76548433303833, 7.137756824493408, 7.510029315948486, 7.8823018074035645, 8.2545747756958, 8.626847267150879, 8.999119758605957, 9.371392250061035, 9.743664741516113, 10.115937232971191]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 10.0, 23.0, 38.0, 62.0, 91.0, 146.0, 238.0, 420.0, 724.0, 1148.0, 2005.0, 3293.0, 5302.0, 9013.0, 14774.0, 23587.0, 37705.0, 58117.0, 90957.0, 135359.0, 195405.0, 271458.0, 352605.0, 428961.0, 472991.0, 472024.0, 426246.0, 352805.0, 268685.0, 194300.0, 133283.0, 89167.0, 57700.0, 36628.0, 23087.0, 14293.0, 8588.0, 5308.0, 3144.0, 1855.0, 1119.0, 661.0, 376.0, 256.0, 131.0, 69.0, 56.0, 29.0, 14.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.3125, -9.0384521484375, -8.764404296875, -8.4903564453125, -8.21630859375, -7.9422607421875, -7.668212890625, -7.3941650390625, -7.1201171875, -6.8460693359375, -6.572021484375, -6.2979736328125, -6.02392578125, -5.7498779296875, -5.475830078125, -5.2017822265625, -4.927734375, -4.6536865234375, -4.379638671875, -4.1055908203125, -3.83154296875, -3.5574951171875, -3.283447265625, -3.0093994140625, -2.7353515625, -2.4613037109375, -2.187255859375, -1.9132080078125, -1.63916015625, -1.3651123046875, -1.091064453125, -0.8170166015625, -0.54296875, -0.2689208984375, 0.005126953125, 0.2791748046875, 0.55322265625, 0.8272705078125, 1.101318359375, 1.3753662109375, 1.6494140625, 1.9234619140625, 2.197509765625, 2.4715576171875, 2.74560546875, 3.0196533203125, 3.293701171875, 3.5677490234375, 3.841796875, 4.1158447265625, 4.389892578125, 4.6639404296875, 4.93798828125, 5.2120361328125, 5.486083984375, 5.7601318359375, 6.0341796875, 6.3082275390625, 6.582275390625, 6.8563232421875, 7.13037109375, 7.4044189453125, 7.678466796875, 7.9525146484375, 8.2265625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 7.0, 8.0, 9.0, 12.0, 18.0, 13.0, 25.0, 25.0, 33.0, 26.0, 24.0, 39.0, 33.0, 38.0, 40.0, 51.0, 44.0, 38.0, 41.0, 40.0, 51.0, 43.0, 40.0, 30.0, 23.0, 37.0, 32.0, 30.0, 18.0, 18.0, 15.0, 15.0, 20.0, 16.0, 11.0, 4.0, 8.0, 7.0, 3.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.4609375, -11.145263671875, -10.82958984375, -10.513916015625, -10.1982421875, -9.882568359375, -9.56689453125, -9.251220703125, -8.935546875, -8.619873046875, -8.30419921875, -7.988525390625, -7.6728515625, -7.357177734375, -7.04150390625, -6.725830078125, -6.41015625, -6.094482421875, -5.77880859375, -5.463134765625, -5.1474609375, -4.831787109375, -4.51611328125, -4.200439453125, -3.884765625, -3.569091796875, -3.25341796875, -2.937744140625, -2.6220703125, -2.306396484375, -1.99072265625, -1.675048828125, -1.359375, -1.043701171875, -0.72802734375, -0.412353515625, -0.0966796875, 0.218994140625, 0.53466796875, 0.850341796875, 1.166015625, 1.481689453125, 1.79736328125, 2.113037109375, 2.4287109375, 2.744384765625, 3.06005859375, 3.375732421875, 3.69140625, 4.007080078125, 4.32275390625, 4.638427734375, 4.9541015625, 5.269775390625, 5.58544921875, 5.901123046875, 6.216796875, 6.532470703125, 6.84814453125, 7.163818359375, 7.4794921875, 7.795166015625, 8.11083984375, 8.426513671875, 8.7421875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 6.0, 14.0, 18.0, 32.0, 46.0, 97.0, 137.0, 231.0, 362.0, 663.0, 1011.0, 1727.0, 2769.0, 4569.0, 7138.0, 11590.0, 18281.0, 28356.0, 42404.0, 63441.0, 92574.0, 130143.0, 176899.0, 232033.0, 290523.0, 343948.0, 383431.0, 400492.0, 391579.0, 358237.0, 308882.0, 249979.0, 195120.0, 144438.0, 103793.0, 71738.0, 49058.0, 32290.0, 20886.0, 13386.0, 8525.0, 5275.0, 3292.0, 1858.0, 1240.0, 724.0, 414.0, 254.0, 163.0, 94.0, 46.0, 42.0, 19.0, 9.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.046875, -7.792724609375, -7.53857421875, -7.284423828125, -7.0302734375, -6.776123046875, -6.52197265625, -6.267822265625, -6.013671875, -5.759521484375, -5.50537109375, -5.251220703125, -4.9970703125, -4.742919921875, -4.48876953125, -4.234619140625, -3.98046875, -3.726318359375, -3.47216796875, -3.218017578125, -2.9638671875, -2.709716796875, -2.45556640625, -2.201416015625, -1.947265625, -1.693115234375, -1.43896484375, -1.184814453125, -0.9306640625, -0.676513671875, -0.42236328125, -0.168212890625, 0.0859375, 0.340087890625, 0.59423828125, 0.848388671875, 1.1025390625, 1.356689453125, 1.61083984375, 1.864990234375, 2.119140625, 2.373291015625, 2.62744140625, 2.881591796875, 3.1357421875, 3.389892578125, 3.64404296875, 3.898193359375, 4.15234375, 4.406494140625, 4.66064453125, 4.914794921875, 5.1689453125, 5.423095703125, 5.67724609375, 5.931396484375, 6.185546875, 6.439697265625, 6.69384765625, 6.947998046875, 7.2021484375, 7.456298828125, 7.71044921875, 7.964599609375, 8.21875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 23.0, 25.0, 35.0, 39.0, 47.0, 49.0, 75.0, 67.0, 79.0, 115.0, 132.0, 153.0, 158.0, 180.0, 203.0, 198.0, 200.0, 213.0, 219.0, 216.0, 167.0, 188.0, 178.0, 169.0, 155.0, 124.0, 107.0, 85.0, 93.0, 57.0, 54.0, 47.0, 43.0, 37.0, 22.0, 18.0, 25.0, 14.0, 12.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.81640625, -4.6710205078125, -4.525634765625, -4.3802490234375, -4.23486328125, -4.0894775390625, -3.944091796875, -3.7987060546875, -3.6533203125, -3.5079345703125, -3.362548828125, -3.2171630859375, -3.07177734375, -2.9263916015625, -2.781005859375, -2.6356201171875, -2.490234375, -2.3448486328125, -2.199462890625, -2.0540771484375, -1.90869140625, -1.7633056640625, -1.617919921875, -1.4725341796875, -1.3271484375, -1.1817626953125, -1.036376953125, -0.8909912109375, -0.74560546875, -0.6002197265625, -0.454833984375, -0.3094482421875, -0.1640625, -0.0186767578125, 0.126708984375, 0.2720947265625, 0.41748046875, 0.5628662109375, 0.708251953125, 0.8536376953125, 0.9990234375, 1.1444091796875, 1.289794921875, 1.4351806640625, 1.58056640625, 1.7259521484375, 1.871337890625, 2.0167236328125, 2.162109375, 2.3074951171875, 2.452880859375, 2.5982666015625, 2.74365234375, 2.8890380859375, 3.034423828125, 3.1798095703125, 3.3251953125, 3.4705810546875, 3.615966796875, 3.7613525390625, 3.90673828125, 4.0521240234375, 4.197509765625, 4.3428955078125, 4.48828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 5.0, 7.0, 7.0, 11.0, 8.0, 17.0, 26.0, 27.0, 21.0, 19.0, 38.0, 27.0, 52.0, 36.0, 70.0, 40.0, 32.0, 39.0, 38.0, 51.0, 42.0, 38.0, 51.0, 32.0, 34.0, 23.0, 31.0, 35.0, 23.0, 19.0, 18.0, 11.0, 8.0, 9.0, 12.0, 10.0, 7.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796188354492188, -9.425966262817383, -9.055744171142578, -8.685522079467773, -8.315299987792969, -7.945078372955322, -7.574856758117676, -7.204634666442871, -6.834412574768066, -6.464190483093262, -6.093968391418457, -5.7237467765808105, -5.353524684906006, -4.983302593231201, -4.613080978393555, -4.24285888671875, -3.8726367950439453, -3.5024147033691406, -3.132192850112915, -2.7619709968566895, -2.3917489051818848, -2.02152681350708, -1.6513049602508545, -1.281083106994629, -0.9108610153198242, -0.5406390428543091, -0.17041707038879395, 0.1998049020767212, 0.5700268745422363, 0.9402488470077515, 1.3104708194732666, 1.6806926727294922, 2.0509138107299805, 2.421135902404785, 2.7913577556610107, 3.1615796089172363, 3.531801700592041, 3.9020237922668457, 4.272245407104492, 4.642467498779297, 5.012689590454102, 5.382911682128906, 5.753133773803711, 6.123355388641357, 6.493577480316162, 6.863799571990967, 7.234021186828613, 7.604243278503418, 7.974465370178223, 8.344687461853027, 8.714909553527832, 9.085131645202637, 9.455352783203125, 9.82557487487793, 10.195796966552734, 10.566019058227539, 10.936241149902344, 11.306463241577148, 11.676685333251953, 12.046907424926758, 12.417129516601562, 12.78735065460205, 13.157572746276855, 13.52779483795166, 13.898016929626465]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 6.0, 3.0, 7.0, 7.0, 9.0, 12.0, 12.0, 14.0, 23.0, 18.0, 20.0, 28.0, 29.0, 31.0, 23.0, 40.0, 35.0, 45.0, 39.0, 31.0, 35.0, 48.0, 40.0, 41.0, 49.0, 43.0, 35.0, 27.0, 38.0, 36.0, 26.0, 20.0, 23.0, 20.0, 13.0, 20.0, 10.0, 9.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.916873931884766, -12.552591323852539, -12.188308715820312, -11.82402515411377, -11.459742546081543, -11.095459938049316, -10.731176376342773, -10.366893768310547, -10.00261116027832, -9.638328552246094, -9.274045944213867, -8.909762382507324, -8.545479774475098, -8.181197166442871, -7.816914081573486, -7.452630996704102, -7.088348388671875, -6.724065780639648, -6.359782695770264, -5.995499610900879, -5.631217002868652, -5.266934394836426, -4.902651309967041, -4.538368225097656, -4.17408561706543, -3.809802770614624, -3.4455199241638184, -3.0812370777130127, -2.716954231262207, -2.3526713848114014, -1.9883885383605957, -1.62410569190979, -1.2598237991333008, -0.8955409526824951, -0.5312581062316895, -0.1669752597808838, 0.19730758666992188, 0.5615904331207275, 0.9258732795715332, 1.2901561260223389, 1.6544389724731445, 2.01872181892395, 2.383004665374756, 2.7472875118255615, 3.111570358276367, 3.475853204727173, 3.8401360511779785, 4.204419136047363, 4.56870174407959, 4.932984352111816, 5.297267436981201, 5.661550521850586, 6.0258331298828125, 6.390115737915039, 6.754398822784424, 7.118681907653809, 7.482964515686035, 7.847247123718262, 8.211530685424805, 8.575813293457031, 8.940095901489258, 9.304378509521484, 9.668661117553711, 10.032944679260254, 10.39722728729248]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 9.0, 8.0, 23.0, 22.0, 33.0, 43.0, 57.0, 79.0, 124.0, 171.0, 258.0, 390.0, 542.0, 839.0, 1230.0, 1906.0, 2953.0, 4522.0, 7345.0, 11421.0, 18451.0, 29690.0, 47336.0, 75033.0, 113991.0, 157178.0, 173175.0, 139698.0, 96155.0, 61618.0, 38727.0, 24055.0, 14999.0, 9490.0, 5973.0, 3754.0, 2405.0, 1560.0, 1079.0, 737.0, 471.0, 326.0, 198.0, 133.0, 101.0, 93.0, 46.0, 42.0, 29.0, 10.0, 9.0, 7.0, 8.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-4.42578125, -4.2886962890625, -4.151611328125, -4.0145263671875, -3.87744140625, -3.7403564453125, -3.603271484375, -3.4661865234375, -3.3291015625, -3.1920166015625, -3.054931640625, -2.9178466796875, -2.78076171875, -2.6436767578125, -2.506591796875, -2.3695068359375, -2.232421875, -2.0953369140625, -1.958251953125, -1.8211669921875, -1.68408203125, -1.5469970703125, -1.409912109375, -1.2728271484375, -1.1357421875, -0.9986572265625, -0.861572265625, -0.7244873046875, -0.58740234375, -0.4503173828125, -0.313232421875, -0.1761474609375, -0.0390625, 0.0980224609375, 0.235107421875, 0.3721923828125, 0.50927734375, 0.6463623046875, 0.783447265625, 0.9205322265625, 1.0576171875, 1.1947021484375, 1.331787109375, 1.4688720703125, 1.60595703125, 1.7430419921875, 1.880126953125, 2.0172119140625, 2.154296875, 2.2913818359375, 2.428466796875, 2.5655517578125, 2.70263671875, 2.8397216796875, 2.976806640625, 3.1138916015625, 3.2509765625, 3.3880615234375, 3.525146484375, 3.6622314453125, 3.79931640625, 3.9364013671875, 4.073486328125, 4.2105712890625, 4.34765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 8.0, 8.0, 11.0, 13.0, 13.0, 23.0, 18.0, 19.0, 27.0, 30.0, 32.0, 23.0, 41.0, 34.0, 39.0, 45.0, 30.0, 37.0, 50.0, 38.0, 43.0, 47.0, 44.0, 34.0, 26.0, 36.0, 41.0, 23.0, 20.0, 23.0, 20.0, 14.0, 21.0, 8.0, 10.0, 9.0, 10.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.78125, -12.419677734375, -12.05810546875, -11.696533203125, -11.3349609375, -10.973388671875, -10.61181640625, -10.250244140625, -9.888671875, -9.527099609375, -9.16552734375, -8.803955078125, -8.4423828125, -8.080810546875, -7.71923828125, -7.357666015625, -6.99609375, -6.634521484375, -6.27294921875, -5.911376953125, -5.5498046875, -5.188232421875, -4.82666015625, -4.465087890625, -4.103515625, -3.741943359375, -3.38037109375, -3.018798828125, -2.6572265625, -2.295654296875, -1.93408203125, -1.572509765625, -1.2109375, -0.849365234375, -0.48779296875, -0.126220703125, 0.2353515625, 0.596923828125, 0.95849609375, 1.320068359375, 1.681640625, 2.043212890625, 2.40478515625, 2.766357421875, 3.1279296875, 3.489501953125, 3.85107421875, 4.212646484375, 4.57421875, 4.935791015625, 5.29736328125, 5.658935546875, 6.0205078125, 6.382080078125, 6.74365234375, 7.105224609375, 7.466796875, 7.828369140625, 8.18994140625, 8.551513671875, 8.9130859375, 9.274658203125, 9.63623046875, 9.997802734375, 10.359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 12.0, 15.0, 24.0, 23.0, 43.0, 57.0, 72.0, 117.0, 170.0, 223.0, 327.0, 457.0, 678.0, 1022.0, 1495.0, 2265.0, 3871.0, 6095.0, 10322.0, 18469.0, 33923.0, 65423.0, 128342.0, 227256.0, 241836.0, 144525.0, 73877.0, 37846.0, 20128.0, 11393.0, 6710.0, 4068.0, 2512.0, 1564.0, 1082.0, 687.0, 520.0, 323.0, 245.0, 155.0, 105.0, 72.0, 62.0, 36.0, 37.0, 20.0, 19.0, 5.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.740234375, -3.61993408203125, -3.4996337890625, -3.37933349609375, -3.259033203125, -3.13873291015625, -3.0184326171875, -2.89813232421875, -2.77783203125, -2.65753173828125, -2.5372314453125, -2.41693115234375, -2.296630859375, -2.17633056640625, -2.0560302734375, -1.93572998046875, -1.8154296875, -1.69512939453125, -1.5748291015625, -1.45452880859375, -1.334228515625, -1.21392822265625, -1.0936279296875, -0.97332763671875, -0.85302734375, -0.73272705078125, -0.6124267578125, -0.49212646484375, -0.371826171875, -0.25152587890625, -0.1312255859375, -0.01092529296875, 0.109375, 0.22967529296875, 0.3499755859375, 0.47027587890625, 0.590576171875, 0.71087646484375, 0.8311767578125, 0.95147705078125, 1.07177734375, 1.19207763671875, 1.3123779296875, 1.43267822265625, 1.552978515625, 1.67327880859375, 1.7935791015625, 1.91387939453125, 2.0341796875, 2.15447998046875, 2.2747802734375, 2.39508056640625, 2.515380859375, 2.63568115234375, 2.7559814453125, 2.87628173828125, 2.99658203125, 3.11688232421875, 3.2371826171875, 3.35748291015625, 3.477783203125, 3.59808349609375, 3.7183837890625, 3.83868408203125, 3.958984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 2.0, 8.0, 7.0, 8.0, 11.0, 15.0, 14.0, 16.0, 26.0, 23.0, 29.0, 24.0, 29.0, 22.0, 31.0, 40.0, 32.0, 33.0, 39.0, 38.0, 46.0, 33.0, 34.0, 40.0, 34.0, 45.0, 47.0, 33.0, 25.0, 31.0, 24.0, 28.0, 21.0, 20.0, 14.0, 17.0, 9.0, 18.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.484375, -6.259033203125, -6.03369140625, -5.808349609375, -5.5830078125, -5.357666015625, -5.13232421875, -4.906982421875, -4.681640625, -4.456298828125, -4.23095703125, -4.005615234375, -3.7802734375, -3.554931640625, -3.32958984375, -3.104248046875, -2.87890625, -2.653564453125, -2.42822265625, -2.202880859375, -1.9775390625, -1.752197265625, -1.52685546875, -1.301513671875, -1.076171875, -0.850830078125, -0.62548828125, -0.400146484375, -0.1748046875, 0.050537109375, 0.27587890625, 0.501220703125, 0.7265625, 0.951904296875, 1.17724609375, 1.402587890625, 1.6279296875, 1.853271484375, 2.07861328125, 2.303955078125, 2.529296875, 2.754638671875, 2.97998046875, 3.205322265625, 3.4306640625, 3.656005859375, 3.88134765625, 4.106689453125, 4.33203125, 4.557373046875, 4.78271484375, 5.008056640625, 5.2333984375, 5.458740234375, 5.68408203125, 5.909423828125, 6.134765625, 6.360107421875, 6.58544921875, 6.810791015625, 7.0361328125, 7.261474609375, 7.48681640625, 7.712158203125, 7.9375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 10.0, 7.0, 11.0, 18.0, 16.0, 29.0, 31.0, 58.0, 63.0, 71.0, 108.0, 181.0, 249.0, 400.0, 679.0, 1192.0, 2361.0, 5183.0, 13291.0, 41139.0, 181612.0, 559176.0, 178724.0, 40390.0, 12924.0, 4983.0, 2377.0, 1186.0, 709.0, 462.0, 283.0, 181.0, 143.0, 93.0, 66.0, 42.0, 38.0, 25.0, 13.0, 10.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.81964111328125, -2.7271728515625, -2.63470458984375, -2.542236328125, -2.44976806640625, -2.3572998046875, -2.26483154296875, -2.17236328125, -2.07989501953125, -1.9874267578125, -1.89495849609375, -1.802490234375, -1.71002197265625, -1.6175537109375, -1.52508544921875, -1.4326171875, -1.34014892578125, -1.2476806640625, -1.15521240234375, -1.062744140625, -0.97027587890625, -0.8778076171875, -0.78533935546875, -0.69287109375, -0.60040283203125, -0.5079345703125, -0.41546630859375, -0.322998046875, -0.23052978515625, -0.1380615234375, -0.04559326171875, 0.046875, 0.13934326171875, 0.2318115234375, 0.32427978515625, 0.416748046875, 0.50921630859375, 0.6016845703125, 0.69415283203125, 0.78662109375, 0.87908935546875, 0.9715576171875, 1.06402587890625, 1.156494140625, 1.24896240234375, 1.3414306640625, 1.43389892578125, 1.5263671875, 1.61883544921875, 1.7113037109375, 1.80377197265625, 1.896240234375, 1.98870849609375, 2.0811767578125, 2.17364501953125, 2.26611328125, 2.35858154296875, 2.4510498046875, 2.54351806640625, 2.635986328125, 2.72845458984375, 2.8209228515625, 2.91339111328125, 3.005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 9.0, 14.0, 17.0, 14.0, 26.0, 25.0, 34.0, 34.0, 49.0, 65.0, 87.0, 74.0, 72.0, 74.0, 71.0, 66.0, 50.0, 48.0, 36.0, 21.0, 26.0, 9.0, 10.0, 9.0, 6.0, 7.0, 10.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0003323554992675781, -0.0003235321491956711, -0.00031470879912376404, -0.000305885449051857, -0.00029706209897994995, -0.0002882387489080429, -0.00027941539883613586, -0.0002705920487642288, -0.0002617686986923218, -0.00025294534862041473, -0.0002441219985485077, -0.00023529864847660065, -0.0002264752984046936, -0.00021765194833278656, -0.00020882859826087952, -0.00020000524818897247, -0.00019118189811706543, -0.00018235854804515839, -0.00017353519797325134, -0.0001647118479013443, -0.00015588849782943726, -0.0001470651477575302, -0.00013824179768562317, -0.00012941844761371613, -0.00012059509754180908, -0.00011177174746990204, -0.000102948397397995, -9.412504732608795e-05, -8.530169725418091e-05, -7.647834718227386e-05, -6.765499711036682e-05, -5.883164703845978e-05, -5.0008296966552734e-05, -4.118494689464569e-05, -3.236159682273865e-05, -2.3538246750831604e-05, -1.471489667892456e-05, -5.891546607017517e-06, 2.9318034648895264e-06, 1.175515353679657e-05, 2.0578503608703613e-05, 2.9401853680610657e-05, 3.82252037525177e-05, 4.7048553824424744e-05, 5.587190389633179e-05, 6.469525396823883e-05, 7.351860404014587e-05, 8.234195411205292e-05, 9.116530418395996e-05, 9.9988654255867e-05, 0.00010881200432777405, 0.00011763535439968109, 0.00012645870447158813, 0.00013528205454349518, 0.00014410540461540222, 0.00015292875468730927, 0.0001617521047592163, 0.00017057545483112335, 0.0001793988049030304, 0.00018822215497493744, 0.00019704550504684448, 0.00020586885511875153, 0.00021469220519065857, 0.0002235155552625656, 0.00023233890533447266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 4.0, 3.0, 6.0, 12.0, 16.0, 30.0, 35.0, 48.0, 86.0, 112.0, 214.0, 338.0, 446.0, 728.0, 1120.0, 1852.0, 3200.0, 6076.0, 13608.0, 39459.0, 135158.0, 378952.0, 314440.0, 99691.0, 29801.0, 10818.0, 4993.0, 2766.0, 1622.0, 1036.0, 655.0, 427.0, 267.0, 169.0, 122.0, 81.0, 48.0, 34.0, 30.0, 15.0, 9.0, 13.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.1539306640625, -4.014892578125, -3.8758544921875, -3.73681640625, -3.5977783203125, -3.458740234375, -3.3197021484375, -3.1806640625, -3.0416259765625, -2.902587890625, -2.7635498046875, -2.62451171875, -2.4854736328125, -2.346435546875, -2.2073974609375, -2.068359375, -1.9293212890625, -1.790283203125, -1.6512451171875, -1.51220703125, -1.3731689453125, -1.234130859375, -1.0950927734375, -0.9560546875, -0.8170166015625, -0.677978515625, -0.5389404296875, -0.39990234375, -0.2608642578125, -0.121826171875, 0.0172119140625, 0.15625, 0.2952880859375, 0.434326171875, 0.5733642578125, 0.71240234375, 0.8514404296875, 0.990478515625, 1.1295166015625, 1.2685546875, 1.4075927734375, 1.546630859375, 1.6856689453125, 1.82470703125, 1.9637451171875, 2.102783203125, 2.2418212890625, 2.380859375, 2.5198974609375, 2.658935546875, 2.7979736328125, 2.93701171875, 3.0760498046875, 3.215087890625, 3.3541259765625, 3.4931640625, 3.6322021484375, 3.771240234375, 3.9102783203125, 4.04931640625, 4.1883544921875, 4.327392578125, 4.4664306640625, 4.60546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 12.0, 15.0, 18.0, 28.0, 34.0, 49.0, 75.0, 83.0, 87.0, 91.0, 86.0, 79.0, 75.0, 55.0, 59.0, 38.0, 29.0, 22.0, 10.0, 7.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.169921875, -1.1318511962890625, -1.093780517578125, -1.0557098388671875, -1.01763916015625, -0.9795684814453125, -0.941497802734375, -0.9034271240234375, -0.8653564453125, -0.8272857666015625, -0.789215087890625, -0.7511444091796875, -0.71307373046875, -0.6750030517578125, -0.636932373046875, -0.5988616943359375, -0.560791015625, -0.5227203369140625, -0.484649658203125, -0.4465789794921875, -0.40850830078125, -0.3704376220703125, -0.332366943359375, -0.2942962646484375, -0.2562255859375, -0.2181549072265625, -0.180084228515625, -0.1420135498046875, -0.10394287109375, -0.0658721923828125, -0.027801513671875, 0.0102691650390625, 0.04833984375, 0.0864105224609375, 0.124481201171875, 0.1625518798828125, 0.20062255859375, 0.2386932373046875, 0.276763916015625, 0.3148345947265625, 0.3529052734375, 0.3909759521484375, 0.429046630859375, 0.4671173095703125, 0.50518798828125, 0.5432586669921875, 0.581329345703125, 0.6194000244140625, 0.657470703125, 0.6955413818359375, 0.733612060546875, 0.7716827392578125, 0.80975341796875, 0.8478240966796875, 0.885894775390625, 0.9239654541015625, 0.9620361328125, 1.0001068115234375, 1.038177490234375, 1.0762481689453125, 1.11431884765625, 1.1523895263671875, 1.190460205078125, 1.2285308837890625, 1.2666015625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 9.0, 10.0, 8.0, 6.0, 21.0, 24.0, 24.0, 27.0, 31.0, 32.0, 42.0, 41.0, 60.0, 52.0, 44.0, 42.0, 45.0, 51.0, 41.0, 47.0, 48.0, 39.0, 34.0, 25.0, 35.0, 27.0, 24.0, 21.0, 9.0, 14.0, 11.0, 13.0, 9.0, 6.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.889636039733887, -10.494866371154785, -10.10009765625, -9.705327987670898, -9.310558319091797, -8.915788650512695, -8.521018981933594, -8.126250267028809, -7.731480598449707, -7.3367109298706055, -6.941941738128662, -6.547172546386719, -6.152402877807617, -5.757633209228516, -5.362864017486572, -4.968094825744629, -4.573325157165527, -4.178555488586426, -3.7837862968444824, -3.38901686668396, -2.9942474365234375, -2.599478006362915, -2.2047085762023926, -1.8099391460418701, -1.4151697158813477, -1.0204002857208252, -0.6256308555603027, -0.23086142539978027, 0.1639080047607422, 0.5586774349212646, 0.9534468650817871, 1.3482162952423096, 1.742985725402832, 2.1377551555633545, 2.532524585723877, 2.9272940158843994, 3.322063446044922, 3.7168328762054443, 4.111602306365967, 4.50637149810791, 4.901141166687012, 5.295910835266113, 5.690680027008057, 6.08544921875, 6.480218887329102, 6.874988555908203, 7.2697577476501465, 7.66452693939209, 8.059296607971191, 8.454066276550293, 8.848834991455078, 9.24360466003418, 9.638374328613281, 10.033143997192383, 10.427913665771484, 10.82268238067627, 11.217452049255371, 11.612221717834473, 12.006990432739258, 12.40176010131836, 12.796529769897461, 13.191299438476562, 13.586069107055664, 13.98083782196045, 14.37560749053955]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 11.0, 9.0, 9.0, 18.0, 18.0, 21.0, 22.0, 30.0, 17.0, 32.0, 26.0, 28.0, 33.0, 50.0, 38.0, 33.0, 32.0, 44.0, 39.0, 46.0, 47.0, 44.0, 36.0, 33.0, 31.0, 36.0, 27.0, 30.0, 19.0, 16.0, 18.0, 17.0, 14.0, 9.0, 14.0, 10.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.343374252319336, -11.988327026367188, -11.633280754089355, -11.278233528137207, -10.923187255859375, -10.568140029907227, -10.213092803955078, -9.85804557800293, -9.502999305725098, -9.14795207977295, -8.792905807495117, -8.437858581542969, -8.08281135559082, -7.727765083312988, -7.37271785736084, -7.01767110824585, -6.662624359130859, -6.307577610015869, -5.952530860900879, -5.5974836349487305, -5.24243688583374, -4.88739013671875, -4.532342910766602, -4.177296161651611, -3.822249412536621, -3.467202663421631, -3.1121556758880615, -2.757108688354492, -2.402061939239502, -2.0470151901245117, -1.6919682025909424, -1.336921215057373, -0.9818744659423828, -0.626827597618103, -0.27178072929382324, 0.08326613903045654, 0.43831300735473633, 0.7933598756790161, 1.148406744003296, 1.5034537315368652, 1.8585004806518555, 2.2135472297668457, 2.568594217300415, 2.9236412048339844, 3.2786879539489746, 3.633734703063965, 3.988781690597534, 4.3438286781311035, 4.698875427246094, 5.053922176361084, 5.408968925476074, 5.764016151428223, 6.119062900543213, 6.474109649658203, 6.829156875610352, 7.184203624725342, 7.539250373840332, 7.894297122955322, 8.249343872070312, 8.604391098022461, 8.95943832397461, 9.314484596252441, 9.66953182220459, 10.024578094482422, 10.37962532043457]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 16.0, 27.0, 49.0, 56.0, 85.0, 160.0, 255.0, 417.0, 618.0, 1025.0, 1655.0, 2357.0, 3586.0, 5660.0, 8262.0, 12233.0, 17581.0, 24830.0, 33247.0, 43717.0, 56159.0, 68185.0, 79825.0, 87926.0, 92490.0, 90889.0, 86058.0, 75990.0, 63867.0, 51877.0, 40038.0, 30171.0, 21958.0, 15518.0, 10634.0, 7334.0, 4880.0, 3242.0, 2038.0, 1376.0, 808.0, 523.0, 351.0, 216.0, 149.0, 87.0, 47.0, 36.0, 20.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.59375, -8.32373046875, -8.0537109375, -7.78369140625, -7.513671875, -7.24365234375, -6.9736328125, -6.70361328125, -6.43359375, -6.16357421875, -5.8935546875, -5.62353515625, -5.353515625, -5.08349609375, -4.8134765625, -4.54345703125, -4.2734375, -4.00341796875, -3.7333984375, -3.46337890625, -3.193359375, -2.92333984375, -2.6533203125, -2.38330078125, -2.11328125, -1.84326171875, -1.5732421875, -1.30322265625, -1.033203125, -0.76318359375, -0.4931640625, -0.22314453125, 0.046875, 0.31689453125, 0.5869140625, 0.85693359375, 1.126953125, 1.39697265625, 1.6669921875, 1.93701171875, 2.20703125, 2.47705078125, 2.7470703125, 3.01708984375, 3.287109375, 3.55712890625, 3.8271484375, 4.09716796875, 4.3671875, 4.63720703125, 4.9072265625, 5.17724609375, 5.447265625, 5.71728515625, 5.9873046875, 6.25732421875, 6.52734375, 6.79736328125, 7.0673828125, 7.33740234375, 7.607421875, 7.87744140625, 8.1474609375, 8.41748046875, 8.6875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 13.0, 5.0, 13.0, 15.0, 20.0, 22.0, 24.0, 26.0, 22.0, 30.0, 28.0, 25.0, 39.0, 45.0, 41.0, 32.0, 34.0, 49.0, 34.0, 43.0, 46.0, 47.0, 34.0, 35.0, 30.0, 33.0, 26.0, 29.0, 19.0, 16.0, 19.0, 17.0, 13.0, 7.0, 16.0, 9.0, 11.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.8203125, -11.4791259765625, -11.137939453125, -10.7967529296875, -10.45556640625, -10.1143798828125, -9.773193359375, -9.4320068359375, -9.0908203125, -8.7496337890625, -8.408447265625, -8.0672607421875, -7.72607421875, -7.3848876953125, -7.043701171875, -6.7025146484375, -6.361328125, -6.0201416015625, -5.678955078125, -5.3377685546875, -4.99658203125, -4.6553955078125, -4.314208984375, -3.9730224609375, -3.6318359375, -3.2906494140625, -2.949462890625, -2.6082763671875, -2.26708984375, -1.9259033203125, -1.584716796875, -1.2435302734375, -0.90234375, -0.5611572265625, -0.219970703125, 0.1212158203125, 0.46240234375, 0.8035888671875, 1.144775390625, 1.4859619140625, 1.8271484375, 2.1683349609375, 2.509521484375, 2.8507080078125, 3.19189453125, 3.5330810546875, 3.874267578125, 4.2154541015625, 4.556640625, 4.8978271484375, 5.239013671875, 5.5802001953125, 5.92138671875, 6.2625732421875, 6.603759765625, 6.9449462890625, 7.2861328125, 7.6273193359375, 7.968505859375, 8.3096923828125, 8.65087890625, 8.9920654296875, 9.333251953125, 9.6744384765625, 10.015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 7.0, 12.0, 20.0, 33.0, 45.0, 92.0, 118.0, 172.0, 311.0, 431.0, 732.0, 1184.0, 1857.0, 2950.0, 4570.0, 7258.0, 11258.0, 16628.0, 24728.0, 34658.0, 47970.0, 62463.0, 78716.0, 92359.0, 102262.0, 104211.0, 99125.0, 88046.0, 72977.0, 57240.0, 42779.0, 30514.0, 21556.0, 14642.0, 9527.0, 6307.0, 3908.0, 2562.0, 1686.0, 1003.0, 606.0, 375.0, 228.0, 149.0, 88.0, 70.0, 48.0, 27.0, 13.0, 13.0, 10.0, 3.0, 7.0, 3.0, 1.0, 0.0, 3.0], "bins": [-10.2265625, -9.91015625, -9.59375, -9.27734375, -8.9609375, -8.64453125, -8.328125, -8.01171875, -7.6953125, -7.37890625, -7.0625, -6.74609375, -6.4296875, -6.11328125, -5.796875, -5.48046875, -5.1640625, -4.84765625, -4.53125, -4.21484375, -3.8984375, -3.58203125, -3.265625, -2.94921875, -2.6328125, -2.31640625, -2.0, -1.68359375, -1.3671875, -1.05078125, -0.734375, -0.41796875, -0.1015625, 0.21484375, 0.53125, 0.84765625, 1.1640625, 1.48046875, 1.796875, 2.11328125, 2.4296875, 2.74609375, 3.0625, 3.37890625, 3.6953125, 4.01171875, 4.328125, 4.64453125, 4.9609375, 5.27734375, 5.59375, 5.91015625, 6.2265625, 6.54296875, 6.859375, 7.17578125, 7.4921875, 7.80859375, 8.125, 8.44140625, 8.7578125, 9.07421875, 9.390625, 9.70703125, 10.0234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 7.0, 9.0, 4.0, 6.0, 10.0, 16.0, 11.0, 15.0, 17.0, 27.0, 20.0, 26.0, 31.0, 21.0, 25.0, 39.0, 31.0, 34.0, 42.0, 39.0, 46.0, 48.0, 39.0, 42.0, 35.0, 34.0, 34.0, 38.0, 31.0, 29.0, 31.0, 18.0, 19.0, 24.0, 19.0, 18.0, 7.0, 10.0, 10.0, 8.0, 10.0, 4.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 4.0], "bins": [-7.57421875, -7.3570556640625, -7.139892578125, -6.9227294921875, -6.70556640625, -6.4884033203125, -6.271240234375, -6.0540771484375, -5.8369140625, -5.6197509765625, -5.402587890625, -5.1854248046875, -4.96826171875, -4.7510986328125, -4.533935546875, -4.3167724609375, -4.099609375, -3.8824462890625, -3.665283203125, -3.4481201171875, -3.23095703125, -3.0137939453125, -2.796630859375, -2.5794677734375, -2.3623046875, -2.1451416015625, -1.927978515625, -1.7108154296875, -1.49365234375, -1.2764892578125, -1.059326171875, -0.8421630859375, -0.625, -0.4078369140625, -0.190673828125, 0.0264892578125, 0.24365234375, 0.4608154296875, 0.677978515625, 0.8951416015625, 1.1123046875, 1.3294677734375, 1.546630859375, 1.7637939453125, 1.98095703125, 2.1981201171875, 2.415283203125, 2.6324462890625, 2.849609375, 3.0667724609375, 3.283935546875, 3.5010986328125, 3.71826171875, 3.9354248046875, 4.152587890625, 4.3697509765625, 4.5869140625, 4.8040771484375, 5.021240234375, 5.2384033203125, 5.45556640625, 5.6727294921875, 5.889892578125, 6.1070556640625, 6.32421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 7.0, 8.0, 22.0, 10.0, 25.0, 53.0, 82.0, 132.0, 196.0, 296.0, 538.0, 848.0, 1445.0, 2445.0, 4290.0, 7173.0, 12460.0, 21749.0, 37846.0, 63504.0, 99514.0, 139234.0, 164451.0, 157228.0, 124570.0, 85212.0, 52534.0, 30599.0, 17775.0, 10161.0, 5804.0, 3292.0, 1995.0, 1144.0, 768.0, 418.0, 280.0, 149.0, 113.0, 62.0, 45.0, 26.0, 20.0, 11.0, 11.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.56640625, -6.36627197265625, -6.1661376953125, -5.96600341796875, -5.765869140625, -5.56573486328125, -5.3656005859375, -5.16546630859375, -4.96533203125, -4.76519775390625, -4.5650634765625, -4.36492919921875, -4.164794921875, -3.96466064453125, -3.7645263671875, -3.56439208984375, -3.3642578125, -3.16412353515625, -2.9639892578125, -2.76385498046875, -2.563720703125, -2.36358642578125, -2.1634521484375, -1.96331787109375, -1.76318359375, -1.56304931640625, -1.3629150390625, -1.16278076171875, -0.962646484375, -0.76251220703125, -0.5623779296875, -0.36224365234375, -0.162109375, 0.03802490234375, 0.2381591796875, 0.43829345703125, 0.638427734375, 0.83856201171875, 1.0386962890625, 1.23883056640625, 1.43896484375, 1.63909912109375, 1.8392333984375, 2.03936767578125, 2.239501953125, 2.43963623046875, 2.6397705078125, 2.83990478515625, 3.0400390625, 3.24017333984375, 3.4403076171875, 3.64044189453125, 3.840576171875, 4.04071044921875, 4.2408447265625, 4.44097900390625, 4.64111328125, 4.84124755859375, 5.0413818359375, 5.24151611328125, 5.441650390625, 5.64178466796875, 5.8419189453125, 6.04205322265625, 6.2421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 12.0, 4.0, 14.0, 10.0, 18.0, 14.0, 17.0, 25.0, 36.0, 40.0, 45.0, 62.0, 53.0, 59.0, 54.0, 54.0, 72.0, 49.0, 52.0, 60.0, 46.0, 35.0, 37.0, 33.0, 24.0, 18.0, 12.0, 8.0, 12.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006799697875976562, -0.000657007098197937, -0.0006340444087982178, -0.0006110817193984985, -0.0005881190299987793, -0.0005651563405990601, -0.0005421936511993408, -0.0005192309617996216, -0.0004962682723999023, -0.0004733055830001831, -0.00045034289360046387, -0.00042738020420074463, -0.0004044175148010254, -0.00038145482540130615, -0.0003584921360015869, -0.0003355294466018677, -0.00031256675720214844, -0.0002896040678024292, -0.00026664137840270996, -0.00024367868900299072, -0.00022071599960327148, -0.00019775331020355225, -0.000174790620803833, -0.00015182793140411377, -0.00012886524200439453, -0.00010590255260467529, -8.293986320495605e-05, -5.9977173805236816e-05, -3.701448440551758e-05, -1.405179500579834e-05, 8.910894393920898e-06, 3.187358379364014e-05, 5.4836273193359375e-05, 7.779896259307861e-05, 0.00010076165199279785, 0.0001237243413925171, 0.00014668703079223633, 0.00016964972019195557, 0.0001926124095916748, 0.00021557509899139404, 0.00023853778839111328, 0.0002615004777908325, 0.00028446316719055176, 0.000307425856590271, 0.00033038854598999023, 0.00035335123538970947, 0.0003763139247894287, 0.00039927661418914795, 0.0004222393035888672, 0.0004452019929885864, 0.00046816468238830566, 0.0004911273717880249, 0.0005140900611877441, 0.0005370527505874634, 0.0005600154399871826, 0.0005829781293869019, 0.0006059408187866211, 0.0006289035081863403, 0.0006518661975860596, 0.0006748288869857788, 0.000697791576385498, 0.0007207542657852173, 0.0007437169551849365, 0.0007666796445846558, 0.000789642333984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 9.0, 14.0, 12.0, 19.0, 26.0, 44.0, 80.0, 102.0, 156.0, 224.0, 353.0, 527.0, 773.0, 1101.0, 1704.0, 2712.0, 3864.0, 5752.0, 9017.0, 13286.0, 20235.0, 29314.0, 42088.0, 58878.0, 77802.0, 96614.0, 111110.0, 115647.0, 109753.0, 93687.0, 74805.0, 55949.0, 39776.0, 27371.0, 18900.0, 12435.0, 8169.0, 5330.0, 3615.0, 2423.0, 1527.0, 1107.0, 758.0, 500.0, 309.0, 239.0, 147.0, 100.0, 76.0, 36.0, 28.0, 15.0, 15.0, 10.0, 7.0, 3.0, 1.0, 4.0], "bins": [-5.16796875, -5.0133056640625, -4.858642578125, -4.7039794921875, -4.54931640625, -4.3946533203125, -4.239990234375, -4.0853271484375, -3.9306640625, -3.7760009765625, -3.621337890625, -3.4666748046875, -3.31201171875, -3.1573486328125, -3.002685546875, -2.8480224609375, -2.693359375, -2.5386962890625, -2.384033203125, -2.2293701171875, -2.07470703125, -1.9200439453125, -1.765380859375, -1.6107177734375, -1.4560546875, -1.3013916015625, -1.146728515625, -0.9920654296875, -0.83740234375, -0.6827392578125, -0.528076171875, -0.3734130859375, -0.21875, -0.0640869140625, 0.090576171875, 0.2452392578125, 0.39990234375, 0.5545654296875, 0.709228515625, 0.8638916015625, 1.0185546875, 1.1732177734375, 1.327880859375, 1.4825439453125, 1.63720703125, 1.7918701171875, 1.946533203125, 2.1011962890625, 2.255859375, 2.4105224609375, 2.565185546875, 2.7198486328125, 2.87451171875, 3.0291748046875, 3.183837890625, 3.3385009765625, 3.4931640625, 3.6478271484375, 3.802490234375, 3.9571533203125, 4.11181640625, 4.2664794921875, 4.421142578125, 4.5758056640625, 4.73046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 3.0, 5.0, 9.0, 7.0, 15.0, 15.0, 20.0, 28.0, 25.0, 25.0, 47.0, 67.0, 52.0, 62.0, 58.0, 47.0, 57.0, 62.0, 52.0, 50.0, 59.0, 42.0, 27.0, 35.0, 30.0, 27.0, 11.0, 12.0, 3.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5625, -2.479766845703125, -2.39703369140625, -2.314300537109375, -2.2315673828125, -2.148834228515625, -2.06610107421875, -1.983367919921875, -1.900634765625, -1.817901611328125, -1.73516845703125, -1.652435302734375, -1.5697021484375, -1.486968994140625, -1.40423583984375, -1.321502685546875, -1.23876953125, -1.156036376953125, -1.07330322265625, -0.990570068359375, -0.9078369140625, -0.825103759765625, -0.74237060546875, -0.659637451171875, -0.576904296875, -0.494171142578125, -0.41143798828125, -0.328704833984375, -0.2459716796875, -0.163238525390625, -0.08050537109375, 0.002227783203125, 0.0849609375, 0.167694091796875, 0.25042724609375, 0.333160400390625, 0.4158935546875, 0.498626708984375, 0.58135986328125, 0.664093017578125, 0.746826171875, 0.829559326171875, 0.91229248046875, 0.995025634765625, 1.0777587890625, 1.160491943359375, 1.24322509765625, 1.325958251953125, 1.40869140625, 1.491424560546875, 1.57415771484375, 1.656890869140625, 1.7396240234375, 1.822357177734375, 1.90509033203125, 1.987823486328125, 2.070556640625, 2.153289794921875, 2.23602294921875, 2.318756103515625, 2.4014892578125, 2.484222412109375, 2.56695556640625, 2.649688720703125, 2.732421875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 8.0, 8.0, 14.0, 16.0, 19.0, 16.0, 25.0, 30.0, 35.0, 47.0, 44.0, 47.0, 43.0, 46.0, 55.0, 47.0, 42.0, 48.0, 41.0, 44.0, 31.0, 40.0, 40.0, 34.0, 35.0, 24.0, 19.0, 19.0, 14.0, 10.0, 10.0, 8.0, 9.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.368993759155273, -11.959609985351562, -11.550226211547852, -11.14084243774414, -10.731457710266113, -10.322073936462402, -9.912690162658691, -9.50330638885498, -9.093921661376953, -8.684537887573242, -8.275154113769531, -7.865769863128662, -7.456385612487793, -7.047001838684082, -6.637618064880371, -6.22823429107666, -5.818850517272949, -5.409466743469238, -5.000082492828369, -4.590698719024658, -4.181314468383789, -3.771930694580078, -3.362546920776367, -2.953162908554077, -2.543778896331787, -2.134394884109497, -1.7250109910964966, -1.315627098083496, -0.906243085861206, -0.496859073638916, -0.08747529983520508, 0.32190871238708496, 0.731292724609375, 1.140676736831665, 1.5500606298446655, 1.959444522857666, 2.368828535079956, 2.778212547302246, 3.187596321105957, 3.596980333328247, 4.006364345550537, 4.415748119354248, 4.825132369995117, 5.234516143798828, 5.643899917602539, 6.053284168243408, 6.462667942047119, 6.872052192687988, 7.281435966491699, 7.69081974029541, 8.100203514099121, 8.509588241577148, 8.91897201538086, 9.32835578918457, 9.737739562988281, 10.147123336791992, 10.556507110595703, 10.965890884399414, 11.375274658203125, 11.784658432006836, 12.194043159484863, 12.603426933288574, 13.012810707092285, 13.422194480895996, 13.831579208374023]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 11.0, 8.0, 5.0, 14.0, 18.0, 20.0, 23.0, 24.0, 36.0, 35.0, 35.0, 37.0, 42.0, 42.0, 48.0, 44.0, 57.0, 53.0, 56.0, 48.0, 38.0, 35.0, 39.0, 38.0, 22.0, 28.0, 35.0, 23.0, 14.0, 24.0, 13.0, 6.0, 5.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.965024948120117, -13.537736892700195, -13.110448837280273, -12.683160781860352, -12.25587272644043, -11.828584671020508, -11.401296615600586, -10.974007606506348, -10.546719551086426, -10.119431495666504, -9.692143440246582, -9.26485538482666, -8.837567329406738, -8.4102783203125, -7.982990741729736, -7.555702209472656, -7.128414630889893, -6.701126575469971, -6.273838520050049, -5.846549987792969, -5.419261932373047, -4.991973876953125, -4.564685821533203, -4.137397766113281, -3.7101094722747803, -3.2828214168548584, -2.8555331230163574, -2.4282450675964355, -2.0009570121765137, -1.5736687183380127, -1.1463806629180908, -0.7190923690795898, -0.29180431365966797, 0.13548383116722107, 0.5627719759941101, 0.9900600910186768, 1.4173482656478882, 1.8446364402770996, 2.2719244956970215, 2.6992127895355225, 3.1265008449554443, 3.553788900375366, 3.981077194213867, 4.408365249633789, 4.835653305053711, 5.262941360473633, 5.690229415893555, 6.117517948150635, 6.544806003570557, 6.9720940589904785, 7.3993821144104, 7.8266706466674805, 8.253958702087402, 8.681246757507324, 9.108534812927246, 9.535822868347168, 9.96311092376709, 10.390398979187012, 10.817687034606934, 11.244975090026855, 11.672263145446777, 12.099552154541016, 12.526840209960938, 12.95412826538086, 13.381416320800781]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 14.0, 17.0, 22.0, 52.0, 63.0, 105.0, 184.0, 337.0, 575.0, 958.0, 1596.0, 2704.0, 4492.0, 7342.0, 12132.0, 19630.0, 31213.0, 49315.0, 76229.0, 114950.0, 168497.0, 237115.0, 315857.0, 394843.0, 453211.0, 473471.0, 448485.0, 384095.0, 304956.0, 225718.0, 160778.0, 109162.0, 72660.0, 46438.0, 29431.0, 18422.0, 11475.0, 7060.0, 4316.0, 2550.0, 1620.0, 889.0, 514.0, 333.0, 193.0, 115.0, 76.0, 41.0, 15.0, 9.0, 12.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6875, -8.4111328125, -8.134765625, -7.8583984375, -7.58203125, -7.3056640625, -7.029296875, -6.7529296875, -6.4765625, -6.2001953125, -5.923828125, -5.6474609375, -5.37109375, -5.0947265625, -4.818359375, -4.5419921875, -4.265625, -3.9892578125, -3.712890625, -3.4365234375, -3.16015625, -2.8837890625, -2.607421875, -2.3310546875, -2.0546875, -1.7783203125, -1.501953125, -1.2255859375, -0.94921875, -0.6728515625, -0.396484375, -0.1201171875, 0.15625, 0.4326171875, 0.708984375, 0.9853515625, 1.26171875, 1.5380859375, 1.814453125, 2.0908203125, 2.3671875, 2.6435546875, 2.919921875, 3.1962890625, 3.47265625, 3.7490234375, 4.025390625, 4.3017578125, 4.578125, 4.8544921875, 5.130859375, 5.4072265625, 5.68359375, 5.9599609375, 6.236328125, 6.5126953125, 6.7890625, 7.0654296875, 7.341796875, 7.6181640625, 7.89453125, 8.1708984375, 8.447265625, 8.7236328125, 9.0]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 8.0, 8.0, 12.0, 14.0, 18.0, 23.0, 20.0, 24.0, 32.0, 35.0, 41.0, 34.0, 44.0, 36.0, 46.0, 48.0, 51.0, 63.0, 49.0, 39.0, 46.0, 40.0, 35.0, 34.0, 30.0, 31.0, 25.0, 21.0, 20.0, 19.0, 13.0, 6.0, 9.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.90625, -11.5421142578125, -11.177978515625, -10.8138427734375, -10.44970703125, -10.0855712890625, -9.721435546875, -9.3572998046875, -8.9931640625, -8.6290283203125, -8.264892578125, -7.9007568359375, -7.53662109375, -7.1724853515625, -6.808349609375, -6.4442138671875, -6.080078125, -5.7159423828125, -5.351806640625, -4.9876708984375, -4.62353515625, -4.2593994140625, -3.895263671875, -3.5311279296875, -3.1669921875, -2.8028564453125, -2.438720703125, -2.0745849609375, -1.71044921875, -1.3463134765625, -0.982177734375, -0.6180419921875, -0.25390625, 0.1102294921875, 0.474365234375, 0.8385009765625, 1.20263671875, 1.5667724609375, 1.930908203125, 2.2950439453125, 2.6591796875, 3.0233154296875, 3.387451171875, 3.7515869140625, 4.11572265625, 4.4798583984375, 4.843994140625, 5.2081298828125, 5.572265625, 5.9364013671875, 6.300537109375, 6.6646728515625, 7.02880859375, 7.3929443359375, 7.757080078125, 8.1212158203125, 8.4853515625, 8.8494873046875, 9.213623046875, 9.5777587890625, 9.94189453125, 10.3060302734375, 10.670166015625, 11.0343017578125, 11.3984375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 11.0, 18.0, 33.0, 58.0, 102.0, 175.0, 295.0, 540.0, 952.0, 1692.0, 2819.0, 4957.0, 8156.0, 14014.0, 22604.0, 36342.0, 56284.0, 86574.0, 128548.0, 181626.0, 246114.0, 315442.0, 380038.0, 424431.0, 438355.0, 419185.0, 370619.0, 304805.0, 236253.0, 172269.0, 121053.0, 81694.0, 52205.0, 33859.0, 21337.0, 12623.0, 7586.0, 4514.0, 2542.0, 1570.0, 845.0, 512.0, 270.0, 148.0, 98.0, 60.0, 24.0, 21.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0], "bins": [-9.9375, -9.6488037109375, -9.360107421875, -9.0714111328125, -8.78271484375, -8.4940185546875, -8.205322265625, -7.9166259765625, -7.6279296875, -7.3392333984375, -7.050537109375, -6.7618408203125, -6.47314453125, -6.1844482421875, -5.895751953125, -5.6070556640625, -5.318359375, -5.0296630859375, -4.740966796875, -4.4522705078125, -4.16357421875, -3.8748779296875, -3.586181640625, -3.2974853515625, -3.0087890625, -2.7200927734375, -2.431396484375, -2.1427001953125, -1.85400390625, -1.5653076171875, -1.276611328125, -0.9879150390625, -0.69921875, -0.4105224609375, -0.121826171875, 0.1668701171875, 0.45556640625, 0.7442626953125, 1.032958984375, 1.3216552734375, 1.6103515625, 1.8990478515625, 2.187744140625, 2.4764404296875, 2.76513671875, 3.0538330078125, 3.342529296875, 3.6312255859375, 3.919921875, 4.2086181640625, 4.497314453125, 4.7860107421875, 5.07470703125, 5.3634033203125, 5.652099609375, 5.9407958984375, 6.2294921875, 6.5181884765625, 6.806884765625, 7.0955810546875, 7.38427734375, 7.6729736328125, 7.961669921875, 8.2503662109375, 8.5390625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 7.0, 4.0, 15.0, 17.0, 26.0, 32.0, 35.0, 51.0, 45.0, 58.0, 56.0, 103.0, 101.0, 117.0, 156.0, 154.0, 158.0, 161.0, 175.0, 178.0, 189.0, 203.0, 209.0, 196.0, 217.0, 155.0, 196.0, 141.0, 154.0, 104.0, 114.0, 103.0, 78.0, 61.0, 57.0, 43.0, 40.0, 37.0, 27.0, 22.0, 19.0, 15.0, 11.0, 4.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.29296875, -4.153564453125, -4.01416015625, -3.874755859375, -3.7353515625, -3.595947265625, -3.45654296875, -3.317138671875, -3.177734375, -3.038330078125, -2.89892578125, -2.759521484375, -2.6201171875, -2.480712890625, -2.34130859375, -2.201904296875, -2.0625, -1.923095703125, -1.78369140625, -1.644287109375, -1.5048828125, -1.365478515625, -1.22607421875, -1.086669921875, -0.947265625, -0.807861328125, -0.66845703125, -0.529052734375, -0.3896484375, -0.250244140625, -0.11083984375, 0.028564453125, 0.16796875, 0.307373046875, 0.44677734375, 0.586181640625, 0.7255859375, 0.864990234375, 1.00439453125, 1.143798828125, 1.283203125, 1.422607421875, 1.56201171875, 1.701416015625, 1.8408203125, 1.980224609375, 2.11962890625, 2.259033203125, 2.3984375, 2.537841796875, 2.67724609375, 2.816650390625, 2.9560546875, 3.095458984375, 3.23486328125, 3.374267578125, 3.513671875, 3.653076171875, 3.79248046875, 3.931884765625, 4.0712890625, 4.210693359375, 4.35009765625, 4.489501953125, 4.62890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 4.0, 14.0, 22.0, 20.0, 14.0, 20.0, 28.0, 32.0, 32.0, 39.0, 43.0, 46.0, 34.0, 36.0, 44.0, 40.0, 38.0, 48.0, 36.0, 40.0, 45.0, 35.0, 34.0, 30.0, 34.0, 21.0, 20.0, 14.0, 13.0, 22.0, 10.0, 10.0, 12.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.752127647399902, -11.386536598205566, -11.02094554901123, -10.655354499816895, -10.289764404296875, -9.924173355102539, -9.558582305908203, -9.192991256713867, -8.827400207519531, -8.461809158325195, -8.09621810913086, -7.730627536773682, -7.365036487579346, -6.99944543838501, -6.633854866027832, -6.268263816833496, -5.90267276763916, -5.537081718444824, -5.171490669250488, -4.8059000968933105, -4.440309047698975, -4.074717998504639, -3.709127187728882, -3.343536376953125, -2.977945327758789, -2.612354278564453, -2.2467634677886963, -1.88117253780365, -1.5155816078186035, -1.1499906778335571, -0.7843997478485107, -0.4188089370727539, -0.05321693420410156, 0.3123739957809448, 0.6779649257659912, 1.0435558557510376, 1.409146785736084, 1.7747377157211304, 2.1403286457061768, 2.5059194564819336, 2.8715105056762695, 3.2371015548706055, 3.6026923656463623, 3.968283176422119, 4.333874225616455, 4.699465274810791, 5.065055847167969, 5.430646896362305, 5.796237945556641, 6.161828994750977, 6.5274200439453125, 6.89301061630249, 7.258601665496826, 7.624192714691162, 7.98978328704834, 8.355374336242676, 8.720965385437012, 9.086556434631348, 9.452147483825684, 9.81773853302002, 10.183328628540039, 10.548919677734375, 10.914510726928711, 11.280101776123047, 11.645692825317383]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 19.0, 25.0, 19.0, 26.0, 29.0, 29.0, 30.0, 36.0, 59.0, 33.0, 47.0, 38.0, 45.0, 40.0, 38.0, 42.0, 46.0, 40.0, 35.0, 39.0, 19.0, 32.0, 28.0, 19.0, 21.0, 12.0, 19.0, 12.0, 18.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.673048973083496, -10.298126220703125, -9.923202514648438, -9.548279762268066, -9.173356056213379, -8.798433303833008, -8.42350959777832, -8.04858684539795, -7.67366361618042, -7.298740386962891, -6.923817157745361, -6.548893928527832, -6.173971176147461, -5.799047470092773, -5.424124717712402, -5.049201488494873, -4.674278259277344, -4.2993550300598145, -3.924431800842285, -3.549508810043335, -3.1745855808258057, -2.7996623516082764, -2.424739360809326, -2.049816131591797, -1.6748929023742676, -1.2999696731567383, -0.9250465631484985, -0.5501234531402588, -0.1752002239227295, 0.1997230052947998, 0.57464599609375, 0.9495692253112793, 1.324493408203125, 1.6994166374206543, 2.0743398666381836, 2.449262857437134, 2.824186086654663, 3.1991093158721924, 3.5740323066711426, 3.948955535888672, 4.323878765106201, 4.6988019943237305, 5.07372522354126, 5.448648452758789, 5.82357120513916, 6.198494911193848, 6.573417663574219, 6.948340892791748, 7.323264122009277, 7.698187351226807, 8.073110580444336, 8.448033332824707, 8.822957038879395, 9.197879791259766, 9.572803497314453, 9.947726249694824, 10.322649002075195, 10.697571754455566, 11.072495460510254, 11.447418212890625, 11.822341918945312, 12.197264671325684, 12.572187423706055, 12.947111129760742, 13.32203483581543]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 7.0, 1.0, 5.0, 4.0, 12.0, 11.0, 22.0, 20.0, 32.0, 54.0, 65.0, 112.0, 155.0, 208.0, 310.0, 450.0, 636.0, 945.0, 1510.0, 2305.0, 3648.0, 5515.0, 8432.0, 13644.0, 21602.0, 34547.0, 55758.0, 89922.0, 140696.0, 185234.0, 170190.0, 117499.0, 72995.0, 45247.0, 27758.0, 17429.0, 11145.0, 7075.0, 4585.0, 2941.0, 1963.0, 1299.0, 804.0, 545.0, 380.0, 248.0, 173.0, 122.0, 92.0, 62.0, 65.0, 25.0, 21.0, 15.0, 11.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.923828125, -3.796356201171875, -3.66888427734375, -3.541412353515625, -3.4139404296875, -3.286468505859375, -3.15899658203125, -3.031524658203125, -2.904052734375, -2.776580810546875, -2.64910888671875, -2.521636962890625, -2.3941650390625, -2.266693115234375, -2.13922119140625, -2.011749267578125, -1.88427734375, -1.756805419921875, -1.62933349609375, -1.501861572265625, -1.3743896484375, -1.246917724609375, -1.11944580078125, -0.991973876953125, -0.864501953125, -0.737030029296875, -0.60955810546875, -0.482086181640625, -0.3546142578125, -0.227142333984375, -0.09967041015625, 0.027801513671875, 0.1552734375, 0.282745361328125, 0.41021728515625, 0.537689208984375, 0.6651611328125, 0.792633056640625, 0.92010498046875, 1.047576904296875, 1.175048828125, 1.302520751953125, 1.42999267578125, 1.557464599609375, 1.6849365234375, 1.812408447265625, 1.93988037109375, 2.067352294921875, 2.19482421875, 2.322296142578125, 2.44976806640625, 2.577239990234375, 2.7047119140625, 2.832183837890625, 2.95965576171875, 3.087127685546875, 3.214599609375, 3.342071533203125, 3.46954345703125, 3.597015380859375, 3.7244873046875, 3.851959228515625, 3.97943115234375, 4.106903076171875, 4.234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 11.0, 8.0, 10.0, 4.0, 19.0, 24.0, 17.0, 25.0, 18.0, 26.0, 28.0, 30.0, 31.0, 40.0, 53.0, 37.0, 44.0, 38.0, 46.0, 42.0, 36.0, 42.0, 47.0, 37.0, 36.0, 43.0, 17.0, 31.0, 30.0, 16.0, 20.0, 13.0, 20.0, 13.0, 17.0, 9.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.2357177734375, -9.862060546875, -9.4884033203125, -9.11474609375, -8.7410888671875, -8.367431640625, -7.9937744140625, -7.6201171875, -7.2464599609375, -6.872802734375, -6.4991455078125, -6.12548828125, -5.7518310546875, -5.378173828125, -5.0045166015625, -4.630859375, -4.2572021484375, -3.883544921875, -3.5098876953125, -3.13623046875, -2.7625732421875, -2.388916015625, -2.0152587890625, -1.6416015625, -1.2679443359375, -0.894287109375, -0.5206298828125, -0.14697265625, 0.2266845703125, 0.600341796875, 0.9739990234375, 1.34765625, 1.7213134765625, 2.094970703125, 2.4686279296875, 2.84228515625, 3.2159423828125, 3.589599609375, 3.9632568359375, 4.3369140625, 4.7105712890625, 5.084228515625, 5.4578857421875, 5.83154296875, 6.2052001953125, 6.578857421875, 6.9525146484375, 7.326171875, 7.6998291015625, 8.073486328125, 8.4471435546875, 8.82080078125, 9.1944580078125, 9.568115234375, 9.9417724609375, 10.3154296875, 10.6890869140625, 11.062744140625, 11.4364013671875, 11.81005859375, 12.1837158203125, 12.557373046875, 12.9310302734375, 13.3046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 12.0, 20.0, 23.0, 30.0, 50.0, 64.0, 90.0, 132.0, 211.0, 297.0, 400.0, 653.0, 964.0, 1497.0, 2394.0, 4014.0, 7198.0, 13382.0, 27502.0, 62777.0, 160610.0, 334359.0, 249446.0, 99055.0, 41184.0, 18807.0, 9579.0, 5324.0, 3015.0, 1892.0, 1199.0, 764.0, 521.0, 346.0, 249.0, 164.0, 90.0, 77.0, 46.0, 35.0, 13.0, 20.0, 15.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-5.31640625, -5.154052734375, -4.99169921875, -4.829345703125, -4.6669921875, -4.504638671875, -4.34228515625, -4.179931640625, -4.017578125, -3.855224609375, -3.69287109375, -3.530517578125, -3.3681640625, -3.205810546875, -3.04345703125, -2.881103515625, -2.71875, -2.556396484375, -2.39404296875, -2.231689453125, -2.0693359375, -1.906982421875, -1.74462890625, -1.582275390625, -1.419921875, -1.257568359375, -1.09521484375, -0.932861328125, -0.7705078125, -0.608154296875, -0.44580078125, -0.283447265625, -0.12109375, 0.041259765625, 0.20361328125, 0.365966796875, 0.5283203125, 0.690673828125, 0.85302734375, 1.015380859375, 1.177734375, 1.340087890625, 1.50244140625, 1.664794921875, 1.8271484375, 1.989501953125, 2.15185546875, 2.314208984375, 2.4765625, 2.638916015625, 2.80126953125, 2.963623046875, 3.1259765625, 3.288330078125, 3.45068359375, 3.613037109375, 3.775390625, 3.937744140625, 4.10009765625, 4.262451171875, 4.4248046875, 4.587158203125, 4.74951171875, 4.911865234375, 5.07421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 6.0, 8.0, 12.0, 13.0, 11.0, 8.0, 9.0, 19.0, 18.0, 26.0, 21.0, 20.0, 33.0, 35.0, 29.0, 27.0, 32.0, 42.0, 39.0, 46.0, 35.0, 35.0, 38.0, 48.0, 41.0, 35.0, 23.0, 35.0, 28.0, 29.0, 23.0, 19.0, 21.0, 19.0, 22.0, 18.0, 13.0, 12.0, 8.0, 9.0, 11.0, 4.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.109375, -6.88604736328125, -6.6627197265625, -6.43939208984375, -6.216064453125, -5.99273681640625, -5.7694091796875, -5.54608154296875, -5.32275390625, -5.09942626953125, -4.8760986328125, -4.65277099609375, -4.429443359375, -4.20611572265625, -3.9827880859375, -3.75946044921875, -3.5361328125, -3.31280517578125, -3.0894775390625, -2.86614990234375, -2.642822265625, -2.41949462890625, -2.1961669921875, -1.97283935546875, -1.74951171875, -1.52618408203125, -1.3028564453125, -1.07952880859375, -0.856201171875, -0.63287353515625, -0.4095458984375, -0.18621826171875, 0.037109375, 0.26043701171875, 0.4837646484375, 0.70709228515625, 0.930419921875, 1.15374755859375, 1.3770751953125, 1.60040283203125, 1.82373046875, 2.04705810546875, 2.2703857421875, 2.49371337890625, 2.717041015625, 2.94036865234375, 3.1636962890625, 3.38702392578125, 3.6103515625, 3.83367919921875, 4.0570068359375, 4.28033447265625, 4.503662109375, 4.72698974609375, 4.9503173828125, 5.17364501953125, 5.39697265625, 5.62030029296875, 5.8436279296875, 6.06695556640625, 6.290283203125, 6.51361083984375, 6.7369384765625, 6.96026611328125, 7.18359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 9.0, 13.0, 18.0, 29.0, 37.0, 45.0, 67.0, 107.0, 131.0, 213.0, 304.0, 458.0, 678.0, 1105.0, 1905.0, 3205.0, 5922.0, 11680.0, 28949.0, 89626.0, 372991.0, 382214.0, 92436.0, 29762.0, 12243.0, 5861.0, 3339.0, 1924.0, 1125.0, 666.0, 462.0, 330.0, 228.0, 150.0, 98.0, 72.0, 48.0, 28.0, 24.0, 14.0, 10.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.322296142578125, -2.24224853515625, -2.162200927734375, -2.0821533203125, -2.002105712890625, -1.92205810546875, -1.842010498046875, -1.761962890625, -1.681915283203125, -1.60186767578125, -1.521820068359375, -1.4417724609375, -1.361724853515625, -1.28167724609375, -1.201629638671875, -1.12158203125, -1.041534423828125, -0.96148681640625, -0.881439208984375, -0.8013916015625, -0.721343994140625, -0.64129638671875, -0.561248779296875, -0.481201171875, -0.401153564453125, -0.32110595703125, -0.241058349609375, -0.1610107421875, -0.080963134765625, -0.00091552734375, 0.079132080078125, 0.1591796875, 0.239227294921875, 0.31927490234375, 0.399322509765625, 0.4793701171875, 0.559417724609375, 0.63946533203125, 0.719512939453125, 0.799560546875, 0.879608154296875, 0.95965576171875, 1.039703369140625, 1.1197509765625, 1.199798583984375, 1.27984619140625, 1.359893798828125, 1.43994140625, 1.519989013671875, 1.60003662109375, 1.680084228515625, 1.7601318359375, 1.840179443359375, 1.92022705078125, 2.000274658203125, 2.080322265625, 2.160369873046875, 2.24041748046875, 2.320465087890625, 2.4005126953125, 2.480560302734375, 2.56060791015625, 2.640655517578125, 2.720703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 0.0, 5.0, 13.0, 12.0, 27.0, 29.0, 60.0, 68.0, 120.0, 159.0, 178.0, 127.0, 74.0, 44.0, 31.0, 24.0, 5.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007534027099609375, -0.0007335394620895386, -0.0007136762142181396, -0.0006938129663467407, -0.0006739497184753418, -0.0006540864706039429, -0.0006342232227325439, -0.000614359974861145, -0.0005944967269897461, -0.0005746334791183472, -0.0005547702312469482, -0.0005349069833755493, -0.0005150437355041504, -0.0004951804876327515, -0.00047531723976135254, -0.0004554539918899536, -0.0004355907440185547, -0.00041572749614715576, -0.00039586424827575684, -0.0003760010004043579, -0.000356137752532959, -0.00033627450466156006, -0.00031641125679016113, -0.0002965480089187622, -0.0002766847610473633, -0.00025682151317596436, -0.00023695826530456543, -0.0002170950174331665, -0.00019723176956176758, -0.00017736852169036865, -0.00015750527381896973, -0.0001376420259475708, -0.00011777877807617188, -9.791553020477295e-05, -7.805228233337402e-05, -5.81890344619751e-05, -3.832578659057617e-05, -1.8462538719177246e-05, 1.4007091522216797e-06, 2.1263957023620605e-05, 4.112720489501953e-05, 6.099045276641846e-05, 8.085370063781738e-05, 0.00010071694850921631, 0.00012058019638061523, 0.00014044344425201416, 0.00016030669212341309, 0.000180169939994812, 0.00020003318786621094, 0.00021989643573760986, 0.0002397596836090088, 0.0002596229314804077, 0.00027948617935180664, 0.00029934942722320557, 0.0003192126750946045, 0.0003390759229660034, 0.00035893917083740234, 0.00037880241870880127, 0.0003986656665802002, 0.0004185289144515991, 0.00043839216232299805, 0.00045825541019439697, 0.0004781186580657959, 0.0004979819059371948, 0.0005178451538085938]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 20.0, 23.0, 38.0, 48.0, 64.0, 108.0, 161.0, 233.0, 319.0, 423.0, 643.0, 918.0, 1456.0, 2217.0, 3476.0, 5437.0, 8732.0, 14285.0, 23550.0, 39339.0, 66598.0, 112433.0, 177447.0, 207007.0, 151934.0, 92477.0, 54991.0, 32252.0, 19640.0, 11754.0, 7255.0, 4576.0, 2923.0, 1945.0, 1184.0, 826.0, 559.0, 407.0, 274.0, 169.0, 131.0, 91.0, 61.0, 45.0, 33.0, 15.0, 13.0, 8.0, 4.0, 1.0, 1.0, 3.0], "bins": [-2.384765625, -2.317230224609375, -2.24969482421875, -2.182159423828125, -2.1146240234375, -2.047088623046875, -1.97955322265625, -1.912017822265625, -1.844482421875, -1.776947021484375, -1.70941162109375, -1.641876220703125, -1.5743408203125, -1.506805419921875, -1.43927001953125, -1.371734619140625, -1.30419921875, -1.236663818359375, -1.16912841796875, -1.101593017578125, -1.0340576171875, -0.966522216796875, -0.89898681640625, -0.831451416015625, -0.763916015625, -0.696380615234375, -0.62884521484375, -0.561309814453125, -0.4937744140625, -0.426239013671875, -0.35870361328125, -0.291168212890625, -0.2236328125, -0.156097412109375, -0.08856201171875, -0.021026611328125, 0.0465087890625, 0.114044189453125, 0.18157958984375, 0.249114990234375, 0.316650390625, 0.384185791015625, 0.45172119140625, 0.519256591796875, 0.5867919921875, 0.654327392578125, 0.72186279296875, 0.789398193359375, 0.85693359375, 0.924468994140625, 0.99200439453125, 1.059539794921875, 1.1270751953125, 1.194610595703125, 1.26214599609375, 1.329681396484375, 1.397216796875, 1.464752197265625, 1.53228759765625, 1.599822998046875, 1.6673583984375, 1.734893798828125, 1.80242919921875, 1.869964599609375, 1.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 5.0, 9.0, 12.0, 21.0, 14.0, 14.0, 24.0, 37.0, 48.0, 44.0, 50.0, 85.0, 86.0, 83.0, 85.0, 69.0, 58.0, 43.0, 31.0, 26.0, 22.0, 22.0, 15.0, 15.0, 10.0, 11.0, 2.0, 5.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97265625, -0.9411468505859375, -0.909637451171875, -0.8781280517578125, -0.84661865234375, -0.8151092529296875, -0.783599853515625, -0.7520904541015625, -0.7205810546875, -0.6890716552734375, -0.657562255859375, -0.6260528564453125, -0.59454345703125, -0.5630340576171875, -0.531524658203125, -0.5000152587890625, -0.468505859375, -0.4369964599609375, -0.405487060546875, -0.3739776611328125, -0.34246826171875, -0.3109588623046875, -0.279449462890625, -0.2479400634765625, -0.2164306640625, -0.1849212646484375, -0.153411865234375, -0.1219024658203125, -0.09039306640625, -0.0588836669921875, -0.027374267578125, 0.0041351318359375, 0.03564453125, 0.0671539306640625, 0.098663330078125, 0.1301727294921875, 0.16168212890625, 0.1931915283203125, 0.224700927734375, 0.2562103271484375, 0.2877197265625, 0.3192291259765625, 0.350738525390625, 0.3822479248046875, 0.41375732421875, 0.4452667236328125, 0.476776123046875, 0.5082855224609375, 0.539794921875, 0.5713043212890625, 0.602813720703125, 0.6343231201171875, 0.66583251953125, 0.6973419189453125, 0.728851318359375, 0.7603607177734375, 0.7918701171875, 0.8233795166015625, 0.854888916015625, 0.8863983154296875, 0.91790771484375, 0.9494171142578125, 0.980926513671875, 1.0124359130859375, 1.0439453125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 11.0, 17.0, 25.0, 17.0, 15.0, 23.0, 35.0, 34.0, 40.0, 37.0, 51.0, 39.0, 37.0, 43.0, 31.0, 46.0, 36.0, 42.0, 48.0, 41.0, 42.0, 26.0, 25.0, 28.0, 29.0, 23.0, 17.0, 19.0, 17.0, 9.0, 11.0, 14.0, 7.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-12.539216995239258, -12.17225456237793, -11.805293083190918, -11.43833065032959, -11.071369171142578, -10.70440673828125, -10.337444305419922, -9.970481872558594, -9.603520393371582, -9.236557960510254, -8.869596481323242, -8.502634048461914, -8.135671615600586, -7.768710136413574, -7.401747703552246, -7.034785747528076, -6.667823791503906, -6.300861835479736, -5.933899879455566, -5.566937446594238, -5.199975490570068, -4.833013534545898, -4.46605110168457, -4.0990891456604, -3.7321271896362305, -3.3651652336120605, -2.9982030391693115, -2.6312408447265625, -2.2642788887023926, -1.897316813468933, -1.5303547382354736, -1.1633925437927246, -0.7964305877685547, -0.4294685125350952, -0.06250643730163574, 0.30445563793182373, 0.6714177131652832, 1.0383797883987427, 1.4053418636322021, 1.7723040580749512, 2.139266014099121, 2.506227970123291, 2.87319016456604, 3.240152359008789, 3.607114315032959, 3.974076271057129, 4.341038703918457, 4.708000659942627, 5.074962615966797, 5.441924571990967, 5.808886528015137, 6.175848960876465, 6.542810916900635, 6.909772872924805, 7.276735305786133, 7.643697261810303, 8.010659217834473, 8.3776216506958, 8.744583129882812, 9.11154556274414, 9.478507995605469, 9.84546947479248, 10.212431907653809, 10.57939338684082, 10.946355819702148]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 4.0, 5.0, 11.0, 7.0, 8.0, 13.0, 15.0, 17.0, 23.0, 27.0, 19.0, 24.0, 29.0, 28.0, 36.0, 47.0, 44.0, 44.0, 41.0, 48.0, 39.0, 38.0, 42.0, 41.0, 44.0, 45.0, 25.0, 37.0, 25.0, 38.0, 20.0, 21.0, 21.0, 16.0, 14.0, 14.0, 12.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.687249183654785, -10.307353019714355, -9.927456855773926, -9.547560691833496, -9.167664527893066, -8.787768363952637, -8.40787124633789, -8.027975082397461, -7.6480793952941895, -7.26818323135376, -6.88828706741333, -6.508390426635742, -6.1284942626953125, -5.748598098754883, -5.368701934814453, -4.988805770874023, -4.608909606933594, -4.229013442993164, -3.8491172790527344, -3.4692208766937256, -3.089324712753296, -2.709428548812866, -2.3295321464538574, -1.9496359825134277, -1.569739818572998, -1.1898436546325684, -0.8099473714828491, -0.4300510883331299, -0.050154924392700195, 0.3297412395477295, 0.7096376419067383, 1.089533805847168, 1.4694290161132812, 1.849325180053711, 2.2292213439941406, 2.6091177463531494, 2.989013910293579, 3.368910074234009, 3.7488064765930176, 4.128702640533447, 4.508598804473877, 4.888494968414307, 5.268391132354736, 5.648287773132324, 6.028183937072754, 6.408080101013184, 6.787976264953613, 7.167872428894043, 7.547768592834473, 7.927664756774902, 8.307560920715332, 8.687457084655762, 9.067353248596191, 9.447249412536621, 9.827146530151367, 10.207042694091797, 10.586938858032227, 10.966835021972656, 11.346731185913086, 11.726627349853516, 12.106523513793945, 12.486419677734375, 12.866315841674805, 13.246212005615234, 13.626108169555664]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 11.0, 13.0, 19.0, 25.0, 39.0, 53.0, 74.0, 108.0, 186.0, 265.0, 467.0, 811.0, 1214.0, 1977.0, 3418.0, 5458.0, 8712.0, 13782.0, 20896.0, 30913.0, 43796.0, 59539.0, 76691.0, 91955.0, 103898.0, 108897.0, 104075.0, 93807.0, 77975.0, 61346.0, 45324.0, 32315.0, 21757.0, 14217.0, 9284.0, 5886.0, 3668.0, 2145.0, 1353.0, 808.0, 522.0, 305.0, 212.0, 115.0, 71.0, 56.0, 33.0, 26.0, 18.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0], "bins": [-11.203125, -10.87890625, -10.5546875, -10.23046875, -9.90625, -9.58203125, -9.2578125, -8.93359375, -8.609375, -8.28515625, -7.9609375, -7.63671875, -7.3125, -6.98828125, -6.6640625, -6.33984375, -6.015625, -5.69140625, -5.3671875, -5.04296875, -4.71875, -4.39453125, -4.0703125, -3.74609375, -3.421875, -3.09765625, -2.7734375, -2.44921875, -2.125, -1.80078125, -1.4765625, -1.15234375, -0.828125, -0.50390625, -0.1796875, 0.14453125, 0.46875, 0.79296875, 1.1171875, 1.44140625, 1.765625, 2.08984375, 2.4140625, 2.73828125, 3.0625, 3.38671875, 3.7109375, 4.03515625, 4.359375, 4.68359375, 5.0078125, 5.33203125, 5.65625, 5.98046875, 6.3046875, 6.62890625, 6.953125, 7.27734375, 7.6015625, 7.92578125, 8.25, 8.57421875, 8.8984375, 9.22265625, 9.546875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 9.0, 13.0, 13.0, 19.0, 26.0, 23.0, 17.0, 30.0, 23.0, 30.0, 37.0, 46.0, 48.0, 39.0, 44.0, 48.0, 38.0, 39.0, 42.0, 35.0, 49.0, 45.0, 25.0, 38.0, 27.0, 34.0, 20.0, 21.0, 24.0, 12.0, 16.0, 15.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.9461669921875, -9.579833984375, -9.2135009765625, -8.84716796875, -8.4808349609375, -8.114501953125, -7.7481689453125, -7.3818359375, -7.0155029296875, -6.649169921875, -6.2828369140625, -5.91650390625, -5.5501708984375, -5.183837890625, -4.8175048828125, -4.451171875, -4.0848388671875, -3.718505859375, -3.3521728515625, -2.98583984375, -2.6195068359375, -2.253173828125, -1.8868408203125, -1.5205078125, -1.1541748046875, -0.787841796875, -0.4215087890625, -0.05517578125, 0.3111572265625, 0.677490234375, 1.0438232421875, 1.41015625, 1.7764892578125, 2.142822265625, 2.5091552734375, 2.87548828125, 3.2418212890625, 3.608154296875, 3.9744873046875, 4.3408203125, 4.7071533203125, 5.073486328125, 5.4398193359375, 5.80615234375, 6.1724853515625, 6.538818359375, 6.9051513671875, 7.271484375, 7.6378173828125, 8.004150390625, 8.3704833984375, 8.73681640625, 9.1031494140625, 9.469482421875, 9.8358154296875, 10.2021484375, 10.5684814453125, 10.934814453125, 11.3011474609375, 11.66748046875, 12.0338134765625, 12.400146484375, 12.7664794921875, 13.1328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 13.0, 23.0, 30.0, 50.0, 51.0, 94.0, 176.0, 245.0, 473.0, 756.0, 1221.0, 2062.0, 3409.0, 5653.0, 9222.0, 14325.0, 21971.0, 33208.0, 47064.0, 64107.0, 82762.0, 99171.0, 110079.0, 112245.0, 104931.0, 91195.0, 73872.0, 55841.0, 39707.0, 26912.0, 18086.0, 11511.0, 6990.0, 4323.0, 2704.0, 1595.0, 940.0, 588.0, 364.0, 202.0, 145.0, 82.0, 58.0, 29.0, 19.0, 15.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.21875, -10.88134765625, -10.5439453125, -10.20654296875, -9.869140625, -9.53173828125, -9.1943359375, -8.85693359375, -8.51953125, -8.18212890625, -7.8447265625, -7.50732421875, -7.169921875, -6.83251953125, -6.4951171875, -6.15771484375, -5.8203125, -5.48291015625, -5.1455078125, -4.80810546875, -4.470703125, -4.13330078125, -3.7958984375, -3.45849609375, -3.12109375, -2.78369140625, -2.4462890625, -2.10888671875, -1.771484375, -1.43408203125, -1.0966796875, -0.75927734375, -0.421875, -0.08447265625, 0.2529296875, 0.59033203125, 0.927734375, 1.26513671875, 1.6025390625, 1.93994140625, 2.27734375, 2.61474609375, 2.9521484375, 3.28955078125, 3.626953125, 3.96435546875, 4.3017578125, 4.63916015625, 4.9765625, 5.31396484375, 5.6513671875, 5.98876953125, 6.326171875, 6.66357421875, 7.0009765625, 7.33837890625, 7.67578125, 8.01318359375, 8.3505859375, 8.68798828125, 9.025390625, 9.36279296875, 9.7001953125, 10.03759765625, 10.375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 5.0, 9.0, 11.0, 16.0, 15.0, 20.0, 17.0, 20.0, 23.0, 22.0, 25.0, 26.0, 35.0, 38.0, 38.0, 31.0, 53.0, 42.0, 51.0, 49.0, 48.0, 40.0, 40.0, 33.0, 35.0, 33.0, 26.0, 25.0, 29.0, 21.0, 5.0, 20.0, 15.0, 12.0, 19.0, 11.0, 6.0, 7.0, 6.0, 2.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.7364501953125, -5.511962890625, -5.2874755859375, -5.06298828125, -4.8385009765625, -4.614013671875, -4.3895263671875, -4.1650390625, -3.9405517578125, -3.716064453125, -3.4915771484375, -3.26708984375, -3.0426025390625, -2.818115234375, -2.5936279296875, -2.369140625, -2.1446533203125, -1.920166015625, -1.6956787109375, -1.47119140625, -1.2467041015625, -1.022216796875, -0.7977294921875, -0.5732421875, -0.3487548828125, -0.124267578125, 0.1002197265625, 0.32470703125, 0.5491943359375, 0.773681640625, 0.9981689453125, 1.22265625, 1.4471435546875, 1.671630859375, 1.8961181640625, 2.12060546875, 2.3450927734375, 2.569580078125, 2.7940673828125, 3.0185546875, 3.2430419921875, 3.467529296875, 3.6920166015625, 3.91650390625, 4.1409912109375, 4.365478515625, 4.5899658203125, 4.814453125, 5.0389404296875, 5.263427734375, 5.4879150390625, 5.71240234375, 5.9368896484375, 6.161376953125, 6.3858642578125, 6.6103515625, 6.8348388671875, 7.059326171875, 7.2838134765625, 7.50830078125, 7.7327880859375, 7.957275390625, 8.1817626953125, 8.40625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 8.0, 12.0, 19.0, 29.0, 30.0, 58.0, 67.0, 110.0, 195.0, 292.0, 454.0, 776.0, 1408.0, 2377.0, 4473.0, 8099.0, 14801.0, 26562.0, 46181.0, 76825.0, 115277.0, 151923.0, 166184.0, 149072.0, 110850.0, 72899.0, 43564.0, 24630.0, 13964.0, 7556.0, 4163.0, 2417.0, 1336.0, 779.0, 438.0, 276.0, 143.0, 118.0, 69.0, 42.0, 32.0, 18.0, 11.0, 4.0, 12.0, 4.0, 1.0, 1.0, 5.0], "bins": [-7.72265625, -7.51641845703125, -7.3101806640625, -7.10394287109375, -6.897705078125, -6.69146728515625, -6.4852294921875, -6.27899169921875, -6.07275390625, -5.86651611328125, -5.6602783203125, -5.45404052734375, -5.247802734375, -5.04156494140625, -4.8353271484375, -4.62908935546875, -4.4228515625, -4.21661376953125, -4.0103759765625, -3.80413818359375, -3.597900390625, -3.39166259765625, -3.1854248046875, -2.97918701171875, -2.77294921875, -2.56671142578125, -2.3604736328125, -2.15423583984375, -1.947998046875, -1.74176025390625, -1.5355224609375, -1.32928466796875, -1.123046875, -0.91680908203125, -0.7105712890625, -0.50433349609375, -0.298095703125, -0.09185791015625, 0.1143798828125, 0.32061767578125, 0.52685546875, 0.73309326171875, 0.9393310546875, 1.14556884765625, 1.351806640625, 1.55804443359375, 1.7642822265625, 1.97052001953125, 2.1767578125, 2.38299560546875, 2.5892333984375, 2.79547119140625, 3.001708984375, 3.20794677734375, 3.4141845703125, 3.62042236328125, 3.82666015625, 4.03289794921875, 4.2391357421875, 4.44537353515625, 4.651611328125, 4.85784912109375, 5.0640869140625, 5.27032470703125, 5.4765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 0.0, 8.0, 5.0, 7.0, 6.0, 16.0, 14.0, 21.0, 30.0, 30.0, 36.0, 33.0, 34.0, 41.0, 36.0, 48.0, 51.0, 55.0, 56.0, 68.0, 63.0, 52.0, 54.0, 38.0, 44.0, 30.0, 23.0, 27.0, 25.0, 13.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007047653198242188, -0.0006809532642364502, -0.0006571412086486816, -0.0006333291530609131, -0.0006095170974731445, -0.000585705041885376, -0.0005618929862976074, -0.0005380809307098389, -0.0005142688751220703, -0.0004904568195343018, -0.0004666447639465332, -0.00044283270835876465, -0.0004190206527709961, -0.00039520859718322754, -0.000371396541595459, -0.00034758448600769043, -0.0003237724304199219, -0.0002999603748321533, -0.00027614831924438477, -0.0002523362636566162, -0.00022852420806884766, -0.0002047121524810791, -0.00018090009689331055, -0.000157088041305542, -0.00013327598571777344, -0.00010946393013000488, -8.565187454223633e-05, -6.183981895446777e-05, -3.802776336669922e-05, -1.4215707778930664e-05, 9.59634780883789e-06, 3.3408403396606445e-05, 5.7220458984375e-05, 8.103251457214355e-05, 0.00010484457015991211, 0.00012865662574768066, 0.00015246868133544922, 0.00017628073692321777, 0.00020009279251098633, 0.00022390484809875488, 0.00024771690368652344, 0.000271528959274292, 0.00029534101486206055, 0.0003191530704498291, 0.00034296512603759766, 0.0003667771816253662, 0.00039058923721313477, 0.0004144012928009033, 0.0004382133483886719, 0.00046202540397644043, 0.000485837459564209, 0.0005096495151519775, 0.0005334615707397461, 0.0005572736263275146, 0.0005810856819152832, 0.0006048977375030518, 0.0006287097930908203, 0.0006525218486785889, 0.0006763339042663574, 0.000700145959854126, 0.0007239580154418945, 0.0007477700710296631, 0.0007715821266174316, 0.0007953941822052002, 0.0008192062377929688]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 20.0, 25.0, 28.0, 48.0, 92.0, 106.0, 177.0, 300.0, 375.0, 618.0, 944.0, 1455.0, 2319.0, 3597.0, 5533.0, 8714.0, 13892.0, 22127.0, 34432.0, 52479.0, 75988.0, 103239.0, 126217.0, 135748.0, 126598.0, 104909.0, 77845.0, 53495.0, 35235.0, 22720.0, 14353.0, 8972.0, 5753.0, 3573.0, 2267.0, 1495.0, 998.0, 616.0, 419.0, 264.0, 198.0, 110.0, 73.0, 64.0, 42.0, 20.0, 18.0, 12.0, 5.0, 4.0, 2.0, 3.0, 1.0], "bins": [-6.19140625, -6.0120849609375, -5.832763671875, -5.6534423828125, -5.47412109375, -5.2947998046875, -5.115478515625, -4.9361572265625, -4.7568359375, -4.5775146484375, -4.398193359375, -4.2188720703125, -4.03955078125, -3.8602294921875, -3.680908203125, -3.5015869140625, -3.322265625, -3.1429443359375, -2.963623046875, -2.7843017578125, -2.60498046875, -2.4256591796875, -2.246337890625, -2.0670166015625, -1.8876953125, -1.7083740234375, -1.529052734375, -1.3497314453125, -1.17041015625, -0.9910888671875, -0.811767578125, -0.6324462890625, -0.453125, -0.2738037109375, -0.094482421875, 0.0848388671875, 0.26416015625, 0.4434814453125, 0.622802734375, 0.8021240234375, 0.9814453125, 1.1607666015625, 1.340087890625, 1.5194091796875, 1.69873046875, 1.8780517578125, 2.057373046875, 2.2366943359375, 2.416015625, 2.5953369140625, 2.774658203125, 2.9539794921875, 3.13330078125, 3.3126220703125, 3.491943359375, 3.6712646484375, 3.8505859375, 4.0299072265625, 4.209228515625, 4.3885498046875, 4.56787109375, 4.7471923828125, 4.926513671875, 5.1058349609375, 5.28515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 7.0, 3.0, 1.0, 9.0, 2.0, 11.0, 15.0, 11.0, 13.0, 15.0, 19.0, 27.0, 23.0, 37.0, 36.0, 53.0, 48.0, 62.0, 59.0, 69.0, 69.0, 62.0, 48.0, 36.0, 43.0, 33.0, 29.0, 30.0, 24.0, 21.0, 19.0, 16.0, 12.0, 8.0, 5.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.6953125, -2.61627197265625, -2.5372314453125, -2.45819091796875, -2.379150390625, -2.30010986328125, -2.2210693359375, -2.14202880859375, -2.06298828125, -1.98394775390625, -1.9049072265625, -1.82586669921875, -1.746826171875, -1.66778564453125, -1.5887451171875, -1.50970458984375, -1.4306640625, -1.35162353515625, -1.2725830078125, -1.19354248046875, -1.114501953125, -1.03546142578125, -0.9564208984375, -0.87738037109375, -0.79833984375, -0.71929931640625, -0.6402587890625, -0.56121826171875, -0.482177734375, -0.40313720703125, -0.3240966796875, -0.24505615234375, -0.166015625, -0.08697509765625, -0.0079345703125, 0.07110595703125, 0.150146484375, 0.22918701171875, 0.3082275390625, 0.38726806640625, 0.46630859375, 0.54534912109375, 0.6243896484375, 0.70343017578125, 0.782470703125, 0.86151123046875, 0.9405517578125, 1.01959228515625, 1.0986328125, 1.17767333984375, 1.2567138671875, 1.33575439453125, 1.414794921875, 1.49383544921875, 1.5728759765625, 1.65191650390625, 1.73095703125, 1.80999755859375, 1.8890380859375, 1.96807861328125, 2.047119140625, 2.12615966796875, 2.2052001953125, 2.28424072265625, 2.36328125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 11.0, 19.0, 17.0, 18.0, 24.0, 23.0, 28.0, 38.0, 42.0, 44.0, 40.0, 47.0, 41.0, 37.0, 39.0, 42.0, 56.0, 42.0, 42.0, 28.0, 37.0, 38.0, 25.0, 26.0, 38.0, 18.0, 11.0, 18.0, 11.0, 12.0, 11.0, 9.0, 12.0, 3.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75565242767334, -11.380942344665527, -11.006231307983398, -10.631521224975586, -10.256810188293457, -9.882100105285645, -9.507389068603516, -9.132678985595703, -8.75796890258789, -8.383258819580078, -8.00854778289795, -7.633837699890137, -7.259126663208008, -6.884416580200195, -6.509706020355225, -6.134995460510254, -5.760284423828125, -5.385573863983154, -5.010863304138184, -4.636153221130371, -4.261442184448242, -3.8867318630218506, -3.512021541595459, -3.1373109817504883, -2.7626004219055176, -2.387889862060547, -2.013179302215576, -1.6384689807891846, -1.2637584209442139, -0.8890478610992432, -0.5143375396728516, -0.13962697982788086, 0.23508453369140625, 0.6097950339317322, 0.9845055341720581, 1.3592159748077393, 1.73392653465271, 2.1086370944976807, 2.4833474159240723, 2.858057975769043, 3.2327685356140137, 3.6074790954589844, 3.982189655303955, 4.356900215148926, 4.731610298156738, 5.106321334838867, 5.48103141784668, 5.85574197769165, 6.230452537536621, 6.605163097381592, 6.9798736572265625, 7.354583740234375, 7.729294776916504, 8.104004859924316, 8.478715896606445, 8.853425979614258, 9.22813606262207, 9.602846145629883, 9.977557182312012, 10.352267265319824, 10.726978302001953, 11.101688385009766, 11.476398468017578, 11.851109504699707, 12.225820541381836]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 3.0, 10.0, 7.0, 8.0, 8.0, 11.0, 4.0, 19.0, 15.0, 25.0, 15.0, 29.0, 25.0, 37.0, 28.0, 25.0, 43.0, 41.0, 34.0, 35.0, 37.0, 38.0, 41.0, 36.0, 35.0, 29.0, 34.0, 30.0, 36.0, 39.0, 30.0, 22.0, 23.0, 20.0, 19.0, 24.0, 20.0, 10.0, 16.0, 9.0, 8.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.271442413330078, -10.927652359008789, -10.5838623046875, -10.240072250366211, -9.896282196044922, -9.552492141723633, -9.208702087402344, -8.864912033081055, -8.521121978759766, -8.177331924438477, -7.8335418701171875, -7.489751815795898, -7.145961761474609, -6.80217170715332, -6.458381652832031, -6.114591598510742, -5.770801544189453, -5.427011489868164, -5.083221435546875, -4.739431381225586, -4.395641326904297, -4.051851272583008, -3.7080612182617188, -3.3642711639404297, -3.0204811096191406, -2.6766910552978516, -2.3329010009765625, -1.9891109466552734, -1.6453208923339844, -1.3015308380126953, -0.9577407836914062, -0.6139507293701172, -0.27016162872314453, 0.07362842559814453, 0.4174184799194336, 0.7612085342407227, 1.1049985885620117, 1.4487886428833008, 1.7925786972045898, 2.136368751525879, 2.480158805847168, 2.823948860168457, 3.167738914489746, 3.511528968811035, 3.855319023132324, 4.199109077453613, 4.542899131774902, 4.886689186096191, 5.2304792404174805, 5.5742692947387695, 5.918059349060059, 6.261849403381348, 6.605639457702637, 6.949429512023926, 7.293219566345215, 7.637009620666504, 7.980799674987793, 8.324589729309082, 8.668379783630371, 9.01216983795166, 9.35595989227295, 9.699749946594238, 10.043540000915527, 10.387330055236816, 10.731120109558105]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 6.0, 7.0, 16.0, 23.0, 38.0, 57.0, 117.0, 178.0, 341.0, 518.0, 824.0, 1407.0, 2215.0, 3520.0, 5686.0, 8976.0, 14222.0, 21990.0, 34111.0, 50951.0, 77572.0, 112649.0, 159089.0, 216686.0, 283796.0, 349883.0, 402281.0, 429691.0, 423645.0, 385270.0, 325106.0, 259014.0, 194413.0, 141038.0, 97741.0, 66448.0, 44517.0, 29021.0, 18476.0, 12214.0, 7477.0, 4918.0, 3004.0, 1999.0, 1186.0, 738.0, 441.0, 308.0, 191.0, 107.0, 68.0, 40.0, 27.0, 13.0, 5.0, 10.0, 7.0, 3.0, 0.0, 2.0, 2.0], "bins": [-8.0390625, -7.7781982421875, -7.517333984375, -7.2564697265625, -6.99560546875, -6.7347412109375, -6.473876953125, -6.2130126953125, -5.9521484375, -5.6912841796875, -5.430419921875, -5.1695556640625, -4.90869140625, -4.6478271484375, -4.386962890625, -4.1260986328125, -3.865234375, -3.6043701171875, -3.343505859375, -3.0826416015625, -2.82177734375, -2.5609130859375, -2.300048828125, -2.0391845703125, -1.7783203125, -1.5174560546875, -1.256591796875, -0.9957275390625, -0.73486328125, -0.4739990234375, -0.213134765625, 0.0477294921875, 0.30859375, 0.5694580078125, 0.830322265625, 1.0911865234375, 1.35205078125, 1.6129150390625, 1.873779296875, 2.1346435546875, 2.3955078125, 2.6563720703125, 2.917236328125, 3.1781005859375, 3.43896484375, 3.6998291015625, 3.960693359375, 4.2215576171875, 4.482421875, 4.7432861328125, 5.004150390625, 5.2650146484375, 5.52587890625, 5.7867431640625, 6.047607421875, 6.3084716796875, 6.5693359375, 6.8302001953125, 7.091064453125, 7.3519287109375, 7.61279296875, 7.8736572265625, 8.134521484375, 8.3953857421875, 8.65625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 6.0, 9.0, 9.0, 9.0, 8.0, 16.0, 12.0, 17.0, 23.0, 23.0, 33.0, 34.0, 28.0, 28.0, 36.0, 44.0, 37.0, 34.0, 38.0, 41.0, 29.0, 47.0, 34.0, 35.0, 27.0, 35.0, 35.0, 40.0, 26.0, 24.0, 30.0, 15.0, 26.0, 22.0, 15.0, 13.0, 13.0, 9.0, 6.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2940673828125, -8.994384765625, -8.6947021484375, -8.39501953125, -8.0953369140625, -7.795654296875, -7.4959716796875, -7.1962890625, -6.8966064453125, -6.596923828125, -6.2972412109375, -5.99755859375, -5.6978759765625, -5.398193359375, -5.0985107421875, -4.798828125, -4.4991455078125, -4.199462890625, -3.8997802734375, -3.60009765625, -3.3004150390625, -3.000732421875, -2.7010498046875, -2.4013671875, -2.1016845703125, -1.802001953125, -1.5023193359375, -1.20263671875, -0.9029541015625, -0.603271484375, -0.3035888671875, -0.00390625, 0.2957763671875, 0.595458984375, 0.8951416015625, 1.19482421875, 1.4945068359375, 1.794189453125, 2.0938720703125, 2.3935546875, 2.6932373046875, 2.992919921875, 3.2926025390625, 3.59228515625, 3.8919677734375, 4.191650390625, 4.4913330078125, 4.791015625, 5.0906982421875, 5.390380859375, 5.6900634765625, 5.98974609375, 6.2894287109375, 6.589111328125, 6.8887939453125, 7.1884765625, 7.4881591796875, 7.787841796875, 8.0875244140625, 8.38720703125, 8.6868896484375, 8.986572265625, 9.2862548828125, 9.5859375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 18.0, 34.0, 50.0, 95.0, 169.0, 302.0, 524.0, 814.0, 1572.0, 2503.0, 4215.0, 6793.0, 11221.0, 17746.0, 28461.0, 43962.0, 65571.0, 96943.0, 137298.0, 187169.0, 245832.0, 305945.0, 359379.0, 396531.0, 408785.0, 393248.0, 355215.0, 298827.0, 239920.0, 182346.0, 132295.0, 93486.0, 63602.0, 42353.0, 27202.0, 17025.0, 10692.0, 6538.0, 3920.0, 2306.0, 1373.0, 844.0, 469.0, 285.0, 151.0, 99.0, 76.0, 32.0, 19.0, 13.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.7265625, -8.4490966796875, -8.171630859375, -7.8941650390625, -7.61669921875, -7.3392333984375, -7.061767578125, -6.7843017578125, -6.5068359375, -6.2293701171875, -5.951904296875, -5.6744384765625, -5.39697265625, -5.1195068359375, -4.842041015625, -4.5645751953125, -4.287109375, -4.0096435546875, -3.732177734375, -3.4547119140625, -3.17724609375, -2.8997802734375, -2.622314453125, -2.3448486328125, -2.0673828125, -1.7899169921875, -1.512451171875, -1.2349853515625, -0.95751953125, -0.6800537109375, -0.402587890625, -0.1251220703125, 0.15234375, 0.4298095703125, 0.707275390625, 0.9847412109375, 1.26220703125, 1.5396728515625, 1.817138671875, 2.0946044921875, 2.3720703125, 2.6495361328125, 2.927001953125, 3.2044677734375, 3.48193359375, 3.7593994140625, 4.036865234375, 4.3143310546875, 4.591796875, 4.8692626953125, 5.146728515625, 5.4241943359375, 5.70166015625, 5.9791259765625, 6.256591796875, 6.5340576171875, 6.8115234375, 7.0889892578125, 7.366455078125, 7.6439208984375, 7.92138671875, 8.1988525390625, 8.476318359375, 8.7537841796875, 9.03125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 7.0, 9.0, 15.0, 16.0, 12.0, 17.0, 29.0, 33.0, 54.0, 60.0, 64.0, 98.0, 101.0, 117.0, 114.0, 153.0, 149.0, 169.0, 183.0, 189.0, 181.0, 222.0, 220.0, 196.0, 175.0, 187.0, 159.0, 145.0, 158.0, 154.0, 127.0, 81.0, 83.0, 86.0, 69.0, 58.0, 29.0, 23.0, 30.0, 20.0, 20.0, 15.0, 16.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-4.765625, -4.62213134765625, -4.4786376953125, -4.33514404296875, -4.191650390625, -4.04815673828125, -3.9046630859375, -3.76116943359375, -3.61767578125, -3.47418212890625, -3.3306884765625, -3.18719482421875, -3.043701171875, -2.90020751953125, -2.7567138671875, -2.61322021484375, -2.4697265625, -2.32623291015625, -2.1827392578125, -2.03924560546875, -1.895751953125, -1.75225830078125, -1.6087646484375, -1.46527099609375, -1.32177734375, -1.17828369140625, -1.0347900390625, -0.89129638671875, -0.747802734375, -0.60430908203125, -0.4608154296875, -0.31732177734375, -0.173828125, -0.03033447265625, 0.1131591796875, 0.25665283203125, 0.400146484375, 0.54364013671875, 0.6871337890625, 0.83062744140625, 0.97412109375, 1.11761474609375, 1.2611083984375, 1.40460205078125, 1.548095703125, 1.69158935546875, 1.8350830078125, 1.97857666015625, 2.1220703125, 2.26556396484375, 2.4090576171875, 2.55255126953125, 2.696044921875, 2.83953857421875, 2.9830322265625, 3.12652587890625, 3.27001953125, 3.41351318359375, 3.5570068359375, 3.70050048828125, 3.843994140625, 3.98748779296875, 4.1309814453125, 4.27447509765625, 4.41796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 7.0, 11.0, 15.0, 25.0, 21.0, 21.0, 25.0, 33.0, 33.0, 44.0, 45.0, 46.0, 42.0, 52.0, 50.0, 55.0, 58.0, 46.0, 48.0, 38.0, 35.0, 32.0, 31.0, 30.0, 27.0, 15.0, 19.0, 14.0, 18.0, 14.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.280447006225586, -14.832430839538574, -14.384414672851562, -13.936399459838867, -13.488383293151855, -13.040367126464844, -12.592350959777832, -12.14433479309082, -11.696318626403809, -11.248302459716797, -10.800286293029785, -10.352270126342773, -9.904254913330078, -9.456238746643066, -9.008222579956055, -8.560206413269043, -8.112190246582031, -7.6641740798950195, -7.216158390045166, -6.768142223358154, -6.320126056671143, -5.872110366821289, -5.424094200134277, -4.976078033447266, -4.52806282043457, -4.080046653747559, -3.632030725479126, -3.1840147972106934, -2.7359986305236816, -2.287982702255249, -1.8399667739868164, -1.3919506072998047, -0.943934440612793, -0.4959184229373932, -0.04790240526199341, 0.400113582611084, 0.8481296300888062, 1.2961456775665283, 1.744161605834961, 2.1921777725219727, 2.6401937007904053, 3.088209629058838, 3.5362257957458496, 3.9842417240142822, 4.432257652282715, 4.880273818969727, 5.328289985656738, 5.77630615234375, 6.2243218421936035, 6.672338008880615, 7.120353698730469, 7.5683698654174805, 8.016386032104492, 8.464402198791504, 8.912418365478516, 9.360433578491211, 9.808449745178223, 10.256465911865234, 10.704482078552246, 11.152498245239258, 11.600513458251953, 12.048529624938965, 12.496545791625977, 12.944561958312988, 13.392578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 8.0, 11.0, 5.0, 11.0, 12.0, 11.0, 12.0, 15.0, 16.0, 22.0, 20.0, 28.0, 29.0, 39.0, 25.0, 29.0, 32.0, 33.0, 34.0, 25.0, 34.0, 37.0, 27.0, 43.0, 36.0, 30.0, 34.0, 31.0, 42.0, 29.0, 33.0, 35.0, 20.0, 28.0, 13.0, 10.0, 13.0, 15.0, 12.0, 11.0, 6.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0], "bins": [-11.690108299255371, -11.369203567504883, -11.048298835754395, -10.727394104003906, -10.406488418579102, -10.085583686828613, -9.764678955078125, -9.443774223327637, -9.122869491577148, -8.80196475982666, -8.481060028076172, -8.160155296325684, -7.839250087738037, -7.518345355987549, -7.197440147399902, -6.876535415649414, -6.555630683898926, -6.2347259521484375, -5.913821220397949, -5.592916011810303, -5.2720112800598145, -4.951106548309326, -4.63020133972168, -4.309296607971191, -3.988391876220703, -3.667487144470215, -3.3465821743011475, -3.02567720413208, -2.704772472381592, -2.3838677406311035, -2.062962770462036, -1.7420578002929688, -1.421152114868164, -1.1002472639083862, -0.7793424129486084, -0.45843756198883057, -0.13753271102905273, 0.1833721399307251, 0.5042769908905029, 0.8251819610595703, 1.1460866928100586, 1.4669915437698364, 1.7878963947296143, 2.1088013648986816, 2.42970609664917, 2.750610828399658, 3.0715157985687256, 3.392420768737793, 3.7133255004882812, 4.0342302322387695, 4.355134963989258, 4.676040172576904, 4.996944904327393, 5.317849636077881, 5.638754844665527, 5.959659576416016, 6.280564308166504, 6.601469039916992, 6.9223737716674805, 7.243278980255127, 7.564183712005615, 7.8850884437561035, 8.20599365234375, 8.526898384094238, 8.847803115844727]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 6.0, 9.0, 23.0, 28.0, 50.0, 50.0, 76.0, 105.0, 174.0, 222.0, 372.0, 530.0, 798.0, 1312.0, 2044.0, 3258.0, 5196.0, 8333.0, 13325.0, 22034.0, 35516.0, 58495.0, 94247.0, 143054.0, 178797.0, 165225.0, 119475.0, 75721.0, 45879.0, 28177.0, 17335.0, 10574.0, 6613.0, 4127.0, 2605.0, 1639.0, 1097.0, 656.0, 430.0, 304.0, 199.0, 132.0, 76.0, 53.0, 58.0, 38.0, 23.0, 14.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0], "bins": [-4.0625, -3.942169189453125, -3.82183837890625, -3.701507568359375, -3.5811767578125, -3.460845947265625, -3.34051513671875, -3.220184326171875, -3.099853515625, -2.979522705078125, -2.85919189453125, -2.738861083984375, -2.6185302734375, -2.498199462890625, -2.37786865234375, -2.257537841796875, -2.13720703125, -2.016876220703125, -1.89654541015625, -1.776214599609375, -1.6558837890625, -1.535552978515625, -1.41522216796875, -1.294891357421875, -1.174560546875, -1.054229736328125, -0.93389892578125, -0.813568115234375, -0.6932373046875, -0.572906494140625, -0.45257568359375, -0.332244873046875, -0.2119140625, -0.091583251953125, 0.02874755859375, 0.149078369140625, 0.2694091796875, 0.389739990234375, 0.51007080078125, 0.630401611328125, 0.750732421875, 0.871063232421875, 0.99139404296875, 1.111724853515625, 1.2320556640625, 1.352386474609375, 1.47271728515625, 1.593048095703125, 1.71337890625, 1.833709716796875, 1.95404052734375, 2.074371337890625, 2.1947021484375, 2.315032958984375, 2.43536376953125, 2.555694580078125, 2.676025390625, 2.796356201171875, 2.91668701171875, 3.037017822265625, 3.1573486328125, 3.277679443359375, 3.39801025390625, 3.518341064453125, 3.638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 7.0, 12.0, 3.0, 14.0, 10.0, 11.0, 14.0, 15.0, 14.0, 21.0, 22.0, 29.0, 29.0, 40.0, 26.0, 24.0, 35.0, 33.0, 34.0, 24.0, 34.0, 39.0, 31.0, 40.0, 34.0, 32.0, 37.0, 26.0, 45.0, 26.0, 36.0, 33.0, 25.0, 23.0, 11.0, 11.0, 13.0, 14.0, 14.0, 8.0, 6.0, 9.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0], "bins": [-11.6953125, -11.37451171875, -11.0537109375, -10.73291015625, -10.412109375, -10.09130859375, -9.7705078125, -9.44970703125, -9.12890625, -8.80810546875, -8.4873046875, -8.16650390625, -7.845703125, -7.52490234375, -7.2041015625, -6.88330078125, -6.5625, -6.24169921875, -5.9208984375, -5.60009765625, -5.279296875, -4.95849609375, -4.6376953125, -4.31689453125, -3.99609375, -3.67529296875, -3.3544921875, -3.03369140625, -2.712890625, -2.39208984375, -2.0712890625, -1.75048828125, -1.4296875, -1.10888671875, -0.7880859375, -0.46728515625, -0.146484375, 0.17431640625, 0.4951171875, 0.81591796875, 1.13671875, 1.45751953125, 1.7783203125, 2.09912109375, 2.419921875, 2.74072265625, 3.0615234375, 3.38232421875, 3.703125, 4.02392578125, 4.3447265625, 4.66552734375, 4.986328125, 5.30712890625, 5.6279296875, 5.94873046875, 6.26953125, 6.59033203125, 6.9111328125, 7.23193359375, 7.552734375, 7.87353515625, 8.1943359375, 8.51513671875, 8.8359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 7.0, 18.0, 20.0, 26.0, 43.0, 57.0, 76.0, 92.0, 132.0, 188.0, 248.0, 346.0, 517.0, 739.0, 1016.0, 1612.0, 2494.0, 3705.0, 5958.0, 10004.0, 17169.0, 31081.0, 59297.0, 116529.0, 213080.0, 248031.0, 157518.0, 80559.0, 41597.0, 22604.0, 12604.0, 7533.0, 4612.0, 2995.0, 1950.0, 1245.0, 838.0, 575.0, 404.0, 302.0, 191.0, 129.0, 104.0, 79.0, 52.0, 60.0, 42.0, 29.0, 14.0, 11.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.552734375, -3.4425048828125, -3.332275390625, -3.2220458984375, -3.11181640625, -3.0015869140625, -2.891357421875, -2.7811279296875, -2.6708984375, -2.5606689453125, -2.450439453125, -2.3402099609375, -2.22998046875, -2.1197509765625, -2.009521484375, -1.8992919921875, -1.7890625, -1.6788330078125, -1.568603515625, -1.4583740234375, -1.34814453125, -1.2379150390625, -1.127685546875, -1.0174560546875, -0.9072265625, -0.7969970703125, -0.686767578125, -0.5765380859375, -0.46630859375, -0.3560791015625, -0.245849609375, -0.1356201171875, -0.025390625, 0.0848388671875, 0.195068359375, 0.3052978515625, 0.41552734375, 0.5257568359375, 0.635986328125, 0.7462158203125, 0.8564453125, 0.9666748046875, 1.076904296875, 1.1871337890625, 1.29736328125, 1.4075927734375, 1.517822265625, 1.6280517578125, 1.73828125, 1.8485107421875, 1.958740234375, 2.0689697265625, 2.17919921875, 2.2894287109375, 2.399658203125, 2.5098876953125, 2.6201171875, 2.7303466796875, 2.840576171875, 2.9508056640625, 3.06103515625, 3.1712646484375, 3.281494140625, 3.3917236328125, 3.501953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 4.0, 4.0, 8.0, 12.0, 11.0, 20.0, 21.0, 15.0, 18.0, 31.0, 31.0, 18.0, 46.0, 31.0, 36.0, 39.0, 32.0, 37.0, 45.0, 39.0, 38.0, 53.0, 47.0, 34.0, 41.0, 39.0, 30.0, 37.0, 28.0, 26.0, 23.0, 12.0, 22.0, 10.0, 13.0, 12.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.32177734375, -7.0810546875, -6.84033203125, -6.599609375, -6.35888671875, -6.1181640625, -5.87744140625, -5.63671875, -5.39599609375, -5.1552734375, -4.91455078125, -4.673828125, -4.43310546875, -4.1923828125, -3.95166015625, -3.7109375, -3.47021484375, -3.2294921875, -2.98876953125, -2.748046875, -2.50732421875, -2.2666015625, -2.02587890625, -1.78515625, -1.54443359375, -1.3037109375, -1.06298828125, -0.822265625, -0.58154296875, -0.3408203125, -0.10009765625, 0.140625, 0.38134765625, 0.6220703125, 0.86279296875, 1.103515625, 1.34423828125, 1.5849609375, 1.82568359375, 2.06640625, 2.30712890625, 2.5478515625, 2.78857421875, 3.029296875, 3.27001953125, 3.5107421875, 3.75146484375, 3.9921875, 4.23291015625, 4.4736328125, 4.71435546875, 4.955078125, 5.19580078125, 5.4365234375, 5.67724609375, 5.91796875, 6.15869140625, 6.3994140625, 6.64013671875, 6.880859375, 7.12158203125, 7.3623046875, 7.60302734375, 7.84375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 11.0, 14.0, 20.0, 34.0, 36.0, 49.0, 73.0, 117.0, 180.0, 232.0, 407.0, 555.0, 880.0, 1455.0, 2362.0, 4212.0, 7926.0, 15507.0, 37222.0, 113548.0, 422341.0, 305092.0, 79444.0, 28051.0, 12844.0, 6480.0, 3614.0, 2116.0, 1250.0, 852.0, 566.0, 350.0, 198.0, 149.0, 86.0, 84.0, 51.0, 46.0, 21.0, 17.0, 19.0, 10.0, 12.0, 3.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.3292236328125, -2.256103515625, -2.1829833984375, -2.10986328125, -2.0367431640625, -1.963623046875, -1.8905029296875, -1.8173828125, -1.7442626953125, -1.671142578125, -1.5980224609375, -1.52490234375, -1.4517822265625, -1.378662109375, -1.3055419921875, -1.232421875, -1.1593017578125, -1.086181640625, -1.0130615234375, -0.93994140625, -0.8668212890625, -0.793701171875, -0.7205810546875, -0.6474609375, -0.5743408203125, -0.501220703125, -0.4281005859375, -0.35498046875, -0.2818603515625, -0.208740234375, -0.1356201171875, -0.0625, 0.0106201171875, 0.083740234375, 0.1568603515625, 0.22998046875, 0.3031005859375, 0.376220703125, 0.4493408203125, 0.5224609375, 0.5955810546875, 0.668701171875, 0.7418212890625, 0.81494140625, 0.8880615234375, 0.961181640625, 1.0343017578125, 1.107421875, 1.1805419921875, 1.253662109375, 1.3267822265625, 1.39990234375, 1.4730224609375, 1.546142578125, 1.6192626953125, 1.6923828125, 1.7655029296875, 1.838623046875, 1.9117431640625, 1.98486328125, 2.0579833984375, 2.131103515625, 2.2042236328125, 2.27734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 15.0, 13.0, 23.0, 37.0, 40.0, 30.0, 65.0, 54.0, 71.0, 69.0, 77.0, 87.0, 61.0, 54.0, 55.0, 45.0, 34.0, 31.0, 23.0, 22.0, 13.0, 14.0, 14.0, 8.0, 5.0, 7.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002162456512451172, -0.00020839646458625793, -0.00020054727792739868, -0.00019269809126853943, -0.00018484890460968018, -0.00017699971795082092, -0.00016915053129196167, -0.00016130134463310242, -0.00015345215797424316, -0.0001456029713153839, -0.00013775378465652466, -0.0001299045979976654, -0.00012205541133880615, -0.0001142062246799469, -0.00010635703802108765, -9.85078513622284e-05, -9.065866470336914e-05, -8.280947804450989e-05, -7.496029138565063e-05, -6.711110472679138e-05, -5.926191806793213e-05, -5.1412731409072876e-05, -4.356354475021362e-05, -3.571435809135437e-05, -2.7865171432495117e-05, -2.0015984773635864e-05, -1.2166798114776611e-05, -4.317611455917358e-06, 3.5315752029418945e-06, 1.1380761861801147e-05, 1.92299485206604e-05, 2.7079135179519653e-05, 3.4928321838378906e-05, 4.277750849723816e-05, 5.062669515609741e-05, 5.8475881814956665e-05, 6.632506847381592e-05, 7.417425513267517e-05, 8.202344179153442e-05, 8.987262845039368e-05, 9.772181510925293e-05, 0.00010557100176811218, 0.00011342018842697144, 0.00012126937508583069, 0.00012911856174468994, 0.0001369677484035492, 0.00014481693506240845, 0.0001526661217212677, 0.00016051530838012695, 0.0001683644950389862, 0.00017621368169784546, 0.0001840628683567047, 0.00019191205501556396, 0.00019976124167442322, 0.00020761042833328247, 0.00021545961499214172, 0.00022330880165100098, 0.00023115798830986023, 0.00023900717496871948, 0.00024685636162757874, 0.000254705548286438, 0.00026255473494529724, 0.0002704039216041565, 0.00027825310826301575, 0.000286102294921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 15.0, 15.0, 30.0, 32.0, 39.0, 65.0, 90.0, 155.0, 204.0, 299.0, 405.0, 635.0, 875.0, 1148.0, 1856.0, 2664.0, 3960.0, 5755.0, 8466.0, 12807.0, 19184.0, 29778.0, 45329.0, 69338.0, 103702.0, 148486.0, 171850.0, 139421.0, 95676.0, 63282.0, 41390.0, 27062.0, 17938.0, 11767.0, 7801.0, 5385.0, 3650.0, 2524.0, 1689.0, 1166.0, 837.0, 544.0, 394.0, 265.0, 178.0, 135.0, 85.0, 58.0, 39.0, 28.0, 14.0, 11.0, 13.0, 5.0, 5.0, 4.0, 3.0, 6.0], "bins": [-1.708984375, -1.6562347412109375, -1.603485107421875, -1.5507354736328125, -1.49798583984375, -1.4452362060546875, -1.392486572265625, -1.3397369384765625, -1.2869873046875, -1.2342376708984375, -1.181488037109375, -1.1287384033203125, -1.07598876953125, -1.0232391357421875, -0.970489501953125, -0.9177398681640625, -0.864990234375, -0.8122406005859375, -0.759490966796875, -0.7067413330078125, -0.65399169921875, -0.6012420654296875, -0.548492431640625, -0.4957427978515625, -0.4429931640625, -0.3902435302734375, -0.337493896484375, -0.2847442626953125, -0.23199462890625, -0.1792449951171875, -0.126495361328125, -0.0737457275390625, -0.02099609375, 0.0317535400390625, 0.084503173828125, 0.1372528076171875, 0.19000244140625, 0.2427520751953125, 0.295501708984375, 0.3482513427734375, 0.4010009765625, 0.4537506103515625, 0.506500244140625, 0.5592498779296875, 0.61199951171875, 0.6647491455078125, 0.717498779296875, 0.7702484130859375, 0.822998046875, 0.8757476806640625, 0.928497314453125, 0.9812469482421875, 1.03399658203125, 1.0867462158203125, 1.139495849609375, 1.1922454833984375, 1.2449951171875, 1.2977447509765625, 1.350494384765625, 1.4032440185546875, 1.45599365234375, 1.5087432861328125, 1.561492919921875, 1.6142425537109375, 1.6669921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 1.0, 4.0, 12.0, 17.0, 13.0, 12.0, 14.0, 20.0, 17.0, 18.0, 34.0, 26.0, 50.0, 33.0, 31.0, 44.0, 47.0, 54.0, 66.0, 69.0, 53.0, 43.0, 51.0, 37.0, 30.0, 33.0, 28.0, 17.0, 11.0, 13.0, 16.0, 10.0, 9.0, 14.0, 12.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.7548828125, -0.7310409545898438, -0.7071990966796875, -0.6833572387695312, -0.659515380859375, -0.6356735229492188, -0.6118316650390625, -0.5879898071289062, -0.56414794921875, -0.5403060913085938, -0.5164642333984375, -0.49262237548828125, -0.468780517578125, -0.44493865966796875, -0.4210968017578125, -0.39725494384765625, -0.3734130859375, -0.34957122802734375, -0.3257293701171875, -0.30188751220703125, -0.278045654296875, -0.25420379638671875, -0.2303619384765625, -0.20652008056640625, -0.18267822265625, -0.15883636474609375, -0.1349945068359375, -0.11115264892578125, -0.087310791015625, -0.06346893310546875, -0.0396270751953125, -0.01578521728515625, 0.008056640625, 0.03189849853515625, 0.0557403564453125, 0.07958221435546875, 0.103424072265625, 0.12726593017578125, 0.1511077880859375, 0.17494964599609375, 0.19879150390625, 0.22263336181640625, 0.2464752197265625, 0.27031707763671875, 0.294158935546875, 0.31800079345703125, 0.3418426513671875, 0.36568450927734375, 0.3895263671875, 0.41336822509765625, 0.4372100830078125, 0.46105194091796875, 0.484893798828125, 0.5087356567382812, 0.5325775146484375, 0.5564193725585938, 0.58026123046875, 0.6041030883789062, 0.6279449462890625, 0.6517868041992188, 0.675628662109375, 0.6994705200195312, 0.7233123779296875, 0.7471542358398438, 0.77099609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 3.0, 17.0, 25.0, 22.0, 17.0, 22.0, 26.0, 39.0, 31.0, 47.0, 46.0, 49.0, 42.0, 49.0, 52.0, 59.0, 44.0, 49.0, 51.0, 30.0, 40.0, 36.0, 31.0, 28.0, 17.0, 21.0, 16.0, 14.0, 15.0, 11.0, 4.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.547548294067383, -15.099172592163086, -14.650796890258789, -14.202422142028809, -13.754046440124512, -13.305670738220215, -12.857295989990234, -12.408920288085938, -11.96054458618164, -11.512168884277344, -11.063793182373047, -10.615418434143066, -10.16704273223877, -9.718667030334473, -9.270292282104492, -8.821916580200195, -8.373540878295898, -7.925165176391602, -7.476789951324463, -7.028414726257324, -6.580039024353027, -6.1316633224487305, -5.683288097381592, -5.234912872314453, -4.786537170410156, -4.338161468505859, -3.8897862434387207, -3.441410779953003, -2.993035316467285, -2.5446598529815674, -2.0962843894958496, -1.6479089260101318, -1.199533462524414, -0.7511579990386963, -0.3027825355529785, 0.14559292793273926, 0.593968391418457, 1.0423438549041748, 1.4907193183898926, 1.9390947818756104, 2.387470245361328, 2.835845708847046, 3.2842211723327637, 3.7325966358184814, 4.180972099304199, 4.629347801208496, 5.077723026275635, 5.526098251342773, 5.97447395324707, 6.422849655151367, 6.871224880218506, 7.3196001052856445, 7.767975807189941, 8.216351509094238, 8.664726257324219, 9.113101959228516, 9.561477661132812, 10.00985336303711, 10.458229064941406, 10.906603813171387, 11.354979515075684, 11.80335521697998, 12.251729965209961, 12.700105667114258, 13.148481369018555]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 10.0, 6.0, 9.0, 9.0, 15.0, 8.0, 13.0, 23.0, 17.0, 14.0, 24.0, 30.0, 42.0, 27.0, 28.0, 24.0, 33.0, 40.0, 24.0, 31.0, 37.0, 33.0, 40.0, 42.0, 20.0, 33.0, 36.0, 32.0, 34.0, 33.0, 35.0, 31.0, 27.0, 20.0, 14.0, 10.0, 14.0, 13.0, 6.0, 14.0, 4.0, 9.0, 9.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0], "bins": [-11.63754940032959, -11.315777778625488, -10.994006156921387, -10.672233581542969, -10.350461959838867, -10.028690338134766, -9.706918716430664, -9.385147094726562, -9.063375473022461, -8.74160385131836, -8.419832229614258, -8.09805965423584, -7.776288032531738, -7.454516410827637, -7.132744789123535, -6.810973167419434, -6.489200592041016, -6.167428970336914, -5.845656871795654, -5.523885250091553, -5.202113151550293, -4.880341529846191, -4.55856990814209, -4.236798286437988, -3.9150261878967285, -3.593254327774048, -3.271482467651367, -2.9497108459472656, -2.627938985824585, -2.3061671257019043, -1.9843953847885132, -1.662623643875122, -1.340850830078125, -1.0190789699554443, -0.6973072290420532, -0.37553542852401733, -0.053763628005981445, 0.2680082321166992, 0.5897799730300903, 0.9115517139434814, 1.233323574066162, 1.5550954341888428, 1.8768671751022339, 2.198638916015625, 2.5204107761383057, 2.8421826362609863, 3.163954257965088, 3.4857261180877686, 3.807497978210449, 4.129269599914551, 4.4510416984558105, 4.772813320159912, 5.094585418701172, 5.416357040405273, 5.738128662109375, 6.059900283813477, 6.381672382354736, 6.703444004058838, 7.025216102600098, 7.346987724304199, 7.668759346008301, 7.9905314445495605, 8.31230354309082, 8.634075164794922, 8.955846786499023]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 12.0, 16.0, 14.0, 34.0, 50.0, 79.0, 109.0, 164.0, 276.0, 474.0, 636.0, 970.0, 1432.0, 2189.0, 3241.0, 4881.0, 7091.0, 10283.0, 14449.0, 20225.0, 27292.0, 36390.0, 46029.0, 57780.0, 67315.0, 77341.0, 84110.0, 87169.0, 85750.0, 80476.0, 71862.0, 61787.0, 50600.0, 39861.0, 30838.0, 22800.0, 16854.0, 11941.0, 8357.0, 5745.0, 3904.0, 2587.0, 1750.0, 1206.0, 766.0, 482.0, 307.0, 217.0, 156.0, 113.0, 68.0, 28.0, 27.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.66796875, -7.40985107421875, -7.1517333984375, -6.89361572265625, -6.635498046875, -6.37738037109375, -6.1192626953125, -5.86114501953125, -5.60302734375, -5.34490966796875, -5.0867919921875, -4.82867431640625, -4.570556640625, -4.31243896484375, -4.0543212890625, -3.79620361328125, -3.5380859375, -3.27996826171875, -3.0218505859375, -2.76373291015625, -2.505615234375, -2.24749755859375, -1.9893798828125, -1.73126220703125, -1.47314453125, -1.21502685546875, -0.9569091796875, -0.69879150390625, -0.440673828125, -0.18255615234375, 0.0755615234375, 0.33367919921875, 0.591796875, 0.84991455078125, 1.1080322265625, 1.36614990234375, 1.624267578125, 1.88238525390625, 2.1405029296875, 2.39862060546875, 2.65673828125, 2.91485595703125, 3.1729736328125, 3.43109130859375, 3.689208984375, 3.94732666015625, 4.2054443359375, 4.46356201171875, 4.7216796875, 4.97979736328125, 5.2379150390625, 5.49603271484375, 5.754150390625, 6.01226806640625, 6.2703857421875, 6.52850341796875, 6.78662109375, 7.04473876953125, 7.3028564453125, 7.56097412109375, 7.819091796875, 8.07720947265625, 8.3353271484375, 8.59344482421875, 8.8515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 6.0, 8.0, 5.0, 9.0, 8.0, 15.0, 11.0, 12.0, 22.0, 15.0, 16.0, 27.0, 26.0, 37.0, 37.0, 23.0, 28.0, 26.0, 40.0, 25.0, 33.0, 41.0, 31.0, 31.0, 42.0, 25.0, 31.0, 40.0, 31.0, 33.0, 32.0, 41.0, 28.0, 24.0, 23.0, 14.0, 12.0, 14.0, 11.0, 9.0, 13.0, 5.0, 7.0, 9.0, 5.0, 7.0, 4.0, 1.0, 2.0, 3.0], "bins": [-11.21875, -10.9093017578125, -10.599853515625, -10.2904052734375, -9.98095703125, -9.6715087890625, -9.362060546875, -9.0526123046875, -8.7431640625, -8.4337158203125, -8.124267578125, -7.8148193359375, -7.50537109375, -7.1959228515625, -6.886474609375, -6.5770263671875, -6.267578125, -5.9581298828125, -5.648681640625, -5.3392333984375, -5.02978515625, -4.7203369140625, -4.410888671875, -4.1014404296875, -3.7919921875, -3.4825439453125, -3.173095703125, -2.8636474609375, -2.55419921875, -2.2447509765625, -1.935302734375, -1.6258544921875, -1.31640625, -1.0069580078125, -0.697509765625, -0.3880615234375, -0.07861328125, 0.2308349609375, 0.540283203125, 0.8497314453125, 1.1591796875, 1.4686279296875, 1.778076171875, 2.0875244140625, 2.39697265625, 2.7064208984375, 3.015869140625, 3.3253173828125, 3.634765625, 3.9442138671875, 4.253662109375, 4.5631103515625, 4.87255859375, 5.1820068359375, 5.491455078125, 5.8009033203125, 6.1103515625, 6.4197998046875, 6.729248046875, 7.0386962890625, 7.34814453125, 7.6575927734375, 7.967041015625, 8.2764892578125, 8.5859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 13.0, 24.0, 32.0, 65.0, 93.0, 143.0, 298.0, 461.0, 850.0, 1426.0, 2416.0, 4321.0, 7309.0, 12113.0, 20103.0, 31601.0, 47641.0, 68043.0, 90507.0, 110100.0, 122295.0, 122337.0, 111567.0, 91858.0, 69161.0, 49258.0, 32783.0, 20855.0, 12680.0, 7653.0, 4394.0, 2552.0, 1463.0, 848.0, 496.0, 304.0, 169.0, 114.0, 53.0, 54.0, 32.0, 14.0, 11.0, 9.0, 5.0, 2.0, 6.0], "bins": [-13.609375, -13.2515869140625, -12.893798828125, -12.5360107421875, -12.17822265625, -11.8204345703125, -11.462646484375, -11.1048583984375, -10.7470703125, -10.3892822265625, -10.031494140625, -9.6737060546875, -9.31591796875, -8.9581298828125, -8.600341796875, -8.2425537109375, -7.884765625, -7.5269775390625, -7.169189453125, -6.8114013671875, -6.45361328125, -6.0958251953125, -5.738037109375, -5.3802490234375, -5.0224609375, -4.6646728515625, -4.306884765625, -3.9490966796875, -3.59130859375, -3.2335205078125, -2.875732421875, -2.5179443359375, -2.16015625, -1.8023681640625, -1.444580078125, -1.0867919921875, -0.72900390625, -0.3712158203125, -0.013427734375, 0.3443603515625, 0.7021484375, 1.0599365234375, 1.417724609375, 1.7755126953125, 2.13330078125, 2.4910888671875, 2.848876953125, 3.2066650390625, 3.564453125, 3.9222412109375, 4.280029296875, 4.6378173828125, 4.99560546875, 5.3533935546875, 5.711181640625, 6.0689697265625, 6.4267578125, 6.7845458984375, 7.142333984375, 7.5001220703125, 7.85791015625, 8.2156982421875, 8.573486328125, 8.9312744140625, 9.2890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 10.0, 15.0, 9.0, 17.0, 20.0, 17.0, 29.0, 25.0, 18.0, 41.0, 42.0, 34.0, 35.0, 29.0, 43.0, 43.0, 51.0, 28.0, 46.0, 41.0, 38.0, 34.0, 42.0, 32.0, 34.0, 31.0, 32.0, 19.0, 29.0, 20.0, 14.0, 12.0, 14.0, 4.0, 8.0, 9.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.3125, -8.0875244140625, -7.862548828125, -7.6375732421875, -7.41259765625, -7.1876220703125, -6.962646484375, -6.7376708984375, -6.5126953125, -6.2877197265625, -6.062744140625, -5.8377685546875, -5.61279296875, -5.3878173828125, -5.162841796875, -4.9378662109375, -4.712890625, -4.4879150390625, -4.262939453125, -4.0379638671875, -3.81298828125, -3.5880126953125, -3.363037109375, -3.1380615234375, -2.9130859375, -2.6881103515625, -2.463134765625, -2.2381591796875, -2.01318359375, -1.7882080078125, -1.563232421875, -1.3382568359375, -1.11328125, -0.8883056640625, -0.663330078125, -0.4383544921875, -0.21337890625, 0.0115966796875, 0.236572265625, 0.4615478515625, 0.6865234375, 0.9114990234375, 1.136474609375, 1.3614501953125, 1.58642578125, 1.8114013671875, 2.036376953125, 2.2613525390625, 2.486328125, 2.7113037109375, 2.936279296875, 3.1612548828125, 3.38623046875, 3.6112060546875, 3.836181640625, 4.0611572265625, 4.2861328125, 4.5111083984375, 4.736083984375, 4.9610595703125, 5.18603515625, 5.4110107421875, 5.635986328125, 5.8609619140625, 6.0859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 12.0, 13.0, 21.0, 27.0, 43.0, 54.0, 94.0, 115.0, 176.0, 309.0, 532.0, 864.0, 1565.0, 2766.0, 5309.0, 10258.0, 20421.0, 39023.0, 71453.0, 117972.0, 165025.0, 184389.0, 163132.0, 115609.0, 69645.0, 37982.0, 19562.0, 10376.0, 5253.0, 2778.0, 1437.0, 874.0, 551.0, 326.0, 199.0, 146.0, 93.0, 56.0, 27.0, 16.0, 22.0, 13.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.80859375, -7.59454345703125, -7.3804931640625, -7.16644287109375, -6.952392578125, -6.73834228515625, -6.5242919921875, -6.31024169921875, -6.09619140625, -5.88214111328125, -5.6680908203125, -5.45404052734375, -5.239990234375, -5.02593994140625, -4.8118896484375, -4.59783935546875, -4.3837890625, -4.16973876953125, -3.9556884765625, -3.74163818359375, -3.527587890625, -3.31353759765625, -3.0994873046875, -2.88543701171875, -2.67138671875, -2.45733642578125, -2.2432861328125, -2.02923583984375, -1.815185546875, -1.60113525390625, -1.3870849609375, -1.17303466796875, -0.958984375, -0.74493408203125, -0.5308837890625, -0.31683349609375, -0.102783203125, 0.11126708984375, 0.3253173828125, 0.53936767578125, 0.75341796875, 0.96746826171875, 1.1815185546875, 1.39556884765625, 1.609619140625, 1.82366943359375, 2.0377197265625, 2.25177001953125, 2.4658203125, 2.67987060546875, 2.8939208984375, 3.10797119140625, 3.322021484375, 3.53607177734375, 3.7501220703125, 3.96417236328125, 4.17822265625, 4.39227294921875, 4.6063232421875, 4.82037353515625, 5.034423828125, 5.24847412109375, 5.4625244140625, 5.67657470703125, 5.890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 16.0, 24.0, 12.0, 19.0, 27.0, 32.0, 46.0, 45.0, 38.0, 49.0, 62.0, 64.0, 60.0, 59.0, 70.0, 61.0, 60.0, 41.0, 37.0, 35.0, 24.0, 22.0, 17.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006856918334960938, -0.0006635934114456177, -0.0006414949893951416, -0.0006193965673446655, -0.0005972981452941895, -0.0005751997232437134, -0.0005531013011932373, -0.0005310028791427612, -0.0005089044570922852, -0.0004868060350418091, -0.000464707612991333, -0.00044260919094085693, -0.00042051076889038086, -0.0003984123468399048, -0.0003763139247894287, -0.00035421550273895264, -0.00033211708068847656, -0.0003100186586380005, -0.0002879202365875244, -0.00026582181453704834, -0.00024372339248657227, -0.0002216249704360962, -0.00019952654838562012, -0.00017742812633514404, -0.00015532970428466797, -0.0001332312822341919, -0.00011113286018371582, -8.903443813323975e-05, -6.693601608276367e-05, -4.48375940322876e-05, -2.2739171981811523e-05, -6.407499313354492e-07, 2.1457672119140625e-05, 4.35560941696167e-05, 6.565451622009277e-05, 8.775293827056885e-05, 0.00010985136032104492, 0.000131949782371521, 0.00015404820442199707, 0.00017614662647247314, 0.00019824504852294922, 0.0002203434705734253, 0.00024244189262390137, 0.00026454031467437744, 0.0002866387367248535, 0.0003087371587753296, 0.00033083558082580566, 0.00035293400287628174, 0.0003750324249267578, 0.0003971308469772339, 0.00041922926902770996, 0.00044132769107818604, 0.0004634261131286621, 0.0004855245351791382, 0.0005076229572296143, 0.0005297213792800903, 0.0005518198013305664, 0.0005739182233810425, 0.0005960166454315186, 0.0006181150674819946, 0.0006402134895324707, 0.0006623119115829468, 0.0006844103336334229, 0.0007065087556838989, 0.000728607177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 7.0, 10.0, 11.0, 23.0, 28.0, 59.0, 61.0, 98.0, 138.0, 223.0, 363.0, 509.0, 742.0, 1129.0, 1762.0, 2819.0, 4458.0, 6702.0, 10791.0, 16812.0, 26482.0, 40100.0, 59050.0, 83024.0, 106454.0, 124956.0, 129607.0, 118818.0, 97089.0, 72197.0, 49910.0, 33797.0, 21615.0, 13901.0, 8762.0, 5801.0, 3581.0, 2274.0, 1482.0, 1022.0, 629.0, 389.0, 309.0, 176.0, 126.0, 88.0, 47.0, 49.0, 23.0, 20.0, 11.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0], "bins": [-5.53125, -5.35992431640625, -5.1885986328125, -5.01727294921875, -4.845947265625, -4.67462158203125, -4.5032958984375, -4.33197021484375, -4.16064453125, -3.98931884765625, -3.8179931640625, -3.64666748046875, -3.475341796875, -3.30401611328125, -3.1326904296875, -2.96136474609375, -2.7900390625, -2.61871337890625, -2.4473876953125, -2.27606201171875, -2.104736328125, -1.93341064453125, -1.7620849609375, -1.59075927734375, -1.41943359375, -1.24810791015625, -1.0767822265625, -0.90545654296875, -0.734130859375, -0.56280517578125, -0.3914794921875, -0.22015380859375, -0.048828125, 0.12249755859375, 0.2938232421875, 0.46514892578125, 0.636474609375, 0.80780029296875, 0.9791259765625, 1.15045166015625, 1.32177734375, 1.49310302734375, 1.6644287109375, 1.83575439453125, 2.007080078125, 2.17840576171875, 2.3497314453125, 2.52105712890625, 2.6923828125, 2.86370849609375, 3.0350341796875, 3.20635986328125, 3.377685546875, 3.54901123046875, 3.7203369140625, 3.89166259765625, 4.06298828125, 4.23431396484375, 4.4056396484375, 4.57696533203125, 4.748291015625, 4.91961669921875, 5.0909423828125, 5.26226806640625, 5.43359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 10.0, 7.0, 8.0, 10.0, 12.0, 16.0, 15.0, 21.0, 26.0, 20.0, 29.0, 36.0, 34.0, 43.0, 35.0, 39.0, 51.0, 33.0, 61.0, 39.0, 36.0, 47.0, 51.0, 27.0, 31.0, 32.0, 31.0, 21.0, 21.0, 16.0, 20.0, 19.0, 20.0, 17.0, 10.0, 4.0, 7.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.9287109375, -1.8708648681640625, -1.813018798828125, -1.7551727294921875, -1.69732666015625, -1.6394805908203125, -1.581634521484375, -1.5237884521484375, -1.4659423828125, -1.4080963134765625, -1.350250244140625, -1.2924041748046875, -1.23455810546875, -1.1767120361328125, -1.118865966796875, -1.0610198974609375, -1.003173828125, -0.9453277587890625, -0.887481689453125, -0.8296356201171875, -0.77178955078125, -0.7139434814453125, -0.656097412109375, -0.5982513427734375, -0.5404052734375, -0.4825592041015625, -0.424713134765625, -0.3668670654296875, -0.30902099609375, -0.2511749267578125, -0.193328857421875, -0.1354827880859375, -0.07763671875, -0.0197906494140625, 0.038055419921875, 0.0959014892578125, 0.15374755859375, 0.2115936279296875, 0.269439697265625, 0.3272857666015625, 0.3851318359375, 0.4429779052734375, 0.500823974609375, 0.5586700439453125, 0.61651611328125, 0.6743621826171875, 0.732208251953125, 0.7900543212890625, 0.847900390625, 0.9057464599609375, 0.963592529296875, 1.0214385986328125, 1.07928466796875, 1.1371307373046875, 1.194976806640625, 1.2528228759765625, 1.3106689453125, 1.3685150146484375, 1.426361083984375, 1.4842071533203125, 1.54205322265625, 1.5998992919921875, 1.657745361328125, 1.7155914306640625, 1.7734375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 8.0, 9.0, 9.0, 5.0, 10.0, 10.0, 15.0, 9.0, 27.0, 24.0, 22.0, 18.0, 29.0, 32.0, 42.0, 51.0, 45.0, 52.0, 46.0, 43.0, 47.0, 46.0, 34.0, 40.0, 26.0, 48.0, 31.0, 39.0, 26.0, 29.0, 15.0, 27.0, 18.0, 11.0, 13.0, 6.0, 8.0, 7.0, 6.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.942811965942383, -13.54409122467041, -13.145371437072754, -12.746650695800781, -12.347929954528809, -11.949209213256836, -11.55048942565918, -11.151768684387207, -10.753047943115234, -10.354327201843262, -9.955607414245605, -9.556886672973633, -9.15816593170166, -8.759445190429688, -8.360725402832031, -7.962004661560059, -7.563284873962402, -7.164564609527588, -6.765843868255615, -6.367123603820801, -5.968402862548828, -5.569682598114014, -5.170962333679199, -4.772241592407227, -4.373521327972412, -3.9748008251190186, -3.576080322265625, -3.1773600578308105, -2.778639554977417, -2.3799190521240234, -1.981198787689209, -1.5824782848358154, -1.1837568283081055, -0.7850363850593567, -0.3863159418106079, 0.012404441833496094, 0.41112494468688965, 0.8098454475402832, 1.2085657119750977, 1.6072862148284912, 2.0060067176818848, 2.4047272205352783, 2.803447723388672, 3.2021679878234863, 3.60088849067688, 3.9996089935302734, 4.398329257965088, 4.797049522399902, 5.195770263671875, 5.5944905281066895, 5.993211269378662, 6.391931533813477, 6.790652275085449, 7.189372539520264, 7.588092803955078, 7.986813545227051, 8.385534286499023, 8.784255027770996, 9.182974815368652, 9.581695556640625, 9.980416297912598, 10.37913703918457, 10.777856826782227, 11.1765775680542, 11.575297355651855]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 8.0, 10.0, 3.0, 7.0, 12.0, 11.0, 6.0, 12.0, 17.0, 17.0, 17.0, 17.0, 25.0, 20.0, 24.0, 28.0, 16.0, 28.0, 46.0, 24.0, 29.0, 30.0, 39.0, 40.0, 44.0, 33.0, 31.0, 24.0, 26.0, 25.0, 20.0, 38.0, 31.0, 30.0, 35.0, 20.0, 31.0, 18.0, 22.0, 10.0, 12.0, 8.0, 6.0, 11.0, 11.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.214995384216309, -9.906293869018555, -9.597591400146484, -9.28888988494873, -8.98018741607666, -8.671485900878906, -8.362783432006836, -8.054081916809082, -7.74537992477417, -7.436677932739258, -7.127975940704346, -6.819273948669434, -6.51057243347168, -6.201869964599609, -5.8931684494018555, -5.584466457366943, -5.275764465332031, -4.967062473297119, -4.658360481262207, -4.349658489227295, -4.040956497192383, -3.73225474357605, -3.423552989959717, -3.1148509979248047, -2.8061490058898926, -2.4974470138549805, -2.1887450218200684, -1.8800432682037354, -1.5713412761688232, -1.2626392841339111, -0.9539374113082886, -0.645235538482666, -0.3365345001220703, -0.02783256769180298, 0.28086936473846436, 0.5895712971687317, 0.898273229598999, 1.2069752216339111, 1.5156770944595337, 1.8243789672851562, 2.1330809593200684, 2.4417829513549805, 2.7504849433898926, 3.0591866970062256, 3.3678886890411377, 3.67659068107605, 3.985292434692383, 4.293994426727295, 4.602696418762207, 4.911398410797119, 5.220100402832031, 5.528802394866943, 5.8375043869018555, 6.146205902099609, 6.4549078941345215, 6.763609886169434, 7.072311878204346, 7.381013870239258, 7.68971586227417, 7.998417854309082, 8.307119369506836, 8.615821838378906, 8.92452335357666, 9.233224868774414, 9.541927337646484]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 9.0, 21.0, 28.0, 49.0, 59.0, 154.0, 254.0, 427.0, 778.0, 1246.0, 2187.0, 3845.0, 6276.0, 10738.0, 17717.0, 28195.0, 45138.0, 70142.0, 105760.0, 154829.0, 217493.0, 291598.0, 366549.0, 426273.0, 457295.0, 446686.0, 399882.0, 330822.0, 255842.0, 186985.0, 129987.0, 86884.0, 56944.0, 36095.0, 22446.0, 13849.0, 8414.0, 5093.0, 3006.0, 1731.0, 1082.0, 667.0, 354.0, 203.0, 115.0, 57.0, 31.0, 29.0, 14.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.3984375, -9.111572265625, -8.82470703125, -8.537841796875, -8.2509765625, -7.964111328125, -7.67724609375, -7.390380859375, -7.103515625, -6.816650390625, -6.52978515625, -6.242919921875, -5.9560546875, -5.669189453125, -5.38232421875, -5.095458984375, -4.80859375, -4.521728515625, -4.23486328125, -3.947998046875, -3.6611328125, -3.374267578125, -3.08740234375, -2.800537109375, -2.513671875, -2.226806640625, -1.93994140625, -1.653076171875, -1.3662109375, -1.079345703125, -0.79248046875, -0.505615234375, -0.21875, 0.068115234375, 0.35498046875, 0.641845703125, 0.9287109375, 1.215576171875, 1.50244140625, 1.789306640625, 2.076171875, 2.363037109375, 2.64990234375, 2.936767578125, 3.2236328125, 3.510498046875, 3.79736328125, 4.084228515625, 4.37109375, 4.657958984375, 4.94482421875, 5.231689453125, 5.5185546875, 5.805419921875, 6.09228515625, 6.379150390625, 6.666015625, 6.952880859375, 7.23974609375, 7.526611328125, 7.8134765625, 8.100341796875, 8.38720703125, 8.674072265625, 8.9609375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 10.0, 8.0, 8.0, 10.0, 10.0, 13.0, 18.0, 18.0, 14.0, 23.0, 26.0, 22.0, 21.0, 27.0, 31.0, 33.0, 23.0, 32.0, 38.0, 30.0, 40.0, 33.0, 45.0, 28.0, 34.0, 29.0, 25.0, 16.0, 32.0, 29.0, 36.0, 33.0, 26.0, 29.0, 26.0, 13.0, 15.0, 14.0, 8.0, 7.0, 13.0, 7.0, 8.0, 6.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.8046875, -8.53564453125, -8.2666015625, -7.99755859375, -7.728515625, -7.45947265625, -7.1904296875, -6.92138671875, -6.65234375, -6.38330078125, -6.1142578125, -5.84521484375, -5.576171875, -5.30712890625, -5.0380859375, -4.76904296875, -4.5, -4.23095703125, -3.9619140625, -3.69287109375, -3.423828125, -3.15478515625, -2.8857421875, -2.61669921875, -2.34765625, -2.07861328125, -1.8095703125, -1.54052734375, -1.271484375, -1.00244140625, -0.7333984375, -0.46435546875, -0.1953125, 0.07373046875, 0.3427734375, 0.61181640625, 0.880859375, 1.14990234375, 1.4189453125, 1.68798828125, 1.95703125, 2.22607421875, 2.4951171875, 2.76416015625, 3.033203125, 3.30224609375, 3.5712890625, 3.84033203125, 4.109375, 4.37841796875, 4.6474609375, 4.91650390625, 5.185546875, 5.45458984375, 5.7236328125, 5.99267578125, 6.26171875, 6.53076171875, 6.7998046875, 7.06884765625, 7.337890625, 7.60693359375, 7.8759765625, 8.14501953125, 8.4140625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 6.0, 7.0, 16.0, 30.0, 42.0, 74.0, 115.0, 235.0, 374.0, 641.0, 1128.0, 1837.0, 3228.0, 5130.0, 8262.0, 13733.0, 21282.0, 32540.0, 48994.0, 72767.0, 104514.0, 143638.0, 192250.0, 244760.0, 298619.0, 344450.0, 376524.0, 386966.0, 375167.0, 343233.0, 295511.0, 241415.0, 188709.0, 140264.0, 101830.0, 71260.0, 48502.0, 31634.0, 20505.0, 12949.0, 8391.0, 5121.0, 3014.0, 1863.0, 1177.0, 663.0, 395.0, 226.0, 120.0, 77.0, 44.0, 23.0, 15.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.578125, -8.3055419921875, -8.032958984375, -7.7603759765625, -7.48779296875, -7.2152099609375, -6.942626953125, -6.6700439453125, -6.3974609375, -6.1248779296875, -5.852294921875, -5.5797119140625, -5.30712890625, -5.0345458984375, -4.761962890625, -4.4893798828125, -4.216796875, -3.9442138671875, -3.671630859375, -3.3990478515625, -3.12646484375, -2.8538818359375, -2.581298828125, -2.3087158203125, -2.0361328125, -1.7635498046875, -1.490966796875, -1.2183837890625, -0.94580078125, -0.6732177734375, -0.400634765625, -0.1280517578125, 0.14453125, 0.4171142578125, 0.689697265625, 0.9622802734375, 1.23486328125, 1.5074462890625, 1.780029296875, 2.0526123046875, 2.3251953125, 2.5977783203125, 2.870361328125, 3.1429443359375, 3.41552734375, 3.6881103515625, 3.960693359375, 4.2332763671875, 4.505859375, 4.7784423828125, 5.051025390625, 5.3236083984375, 5.59619140625, 5.8687744140625, 6.141357421875, 6.4139404296875, 6.6865234375, 6.9591064453125, 7.231689453125, 7.5042724609375, 7.77685546875, 8.0494384765625, 8.322021484375, 8.5946044921875, 8.8671875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 8.0, 17.0, 20.0, 30.0, 44.0, 53.0, 48.0, 68.0, 71.0, 98.0, 98.0, 125.0, 148.0, 181.0, 180.0, 197.0, 194.0, 230.0, 214.0, 189.0, 215.0, 188.0, 183.0, 196.0, 156.0, 160.0, 141.0, 130.0, 90.0, 73.0, 63.0, 46.0, 45.0, 41.0, 34.0, 24.0, 11.0, 12.0, 11.0, 3.0, 0.0, 2.0, 7.0, 1.0, 3.0, 1.0], "bins": [-5.765625, -5.6092529296875, -5.452880859375, -5.2965087890625, -5.14013671875, -4.9837646484375, -4.827392578125, -4.6710205078125, -4.5146484375, -4.3582763671875, -4.201904296875, -4.0455322265625, -3.88916015625, -3.7327880859375, -3.576416015625, -3.4200439453125, -3.263671875, -3.1072998046875, -2.950927734375, -2.7945556640625, -2.63818359375, -2.4818115234375, -2.325439453125, -2.1690673828125, -2.0126953125, -1.8563232421875, -1.699951171875, -1.5435791015625, -1.38720703125, -1.2308349609375, -1.074462890625, -0.9180908203125, -0.76171875, -0.6053466796875, -0.448974609375, -0.2926025390625, -0.13623046875, 0.0201416015625, 0.176513671875, 0.3328857421875, 0.4892578125, 0.6456298828125, 0.802001953125, 0.9583740234375, 1.11474609375, 1.2711181640625, 1.427490234375, 1.5838623046875, 1.740234375, 1.8966064453125, 2.052978515625, 2.2093505859375, 2.36572265625, 2.5220947265625, 2.678466796875, 2.8348388671875, 2.9912109375, 3.1475830078125, 3.303955078125, 3.4603271484375, 3.61669921875, 3.7730712890625, 3.929443359375, 4.0858154296875, 4.2421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 4.0, 7.0, 3.0, 12.0, 14.0, 19.0, 16.0, 16.0, 22.0, 22.0, 24.0, 26.0, 33.0, 27.0, 34.0, 30.0, 36.0, 40.0, 40.0, 36.0, 49.0, 30.0, 41.0, 38.0, 38.0, 45.0, 31.0, 32.0, 32.0, 34.0, 16.0, 32.0, 24.0, 14.0, 9.0, 11.0, 12.0, 7.0, 9.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.58362865447998, -10.225683212280273, -9.86773681640625, -9.509790420532227, -9.15184497833252, -8.793899536132812, -8.435953140258789, -8.078006744384766, -7.720061302185059, -7.362115383148193, -7.004169464111328, -6.646223545074463, -6.288277626037598, -5.930331707000732, -5.572385787963867, -5.214439868927002, -4.856493949890137, -4.4985480308532715, -4.140602111816406, -3.782656192779541, -3.424710273742676, -3.0667643547058105, -2.7088184356689453, -2.35087251663208, -1.9929265975952148, -1.6349806785583496, -1.2770347595214844, -0.9190888404846191, -0.5611429214477539, -0.20319700241088867, 0.15474891662597656, 0.5126948356628418, 0.8706417083740234, 1.2285876274108887, 1.586533546447754, 1.9444794654846191, 2.3024253845214844, 2.6603713035583496, 3.018317222595215, 3.37626314163208, 3.7342090606689453, 4.0921549797058105, 4.450100898742676, 4.808046817779541, 5.165992736816406, 5.5239386558532715, 5.881884574890137, 6.239830493927002, 6.597776412963867, 6.955722332000732, 7.313668251037598, 7.671614170074463, 8.029560089111328, 8.387506484985352, 8.745451927185059, 9.103397369384766, 9.461343765258789, 9.819290161132812, 10.17723560333252, 10.535181045532227, 10.89312744140625, 11.251073837280273, 11.60901927947998, 11.966964721679688, 12.324911117553711]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 13.0, 13.0, 17.0, 16.0, 20.0, 19.0, 23.0, 29.0, 34.0, 33.0, 31.0, 29.0, 41.0, 30.0, 37.0, 37.0, 33.0, 41.0, 39.0, 41.0, 45.0, 30.0, 32.0, 36.0, 24.0, 27.0, 34.0, 31.0, 21.0, 18.0, 16.0, 15.0, 14.0, 9.0, 15.0, 5.0, 13.0, 1.0, 3.0, 5.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.981307029724121, -10.63040542602539, -10.279504776000977, -9.928603172302246, -9.577701568603516, -9.226799964904785, -8.875899314880371, -8.52499771118164, -8.17409610748291, -7.823194980621338, -7.472293376922607, -7.121392250061035, -6.770490646362305, -6.419589519500732, -6.06868839263916, -5.71778678894043, -5.366885662078857, -5.015984535217285, -4.665082931518555, -4.314181804656982, -3.963280200958252, -3.6123790740966797, -3.2614777088165283, -2.910576343536377, -2.5596749782562256, -2.208773612976074, -1.8578722476959229, -1.506971001625061, -1.1560696363449097, -0.8051682710647583, -0.4542670249938965, -0.10336565971374512, 0.24753570556640625, 0.5984370708465576, 0.9493383765220642, 1.3002396821975708, 1.6511410474777222, 2.002042293548584, 2.3529436588287354, 2.7038450241088867, 3.054746389389038, 3.4056477546691895, 3.756549119949341, 4.107450485229492, 4.4583516120910645, 4.809253215789795, 5.160154342651367, 5.511055946350098, 5.86195707321167, 6.212858200073242, 6.563759803771973, 6.914660930633545, 7.265562534332275, 7.616463661193848, 7.967365264892578, 8.318265914916992, 8.669167518615723, 9.020069122314453, 9.370969772338867, 9.721871376037598, 10.072772979736328, 10.423674583435059, 10.774575233459473, 11.125476837158203, 11.476378440856934]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 6.0, 19.0, 21.0, 27.0, 44.0, 53.0, 64.0, 137.0, 171.0, 264.0, 355.0, 557.0, 889.0, 1318.0, 1949.0, 3053.0, 4923.0, 8397.0, 14561.0, 26529.0, 49329.0, 93077.0, 165142.0, 224868.0, 193920.0, 117207.0, 63333.0, 33050.0, 18348.0, 10242.0, 6008.0, 3723.0, 2347.0, 1494.0, 1050.0, 667.0, 445.0, 305.0, 227.0, 139.0, 75.0, 69.0, 44.0, 29.0, 27.0, 17.0, 12.0, 13.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.90625, -3.782989501953125, -3.65972900390625, -3.536468505859375, -3.4132080078125, -3.289947509765625, -3.16668701171875, -3.043426513671875, -2.920166015625, -2.796905517578125, -2.67364501953125, -2.550384521484375, -2.4271240234375, -2.303863525390625, -2.18060302734375, -2.057342529296875, -1.93408203125, -1.810821533203125, -1.68756103515625, -1.564300537109375, -1.4410400390625, -1.317779541015625, -1.19451904296875, -1.071258544921875, -0.947998046875, -0.824737548828125, -0.70147705078125, -0.578216552734375, -0.4549560546875, -0.331695556640625, -0.20843505859375, -0.085174560546875, 0.0380859375, 0.161346435546875, 0.28460693359375, 0.407867431640625, 0.5311279296875, 0.654388427734375, 0.77764892578125, 0.900909423828125, 1.024169921875, 1.147430419921875, 1.27069091796875, 1.393951416015625, 1.5172119140625, 1.640472412109375, 1.76373291015625, 1.886993408203125, 2.01025390625, 2.133514404296875, 2.25677490234375, 2.380035400390625, 2.5032958984375, 2.626556396484375, 2.74981689453125, 2.873077392578125, 2.996337890625, 3.119598388671875, 3.24285888671875, 3.366119384765625, 3.4893798828125, 3.612640380859375, 3.73590087890625, 3.859161376953125, 3.982421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 8.0, 6.0, 9.0, 12.0, 13.0, 19.0, 17.0, 16.0, 21.0, 23.0, 27.0, 36.0, 31.0, 33.0, 28.0, 37.0, 32.0, 36.0, 41.0, 32.0, 40.0, 39.0, 41.0, 45.0, 32.0, 30.0, 35.0, 24.0, 31.0, 31.0, 32.0, 20.0, 19.0, 16.0, 16.0, 11.0, 12.0, 15.0, 5.0, 11.0, 3.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.921875, -10.572265625, -10.22265625, -9.873046875, -9.5234375, -9.173828125, -8.82421875, -8.474609375, -8.125, -7.775390625, -7.42578125, -7.076171875, -6.7265625, -6.376953125, -6.02734375, -5.677734375, -5.328125, -4.978515625, -4.62890625, -4.279296875, -3.9296875, -3.580078125, -3.23046875, -2.880859375, -2.53125, -2.181640625, -1.83203125, -1.482421875, -1.1328125, -0.783203125, -0.43359375, -0.083984375, 0.265625, 0.615234375, 0.96484375, 1.314453125, 1.6640625, 2.013671875, 2.36328125, 2.712890625, 3.0625, 3.412109375, 3.76171875, 4.111328125, 4.4609375, 4.810546875, 5.16015625, 5.509765625, 5.859375, 6.208984375, 6.55859375, 6.908203125, 7.2578125, 7.607421875, 7.95703125, 8.306640625, 8.65625, 9.005859375, 9.35546875, 9.705078125, 10.0546875, 10.404296875, 10.75390625, 11.103515625, 11.453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 10.0, 11.0, 11.0, 11.0, 18.0, 23.0, 37.0, 43.0, 67.0, 79.0, 117.0, 178.0, 220.0, 338.0, 499.0, 677.0, 1050.0, 1558.0, 2502.0, 4113.0, 6883.0, 12469.0, 24580.0, 52048.0, 119780.0, 256585.0, 287728.0, 147877.0, 63917.0, 29592.0, 14790.0, 7997.0, 4501.0, 2812.0, 1692.0, 1203.0, 788.0, 514.0, 360.0, 262.0, 165.0, 129.0, 89.0, 67.0, 55.0, 35.0, 23.0, 14.0, 14.0, 9.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.888671875, -3.771270751953125, -3.65386962890625, -3.536468505859375, -3.4190673828125, -3.301666259765625, -3.18426513671875, -3.066864013671875, -2.949462890625, -2.832061767578125, -2.71466064453125, -2.597259521484375, -2.4798583984375, -2.362457275390625, -2.24505615234375, -2.127655029296875, -2.01025390625, -1.892852783203125, -1.77545166015625, -1.658050537109375, -1.5406494140625, -1.423248291015625, -1.30584716796875, -1.188446044921875, -1.071044921875, -0.953643798828125, -0.83624267578125, -0.718841552734375, -0.6014404296875, -0.484039306640625, -0.36663818359375, -0.249237060546875, -0.1318359375, -0.014434814453125, 0.10296630859375, 0.220367431640625, 0.3377685546875, 0.455169677734375, 0.57257080078125, 0.689971923828125, 0.807373046875, 0.924774169921875, 1.04217529296875, 1.159576416015625, 1.2769775390625, 1.394378662109375, 1.51177978515625, 1.629180908203125, 1.74658203125, 1.863983154296875, 1.98138427734375, 2.098785400390625, 2.2161865234375, 2.333587646484375, 2.45098876953125, 2.568389892578125, 2.685791015625, 2.803192138671875, 2.92059326171875, 3.037994384765625, 3.1553955078125, 3.272796630859375, 3.39019775390625, 3.507598876953125, 3.625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 9.0, 7.0, 8.0, 13.0, 9.0, 14.0, 16.0, 19.0, 10.0, 27.0, 23.0, 32.0, 21.0, 24.0, 35.0, 41.0, 41.0, 40.0, 38.0, 41.0, 47.0, 46.0, 40.0, 47.0, 37.0, 38.0, 43.0, 34.0, 31.0, 28.0, 17.0, 22.0, 12.0, 17.0, 19.0, 11.0, 7.0, 5.0, 8.0, 6.0, 8.0, 2.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.0234375, -7.77685546875, -7.5302734375, -7.28369140625, -7.037109375, -6.79052734375, -6.5439453125, -6.29736328125, -6.05078125, -5.80419921875, -5.5576171875, -5.31103515625, -5.064453125, -4.81787109375, -4.5712890625, -4.32470703125, -4.078125, -3.83154296875, -3.5849609375, -3.33837890625, -3.091796875, -2.84521484375, -2.5986328125, -2.35205078125, -2.10546875, -1.85888671875, -1.6123046875, -1.36572265625, -1.119140625, -0.87255859375, -0.6259765625, -0.37939453125, -0.1328125, 0.11376953125, 0.3603515625, 0.60693359375, 0.853515625, 1.10009765625, 1.3466796875, 1.59326171875, 1.83984375, 2.08642578125, 2.3330078125, 2.57958984375, 2.826171875, 3.07275390625, 3.3193359375, 3.56591796875, 3.8125, 4.05908203125, 4.3056640625, 4.55224609375, 4.798828125, 5.04541015625, 5.2919921875, 5.53857421875, 5.78515625, 6.03173828125, 6.2783203125, 6.52490234375, 6.771484375, 7.01806640625, 7.2646484375, 7.51123046875, 7.7578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 1.0, 10.0, 3.0, 14.0, 24.0, 23.0, 34.0, 50.0, 74.0, 101.0, 143.0, 182.0, 285.0, 385.0, 552.0, 898.0, 1345.0, 2198.0, 3944.0, 7437.0, 15760.0, 40280.0, 139732.0, 485871.0, 244723.0, 61099.0, 21699.0, 9515.0, 4929.0, 2708.0, 1540.0, 951.0, 631.0, 411.0, 302.0, 207.0, 129.0, 103.0, 71.0, 54.0, 40.0, 35.0, 16.0, 15.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8232421875, -1.763824462890625, -1.70440673828125, -1.644989013671875, -1.5855712890625, -1.526153564453125, -1.46673583984375, -1.407318115234375, -1.347900390625, -1.288482666015625, -1.22906494140625, -1.169647216796875, -1.1102294921875, -1.050811767578125, -0.99139404296875, -0.931976318359375, -0.87255859375, -0.813140869140625, -0.75372314453125, -0.694305419921875, -0.6348876953125, -0.575469970703125, -0.51605224609375, -0.456634521484375, -0.397216796875, -0.337799072265625, -0.27838134765625, -0.218963623046875, -0.1595458984375, -0.100128173828125, -0.04071044921875, 0.018707275390625, 0.078125, 0.137542724609375, 0.19696044921875, 0.256378173828125, 0.3157958984375, 0.375213623046875, 0.43463134765625, 0.494049072265625, 0.553466796875, 0.612884521484375, 0.67230224609375, 0.731719970703125, 0.7911376953125, 0.850555419921875, 0.90997314453125, 0.969390869140625, 1.02880859375, 1.088226318359375, 1.14764404296875, 1.207061767578125, 1.2664794921875, 1.325897216796875, 1.38531494140625, 1.444732666015625, 1.504150390625, 1.563568115234375, 1.62298583984375, 1.682403564453125, 1.7418212890625, 1.801239013671875, 1.86065673828125, 1.920074462890625, 1.9794921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 10.0, 7.0, 11.0, 14.0, 15.0, 19.0, 13.0, 35.0, 35.0, 36.0, 44.0, 61.0, 57.0, 62.0, 69.0, 70.0, 62.0, 59.0, 45.0, 37.0, 36.0, 39.0, 27.0, 24.0, 29.0, 13.0, 21.0, 5.0, 9.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00014256685972213745, -0.00013779103755950928, -0.0001330152153968811, -0.00012823939323425293, -0.00012346357107162476, -0.00011868774890899658, -0.00011391192674636841, -0.00010913610458374023, -0.00010436028242111206, -9.958446025848389e-05, -9.480863809585571e-05, -9.003281593322754e-05, -8.525699377059937e-05, -8.048117160797119e-05, -7.570534944534302e-05, -7.092952728271484e-05, -6.615370512008667e-05, -6.13778829574585e-05, -5.660206079483032e-05, -5.182623863220215e-05, -4.7050416469573975e-05, -4.22745943069458e-05, -3.749877214431763e-05, -3.272294998168945e-05, -2.794712781906128e-05, -2.3171305656433105e-05, -1.839548349380493e-05, -1.3619661331176758e-05, -8.843839168548584e-06, -4.06801700592041e-06, 7.078051567077637e-07, 5.4836273193359375e-06, 1.0259449481964111e-05, 1.5035271644592285e-05, 1.981109380722046e-05, 2.4586915969848633e-05, 2.9362738132476807e-05, 3.413856029510498e-05, 3.8914382457733154e-05, 4.369020462036133e-05, 4.84660267829895e-05, 5.3241848945617676e-05, 5.801767110824585e-05, 6.279349327087402e-05, 6.75693154335022e-05, 7.234513759613037e-05, 7.712095975875854e-05, 8.189678192138672e-05, 8.667260408401489e-05, 9.144842624664307e-05, 9.622424840927124e-05, 0.00010100007057189941, 0.00010577589273452759, 0.00011055171489715576, 0.00011532753705978394, 0.00012010335922241211, 0.00012487918138504028, 0.00012965500354766846, 0.00013443082571029663, 0.0001392066478729248, 0.00014398247003555298, 0.00014875829219818115, 0.00015353411436080933, 0.0001583099365234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 2.0, 14.0, 14.0, 27.0, 33.0, 64.0, 98.0, 155.0, 240.0, 417.0, 651.0, 1200.0, 2249.0, 4140.0, 7853.0, 15778.0, 35109.0, 83564.0, 205331.0, 329987.0, 207490.0, 85199.0, 35273.0, 16383.0, 7944.0, 4147.0, 2219.0, 1238.0, 712.0, 376.0, 244.0, 147.0, 91.0, 62.0, 27.0, 17.0, 14.0, 12.0, 14.0, 5.0, 11.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.90234375, -2.8182373046875, -2.734130859375, -2.6500244140625, -2.56591796875, -2.4818115234375, -2.397705078125, -2.3135986328125, -2.2294921875, -2.1453857421875, -2.061279296875, -1.9771728515625, -1.89306640625, -1.8089599609375, -1.724853515625, -1.6407470703125, -1.556640625, -1.4725341796875, -1.388427734375, -1.3043212890625, -1.22021484375, -1.1361083984375, -1.052001953125, -0.9678955078125, -0.8837890625, -0.7996826171875, -0.715576171875, -0.6314697265625, -0.54736328125, -0.4632568359375, -0.379150390625, -0.2950439453125, -0.2109375, -0.1268310546875, -0.042724609375, 0.0413818359375, 0.12548828125, 0.2095947265625, 0.293701171875, 0.3778076171875, 0.4619140625, 0.5460205078125, 0.630126953125, 0.7142333984375, 0.79833984375, 0.8824462890625, 0.966552734375, 1.0506591796875, 1.134765625, 1.2188720703125, 1.302978515625, 1.3870849609375, 1.47119140625, 1.5552978515625, 1.639404296875, 1.7235107421875, 1.8076171875, 1.8917236328125, 1.975830078125, 2.0599365234375, 2.14404296875, 2.2281494140625, 2.312255859375, 2.3963623046875, 2.48046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 5.0, 14.0, 17.0, 25.0, 44.0, 41.0, 56.0, 63.0, 90.0, 103.0, 112.0, 109.0, 93.0, 56.0, 33.0, 36.0, 19.0, 20.0, 13.0, 12.0, 14.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1787109375, -1.1479949951171875, -1.117279052734375, -1.0865631103515625, -1.05584716796875, -1.0251312255859375, -0.994415283203125, -0.9636993408203125, -0.9329833984375, -0.9022674560546875, -0.871551513671875, -0.8408355712890625, -0.81011962890625, -0.7794036865234375, -0.748687744140625, -0.7179718017578125, -0.687255859375, -0.6565399169921875, -0.625823974609375, -0.5951080322265625, -0.56439208984375, -0.5336761474609375, -0.502960205078125, -0.4722442626953125, -0.4415283203125, -0.4108123779296875, -0.380096435546875, -0.3493804931640625, -0.31866455078125, -0.2879486083984375, -0.257232666015625, -0.2265167236328125, -0.19580078125, -0.1650848388671875, -0.134368896484375, -0.1036529541015625, -0.07293701171875, -0.0422210693359375, -0.011505126953125, 0.0192108154296875, 0.0499267578125, 0.0806427001953125, 0.111358642578125, 0.1420745849609375, 0.17279052734375, 0.2035064697265625, 0.234222412109375, 0.2649383544921875, 0.295654296875, 0.3263702392578125, 0.357086181640625, 0.3878021240234375, 0.41851806640625, 0.4492340087890625, 0.479949951171875, 0.5106658935546875, 0.5413818359375, 0.5720977783203125, 0.602813720703125, 0.6335296630859375, 0.66424560546875, 0.6949615478515625, 0.725677490234375, 0.7563934326171875, 0.787109375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 8.0, 15.0, 12.0, 17.0, 22.0, 19.0, 19.0, 21.0, 27.0, 23.0, 37.0, 31.0, 28.0, 36.0, 50.0, 27.0, 39.0, 41.0, 39.0, 39.0, 34.0, 40.0, 38.0, 37.0, 34.0, 37.0, 27.0, 33.0, 13.0, 27.0, 20.0, 14.0, 12.0, 8.0, 7.0, 13.0, 5.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.514762878417969, -10.161996841430664, -9.80923080444336, -9.456463813781738, -9.103697776794434, -8.750931739807129, -8.398164749145508, -8.045398712158203, -7.692632675170898, -7.339866638183594, -6.987100124359131, -6.634333610534668, -6.281567573547363, -5.928801536560059, -5.576035022735596, -5.223268508911133, -4.870502471923828, -4.517736434936523, -4.1649699211120605, -3.8122036457061768, -3.459437370300293, -3.106671094894409, -2.7539048194885254, -2.4011385440826416, -2.048372268676758, -1.695605993270874, -1.3428397178649902, -0.9900734424591064, -0.6373071670532227, -0.28454089164733887, 0.06822538375854492, 0.4209916591644287, 0.7737579345703125, 1.1265242099761963, 1.47929048538208, 1.8320567607879639, 2.1848230361938477, 2.5375893115997314, 2.8903555870056152, 3.243121862411499, 3.595888137817383, 3.9486544132232666, 4.30142068862915, 4.654187202453613, 5.006953239440918, 5.359719276428223, 5.7124857902526855, 6.065252304077148, 6.418018341064453, 6.770784378051758, 7.123550891876221, 7.476317405700684, 7.829083442687988, 8.181849479675293, 8.534616470336914, 8.887382507324219, 9.240148544311523, 9.592914581298828, 9.945680618286133, 10.298447608947754, 10.651213645935059, 11.003979682922363, 11.356746673583984, 11.709512710571289, 12.062278747558594]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 3.0, 7.0, 13.0, 10.0, 17.0, 18.0, 18.0, 23.0, 14.0, 30.0, 27.0, 35.0, 30.0, 28.0, 33.0, 34.0, 37.0, 41.0, 25.0, 36.0, 45.0, 38.0, 51.0, 36.0, 32.0, 34.0, 26.0, 28.0, 34.0, 31.0, 24.0, 20.0, 18.0, 18.0, 11.0, 15.0, 8.0, 13.0, 10.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.804856300354004, -10.4555082321167, -10.106159210205078, -9.756811141967773, -9.407462120056152, -9.058114051818848, -8.708765029907227, -8.359416961669922, -8.0100679397583, -7.660719394683838, -7.311370849609375, -6.962022304534912, -6.612673759460449, -6.263325214385986, -5.913976669311523, -5.564628601074219, -5.215280055999756, -4.865931510925293, -4.51658296585083, -4.167234420776367, -3.8178858757019043, -3.4685373306274414, -3.1191890239715576, -2.7698404788970947, -2.420491933822632, -2.071143388748169, -1.721794843673706, -1.3724464178085327, -1.0230978727340698, -0.6737493276596069, -0.3244009017944336, 0.024947643280029297, 0.3742961883544922, 0.7236447334289551, 1.072993278503418, 1.4223417043685913, 1.7716902494430542, 2.1210389137268066, 2.4703872203826904, 2.8197357654571533, 3.169084310531616, 3.518432855606079, 3.867781400680542, 4.217129707336426, 4.566478252410889, 4.915826797485352, 5.2651753425598145, 5.614523887634277, 5.96387243270874, 6.313220977783203, 6.662569522857666, 7.011918067932129, 7.361266613006592, 7.710615158081055, 8.05996322631836, 8.40931224822998, 8.758660316467285, 9.10800838470459, 9.457357406616211, 9.806705474853516, 10.156054496765137, 10.505402565002441, 10.854751586914062, 11.204099655151367, 11.553448677062988]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 14.0, 16.0, 26.0, 43.0, 89.0, 150.0, 242.0, 420.0, 694.0, 1147.0, 1877.0, 2964.0, 4906.0, 7567.0, 11830.0, 17842.0, 25957.0, 36653.0, 50227.0, 65330.0, 79486.0, 93150.0, 101037.0, 101978.0, 97260.0, 86087.0, 71956.0, 56433.0, 42567.0, 30443.0, 20930.0, 14411.0, 9243.0, 5979.0, 3783.0, 2236.0, 1376.0, 902.0, 498.0, 336.0, 192.0, 133.0, 52.0, 38.0, 21.0, 14.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7890625, -8.48828125, -8.1875, -7.88671875, -7.5859375, -7.28515625, -6.984375, -6.68359375, -6.3828125, -6.08203125, -5.78125, -5.48046875, -5.1796875, -4.87890625, -4.578125, -4.27734375, -3.9765625, -3.67578125, -3.375, -3.07421875, -2.7734375, -2.47265625, -2.171875, -1.87109375, -1.5703125, -1.26953125, -0.96875, -0.66796875, -0.3671875, -0.06640625, 0.234375, 0.53515625, 0.8359375, 1.13671875, 1.4375, 1.73828125, 2.0390625, 2.33984375, 2.640625, 2.94140625, 3.2421875, 3.54296875, 3.84375, 4.14453125, 4.4453125, 4.74609375, 5.046875, 5.34765625, 5.6484375, 5.94921875, 6.25, 6.55078125, 6.8515625, 7.15234375, 7.453125, 7.75390625, 8.0546875, 8.35546875, 8.65625, 8.95703125, 9.2578125, 9.55859375, 9.859375, 10.16015625, 10.4609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 6.0, 14.0, 9.0, 17.0, 18.0, 16.0, 25.0, 17.0, 23.0, 32.0, 37.0, 25.0, 31.0, 37.0, 28.0, 38.0, 37.0, 31.0, 35.0, 44.0, 39.0, 53.0, 30.0, 34.0, 34.0, 29.0, 20.0, 41.0, 29.0, 26.0, 21.0, 15.0, 19.0, 13.0, 13.0, 9.0, 13.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.453125, -10.1156005859375, -9.778076171875, -9.4405517578125, -9.10302734375, -8.7655029296875, -8.427978515625, -8.0904541015625, -7.7529296875, -7.4154052734375, -7.077880859375, -6.7403564453125, -6.40283203125, -6.0653076171875, -5.727783203125, -5.3902587890625, -5.052734375, -4.7152099609375, -4.377685546875, -4.0401611328125, -3.70263671875, -3.3651123046875, -3.027587890625, -2.6900634765625, -2.3525390625, -2.0150146484375, -1.677490234375, -1.3399658203125, -1.00244140625, -0.6649169921875, -0.327392578125, 0.0101318359375, 0.34765625, 0.6851806640625, 1.022705078125, 1.3602294921875, 1.69775390625, 2.0352783203125, 2.372802734375, 2.7103271484375, 3.0478515625, 3.3853759765625, 3.722900390625, 4.0604248046875, 4.39794921875, 4.7354736328125, 5.072998046875, 5.4105224609375, 5.748046875, 6.0855712890625, 6.423095703125, 6.7606201171875, 7.09814453125, 7.4356689453125, 7.773193359375, 8.1107177734375, 8.4482421875, 8.7857666015625, 9.123291015625, 9.4608154296875, 9.79833984375, 10.1358642578125, 10.473388671875, 10.8109130859375, 11.1484375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 14.0, 25.0, 36.0, 62.0, 77.0, 133.0, 218.0, 352.0, 492.0, 771.0, 1253.0, 1820.0, 3014.0, 4718.0, 7217.0, 10831.0, 16167.0, 23579.0, 33465.0, 45805.0, 59657.0, 74116.0, 87787.0, 97082.0, 101062.0, 97658.0, 88495.0, 75738.0, 61387.0, 47044.0, 34628.0, 24526.0, 16942.0, 11452.0, 7439.0, 4934.0, 3044.0, 1955.0, 1274.0, 816.0, 538.0, 330.0, 221.0, 150.0, 82.0, 45.0, 39.0, 19.0, 16.0, 11.0, 9.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.9765625, -8.6827392578125, -8.388916015625, -8.0950927734375, -7.80126953125, -7.5074462890625, -7.213623046875, -6.9197998046875, -6.6259765625, -6.3321533203125, -6.038330078125, -5.7445068359375, -5.45068359375, -5.1568603515625, -4.863037109375, -4.5692138671875, -4.275390625, -3.9815673828125, -3.687744140625, -3.3939208984375, -3.10009765625, -2.8062744140625, -2.512451171875, -2.2186279296875, -1.9248046875, -1.6309814453125, -1.337158203125, -1.0433349609375, -0.74951171875, -0.4556884765625, -0.161865234375, 0.1319580078125, 0.42578125, 0.7196044921875, 1.013427734375, 1.3072509765625, 1.60107421875, 1.8948974609375, 2.188720703125, 2.4825439453125, 2.7763671875, 3.0701904296875, 3.364013671875, 3.6578369140625, 3.95166015625, 4.2454833984375, 4.539306640625, 4.8331298828125, 5.126953125, 5.4207763671875, 5.714599609375, 6.0084228515625, 6.30224609375, 6.5960693359375, 6.889892578125, 7.1837158203125, 7.4775390625, 7.7713623046875, 8.065185546875, 8.3590087890625, 8.65283203125, 8.9466552734375, 9.240478515625, 9.5343017578125, 9.828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 5.0, 5.0, 3.0, 10.0, 8.0, 13.0, 17.0, 24.0, 11.0, 11.0, 24.0, 19.0, 30.0, 29.0, 26.0, 37.0, 39.0, 36.0, 52.0, 49.0, 28.0, 31.0, 37.0, 45.0, 48.0, 40.0, 36.0, 39.0, 38.0, 27.0, 23.0, 25.0, 22.0, 20.0, 24.0, 15.0, 12.0, 10.0, 4.0, 6.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.2578125, -7.0216064453125, -6.785400390625, -6.5491943359375, -6.31298828125, -6.0767822265625, -5.840576171875, -5.6043701171875, -5.3681640625, -5.1319580078125, -4.895751953125, -4.6595458984375, -4.42333984375, -4.1871337890625, -3.950927734375, -3.7147216796875, -3.478515625, -3.2423095703125, -3.006103515625, -2.7698974609375, -2.53369140625, -2.2974853515625, -2.061279296875, -1.8250732421875, -1.5888671875, -1.3526611328125, -1.116455078125, -0.8802490234375, -0.64404296875, -0.4078369140625, -0.171630859375, 0.0645751953125, 0.30078125, 0.5369873046875, 0.773193359375, 1.0093994140625, 1.24560546875, 1.4818115234375, 1.718017578125, 1.9542236328125, 2.1904296875, 2.4266357421875, 2.662841796875, 2.8990478515625, 3.13525390625, 3.3714599609375, 3.607666015625, 3.8438720703125, 4.080078125, 4.3162841796875, 4.552490234375, 4.7886962890625, 5.02490234375, 5.2611083984375, 5.497314453125, 5.7335205078125, 5.9697265625, 6.2059326171875, 6.442138671875, 6.6783447265625, 6.91455078125, 7.1507568359375, 7.386962890625, 7.6231689453125, 7.859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 14.0, 6.0, 20.0, 23.0, 31.0, 52.0, 61.0, 110.0, 149.0, 230.0, 306.0, 513.0, 722.0, 1241.0, 2108.0, 3525.0, 6263.0, 10745.0, 18454.0, 30984.0, 49766.0, 75907.0, 106376.0, 132618.0, 143685.0, 135653.0, 111648.0, 80526.0, 53859.0, 33868.0, 20480.0, 11721.0, 6868.0, 3983.0, 2344.0, 1380.0, 804.0, 504.0, 327.0, 222.0, 147.0, 100.0, 67.0, 42.0, 38.0, 23.0, 15.0, 14.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.53515625, -5.35418701171875, -5.1732177734375, -4.99224853515625, -4.811279296875, -4.63031005859375, -4.4493408203125, -4.26837158203125, -4.08740234375, -3.90643310546875, -3.7254638671875, -3.54449462890625, -3.363525390625, -3.18255615234375, -3.0015869140625, -2.82061767578125, -2.6396484375, -2.45867919921875, -2.2777099609375, -2.09674072265625, -1.915771484375, -1.73480224609375, -1.5538330078125, -1.37286376953125, -1.19189453125, -1.01092529296875, -0.8299560546875, -0.64898681640625, -0.468017578125, -0.28704833984375, -0.1060791015625, 0.07489013671875, 0.255859375, 0.43682861328125, 0.6177978515625, 0.79876708984375, 0.979736328125, 1.16070556640625, 1.3416748046875, 1.52264404296875, 1.70361328125, 1.88458251953125, 2.0655517578125, 2.24652099609375, 2.427490234375, 2.60845947265625, 2.7894287109375, 2.97039794921875, 3.1513671875, 3.33233642578125, 3.5133056640625, 3.69427490234375, 3.875244140625, 4.05621337890625, 4.2371826171875, 4.41815185546875, 4.59912109375, 4.78009033203125, 4.9610595703125, 5.14202880859375, 5.322998046875, 5.50396728515625, 5.6849365234375, 5.86590576171875, 6.046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 6.0, 9.0, 8.0, 12.0, 19.0, 13.0, 20.0, 26.0, 28.0, 34.0, 23.0, 34.0, 44.0, 27.0, 46.0, 60.0, 56.0, 47.0, 55.0, 54.0, 43.0, 59.0, 42.0, 46.0, 33.0, 22.0, 31.0, 16.0, 17.0, 13.0, 13.0, 9.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0007762908935546875, -0.0007555261254310608, -0.0007347613573074341, -0.0007139965891838074, -0.0006932318210601807, -0.000672467052936554, -0.0006517022848129272, -0.0006309375166893005, -0.0006101727485656738, -0.0005894079804420471, -0.0005686432123184204, -0.0005478784441947937, -0.000527113676071167, -0.0005063489079475403, -0.0004855841398239136, -0.00046481937170028687, -0.00044405460357666016, -0.00042328983545303345, -0.00040252506732940674, -0.00038176029920578003, -0.0003609955310821533, -0.0003402307629585266, -0.0003194659948348999, -0.0002987012267112732, -0.0002779364585876465, -0.0002571716904640198, -0.00023640692234039307, -0.00021564215421676636, -0.00019487738609313965, -0.00017411261796951294, -0.00015334784984588623, -0.00013258308172225952, -0.00011181831359863281, -9.10535454750061e-05, -7.02887773513794e-05, -4.9524009227752686e-05, -2.8759241104125977e-05, -7.994472980499268e-06, 1.2770295143127441e-05, 3.353506326675415e-05, 5.429983139038086e-05, 7.506459951400757e-05, 9.582936763763428e-05, 0.00011659413576126099, 0.0001373589038848877, 0.0001581236720085144, 0.0001788884401321411, 0.00019965320825576782, 0.00022041797637939453, 0.00024118274450302124, 0.00026194751262664795, 0.00028271228075027466, 0.00030347704887390137, 0.0003242418169975281, 0.0003450065851211548, 0.0003657713532447815, 0.0003865361213684082, 0.0004073008894920349, 0.0004280656576156616, 0.00044883042573928833, 0.00046959519386291504, 0.0004903599619865417, 0.0005111247301101685, 0.0005318894982337952, 0.0005526542663574219]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 9.0, 9.0, 7.0, 12.0, 26.0, 33.0, 70.0, 140.0, 223.0, 313.0, 559.0, 982.0, 1682.0, 3060.0, 5492.0, 10246.0, 18484.0, 33366.0, 57483.0, 92055.0, 131103.0, 160577.0, 162238.0, 135478.0, 95763.0, 60516.0, 35026.0, 19546.0, 10700.0, 5756.0, 3138.0, 1898.0, 1022.0, 619.0, 384.0, 226.0, 133.0, 71.0, 58.0, 18.0, 15.0, 10.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.2735595703125, -7.031494140625, -6.7894287109375, -6.54736328125, -6.3052978515625, -6.063232421875, -5.8211669921875, -5.5791015625, -5.3370361328125, -5.094970703125, -4.8529052734375, -4.61083984375, -4.3687744140625, -4.126708984375, -3.8846435546875, -3.642578125, -3.4005126953125, -3.158447265625, -2.9163818359375, -2.67431640625, -2.4322509765625, -2.190185546875, -1.9481201171875, -1.7060546875, -1.4639892578125, -1.221923828125, -0.9798583984375, -0.73779296875, -0.4957275390625, -0.253662109375, -0.0115966796875, 0.23046875, 0.4725341796875, 0.714599609375, 0.9566650390625, 1.19873046875, 1.4407958984375, 1.682861328125, 1.9249267578125, 2.1669921875, 2.4090576171875, 2.651123046875, 2.8931884765625, 3.13525390625, 3.3773193359375, 3.619384765625, 3.8614501953125, 4.103515625, 4.3455810546875, 4.587646484375, 4.8297119140625, 5.07177734375, 5.3138427734375, 5.555908203125, 5.7979736328125, 6.0400390625, 6.2821044921875, 6.524169921875, 6.7662353515625, 7.00830078125, 7.2503662109375, 7.492431640625, 7.7344970703125, 7.9765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 12.0, 14.0, 10.0, 29.0, 30.0, 30.0, 39.0, 51.0, 51.0, 55.0, 76.0, 70.0, 82.0, 67.0, 68.0, 47.0, 37.0, 45.0, 40.0, 31.0, 27.0, 19.0, 11.0, 10.0, 10.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.97259521484375, -2.8690185546875, -2.76544189453125, -2.661865234375, -2.55828857421875, -2.4547119140625, -2.35113525390625, -2.24755859375, -2.14398193359375, -2.0404052734375, -1.93682861328125, -1.833251953125, -1.72967529296875, -1.6260986328125, -1.52252197265625, -1.4189453125, -1.31536865234375, -1.2117919921875, -1.10821533203125, -1.004638671875, -0.90106201171875, -0.7974853515625, -0.69390869140625, -0.59033203125, -0.48675537109375, -0.3831787109375, -0.27960205078125, -0.176025390625, -0.07244873046875, 0.0311279296875, 0.13470458984375, 0.23828125, 0.34185791015625, 0.4454345703125, 0.54901123046875, 0.652587890625, 0.75616455078125, 0.8597412109375, 0.96331787109375, 1.06689453125, 1.17047119140625, 1.2740478515625, 1.37762451171875, 1.481201171875, 1.58477783203125, 1.6883544921875, 1.79193115234375, 1.8955078125, 1.99908447265625, 2.1026611328125, 2.20623779296875, 2.309814453125, 2.41339111328125, 2.5169677734375, 2.62054443359375, 2.72412109375, 2.82769775390625, 2.9312744140625, 3.03485107421875, 3.138427734375, 3.24200439453125, 3.3455810546875, 3.44915771484375, 3.552734375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 9.0, 5.0, 8.0, 13.0, 13.0, 13.0, 25.0, 19.0, 15.0, 22.0, 30.0, 33.0, 26.0, 39.0, 23.0, 35.0, 36.0, 40.0, 47.0, 33.0, 44.0, 43.0, 41.0, 45.0, 53.0, 41.0, 44.0, 29.0, 31.0, 24.0, 20.0, 17.0, 19.0, 14.0, 10.0, 7.0, 5.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.578670501708984, -11.192037582397461, -10.805404663085938, -10.418771743774414, -10.032139778137207, -9.645506858825684, -9.25887393951416, -8.872241020202637, -8.48560905456543, -8.098976135253906, -7.712343692779541, -7.325710773468018, -6.939078330993652, -6.552445411682129, -6.1658124923706055, -5.779179573059082, -5.392546653747559, -5.005913734436035, -4.61928129196167, -4.2326483726501465, -3.846015691757202, -3.459383010864258, -3.0727500915527344, -2.68611741065979, -2.2994847297668457, -1.9128520488739014, -1.5262192487716675, -1.1395864486694336, -0.7529537677764893, -0.3663210868835449, 0.020311832427978516, 0.40694451332092285, 0.7935762405395508, 1.1802089214324951, 1.566841721534729, 1.953474521636963, 2.3401072025299072, 2.7267398834228516, 3.113372802734375, 3.5000054836273193, 3.8866381645202637, 4.273271083831787, 4.659903526306152, 5.046536445617676, 5.433169364929199, 5.8198018074035645, 6.206434726715088, 6.593067169189453, 6.979700088500977, 7.3663330078125, 7.752965450286865, 8.139598846435547, 8.526230812072754, 8.912863731384277, 9.2994966506958, 9.686129570007324, 10.072761535644531, 10.459394454956055, 10.846027374267578, 11.232660293579102, 11.619292259216309, 12.005925178527832, 12.392558097839355, 12.779191017150879, 13.165823936462402]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 9.0, 10.0, 23.0, 20.0, 15.0, 19.0, 26.0, 22.0, 26.0, 25.0, 32.0, 28.0, 41.0, 50.0, 31.0, 52.0, 31.0, 37.0, 34.0, 33.0, 41.0, 35.0, 45.0, 37.0, 37.0, 26.0, 28.0, 28.0, 17.0, 22.0, 20.0, 18.0, 17.0, 12.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.380697250366211, -11.008035659790039, -10.635375022888184, -10.262714385986328, -9.890052795410156, -9.517391204833984, -9.144730567932129, -8.772069931030273, -8.399408340454102, -8.02674674987793, -7.654086112976074, -7.2814249992370605, -6.908763885498047, -6.536102771759033, -6.1634416580200195, -5.790780544281006, -5.418119430541992, -5.0454583168029785, -4.672797203063965, -4.300136089324951, -3.9274749755859375, -3.554813861846924, -3.18215274810791, -2.8094916343688965, -2.436830520629883, -2.064169406890869, -1.6915082931518555, -1.3188471794128418, -0.9461860656738281, -0.5735249519348145, -0.20086383819580078, 0.1717972755432129, 0.544459342956543, 0.9171204566955566, 1.2897815704345703, 1.662442684173584, 2.0351037979125977, 2.4077649116516113, 2.780426025390625, 3.1530871391296387, 3.5257482528686523, 3.898409366607666, 4.27107048034668, 4.643731594085693, 5.016392707824707, 5.389053821563721, 5.761714935302734, 6.134376049041748, 6.507037162780762, 6.879698276519775, 7.252359390258789, 7.625020503997803, 7.997681617736816, 8.370342254638672, 8.743003845214844, 9.115665435791016, 9.488326072692871, 9.860986709594727, 10.233648300170898, 10.60630989074707, 10.978970527648926, 11.351631164550781, 11.724292755126953, 12.096954345703125, 12.46961498260498]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 22.0, 20.0, 49.0, 53.0, 111.0, 216.0, 416.0, 615.0, 1101.0, 1733.0, 3060.0, 4900.0, 7845.0, 12793.0, 20259.0, 32113.0, 48900.0, 74258.0, 108393.0, 153381.0, 208827.0, 275501.0, 338902.0, 392371.0, 423160.0, 422425.0, 390641.0, 336118.0, 270581.0, 206546.0, 149774.0, 105660.0, 71551.0, 48018.0, 31387.0, 19782.0, 12573.0, 7723.0, 4872.0, 2988.0, 1725.0, 1154.0, 666.0, 442.0, 248.0, 176.0, 95.0, 51.0, 41.0, 21.0, 12.0, 10.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.8515625, -8.57470703125, -8.2978515625, -8.02099609375, -7.744140625, -7.46728515625, -7.1904296875, -6.91357421875, -6.63671875, -6.35986328125, -6.0830078125, -5.80615234375, -5.529296875, -5.25244140625, -4.9755859375, -4.69873046875, -4.421875, -4.14501953125, -3.8681640625, -3.59130859375, -3.314453125, -3.03759765625, -2.7607421875, -2.48388671875, -2.20703125, -1.93017578125, -1.6533203125, -1.37646484375, -1.099609375, -0.82275390625, -0.5458984375, -0.26904296875, 0.0078125, 0.28466796875, 0.5615234375, 0.83837890625, 1.115234375, 1.39208984375, 1.6689453125, 1.94580078125, 2.22265625, 2.49951171875, 2.7763671875, 3.05322265625, 3.330078125, 3.60693359375, 3.8837890625, 4.16064453125, 4.4375, 4.71435546875, 4.9912109375, 5.26806640625, 5.544921875, 5.82177734375, 6.0986328125, 6.37548828125, 6.65234375, 6.92919921875, 7.2060546875, 7.48291015625, 7.759765625, 8.03662109375, 8.3134765625, 8.59033203125, 8.8671875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 3.0, 8.0, 19.0, 19.0, 22.0, 22.0, 17.0, 24.0, 23.0, 29.0, 27.0, 29.0, 38.0, 39.0, 39.0, 38.0, 49.0, 43.0, 25.0, 30.0, 37.0, 35.0, 42.0, 41.0, 35.0, 29.0, 33.0, 26.0, 23.0, 23.0, 11.0, 27.0, 16.0, 17.0, 9.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.609375, -9.2900390625, -8.970703125, -8.6513671875, -8.33203125, -8.0126953125, -7.693359375, -7.3740234375, -7.0546875, -6.7353515625, -6.416015625, -6.0966796875, -5.77734375, -5.4580078125, -5.138671875, -4.8193359375, -4.5, -4.1806640625, -3.861328125, -3.5419921875, -3.22265625, -2.9033203125, -2.583984375, -2.2646484375, -1.9453125, -1.6259765625, -1.306640625, -0.9873046875, -0.66796875, -0.3486328125, -0.029296875, 0.2900390625, 0.609375, 0.9287109375, 1.248046875, 1.5673828125, 1.88671875, 2.2060546875, 2.525390625, 2.8447265625, 3.1640625, 3.4833984375, 3.802734375, 4.1220703125, 4.44140625, 4.7607421875, 5.080078125, 5.3994140625, 5.71875, 6.0380859375, 6.357421875, 6.6767578125, 6.99609375, 7.3154296875, 7.634765625, 7.9541015625, 8.2734375, 8.5927734375, 8.912109375, 9.2314453125, 9.55078125, 9.8701171875, 10.189453125, 10.5087890625, 10.828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 21.0, 13.0, 47.0, 86.0, 121.0, 310.0, 527.0, 929.0, 1740.0, 3124.0, 5521.0, 9433.0, 16046.0, 26932.0, 43783.0, 68772.0, 105239.0, 152669.0, 213773.0, 283335.0, 349839.0, 405741.0, 436985.0, 434927.0, 400247.0, 341703.0, 272725.0, 206600.0, 146296.0, 99543.0, 64936.0, 41310.0, 25371.0, 15152.0, 8963.0, 5138.0, 2829.0, 1566.0, 923.0, 480.0, 289.0, 157.0, 66.0, 34.0, 31.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.4453125, -11.1268310546875, -10.808349609375, -10.4898681640625, -10.17138671875, -9.8529052734375, -9.534423828125, -9.2159423828125, -8.8974609375, -8.5789794921875, -8.260498046875, -7.9420166015625, -7.62353515625, -7.3050537109375, -6.986572265625, -6.6680908203125, -6.349609375, -6.0311279296875, -5.712646484375, -5.3941650390625, -5.07568359375, -4.7572021484375, -4.438720703125, -4.1202392578125, -3.8017578125, -3.4832763671875, -3.164794921875, -2.8463134765625, -2.52783203125, -2.2093505859375, -1.890869140625, -1.5723876953125, -1.25390625, -0.9354248046875, -0.616943359375, -0.2984619140625, 0.02001953125, 0.3385009765625, 0.656982421875, 0.9754638671875, 1.2939453125, 1.6124267578125, 1.930908203125, 2.2493896484375, 2.56787109375, 2.8863525390625, 3.204833984375, 3.5233154296875, 3.841796875, 4.1602783203125, 4.478759765625, 4.7972412109375, 5.11572265625, 5.4342041015625, 5.752685546875, 6.0711669921875, 6.3896484375, 6.7081298828125, 7.026611328125, 7.3450927734375, 7.66357421875, 7.9820556640625, 8.300537109375, 8.6190185546875, 8.9375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 5.0, 4.0, 11.0, 14.0, 23.0, 16.0, 23.0, 34.0, 36.0, 39.0, 52.0, 58.0, 85.0, 92.0, 127.0, 111.0, 135.0, 147.0, 165.0, 190.0, 167.0, 170.0, 196.0, 193.0, 219.0, 182.0, 184.0, 184.0, 175.0, 144.0, 147.0, 105.0, 107.0, 86.0, 62.0, 65.0, 52.0, 66.0, 43.0, 28.0, 31.0, 21.0, 18.0, 12.0, 13.0, 5.0, 5.0, 11.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.6171875, -4.47027587890625, -4.3233642578125, -4.17645263671875, -4.029541015625, -3.88262939453125, -3.7357177734375, -3.58880615234375, -3.44189453125, -3.29498291015625, -3.1480712890625, -3.00115966796875, -2.854248046875, -2.70733642578125, -2.5604248046875, -2.41351318359375, -2.2666015625, -2.11968994140625, -1.9727783203125, -1.82586669921875, -1.678955078125, -1.53204345703125, -1.3851318359375, -1.23822021484375, -1.09130859375, -0.94439697265625, -0.7974853515625, -0.65057373046875, -0.503662109375, -0.35675048828125, -0.2098388671875, -0.06292724609375, 0.083984375, 0.23089599609375, 0.3778076171875, 0.52471923828125, 0.671630859375, 0.81854248046875, 0.9654541015625, 1.11236572265625, 1.25927734375, 1.40618896484375, 1.5531005859375, 1.70001220703125, 1.846923828125, 1.99383544921875, 2.1407470703125, 2.28765869140625, 2.4345703125, 2.58148193359375, 2.7283935546875, 2.87530517578125, 3.022216796875, 3.16912841796875, 3.3160400390625, 3.46295166015625, 3.60986328125, 3.75677490234375, 3.9036865234375, 4.05059814453125, 4.197509765625, 4.34442138671875, 4.4913330078125, 4.63824462890625, 4.78515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 9.0, 10.0, 9.0, 23.0, 13.0, 25.0, 26.0, 29.0, 33.0, 52.0, 36.0, 49.0, 48.0, 58.0, 50.0, 39.0, 54.0, 44.0, 54.0, 54.0, 44.0, 33.0, 33.0, 35.0, 27.0, 21.0, 19.0, 10.0, 12.0, 9.0, 4.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.173664093017578, -15.68911361694336, -15.204562187194824, -14.720011711120605, -14.235461235046387, -13.750909805297852, -13.266359329223633, -12.781808853149414, -12.297258377075195, -11.812707901000977, -11.328156471252441, -10.843605995178223, -10.359055519104004, -9.874504089355469, -9.38995361328125, -8.905403137207031, -8.420851707458496, -7.936300754547119, -7.4517502784729, -6.967199325561523, -6.482648849487305, -5.998097896575928, -5.513546943664551, -5.028996467590332, -4.544445514678955, -4.059894561767578, -3.5753440856933594, -3.0907931327819824, -2.6062424182891846, -2.1216917037963867, -1.6371407508850098, -1.152590036392212, -0.6680393218994141, -0.18348854780197144, 0.3010622262954712, 0.7856130599975586, 1.2701637744903564, 1.7547144889831543, 2.2392654418945312, 2.723816156387329, 3.208366870880127, 3.692917585372925, 4.177468299865723, 4.6620192527771, 5.146570205688477, 5.631120681762695, 6.115671634674072, 6.600222587585449, 7.084773063659668, 7.569324016571045, 8.053874969482422, 8.53842544555664, 9.02297592163086, 9.507526397705078, 9.992077827453613, 10.476628303527832, 10.961179733276367, 11.445730209350586, 11.930281639099121, 12.41483211517334, 12.899382591247559, 13.383934020996094, 13.868484497070312, 14.353034973144531, 14.83758544921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 9.0, 6.0, 10.0, 7.0, 7.0, 11.0, 15.0, 16.0, 22.0, 28.0, 18.0, 36.0, 36.0, 28.0, 50.0, 42.0, 37.0, 44.0, 37.0, 37.0, 36.0, 34.0, 42.0, 42.0, 37.0, 31.0, 32.0, 37.0, 32.0, 27.0, 22.0, 25.0, 20.0, 15.0, 20.0, 15.0, 10.0, 5.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.958240509033203, -10.571837425231934, -10.185434341430664, -9.799031257629395, -9.412628173828125, -9.026226043701172, -8.639822959899902, -8.253419876098633, -7.867016792297363, -7.480613708496094, -7.094210624694824, -6.707808017730713, -6.321404933929443, -5.935001850128174, -5.5485992431640625, -5.162196159362793, -4.775793075561523, -4.389389991760254, -4.002986907958984, -3.616584300994873, -3.2301812171936035, -2.843778133392334, -2.4573752880096436, -2.070972442626953, -1.6845693588256836, -1.2981663942337036, -0.9117634296417236, -0.5253604650497437, -0.13895750045776367, 0.2474454641342163, 0.6338484287261963, 1.0202512741088867, 1.4066543579101562, 1.7930573225021362, 2.179460287094116, 2.5658631324768066, 2.952266216278076, 3.3386693000793457, 3.725072145462036, 4.111474990844727, 4.497878074645996, 4.884281158447266, 5.270684242248535, 5.6570868492126465, 6.043489933013916, 6.4298930168151855, 6.816295623779297, 7.202698707580566, 7.589101791381836, 7.9755048751831055, 8.361907958984375, 8.748311042785645, 9.134714126586914, 9.521116256713867, 9.907519340515137, 10.293922424316406, 10.680325508117676, 11.066728591918945, 11.453131675720215, 11.839534759521484, 12.225936889648438, 12.612339973449707, 12.998743057250977, 13.385146141052246, 13.771549224853516]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 30.0, 37.0, 60.0, 86.0, 122.0, 179.0, 267.0, 400.0, 578.0, 905.0, 1221.0, 2050.0, 3296.0, 5267.0, 8770.0, 14803.0, 25072.0, 43849.0, 76516.0, 126358.0, 179913.0, 190683.0, 147476.0, 91192.0, 53346.0, 30664.0, 17731.0, 10498.0, 6307.0, 3874.0, 2372.0, 1519.0, 989.0, 647.0, 448.0, 319.0, 209.0, 150.0, 109.0, 70.0, 44.0, 28.0, 26.0, 18.0, 7.0, 11.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.060546875, -2.968292236328125, -2.87603759765625, -2.783782958984375, -2.6915283203125, -2.599273681640625, -2.50701904296875, -2.414764404296875, -2.322509765625, -2.230255126953125, -2.13800048828125, -2.045745849609375, -1.9534912109375, -1.861236572265625, -1.76898193359375, -1.676727294921875, -1.58447265625, -1.492218017578125, -1.39996337890625, -1.307708740234375, -1.2154541015625, -1.123199462890625, -1.03094482421875, -0.938690185546875, -0.846435546875, -0.754180908203125, -0.66192626953125, -0.569671630859375, -0.4774169921875, -0.385162353515625, -0.29290771484375, -0.200653076171875, -0.1083984375, -0.016143798828125, 0.07611083984375, 0.168365478515625, 0.2606201171875, 0.352874755859375, 0.44512939453125, 0.537384033203125, 0.629638671875, 0.721893310546875, 0.81414794921875, 0.906402587890625, 0.9986572265625, 1.090911865234375, 1.18316650390625, 1.275421142578125, 1.36767578125, 1.459930419921875, 1.55218505859375, 1.644439697265625, 1.7366943359375, 1.828948974609375, 1.92120361328125, 2.013458251953125, 2.105712890625, 2.197967529296875, 2.29022216796875, 2.382476806640625, 2.4747314453125, 2.566986083984375, 2.65924072265625, 2.751495361328125, 2.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 6.0, 8.0, 9.0, 8.0, 8.0, 8.0, 15.0, 18.0, 21.0, 29.0, 17.0, 35.0, 36.0, 29.0, 49.0, 42.0, 37.0, 43.0, 40.0, 34.0, 38.0, 32.0, 42.0, 41.0, 39.0, 30.0, 31.0, 36.0, 37.0, 26.0, 20.0, 25.0, 23.0, 13.0, 20.0, 17.0, 9.0, 6.0, 7.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.5906982421875, -10.204833984375, -9.8189697265625, -9.43310546875, -9.0472412109375, -8.661376953125, -8.2755126953125, -7.8896484375, -7.5037841796875, -7.117919921875, -6.7320556640625, -6.34619140625, -5.9603271484375, -5.574462890625, -5.1885986328125, -4.802734375, -4.4168701171875, -4.031005859375, -3.6451416015625, -3.25927734375, -2.8734130859375, -2.487548828125, -2.1016845703125, -1.7158203125, -1.3299560546875, -0.944091796875, -0.5582275390625, -0.17236328125, 0.2135009765625, 0.599365234375, 0.9852294921875, 1.37109375, 1.7569580078125, 2.142822265625, 2.5286865234375, 2.91455078125, 3.3004150390625, 3.686279296875, 4.0721435546875, 4.4580078125, 4.8438720703125, 5.229736328125, 5.6156005859375, 6.00146484375, 6.3873291015625, 6.773193359375, 7.1590576171875, 7.544921875, 7.9307861328125, 8.316650390625, 8.7025146484375, 9.08837890625, 9.4742431640625, 9.860107421875, 10.2459716796875, 10.6318359375, 11.0177001953125, 11.403564453125, 11.7894287109375, 12.17529296875, 12.5611572265625, 12.947021484375, 13.3328857421875, 13.71875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 13.0, 6.0, 16.0, 23.0, 34.0, 43.0, 63.0, 99.0, 133.0, 214.0, 300.0, 407.0, 654.0, 1032.0, 1726.0, 2850.0, 4814.0, 8537.0, 15712.0, 29385.0, 57411.0, 118969.0, 227277.0, 263381.0, 156014.0, 75839.0, 37890.0, 19384.0, 10592.0, 6239.0, 3495.0, 2138.0, 1275.0, 859.0, 534.0, 393.0, 253.0, 153.0, 106.0, 89.0, 59.0, 45.0, 25.0, 26.0, 17.0, 11.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.31640625, -3.21337890625, -3.1103515625, -3.00732421875, -2.904296875, -2.80126953125, -2.6982421875, -2.59521484375, -2.4921875, -2.38916015625, -2.2861328125, -2.18310546875, -2.080078125, -1.97705078125, -1.8740234375, -1.77099609375, -1.66796875, -1.56494140625, -1.4619140625, -1.35888671875, -1.255859375, -1.15283203125, -1.0498046875, -0.94677734375, -0.84375, -0.74072265625, -0.6376953125, -0.53466796875, -0.431640625, -0.32861328125, -0.2255859375, -0.12255859375, -0.01953125, 0.08349609375, 0.1865234375, 0.28955078125, 0.392578125, 0.49560546875, 0.5986328125, 0.70166015625, 0.8046875, 0.90771484375, 1.0107421875, 1.11376953125, 1.216796875, 1.31982421875, 1.4228515625, 1.52587890625, 1.62890625, 1.73193359375, 1.8349609375, 1.93798828125, 2.041015625, 2.14404296875, 2.2470703125, 2.35009765625, 2.453125, 2.55615234375, 2.6591796875, 2.76220703125, 2.865234375, 2.96826171875, 3.0712890625, 3.17431640625, 3.27734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 11.0, 11.0, 13.0, 13.0, 14.0, 17.0, 28.0, 23.0, 23.0, 28.0, 28.0, 27.0, 33.0, 29.0, 51.0, 31.0, 25.0, 42.0, 28.0, 42.0, 43.0, 50.0, 37.0, 40.0, 39.0, 41.0, 34.0, 21.0, 19.0, 24.0, 19.0, 16.0, 17.0, 11.0, 7.0, 12.0, 9.0, 8.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.734375, -7.4979248046875, -7.261474609375, -7.0250244140625, -6.78857421875, -6.5521240234375, -6.315673828125, -6.0792236328125, -5.8427734375, -5.6063232421875, -5.369873046875, -5.1334228515625, -4.89697265625, -4.6605224609375, -4.424072265625, -4.1876220703125, -3.951171875, -3.7147216796875, -3.478271484375, -3.2418212890625, -3.00537109375, -2.7689208984375, -2.532470703125, -2.2960205078125, -2.0595703125, -1.8231201171875, -1.586669921875, -1.3502197265625, -1.11376953125, -0.8773193359375, -0.640869140625, -0.4044189453125, -0.16796875, 0.0684814453125, 0.304931640625, 0.5413818359375, 0.77783203125, 1.0142822265625, 1.250732421875, 1.4871826171875, 1.7236328125, 1.9600830078125, 2.196533203125, 2.4329833984375, 2.66943359375, 2.9058837890625, 3.142333984375, 3.3787841796875, 3.615234375, 3.8516845703125, 4.088134765625, 4.3245849609375, 4.56103515625, 4.7974853515625, 5.033935546875, 5.2703857421875, 5.5068359375, 5.7432861328125, 5.979736328125, 6.2161865234375, 6.45263671875, 6.6890869140625, 6.925537109375, 7.1619873046875, 7.3984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 13.0, 8.0, 23.0, 33.0, 30.0, 46.0, 82.0, 108.0, 170.0, 187.0, 293.0, 390.0, 610.0, 873.0, 1274.0, 1805.0, 3038.0, 4956.0, 8120.0, 14484.0, 26956.0, 54380.0, 123813.0, 265163.0, 279482.0, 135597.0, 59144.0, 28562.0, 15208.0, 8728.0, 5355.0, 3104.0, 2112.0, 1390.0, 875.0, 614.0, 425.0, 279.0, 230.0, 156.0, 134.0, 87.0, 51.0, 46.0, 33.0, 23.0, 17.0, 16.0, 6.0, 6.0, 6.0, 1.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.90771484375, -0.8775100708007812, -0.8473052978515625, -0.8171005249023438, -0.786895751953125, -0.7566909790039062, -0.7264862060546875, -0.6962814331054688, -0.66607666015625, -0.6358718872070312, -0.6056671142578125, -0.5754623413085938, -0.545257568359375, -0.5150527954101562, -0.4848480224609375, -0.45464324951171875, -0.4244384765625, -0.39423370361328125, -0.3640289306640625, -0.33382415771484375, -0.303619384765625, -0.27341461181640625, -0.2432098388671875, -0.21300506591796875, -0.18280029296875, -0.15259552001953125, -0.1223907470703125, -0.09218597412109375, -0.061981201171875, -0.03177642822265625, -0.0015716552734375, 0.02863311767578125, 0.058837890625, 0.08904266357421875, 0.1192474365234375, 0.14945220947265625, 0.179656982421875, 0.20986175537109375, 0.2400665283203125, 0.27027130126953125, 0.30047607421875, 0.33068084716796875, 0.3608856201171875, 0.39109039306640625, 0.421295166015625, 0.45149993896484375, 0.4817047119140625, 0.5119094848632812, 0.5421142578125, 0.5723190307617188, 0.6025238037109375, 0.6327285766601562, 0.662933349609375, 0.6931381225585938, 0.7233428955078125, 0.7535476684570312, 0.78375244140625, 0.8139572143554688, 0.8441619873046875, 0.8743667602539062, 0.904571533203125, 0.9347763061523438, 0.9649810791015625, 0.9951858520507812, 1.025390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 20.0, 19.0, 29.0, 29.0, 38.0, 58.0, 54.0, 64.0, 68.0, 71.0, 61.0, 94.0, 61.0, 49.0, 48.0, 43.0, 37.0, 31.0, 29.0, 10.0, 13.0, 14.0, 11.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.959936141967773e-05, -9.492877870798111e-05, -9.025819599628448e-05, -8.558761328458786e-05, -8.091703057289124e-05, -7.624644786119461e-05, -7.157586514949799e-05, -6.690528243780136e-05, -6.223469972610474e-05, -5.756411701440811e-05, -5.289353430271149e-05, -4.822295159101486e-05, -4.355236887931824e-05, -3.888178616762161e-05, -3.421120345592499e-05, -2.9540620744228363e-05, -2.4870038032531738e-05, -2.0199455320835114e-05, -1.552887260913849e-05, -1.0858289897441864e-05, -6.187707185745239e-06, -1.5171244740486145e-06, 3.1534582376480103e-06, 7.824040949344635e-06, 1.249462366104126e-05, 1.7165206372737885e-05, 2.183578908443451e-05, 2.6506371796131134e-05, 3.117695450782776e-05, 3.5847537219524384e-05, 4.051811993122101e-05, 4.518870264291763e-05, 4.985928535461426e-05, 5.452986806631088e-05, 5.920045077800751e-05, 6.387103348970413e-05, 6.854161620140076e-05, 7.321219891309738e-05, 7.7882781624794e-05, 8.255336433649063e-05, 8.722394704818726e-05, 9.189452975988388e-05, 9.65651124715805e-05, 0.00010123569518327713, 0.00010590627789497375, 0.00011057686060667038, 0.000115247443318367, 0.00011991802603006363, 0.00012458860874176025, 0.00012925919145345688, 0.0001339297741651535, 0.00013860035687685013, 0.00014327093958854675, 0.00014794152230024338, 0.00015261210501194, 0.00015728268772363663, 0.00016195327043533325, 0.00016662385314702988, 0.0001712944358587265, 0.00017596501857042313, 0.00018063560128211975, 0.00018530618399381638, 0.000189976766705513, 0.00019464734941720963, 0.00019931793212890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 10.0, 12.0, 13.0, 27.0, 41.0, 60.0, 88.0, 129.0, 217.0, 287.0, 422.0, 667.0, 1075.0, 1652.0, 2470.0, 3977.0, 6149.0, 9712.0, 15748.0, 25573.0, 42546.0, 69971.0, 113460.0, 165525.0, 183976.0, 149682.0, 98763.0, 60665.0, 36499.0, 22133.0, 13477.0, 8644.0, 5268.0, 3379.0, 2171.0, 1376.0, 876.0, 627.0, 416.0, 260.0, 164.0, 133.0, 81.0, 49.0, 27.0, 31.0, 13.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2747650146484375, -1.234100341796875, -1.1934356689453125, -1.15277099609375, -1.1121063232421875, -1.071441650390625, -1.0307769775390625, -0.9901123046875, -0.9494476318359375, -0.908782958984375, -0.8681182861328125, -0.82745361328125, -0.7867889404296875, -0.746124267578125, -0.7054595947265625, -0.664794921875, -0.6241302490234375, -0.583465576171875, -0.5428009033203125, -0.50213623046875, -0.4614715576171875, -0.420806884765625, -0.3801422119140625, -0.3394775390625, -0.2988128662109375, -0.258148193359375, -0.2174835205078125, -0.17681884765625, -0.1361541748046875, -0.095489501953125, -0.0548248291015625, -0.01416015625, 0.0265045166015625, 0.067169189453125, 0.1078338623046875, 0.14849853515625, 0.1891632080078125, 0.229827880859375, 0.2704925537109375, 0.3111572265625, 0.3518218994140625, 0.392486572265625, 0.4331512451171875, 0.47381591796875, 0.5144805908203125, 0.555145263671875, 0.5958099365234375, 0.636474609375, 0.6771392822265625, 0.717803955078125, 0.7584686279296875, 0.79913330078125, 0.8397979736328125, 0.880462646484375, 0.9211273193359375, 0.9617919921875, 1.0024566650390625, 1.043121337890625, 1.0837860107421875, 1.12445068359375, 1.1651153564453125, 1.205780029296875, 1.2464447021484375, 1.287109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 0.0, 7.0, 2.0, 5.0, 7.0, 8.0, 9.0, 16.0, 14.0, 15.0, 31.0, 33.0, 43.0, 46.0, 43.0, 42.0, 46.0, 57.0, 74.0, 58.0, 59.0, 66.0, 58.0, 50.0, 37.0, 30.0, 23.0, 14.0, 12.0, 17.0, 12.0, 11.0, 6.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.5029296875, -0.4884834289550781, -0.47403717041015625, -0.4595909118652344, -0.4451446533203125, -0.4306983947753906, -0.41625213623046875, -0.4018058776855469, -0.387359619140625, -0.3729133605957031, -0.35846710205078125, -0.3440208435058594, -0.3295745849609375, -0.3151283264160156, -0.30068206787109375, -0.2862358093261719, -0.27178955078125, -0.2573432922363281, -0.24289703369140625, -0.22845077514648438, -0.2140045166015625, -0.19955825805664062, -0.18511199951171875, -0.17066574096679688, -0.156219482421875, -0.14177322387695312, -0.12732696533203125, -0.11288070678710938, -0.0984344482421875, -0.08398818969726562, -0.06954193115234375, -0.055095672607421875, -0.0406494140625, -0.026203155517578125, -0.01175689697265625, 0.002689361572265625, 0.0171356201171875, 0.031581878662109375, 0.04602813720703125, 0.060474395751953125, 0.074920654296875, 0.08936691284179688, 0.10381317138671875, 0.11825942993164062, 0.1327056884765625, 0.14715194702148438, 0.16159820556640625, 0.17604446411132812, 0.19049072265625, 0.20493698120117188, 0.21938323974609375, 0.23382949829101562, 0.2482757568359375, 0.2627220153808594, 0.27716827392578125, 0.2916145324707031, 0.306060791015625, 0.3205070495605469, 0.33495330810546875, 0.3493995666503906, 0.3638458251953125, 0.3782920837402344, 0.39273834228515625, 0.4071846008300781, 0.421630859375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 7.0, 9.0, 14.0, 6.0, 16.0, 17.0, 17.0, 25.0, 28.0, 27.0, 43.0, 38.0, 41.0, 46.0, 48.0, 56.0, 39.0, 54.0, 47.0, 44.0, 46.0, 45.0, 41.0, 33.0, 33.0, 41.0, 29.0, 19.0, 16.0, 13.0, 16.0, 7.0, 9.0, 4.0, 3.0, 7.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.841849327087402, -14.381918907165527, -13.921988487243652, -13.462057113647461, -13.002126693725586, -12.542196273803711, -12.082265853881836, -11.622335433959961, -11.16240406036377, -10.702473640441895, -10.24254322052002, -9.782611846923828, -9.322681427001953, -8.862751007080078, -8.402820587158203, -7.94288969039917, -7.482959270477295, -7.02302885055542, -6.563097953796387, -6.103167533874512, -5.6432366371154785, -5.1833062171936035, -4.72337532043457, -4.263444900512695, -3.803514242172241, -3.343583583831787, -2.883652925491333, -2.423722267150879, -1.9637917280197144, -1.5038611888885498, -1.0439305305480957, -0.5839998722076416, -0.1240692138671875, 0.3358614146709442, 0.7957920432090759, 1.2557226419448853, 1.7156533002853394, 2.175583839416504, 2.635514497756958, 3.095445156097412, 3.555375814437866, 4.01530647277832, 4.475236892700195, 4.9351677894592285, 5.3950982093811035, 5.855029106140137, 6.314959526062012, 6.774889945983887, 7.23482084274292, 7.694751262664795, 8.154682159423828, 8.614612579345703, 9.074542999267578, 9.534473419189453, 9.994404792785645, 10.45433521270752, 10.914265632629395, 11.37419605255127, 11.834126472473145, 12.294057846069336, 12.753988265991211, 13.213918685913086, 13.673849105834961, 14.133779525756836, 14.593710899353027]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 11.0, 5.0, 10.0, 7.0, 8.0, 13.0, 14.0, 24.0, 27.0, 19.0, 22.0, 46.0, 28.0, 40.0, 39.0, 48.0, 39.0, 36.0, 41.0, 44.0, 29.0, 40.0, 47.0, 35.0, 33.0, 34.0, 39.0, 30.0, 31.0, 22.0, 24.0, 24.0, 14.0, 18.0, 18.0, 10.0, 5.0, 8.0, 8.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.263108253479004, -10.871716499328613, -10.480323791503906, -10.088932037353516, -9.697539329528809, -9.306147575378418, -8.914754867553711, -8.52336311340332, -8.13197135925293, -7.740579128265381, -7.349186897277832, -6.957795143127441, -6.566402435302734, -6.175010681152344, -5.783618450164795, -5.392226219177246, -5.000833511352539, -4.60944128036499, -4.218049049377441, -3.8266570568084717, -3.435264825820923, -3.043872594833374, -2.6524806022644043, -2.2610883712768555, -1.8696961402893066, -1.4783039093017578, -1.0869117975234985, -0.6955196857452393, -0.30412745475769043, 0.0872647762298584, 0.4786567687988281, 0.870048999786377, 1.2614412307739258, 1.6528334617614746, 2.0442256927490234, 2.435617685317993, 2.827009916305542, 3.218402147293091, 3.6097941398620605, 4.001186370849609, 4.392578601837158, 4.783970832824707, 5.175363063812256, 5.566755294799805, 5.958147048950195, 6.349539756774902, 6.740931510925293, 7.132323741912842, 7.523715972900391, 7.9151082038879395, 8.306500434875488, 8.697892189025879, 9.089284896850586, 9.480676651000977, 9.872068405151367, 10.263461112976074, 10.654853820800781, 11.046245574951172, 11.437638282775879, 11.82903003692627, 12.220422744750977, 12.611814498901367, 13.003206253051758, 13.394598960876465, 13.785990715026855]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 12.0, 12.0, 25.0, 52.0, 81.0, 145.0, 272.0, 451.0, 831.0, 1380.0, 2506.0, 4278.0, 7119.0, 11879.0, 18761.0, 28800.0, 42124.0, 58587.0, 77341.0, 94282.0, 107946.0, 112810.0, 109416.0, 97582.0, 80341.0, 62238.0, 45097.0, 31602.0, 20509.0, 12793.0, 7924.0, 4775.0, 2716.0, 1624.0, 961.0, 555.0, 327.0, 171.0, 92.0, 59.0, 38.0, 13.0, 9.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.748779296875, -9.41943359375, -9.090087890625, -8.7607421875, -8.431396484375, -8.10205078125, -7.772705078125, -7.443359375, -7.114013671875, -6.78466796875, -6.455322265625, -6.1259765625, -5.796630859375, -5.46728515625, -5.137939453125, -4.80859375, -4.479248046875, -4.14990234375, -3.820556640625, -3.4912109375, -3.161865234375, -2.83251953125, -2.503173828125, -2.173828125, -1.844482421875, -1.51513671875, -1.185791015625, -0.8564453125, -0.527099609375, -0.19775390625, 0.131591796875, 0.4609375, 0.790283203125, 1.11962890625, 1.448974609375, 1.7783203125, 2.107666015625, 2.43701171875, 2.766357421875, 3.095703125, 3.425048828125, 3.75439453125, 4.083740234375, 4.4130859375, 4.742431640625, 5.07177734375, 5.401123046875, 5.73046875, 6.059814453125, 6.38916015625, 6.718505859375, 7.0478515625, 7.377197265625, 7.70654296875, 8.035888671875, 8.365234375, 8.694580078125, 9.02392578125, 9.353271484375, 9.6826171875, 10.011962890625, 10.34130859375, 10.670654296875, 11.0]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 7.0, 9.0, 11.0, 8.0, 7.0, 9.0, 16.0, 21.0, 19.0, 31.0, 16.0, 49.0, 23.0, 40.0, 42.0, 49.0, 34.0, 44.0, 35.0, 45.0, 32.0, 37.0, 48.0, 40.0, 36.0, 28.0, 42.0, 30.0, 30.0, 21.0, 24.0, 25.0, 19.0, 11.0, 23.0, 8.0, 8.0, 9.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.015625, -10.63525390625, -10.2548828125, -9.87451171875, -9.494140625, -9.11376953125, -8.7333984375, -8.35302734375, -7.97265625, -7.59228515625, -7.2119140625, -6.83154296875, -6.451171875, -6.07080078125, -5.6904296875, -5.31005859375, -4.9296875, -4.54931640625, -4.1689453125, -3.78857421875, -3.408203125, -3.02783203125, -2.6474609375, -2.26708984375, -1.88671875, -1.50634765625, -1.1259765625, -0.74560546875, -0.365234375, 0.01513671875, 0.3955078125, 0.77587890625, 1.15625, 1.53662109375, 1.9169921875, 2.29736328125, 2.677734375, 3.05810546875, 3.4384765625, 3.81884765625, 4.19921875, 4.57958984375, 4.9599609375, 5.34033203125, 5.720703125, 6.10107421875, 6.4814453125, 6.86181640625, 7.2421875, 7.62255859375, 8.0029296875, 8.38330078125, 8.763671875, 9.14404296875, 9.5244140625, 9.90478515625, 10.28515625, 10.66552734375, 11.0458984375, 11.42626953125, 11.806640625, 12.18701171875, 12.5673828125, 12.94775390625, 13.328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 6.0, 7.0, 18.0, 27.0, 29.0, 44.0, 83.0, 96.0, 149.0, 305.0, 407.0, 645.0, 1053.0, 1612.0, 2404.0, 3716.0, 5683.0, 8655.0, 12672.0, 18233.0, 26036.0, 35331.0, 46824.0, 59270.0, 72213.0, 83358.0, 91090.0, 94543.0, 92528.0, 84804.0, 73751.0, 61094.0, 48748.0, 36954.0, 26961.0, 19092.0, 13592.0, 9118.0, 6101.0, 4043.0, 2617.0, 1665.0, 1091.0, 644.0, 450.0, 318.0, 153.0, 119.0, 84.0, 46.0, 30.0, 26.0, 9.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.640625, -8.366943359375, -8.09326171875, -7.819580078125, -7.5458984375, -7.272216796875, -6.99853515625, -6.724853515625, -6.451171875, -6.177490234375, -5.90380859375, -5.630126953125, -5.3564453125, -5.082763671875, -4.80908203125, -4.535400390625, -4.26171875, -3.988037109375, -3.71435546875, -3.440673828125, -3.1669921875, -2.893310546875, -2.61962890625, -2.345947265625, -2.072265625, -1.798583984375, -1.52490234375, -1.251220703125, -0.9775390625, -0.703857421875, -0.43017578125, -0.156494140625, 0.1171875, 0.390869140625, 0.66455078125, 0.938232421875, 1.2119140625, 1.485595703125, 1.75927734375, 2.032958984375, 2.306640625, 2.580322265625, 2.85400390625, 3.127685546875, 3.4013671875, 3.675048828125, 3.94873046875, 4.222412109375, 4.49609375, 4.769775390625, 5.04345703125, 5.317138671875, 5.5908203125, 5.864501953125, 6.13818359375, 6.411865234375, 6.685546875, 6.959228515625, 7.23291015625, 7.506591796875, 7.7802734375, 8.053955078125, 8.32763671875, 8.601318359375, 8.875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 4.0, 11.0, 9.0, 10.0, 12.0, 13.0, 15.0, 15.0, 22.0, 23.0, 22.0, 30.0, 27.0, 28.0, 39.0, 29.0, 23.0, 29.0, 44.0, 35.0, 38.0, 25.0, 26.0, 43.0, 39.0, 33.0, 37.0, 28.0, 31.0, 24.0, 28.0, 23.0, 22.0, 23.0, 25.0, 11.0, 16.0, 10.0, 12.0, 15.0, 7.0, 6.0, 1.0, 4.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 3.0], "bins": [-7.20703125, -6.9986572265625, -6.790283203125, -6.5819091796875, -6.37353515625, -6.1651611328125, -5.956787109375, -5.7484130859375, -5.5400390625, -5.3316650390625, -5.123291015625, -4.9149169921875, -4.70654296875, -4.4981689453125, -4.289794921875, -4.0814208984375, -3.873046875, -3.6646728515625, -3.456298828125, -3.2479248046875, -3.03955078125, -2.8311767578125, -2.622802734375, -2.4144287109375, -2.2060546875, -1.9976806640625, -1.789306640625, -1.5809326171875, -1.37255859375, -1.1641845703125, -0.955810546875, -0.7474365234375, -0.5390625, -0.3306884765625, -0.122314453125, 0.0860595703125, 0.29443359375, 0.5028076171875, 0.711181640625, 0.9195556640625, 1.1279296875, 1.3363037109375, 1.544677734375, 1.7530517578125, 1.96142578125, 2.1697998046875, 2.378173828125, 2.5865478515625, 2.794921875, 3.0032958984375, 3.211669921875, 3.4200439453125, 3.62841796875, 3.8367919921875, 4.045166015625, 4.2535400390625, 4.4619140625, 4.6702880859375, 4.878662109375, 5.0870361328125, 5.29541015625, 5.5037841796875, 5.712158203125, 5.9205322265625, 6.12890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 22.0, 30.0, 55.0, 77.0, 106.0, 181.0, 279.0, 439.0, 642.0, 1066.0, 1691.0, 2790.0, 4339.0, 6916.0, 11103.0, 17903.0, 28122.0, 42957.0, 62653.0, 85729.0, 107381.0, 121930.0, 126182.0, 114944.0, 95152.0, 72082.0, 51278.0, 33974.0, 21996.0, 13790.0, 8593.0, 5399.0, 3202.0, 1942.0, 1259.0, 875.0, 524.0, 314.0, 205.0, 145.0, 95.0, 64.0, 39.0, 26.0, 14.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.12109375, -4.9669189453125, -4.812744140625, -4.6585693359375, -4.50439453125, -4.3502197265625, -4.196044921875, -4.0418701171875, -3.8876953125, -3.7335205078125, -3.579345703125, -3.4251708984375, -3.27099609375, -3.1168212890625, -2.962646484375, -2.8084716796875, -2.654296875, -2.5001220703125, -2.345947265625, -2.1917724609375, -2.03759765625, -1.8834228515625, -1.729248046875, -1.5750732421875, -1.4208984375, -1.2667236328125, -1.112548828125, -0.9583740234375, -0.80419921875, -0.6500244140625, -0.495849609375, -0.3416748046875, -0.1875, -0.0333251953125, 0.120849609375, 0.2750244140625, 0.42919921875, 0.5833740234375, 0.737548828125, 0.8917236328125, 1.0458984375, 1.2000732421875, 1.354248046875, 1.5084228515625, 1.66259765625, 1.8167724609375, 1.970947265625, 2.1251220703125, 2.279296875, 2.4334716796875, 2.587646484375, 2.7418212890625, 2.89599609375, 3.0501708984375, 3.204345703125, 3.3585205078125, 3.5126953125, 3.6668701171875, 3.821044921875, 3.9752197265625, 4.12939453125, 4.2835693359375, 4.437744140625, 4.5919189453125, 4.74609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 14.0, 19.0, 13.0, 28.0, 23.0, 37.0, 20.0, 42.0, 29.0, 34.0, 55.0, 42.0, 40.0, 54.0, 52.0, 56.0, 46.0, 49.0, 40.0, 51.0, 32.0, 31.0, 28.0, 22.0, 29.0, 23.0, 16.0, 14.0, 4.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007028579711914062, -0.0006838962435722351, -0.000664934515953064, -0.0006459727883338928, -0.0006270110607147217, -0.0006080493330955505, -0.0005890876054763794, -0.0005701258778572083, -0.0005511641502380371, -0.000532202422618866, -0.0005132406949996948, -0.0004942789673805237, -0.00047531723976135254, -0.0004563555121421814, -0.00043739378452301025, -0.0004184320569038391, -0.00039947032928466797, -0.0003805086016654968, -0.0003615468740463257, -0.00034258514642715454, -0.0003236234188079834, -0.00030466169118881226, -0.0002856999635696411, -0.00026673823595046997, -0.00024777650833129883, -0.00022881478071212769, -0.00020985305309295654, -0.0001908913254737854, -0.00017192959785461426, -0.00015296787023544312, -0.00013400614261627197, -0.00011504441499710083, -9.608268737792969e-05, -7.712095975875854e-05, -5.81592321395874e-05, -3.919750452041626e-05, -2.0235776901245117e-05, -1.2740492820739746e-06, 1.7687678337097168e-05, 3.664940595626831e-05, 5.561113357543945e-05, 7.45728611946106e-05, 9.353458881378174e-05, 0.00011249631643295288, 0.00013145804405212402, 0.00015041977167129517, 0.0001693814992904663, 0.00018834322690963745, 0.0002073049545288086, 0.00022626668214797974, 0.0002452284097671509, 0.000264190137386322, 0.00028315186500549316, 0.0003021135926246643, 0.00032107532024383545, 0.0003400370478630066, 0.00035899877548217773, 0.0003779605031013489, 0.00039692223072052, 0.00041588395833969116, 0.0004348456859588623, 0.00045380741357803345, 0.0004727691411972046, 0.0004917308688163757, 0.0005106925964355469]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 8.0, 9.0, 12.0, 25.0, 27.0, 71.0, 86.0, 136.0, 250.0, 395.0, 710.0, 1101.0, 1989.0, 3292.0, 5903.0, 10365.0, 18562.0, 32547.0, 54926.0, 86720.0, 123533.0, 152690.0, 158119.0, 136638.0, 100564.0, 66495.0, 40056.0, 23115.0, 13056.0, 7382.0, 4109.0, 2255.0, 1320.0, 782.0, 491.0, 317.0, 189.0, 120.0, 67.0, 38.0, 36.0, 21.0, 14.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3203125, -7.08563232421875, -6.8509521484375, -6.61627197265625, -6.381591796875, -6.14691162109375, -5.9122314453125, -5.67755126953125, -5.44287109375, -5.20819091796875, -4.9735107421875, -4.73883056640625, -4.504150390625, -4.26947021484375, -4.0347900390625, -3.80010986328125, -3.5654296875, -3.33074951171875, -3.0960693359375, -2.86138916015625, -2.626708984375, -2.39202880859375, -2.1573486328125, -1.92266845703125, -1.68798828125, -1.45330810546875, -1.2186279296875, -0.98394775390625, -0.749267578125, -0.51458740234375, -0.2799072265625, -0.04522705078125, 0.189453125, 0.42413330078125, 0.6588134765625, 0.89349365234375, 1.128173828125, 1.36285400390625, 1.5975341796875, 1.83221435546875, 2.06689453125, 2.30157470703125, 2.5362548828125, 2.77093505859375, 3.005615234375, 3.24029541015625, 3.4749755859375, 3.70965576171875, 3.9443359375, 4.17901611328125, 4.4136962890625, 4.64837646484375, 4.883056640625, 5.11773681640625, 5.3524169921875, 5.58709716796875, 5.82177734375, 6.05645751953125, 6.2911376953125, 6.52581787109375, 6.760498046875, 6.99517822265625, 7.2298583984375, 7.46453857421875, 7.69921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 11.0, 21.0, 18.0, 24.0, 28.0, 35.0, 50.0, 47.0, 81.0, 85.0, 68.0, 78.0, 66.0, 65.0, 67.0, 55.0, 48.0, 48.0, 20.0, 25.0, 15.0, 17.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.6092529296875, -3.497802734375, -3.3863525390625, -3.27490234375, -3.1634521484375, -3.052001953125, -2.9405517578125, -2.8291015625, -2.7176513671875, -2.606201171875, -2.4947509765625, -2.38330078125, -2.2718505859375, -2.160400390625, -2.0489501953125, -1.9375, -1.8260498046875, -1.714599609375, -1.6031494140625, -1.49169921875, -1.3802490234375, -1.268798828125, -1.1573486328125, -1.0458984375, -0.9344482421875, -0.822998046875, -0.7115478515625, -0.60009765625, -0.4886474609375, -0.377197265625, -0.2657470703125, -0.154296875, -0.0428466796875, 0.068603515625, 0.1800537109375, 0.29150390625, 0.4029541015625, 0.514404296875, 0.6258544921875, 0.7373046875, 0.8487548828125, 0.960205078125, 1.0716552734375, 1.18310546875, 1.2945556640625, 1.406005859375, 1.5174560546875, 1.62890625, 1.7403564453125, 1.851806640625, 1.9632568359375, 2.07470703125, 2.1861572265625, 2.297607421875, 2.4090576171875, 2.5205078125, 2.6319580078125, 2.743408203125, 2.8548583984375, 2.96630859375, 3.0777587890625, 3.189208984375, 3.3006591796875, 3.412109375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 8.0, 9.0, 9.0, 15.0, 26.0, 11.0, 22.0, 22.0, 22.0, 37.0, 26.0, 31.0, 35.0, 38.0, 43.0, 37.0, 54.0, 40.0, 48.0, 40.0, 54.0, 35.0, 43.0, 32.0, 30.0, 22.0, 31.0, 22.0, 19.0, 25.0, 16.0, 6.0, 7.0, 8.0, 7.0, 12.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.578065872192383, -11.183698654174805, -10.789332389831543, -10.394965171813965, -10.000597953796387, -9.606231689453125, -9.211864471435547, -8.817497253417969, -8.42313003540039, -8.028762817382812, -7.634396076202393, -7.240029335021973, -6.8456621170043945, -6.451295375823975, -6.056928634643555, -5.662561416625977, -5.268195152282715, -4.873828411102295, -4.479461193084717, -4.085094451904297, -3.690727472305298, -3.296360492706299, -2.901993751525879, -2.50762677192688, -2.113259792327881, -1.7188928127288818, -1.3245259523391724, -0.9301590919494629, -0.5357921123504639, -0.14142513275146484, 0.2529416084289551, 0.6473085880279541, 1.0416755676269531, 1.4360425472259521, 1.8304094076156616, 2.224776268005371, 2.61914324760437, 3.013510227203369, 3.407876968383789, 3.802243947982788, 4.196610927581787, 4.590977668762207, 4.985344886779785, 5.379711627960205, 5.774078369140625, 6.168445587158203, 6.562812328338623, 6.957179069519043, 7.351546287536621, 7.745913028717041, 8.140279769897461, 8.534646987915039, 8.929014205932617, 9.323381423950195, 9.717747688293457, 10.112114906311035, 10.506481170654297, 10.900848388671875, 11.295214653015137, 11.689581871032715, 12.083949089050293, 12.478315353393555, 12.872682571411133, 13.267049789428711, 13.661417007446289]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 9.0, 8.0, 8.0, 11.0, 15.0, 22.0, 16.0, 23.0, 21.0, 28.0, 22.0, 35.0, 37.0, 41.0, 38.0, 37.0, 29.0, 52.0, 42.0, 31.0, 33.0, 29.0, 34.0, 25.0, 32.0, 40.0, 31.0, 41.0, 33.0, 25.0, 15.0, 18.0, 12.0, 13.0, 17.0, 15.0, 9.0, 4.0, 7.0, 9.0, 7.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.059592247009277, -10.678985595703125, -10.298379898071289, -9.917774200439453, -9.5371675491333, -9.156560897827148, -8.775955200195312, -8.395349502563477, -8.014742851257324, -7.63413667678833, -7.253530502319336, -6.872924327850342, -6.492318153381348, -6.1117119789123535, -5.731105804443359, -5.350499629974365, -4.969893455505371, -4.589287281036377, -4.208681106567383, -3.8280749320983887, -3.4474687576293945, -3.0668625831604004, -2.6862564086914062, -2.305650234222412, -1.925044059753418, -1.5444378852844238, -1.1638317108154297, -0.7832255363464355, -0.4026193618774414, -0.022013187408447266, 0.3585929870605469, 0.739199161529541, 1.1198053359985352, 1.5004115104675293, 1.8810176849365234, 2.2616238594055176, 2.6422300338745117, 3.022836208343506, 3.4034423828125, 3.784048557281494, 4.164654731750488, 4.545260906219482, 4.925867080688477, 5.306473255157471, 5.687079429626465, 6.067685604095459, 6.448291778564453, 6.828897953033447, 7.209504127502441, 7.5901103019714355, 7.97071647644043, 8.351322174072266, 8.731928825378418, 9.11253547668457, 9.493141174316406, 9.873746871948242, 10.254353523254395, 10.634960174560547, 11.015565872192383, 11.396171569824219, 11.776778221130371, 12.157384872436523, 12.53799057006836, 12.918596267700195, 13.299202919006348]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 14.0, 31.0, 33.0, 58.0, 119.0, 176.0, 325.0, 548.0, 924.0, 1543.0, 2538.0, 4142.0, 6849.0, 11088.0, 17722.0, 27710.0, 42817.0, 65007.0, 96655.0, 137396.0, 190933.0, 252039.0, 316092.0, 373063.0, 410780.0, 421996.0, 402189.0, 355578.0, 293255.0, 229475.0, 171099.0, 122116.0, 83953.0, 56058.0, 37009.0, 23959.0, 15037.0, 9382.0, 5916.0, 3438.0, 2092.0, 1241.0, 761.0, 459.0, 279.0, 172.0, 82.0, 50.0, 38.0, 21.0, 11.0, 16.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.4375, -9.154296875, -8.87109375, -8.587890625, -8.3046875, -8.021484375, -7.73828125, -7.455078125, -7.171875, -6.888671875, -6.60546875, -6.322265625, -6.0390625, -5.755859375, -5.47265625, -5.189453125, -4.90625, -4.623046875, -4.33984375, -4.056640625, -3.7734375, -3.490234375, -3.20703125, -2.923828125, -2.640625, -2.357421875, -2.07421875, -1.791015625, -1.5078125, -1.224609375, -0.94140625, -0.658203125, -0.375, -0.091796875, 0.19140625, 0.474609375, 0.7578125, 1.041015625, 1.32421875, 1.607421875, 1.890625, 2.173828125, 2.45703125, 2.740234375, 3.0234375, 3.306640625, 3.58984375, 3.873046875, 4.15625, 4.439453125, 4.72265625, 5.005859375, 5.2890625, 5.572265625, 5.85546875, 6.138671875, 6.421875, 6.705078125, 6.98828125, 7.271484375, 7.5546875, 7.837890625, 8.12109375, 8.404296875, 8.6875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 10.0, 11.0, 12.0, 7.0, 9.0, 18.0, 14.0, 18.0, 21.0, 19.0, 31.0, 25.0, 23.0, 39.0, 41.0, 44.0, 33.0, 25.0, 54.0, 40.0, 39.0, 29.0, 21.0, 42.0, 23.0, 32.0, 37.0, 39.0, 34.0, 35.0, 24.0, 25.0, 15.0, 11.0, 20.0, 15.0, 14.0, 6.0, 10.0, 5.0, 9.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.02978515625, -8.7001953125, -8.37060546875, -8.041015625, -7.71142578125, -7.3818359375, -7.05224609375, -6.72265625, -6.39306640625, -6.0634765625, -5.73388671875, -5.404296875, -5.07470703125, -4.7451171875, -4.41552734375, -4.0859375, -3.75634765625, -3.4267578125, -3.09716796875, -2.767578125, -2.43798828125, -2.1083984375, -1.77880859375, -1.44921875, -1.11962890625, -0.7900390625, -0.46044921875, -0.130859375, 0.19873046875, 0.5283203125, 0.85791015625, 1.1875, 1.51708984375, 1.8466796875, 2.17626953125, 2.505859375, 2.83544921875, 3.1650390625, 3.49462890625, 3.82421875, 4.15380859375, 4.4833984375, 4.81298828125, 5.142578125, 5.47216796875, 5.8017578125, 6.13134765625, 6.4609375, 6.79052734375, 7.1201171875, 7.44970703125, 7.779296875, 8.10888671875, 8.4384765625, 8.76806640625, 9.09765625, 9.42724609375, 9.7568359375, 10.08642578125, 10.416015625, 10.74560546875, 11.0751953125, 11.40478515625, 11.734375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 5.0, 5.0, 13.0, 13.0, 30.0, 50.0, 107.0, 181.0, 314.0, 552.0, 925.0, 1542.0, 2677.0, 4332.0, 7220.0, 11993.0, 19265.0, 30219.0, 45747.0, 69248.0, 100234.0, 141294.0, 190550.0, 245153.0, 301054.0, 350777.0, 384525.0, 395377.0, 382747.0, 349688.0, 299251.0, 242908.0, 187448.0, 139779.0, 99026.0, 67641.0, 45262.0, 29426.0, 18274.0, 11726.0, 7211.0, 4345.0, 2527.0, 1512.0, 895.0, 498.0, 301.0, 183.0, 101.0, 55.0, 33.0, 29.0, 14.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.6971435546875, -8.402099609375, -8.1070556640625, -7.81201171875, -7.5169677734375, -7.221923828125, -6.9268798828125, -6.6318359375, -6.3367919921875, -6.041748046875, -5.7467041015625, -5.45166015625, -5.1566162109375, -4.861572265625, -4.5665283203125, -4.271484375, -3.9764404296875, -3.681396484375, -3.3863525390625, -3.09130859375, -2.7962646484375, -2.501220703125, -2.2061767578125, -1.9111328125, -1.6160888671875, -1.321044921875, -1.0260009765625, -0.73095703125, -0.4359130859375, -0.140869140625, 0.1541748046875, 0.44921875, 0.7442626953125, 1.039306640625, 1.3343505859375, 1.62939453125, 1.9244384765625, 2.219482421875, 2.5145263671875, 2.8095703125, 3.1046142578125, 3.399658203125, 3.6947021484375, 3.98974609375, 4.2847900390625, 4.579833984375, 4.8748779296875, 5.169921875, 5.4649658203125, 5.760009765625, 6.0550537109375, 6.35009765625, 6.6451416015625, 6.940185546875, 7.2352294921875, 7.5302734375, 7.8253173828125, 8.120361328125, 8.4154052734375, 8.71044921875, 9.0054931640625, 9.300537109375, 9.5955810546875, 9.890625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 9.0, 14.0, 17.0, 18.0, 30.0, 40.0, 48.0, 56.0, 72.0, 80.0, 91.0, 105.0, 127.0, 119.0, 110.0, 149.0, 160.0, 200.0, 168.0, 184.0, 211.0, 177.0, 200.0, 185.0, 177.0, 168.0, 155.0, 145.0, 140.0, 114.0, 95.0, 93.0, 72.0, 71.0, 56.0, 53.0, 35.0, 28.0, 27.0, 21.0, 12.0, 18.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0234375, -4.86700439453125, -4.7105712890625, -4.55413818359375, -4.397705078125, -4.24127197265625, -4.0848388671875, -3.92840576171875, -3.77197265625, -3.61553955078125, -3.4591064453125, -3.30267333984375, -3.146240234375, -2.98980712890625, -2.8333740234375, -2.67694091796875, -2.5205078125, -2.36407470703125, -2.2076416015625, -2.05120849609375, -1.894775390625, -1.73834228515625, -1.5819091796875, -1.42547607421875, -1.26904296875, -1.11260986328125, -0.9561767578125, -0.79974365234375, -0.643310546875, -0.48687744140625, -0.3304443359375, -0.17401123046875, -0.017578125, 0.13885498046875, 0.2952880859375, 0.45172119140625, 0.608154296875, 0.76458740234375, 0.9210205078125, 1.07745361328125, 1.23388671875, 1.39031982421875, 1.5467529296875, 1.70318603515625, 1.859619140625, 2.01605224609375, 2.1724853515625, 2.32891845703125, 2.4853515625, 2.64178466796875, 2.7982177734375, 2.95465087890625, 3.111083984375, 3.26751708984375, 3.4239501953125, 3.58038330078125, 3.73681640625, 3.89324951171875, 4.0496826171875, 4.20611572265625, 4.362548828125, 4.51898193359375, 4.6754150390625, 4.83184814453125, 4.98828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 5.0, 4.0, 3.0, 11.0, 9.0, 13.0, 10.0, 24.0, 25.0, 18.0, 26.0, 20.0, 26.0, 38.0, 29.0, 47.0, 47.0, 39.0, 51.0, 45.0, 39.0, 46.0, 37.0, 45.0, 36.0, 32.0, 35.0, 31.0, 24.0, 29.0, 35.0, 17.0, 21.0, 11.0, 10.0, 11.0, 8.0, 13.0, 8.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.261646270751953, -14.843293190002441, -14.42494010925293, -14.006586074829102, -13.58823299407959, -13.169879913330078, -12.751526832580566, -12.333173751831055, -11.914820671081543, -11.496467590332031, -11.07811450958252, -10.659761428833008, -10.24140739440918, -9.823054313659668, -9.404701232910156, -8.986348152160645, -8.567995071411133, -8.149641990661621, -7.731288433074951, -7.3129353523254395, -6.894582271575928, -6.476228713989258, -6.057875633239746, -5.639522552490234, -5.221168518066406, -4.8028154373168945, -4.384461879730225, -3.966108798980713, -3.547755718231201, -3.1294023990631104, -2.7110490798950195, -2.292695999145508, -1.874342918395996, -1.4559897184371948, -1.0376365184783936, -0.6192831993103027, -0.20092999935150146, 0.2174232006072998, 0.6357765197753906, 1.0541296005249023, 1.4724829196929932, 1.8908361196517944, 2.3091893196105957, 2.7275426387786865, 3.1458959579467773, 3.564249038696289, 3.98260235786438, 4.4009552001953125, 4.819308757781982, 5.237661838531494, 5.656015396118164, 6.074368476867676, 6.4927215576171875, 6.911074638366699, 7.329428195953369, 7.747781276702881, 8.16613483428955, 8.584487915039062, 9.002840995788574, 9.421194076538086, 9.839548110961914, 10.257901191711426, 10.676254272460938, 11.09460735321045, 11.512960433959961]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 4.0, 12.0, 10.0, 5.0, 12.0, 8.0, 10.0, 20.0, 24.0, 26.0, 23.0, 26.0, 37.0, 35.0, 36.0, 19.0, 32.0, 56.0, 40.0, 27.0, 46.0, 26.0, 29.0, 36.0, 25.0, 44.0, 29.0, 27.0, 33.0, 32.0, 29.0, 28.0, 18.0, 16.0, 14.0, 18.0, 11.0, 21.0, 8.0, 7.0, 8.0, 7.0, 3.0, 6.0, 2.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.496857643127441, -11.12658405303955, -10.75631046295166, -10.38603687286377, -10.015763282775879, -9.645489692687988, -9.275216102600098, -8.904942512512207, -8.534668922424316, -8.164395332336426, -7.794121742248535, -7.4238481521606445, -7.053574562072754, -6.683300971984863, -6.313027381896973, -5.942753791809082, -5.572480201721191, -5.202206611633301, -4.83193302154541, -4.4616594314575195, -4.091385841369629, -3.7211122512817383, -3.3508386611938477, -2.980565071105957, -2.6102914810180664, -2.240017890930176, -1.8697443008422852, -1.4994707107543945, -1.129197120666504, -0.7589235305786133, -0.38864994049072266, -0.01837635040283203, 0.3518962860107422, 0.7221698760986328, 1.0924434661865234, 1.462717056274414, 1.8329906463623047, 2.2032642364501953, 2.573537826538086, 2.9438114166259766, 3.314085006713867, 3.684358596801758, 4.054632186889648, 4.424905776977539, 4.79517936706543, 5.16545295715332, 5.535726547241211, 5.906000137329102, 6.276273727416992, 6.646547317504883, 7.016820907592773, 7.387094497680664, 7.757368087768555, 8.127641677856445, 8.497915267944336, 8.868188858032227, 9.238462448120117, 9.608736038208008, 9.979009628295898, 10.349283218383789, 10.71955680847168, 11.08983039855957, 11.460103988647461, 11.830377578735352, 12.200651168823242]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 7.0, 17.0, 22.0, 28.0, 35.0, 50.0, 79.0, 97.0, 180.0, 216.0, 347.0, 463.0, 708.0, 1122.0, 1575.0, 2484.0, 3980.0, 6312.0, 10062.0, 16443.0, 27984.0, 47033.0, 79884.0, 128989.0, 177279.0, 182685.0, 139492.0, 88198.0, 52704.0, 31261.0, 18491.0, 10985.0, 6847.0, 4276.0, 2858.0, 1753.0, 1136.0, 801.0, 540.0, 361.0, 256.0, 159.0, 105.0, 83.0, 49.0, 31.0, 33.0, 17.0, 20.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.818359375, -2.73321533203125, -2.6480712890625, -2.56292724609375, -2.477783203125, -2.39263916015625, -2.3074951171875, -2.22235107421875, -2.13720703125, -2.05206298828125, -1.9669189453125, -1.88177490234375, -1.796630859375, -1.71148681640625, -1.6263427734375, -1.54119873046875, -1.4560546875, -1.37091064453125, -1.2857666015625, -1.20062255859375, -1.115478515625, -1.03033447265625, -0.9451904296875, -0.86004638671875, -0.77490234375, -0.68975830078125, -0.6046142578125, -0.51947021484375, -0.434326171875, -0.34918212890625, -0.2640380859375, -0.17889404296875, -0.09375, -0.00860595703125, 0.0765380859375, 0.16168212890625, 0.246826171875, 0.33197021484375, 0.4171142578125, 0.50225830078125, 0.58740234375, 0.67254638671875, 0.7576904296875, 0.84283447265625, 0.927978515625, 1.01312255859375, 1.0982666015625, 1.18341064453125, 1.2685546875, 1.35369873046875, 1.4388427734375, 1.52398681640625, 1.609130859375, 1.69427490234375, 1.7794189453125, 1.86456298828125, 1.94970703125, 2.03485107421875, 2.1199951171875, 2.20513916015625, 2.290283203125, 2.37542724609375, 2.4605712890625, 2.54571533203125, 2.630859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 4.0, 12.0, 9.0, 6.0, 11.0, 9.0, 10.0, 20.0, 24.0, 28.0, 19.0, 29.0, 34.0, 36.0, 37.0, 18.0, 30.0, 58.0, 39.0, 29.0, 42.0, 30.0, 30.0, 32.0, 28.0, 42.0, 30.0, 26.0, 30.0, 37.0, 27.0, 29.0, 19.0, 15.0, 14.0, 18.0, 12.0, 18.0, 10.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.091064453125, -10.72119140625, -10.351318359375, -9.9814453125, -9.611572265625, -9.24169921875, -8.871826171875, -8.501953125, -8.132080078125, -7.76220703125, -7.392333984375, -7.0224609375, -6.652587890625, -6.28271484375, -5.912841796875, -5.54296875, -5.173095703125, -4.80322265625, -4.433349609375, -4.0634765625, -3.693603515625, -3.32373046875, -2.953857421875, -2.583984375, -2.214111328125, -1.84423828125, -1.474365234375, -1.1044921875, -0.734619140625, -0.36474609375, 0.005126953125, 0.375, 0.744873046875, 1.11474609375, 1.484619140625, 1.8544921875, 2.224365234375, 2.59423828125, 2.964111328125, 3.333984375, 3.703857421875, 4.07373046875, 4.443603515625, 4.8134765625, 5.183349609375, 5.55322265625, 5.923095703125, 6.29296875, 6.662841796875, 7.03271484375, 7.402587890625, 7.7724609375, 8.142333984375, 8.51220703125, 8.882080078125, 9.251953125, 9.621826171875, 9.99169921875, 10.361572265625, 10.7314453125, 11.101318359375, 11.47119140625, 11.841064453125, 12.2109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 9.0, 8.0, 8.0, 13.0, 16.0, 25.0, 34.0, 59.0, 75.0, 92.0, 148.0, 234.0, 341.0, 497.0, 737.0, 1112.0, 1883.0, 2939.0, 4805.0, 8528.0, 15334.0, 28822.0, 55584.0, 112475.0, 215458.0, 263207.0, 163633.0, 81807.0, 40888.0, 21320.0, 11459.0, 6610.0, 3860.0, 2378.0, 1430.0, 926.0, 600.0, 399.0, 252.0, 187.0, 113.0, 72.0, 53.0, 43.0, 26.0, 19.0, 8.0, 7.0, 10.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.23046875, -3.13037109375, -3.0302734375, -2.93017578125, -2.830078125, -2.72998046875, -2.6298828125, -2.52978515625, -2.4296875, -2.32958984375, -2.2294921875, -2.12939453125, -2.029296875, -1.92919921875, -1.8291015625, -1.72900390625, -1.62890625, -1.52880859375, -1.4287109375, -1.32861328125, -1.228515625, -1.12841796875, -1.0283203125, -0.92822265625, -0.828125, -0.72802734375, -0.6279296875, -0.52783203125, -0.427734375, -0.32763671875, -0.2275390625, -0.12744140625, -0.02734375, 0.07275390625, 0.1728515625, 0.27294921875, 0.373046875, 0.47314453125, 0.5732421875, 0.67333984375, 0.7734375, 0.87353515625, 0.9736328125, 1.07373046875, 1.173828125, 1.27392578125, 1.3740234375, 1.47412109375, 1.57421875, 1.67431640625, 1.7744140625, 1.87451171875, 1.974609375, 2.07470703125, 2.1748046875, 2.27490234375, 2.375, 2.47509765625, 2.5751953125, 2.67529296875, 2.775390625, 2.87548828125, 2.9755859375, 3.07568359375, 3.17578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 7.0, 6.0, 6.0, 13.0, 8.0, 9.0, 16.0, 13.0, 21.0, 30.0, 23.0, 30.0, 31.0, 46.0, 34.0, 36.0, 35.0, 27.0, 42.0, 44.0, 36.0, 38.0, 36.0, 43.0, 42.0, 45.0, 31.0, 26.0, 27.0, 26.0, 25.0, 22.0, 24.0, 21.0, 12.0, 11.0, 12.0, 4.0, 7.0, 1.0, 2.0, 7.0, 7.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3515625, -8.094970703125, -7.83837890625, -7.581787109375, -7.3251953125, -7.068603515625, -6.81201171875, -6.555419921875, -6.298828125, -6.042236328125, -5.78564453125, -5.529052734375, -5.2724609375, -5.015869140625, -4.75927734375, -4.502685546875, -4.24609375, -3.989501953125, -3.73291015625, -3.476318359375, -3.2197265625, -2.963134765625, -2.70654296875, -2.449951171875, -2.193359375, -1.936767578125, -1.68017578125, -1.423583984375, -1.1669921875, -0.910400390625, -0.65380859375, -0.397216796875, -0.140625, 0.115966796875, 0.37255859375, 0.629150390625, 0.8857421875, 1.142333984375, 1.39892578125, 1.655517578125, 1.912109375, 2.168701171875, 2.42529296875, 2.681884765625, 2.9384765625, 3.195068359375, 3.45166015625, 3.708251953125, 3.96484375, 4.221435546875, 4.47802734375, 4.734619140625, 4.9912109375, 5.247802734375, 5.50439453125, 5.760986328125, 6.017578125, 6.274169921875, 6.53076171875, 6.787353515625, 7.0439453125, 7.300537109375, 7.55712890625, 7.813720703125, 8.0703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 6.0, 4.0, 11.0, 13.0, 14.0, 28.0, 29.0, 44.0, 61.0, 81.0, 110.0, 179.0, 219.0, 341.0, 462.0, 623.0, 1039.0, 1723.0, 2552.0, 4434.0, 8251.0, 17004.0, 41182.0, 128947.0, 427006.0, 281739.0, 75953.0, 27790.0, 12353.0, 6414.0, 3589.0, 2147.0, 1347.0, 896.0, 571.0, 394.0, 296.0, 192.0, 144.0, 96.0, 79.0, 59.0, 31.0, 32.0, 25.0, 16.0, 11.0, 9.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4619140625, -1.417327880859375, -1.37274169921875, -1.328155517578125, -1.2835693359375, -1.238983154296875, -1.19439697265625, -1.149810791015625, -1.105224609375, -1.060638427734375, -1.01605224609375, -0.971466064453125, -0.9268798828125, -0.882293701171875, -0.83770751953125, -0.793121337890625, -0.74853515625, -0.703948974609375, -0.65936279296875, -0.614776611328125, -0.5701904296875, -0.525604248046875, -0.48101806640625, -0.436431884765625, -0.391845703125, -0.347259521484375, -0.30267333984375, -0.258087158203125, -0.2135009765625, -0.168914794921875, -0.12432861328125, -0.079742431640625, -0.03515625, 0.009429931640625, 0.05401611328125, 0.098602294921875, 0.1431884765625, 0.187774658203125, 0.23236083984375, 0.276947021484375, 0.321533203125, 0.366119384765625, 0.41070556640625, 0.455291748046875, 0.4998779296875, 0.544464111328125, 0.58905029296875, 0.633636474609375, 0.67822265625, 0.722808837890625, 0.76739501953125, 0.811981201171875, 0.8565673828125, 0.901153564453125, 0.94573974609375, 0.990325927734375, 1.034912109375, 1.079498291015625, 1.12408447265625, 1.168670654296875, 1.2132568359375, 1.257843017578125, 1.30242919921875, 1.347015380859375, 1.3916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 7.0, 16.0, 15.0, 23.0, 26.0, 29.0, 33.0, 47.0, 56.0, 46.0, 57.0, 66.0, 59.0, 61.0, 54.0, 44.0, 58.0, 52.0, 31.0, 39.0, 34.0, 20.0, 17.0, 29.0, 8.0, 11.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000125885009765625, -0.00012216903269290924, -0.00011845305562019348, -0.00011473707854747772, -0.00011102110147476196, -0.0001073051244020462, -0.00010358914732933044, -9.987317025661469e-05, -9.615719318389893e-05, -9.244121611118317e-05, -8.872523903846741e-05, -8.500926196575165e-05, -8.129328489303589e-05, -7.757730782032013e-05, -7.386133074760437e-05, -7.014535367488861e-05, -6.642937660217285e-05, -6.271339952945709e-05, -5.899742245674133e-05, -5.5281445384025574e-05, -5.1565468311309814e-05, -4.7849491238594055e-05, -4.4133514165878296e-05, -4.041753709316254e-05, -3.670156002044678e-05, -3.298558294773102e-05, -2.926960587501526e-05, -2.55536288022995e-05, -2.183765172958374e-05, -1.812167465686798e-05, -1.4405697584152222e-05, -1.0689720511436462e-05, -6.973743438720703e-06, -3.257766366004944e-06, 4.5821070671081543e-07, 4.174187779426575e-06, 7.890164852142334e-06, 1.1606141924858093e-05, 1.5322118997573853e-05, 1.9038096070289612e-05, 2.275407314300537e-05, 2.647005021572113e-05, 3.018602728843689e-05, 3.390200436115265e-05, 3.761798143386841e-05, 4.133395850658417e-05, 4.504993557929993e-05, 4.8765912652015686e-05, 5.2481889724731445e-05, 5.6197866797447205e-05, 5.9913843870162964e-05, 6.362982094287872e-05, 6.734579801559448e-05, 7.106177508831024e-05, 7.4777752161026e-05, 7.849372923374176e-05, 8.220970630645752e-05, 8.592568337917328e-05, 8.964166045188904e-05, 9.33576375246048e-05, 9.707361459732056e-05, 0.00010078959167003632, 0.00010450556874275208, 0.00010822154581546783, 0.0001119375228881836]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 15.0, 9.0, 18.0, 15.0, 25.0, 40.0, 62.0, 83.0, 108.0, 161.0, 231.0, 343.0, 528.0, 814.0, 1208.0, 1945.0, 3054.0, 4997.0, 8792.0, 15719.0, 29900.0, 62294.0, 137752.0, 262309.0, 257545.0, 133690.0, 60901.0, 29154.0, 14901.0, 8460.0, 4920.0, 2979.0, 1908.0, 1230.0, 775.0, 542.0, 370.0, 249.0, 162.0, 112.0, 75.0, 48.0, 36.0, 29.0, 14.0, 12.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.92578125, -1.863616943359375, -1.80145263671875, -1.739288330078125, -1.6771240234375, -1.614959716796875, -1.55279541015625, -1.490631103515625, -1.428466796875, -1.366302490234375, -1.30413818359375, -1.241973876953125, -1.1798095703125, -1.117645263671875, -1.05548095703125, -0.993316650390625, -0.93115234375, -0.868988037109375, -0.80682373046875, -0.744659423828125, -0.6824951171875, -0.620330810546875, -0.55816650390625, -0.496002197265625, -0.433837890625, -0.371673583984375, -0.30950927734375, -0.247344970703125, -0.1851806640625, -0.123016357421875, -0.06085205078125, 0.001312255859375, 0.0634765625, 0.125640869140625, 0.18780517578125, 0.249969482421875, 0.3121337890625, 0.374298095703125, 0.43646240234375, 0.498626708984375, 0.560791015625, 0.622955322265625, 0.68511962890625, 0.747283935546875, 0.8094482421875, 0.871612548828125, 0.93377685546875, 0.995941162109375, 1.05810546875, 1.120269775390625, 1.18243408203125, 1.244598388671875, 1.3067626953125, 1.368927001953125, 1.43109130859375, 1.493255615234375, 1.555419921875, 1.617584228515625, 1.67974853515625, 1.741912841796875, 1.8040771484375, 1.866241455078125, 1.92840576171875, 1.990570068359375, 2.052734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 6.0, 8.0, 7.0, 12.0, 19.0, 50.0, 31.0, 67.0, 74.0, 87.0, 93.0, 80.0, 98.0, 83.0, 74.0, 54.0, 41.0, 25.0, 23.0, 15.0, 16.0, 13.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6962890625, -0.669952392578125, -0.64361572265625, -0.617279052734375, -0.5909423828125, -0.564605712890625, -0.53826904296875, -0.511932373046875, -0.485595703125, -0.459259033203125, -0.43292236328125, -0.406585693359375, -0.3802490234375, -0.353912353515625, -0.32757568359375, -0.301239013671875, -0.27490234375, -0.248565673828125, -0.22222900390625, -0.195892333984375, -0.1695556640625, -0.143218994140625, -0.11688232421875, -0.090545654296875, -0.064208984375, -0.037872314453125, -0.01153564453125, 0.014801025390625, 0.0411376953125, 0.067474365234375, 0.09381103515625, 0.120147705078125, 0.146484375, 0.172821044921875, 0.19915771484375, 0.225494384765625, 0.2518310546875, 0.278167724609375, 0.30450439453125, 0.330841064453125, 0.357177734375, 0.383514404296875, 0.40985107421875, 0.436187744140625, 0.4625244140625, 0.488861083984375, 0.51519775390625, 0.541534423828125, 0.56787109375, 0.594207763671875, 0.62054443359375, 0.646881103515625, 0.6732177734375, 0.699554443359375, 0.72589111328125, 0.752227783203125, 0.778564453125, 0.804901123046875, 0.83123779296875, 0.857574462890625, 0.8839111328125, 0.910247802734375, 0.93658447265625, 0.962921142578125, 0.9892578125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 2.0, 7.0, 2.0, 4.0, 10.0, 11.0, 8.0, 14.0, 28.0, 22.0, 15.0, 26.0, 31.0, 26.0, 35.0, 25.0, 41.0, 48.0, 45.0, 40.0, 55.0, 42.0, 38.0, 52.0, 34.0, 38.0, 34.0, 31.0, 27.0, 26.0, 35.0, 27.0, 19.0, 22.0, 13.0, 11.0, 8.0, 11.0, 11.0, 8.0, 2.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-15.242074012756348, -14.822809219360352, -14.403544425964355, -13.98427963256836, -13.565014839172363, -13.145750045776367, -12.726485252380371, -12.307220458984375, -11.887955665588379, -11.468690872192383, -11.049426078796387, -10.63016128540039, -10.210896492004395, -9.791631698608398, -9.372366905212402, -8.953102111816406, -8.53383731842041, -8.114572525024414, -7.695307731628418, -7.276042938232422, -6.856778144836426, -6.43751335144043, -6.018248558044434, -5.5989837646484375, -5.179718971252441, -4.760454177856445, -4.341189384460449, -3.921924591064453, -3.502659797668457, -3.083395004272461, -2.664130210876465, -2.2448654174804688, -1.8255996704101562, -1.4063348770141602, -0.9870700836181641, -0.567805290222168, -0.14854049682617188, 0.2707242965698242, 0.6899890899658203, 1.1092538833618164, 1.5285186767578125, 1.9477834701538086, 2.3670482635498047, 2.786313056945801, 3.205577850341797, 3.624842643737793, 4.044107437133789, 4.463372230529785, 4.882637023925781, 5.301901817321777, 5.721166610717773, 6.1404314041137695, 6.559696197509766, 6.978960990905762, 7.398225784301758, 7.817490577697754, 8.23675537109375, 8.656020164489746, 9.075284957885742, 9.494549751281738, 9.913814544677734, 10.33307933807373, 10.752344131469727, 11.171608924865723, 11.590873718261719]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 6.0, 7.0, 10.0, 6.0, 14.0, 16.0, 22.0, 23.0, 30.0, 29.0, 27.0, 35.0, 36.0, 24.0, 26.0, 42.0, 48.0, 39.0, 28.0, 43.0, 26.0, 34.0, 29.0, 28.0, 45.0, 28.0, 26.0, 33.0, 31.0, 27.0, 20.0, 18.0, 16.0, 18.0, 14.0, 11.0, 16.0, 7.0, 7.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.507094383239746, -11.1393404006958, -10.771587371826172, -10.403833389282227, -10.036079406738281, -9.668325424194336, -9.30057144165039, -8.932818412780762, -8.565064430236816, -8.197310447692871, -7.829556941986084, -7.461803436279297, -7.094049453735352, -6.726295471191406, -6.358541965484619, -5.990788459777832, -5.623034477233887, -5.255280494689941, -4.887526988983154, -4.519773483276367, -4.152019500732422, -3.7842657566070557, -3.4165120124816895, -3.0487582683563232, -2.681004524230957, -2.313250780105591, -1.9454970359802246, -1.5777432918548584, -1.2099895477294922, -0.842235803604126, -0.47448205947875977, -0.10672831535339355, 0.26102638244628906, 0.6287801265716553, 0.9965338706970215, 1.3642876148223877, 1.732041358947754, 2.09979510307312, 2.4675488471984863, 2.8353025913238525, 3.2030563354492188, 3.570810079574585, 3.938563823699951, 4.306317329406738, 4.674071311950684, 5.041825294494629, 5.409578800201416, 5.777332305908203, 6.145086288452148, 6.512840270996094, 6.880593776702881, 7.248347282409668, 7.616101264953613, 7.983855247497559, 8.351608276367188, 8.719362258911133, 9.087116241455078, 9.454870223999023, 9.822624206542969, 10.190377235412598, 10.558131217956543, 10.925885200500488, 11.293638229370117, 11.661392211914062, 12.029146194458008]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 9.0, 13.0, 28.0, 27.0, 58.0, 100.0, 156.0, 268.0, 406.0, 631.0, 945.0, 1571.0, 2275.0, 3581.0, 5324.0, 7779.0, 11507.0, 16048.0, 22226.0, 29894.0, 39013.0, 49918.0, 59967.0, 70940.0, 78748.0, 84703.0, 86244.0, 84071.0, 78211.0, 69371.0, 59378.0, 48181.0, 37713.0, 28865.0, 21294.0, 15657.0, 11033.0, 7572.0, 5116.0, 3449.0, 2263.0, 1440.0, 931.0, 621.0, 387.0, 255.0, 134.0, 93.0, 58.0, 45.0, 20.0, 12.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3359375, -7.0867919921875, -6.837646484375, -6.5885009765625, -6.33935546875, -6.0902099609375, -5.841064453125, -5.5919189453125, -5.3427734375, -5.0936279296875, -4.844482421875, -4.5953369140625, -4.34619140625, -4.0970458984375, -3.847900390625, -3.5987548828125, -3.349609375, -3.1004638671875, -2.851318359375, -2.6021728515625, -2.35302734375, -2.1038818359375, -1.854736328125, -1.6055908203125, -1.3564453125, -1.1072998046875, -0.858154296875, -0.6090087890625, -0.35986328125, -0.1107177734375, 0.138427734375, 0.3875732421875, 0.63671875, 0.8858642578125, 1.135009765625, 1.3841552734375, 1.63330078125, 1.8824462890625, 2.131591796875, 2.3807373046875, 2.6298828125, 2.8790283203125, 3.128173828125, 3.3773193359375, 3.62646484375, 3.8756103515625, 4.124755859375, 4.3739013671875, 4.623046875, 4.8721923828125, 5.121337890625, 5.3704833984375, 5.61962890625, 5.8687744140625, 6.117919921875, 6.3670654296875, 6.6162109375, 6.8653564453125, 7.114501953125, 7.3636474609375, 7.61279296875, 7.8619384765625, 8.111083984375, 8.3602294921875, 8.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 9.0, 6.0, 10.0, 11.0, 5.0, 15.0, 12.0, 21.0, 24.0, 28.0, 28.0, 29.0, 39.0, 31.0, 27.0, 25.0, 41.0, 48.0, 42.0, 28.0, 40.0, 28.0, 34.0, 29.0, 29.0, 44.0, 28.0, 26.0, 34.0, 35.0, 28.0, 15.0, 21.0, 15.0, 18.0, 15.0, 11.0, 16.0, 9.0, 4.0, 9.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.8917236328125, -10.533447265625, -10.1751708984375, -9.81689453125, -9.4586181640625, -9.100341796875, -8.7420654296875, -8.3837890625, -8.0255126953125, -7.667236328125, -7.3089599609375, -6.95068359375, -6.5924072265625, -6.234130859375, -5.8758544921875, -5.517578125, -5.1593017578125, -4.801025390625, -4.4427490234375, -4.08447265625, -3.7261962890625, -3.367919921875, -3.0096435546875, -2.6513671875, -2.2930908203125, -1.934814453125, -1.5765380859375, -1.21826171875, -0.8599853515625, -0.501708984375, -0.1434326171875, 0.21484375, 0.5731201171875, 0.931396484375, 1.2896728515625, 1.64794921875, 2.0062255859375, 2.364501953125, 2.7227783203125, 3.0810546875, 3.4393310546875, 3.797607421875, 4.1558837890625, 4.51416015625, 4.8724365234375, 5.230712890625, 5.5889892578125, 5.947265625, 6.3055419921875, 6.663818359375, 7.0220947265625, 7.38037109375, 7.7386474609375, 8.096923828125, 8.4552001953125, 8.8134765625, 9.1717529296875, 9.530029296875, 9.8883056640625, 10.24658203125, 10.6048583984375, 10.963134765625, 11.3214111328125, 11.6796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 6.0, 15.0, 16.0, 26.0, 64.0, 97.0, 163.0, 290.0, 508.0, 948.0, 1652.0, 2719.0, 4480.0, 7779.0, 12509.0, 19758.0, 29983.0, 43417.0, 59825.0, 77869.0, 94813.0, 107560.0, 112182.0, 107883.0, 96229.0, 79089.0, 60940.0, 44552.0, 30545.0, 20243.0, 12996.0, 7991.0, 4747.0, 2749.0, 1682.0, 970.0, 576.0, 280.0, 173.0, 93.0, 61.0, 29.0, 25.0, 14.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.184814453125, -9.86181640625, -9.538818359375, -9.2158203125, -8.892822265625, -8.56982421875, -8.246826171875, -7.923828125, -7.600830078125, -7.27783203125, -6.954833984375, -6.6318359375, -6.308837890625, -5.98583984375, -5.662841796875, -5.33984375, -5.016845703125, -4.69384765625, -4.370849609375, -4.0478515625, -3.724853515625, -3.40185546875, -3.078857421875, -2.755859375, -2.432861328125, -2.10986328125, -1.786865234375, -1.4638671875, -1.140869140625, -0.81787109375, -0.494873046875, -0.171875, 0.151123046875, 0.47412109375, 0.797119140625, 1.1201171875, 1.443115234375, 1.76611328125, 2.089111328125, 2.412109375, 2.735107421875, 3.05810546875, 3.381103515625, 3.7041015625, 4.027099609375, 4.35009765625, 4.673095703125, 4.99609375, 5.319091796875, 5.64208984375, 5.965087890625, 6.2880859375, 6.611083984375, 6.93408203125, 7.257080078125, 7.580078125, 7.903076171875, 8.22607421875, 8.549072265625, 8.8720703125, 9.195068359375, 9.51806640625, 9.841064453125, 10.1640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 2.0, 4.0, 6.0, 3.0, 5.0, 15.0, 12.0, 15.0, 21.0, 17.0, 23.0, 20.0, 24.0, 27.0, 34.0, 34.0, 35.0, 37.0, 38.0, 43.0, 44.0, 43.0, 37.0, 34.0, 38.0, 39.0, 33.0, 36.0, 46.0, 40.0, 27.0, 23.0, 27.0, 28.0, 17.0, 11.0, 10.0, 9.0, 13.0, 9.0, 10.0, 4.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7734375, -8.5064697265625, -8.239501953125, -7.9725341796875, -7.70556640625, -7.4385986328125, -7.171630859375, -6.9046630859375, -6.6376953125, -6.3707275390625, -6.103759765625, -5.8367919921875, -5.56982421875, -5.3028564453125, -5.035888671875, -4.7689208984375, -4.501953125, -4.2349853515625, -3.968017578125, -3.7010498046875, -3.43408203125, -3.1671142578125, -2.900146484375, -2.6331787109375, -2.3662109375, -2.0992431640625, -1.832275390625, -1.5653076171875, -1.29833984375, -1.0313720703125, -0.764404296875, -0.4974365234375, -0.23046875, 0.0364990234375, 0.303466796875, 0.5704345703125, 0.83740234375, 1.1043701171875, 1.371337890625, 1.6383056640625, 1.9052734375, 2.1722412109375, 2.439208984375, 2.7061767578125, 2.97314453125, 3.2401123046875, 3.507080078125, 3.7740478515625, 4.041015625, 4.3079833984375, 4.574951171875, 4.8419189453125, 5.10888671875, 5.3758544921875, 5.642822265625, 5.9097900390625, 6.1767578125, 6.4437255859375, 6.710693359375, 6.9776611328125, 7.24462890625, 7.5115966796875, 7.778564453125, 8.0455322265625, 8.3125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 11.0, 18.0, 20.0, 31.0, 55.0, 68.0, 100.0, 195.0, 300.0, 568.0, 943.0, 1552.0, 2775.0, 4965.0, 8565.0, 15193.0, 25897.0, 43124.0, 66733.0, 95877.0, 124777.0, 142162.0, 139836.0, 121377.0, 92934.0, 63035.0, 40417.0, 24182.0, 14078.0, 8026.0, 4633.0, 2544.0, 1505.0, 812.0, 492.0, 275.0, 169.0, 101.0, 73.0, 37.0, 29.0, 13.0, 17.0, 6.0, 3.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.6796875, -5.5018310546875, -5.323974609375, -5.1461181640625, -4.96826171875, -4.7904052734375, -4.612548828125, -4.4346923828125, -4.2568359375, -4.0789794921875, -3.901123046875, -3.7232666015625, -3.54541015625, -3.3675537109375, -3.189697265625, -3.0118408203125, -2.833984375, -2.6561279296875, -2.478271484375, -2.3004150390625, -2.12255859375, -1.9447021484375, -1.766845703125, -1.5889892578125, -1.4111328125, -1.2332763671875, -1.055419921875, -0.8775634765625, -0.69970703125, -0.5218505859375, -0.343994140625, -0.1661376953125, 0.01171875, 0.1895751953125, 0.367431640625, 0.5452880859375, 0.72314453125, 0.9010009765625, 1.078857421875, 1.2567138671875, 1.4345703125, 1.6124267578125, 1.790283203125, 1.9681396484375, 2.14599609375, 2.3238525390625, 2.501708984375, 2.6795654296875, 2.857421875, 3.0352783203125, 3.213134765625, 3.3909912109375, 3.56884765625, 3.7467041015625, 3.924560546875, 4.1024169921875, 4.2802734375, 4.4581298828125, 4.635986328125, 4.8138427734375, 4.99169921875, 5.1695556640625, 5.347412109375, 5.5252685546875, 5.703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 16.0, 21.0, 16.0, 19.0, 16.0, 12.0, 21.0, 33.0, 28.0, 48.0, 34.0, 47.0, 39.0, 44.0, 48.0, 52.0, 44.0, 46.0, 41.0, 29.0, 42.0, 27.0, 34.0, 35.0, 30.0, 29.0, 20.0, 17.0, 15.0, 8.0, 13.0, 14.0, 9.0, 12.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.000606536865234375, -0.0005899891257286072, -0.0005734413862228394, -0.0005568936467170715, -0.0005403459072113037, -0.0005237981677055359, -0.0005072504281997681, -0.0004907026886940002, -0.0004741549491882324, -0.0004576072096824646, -0.0004410594701766968, -0.00042451173067092896, -0.00040796399116516113, -0.0003914162516593933, -0.0003748685121536255, -0.00035832077264785767, -0.00034177303314208984, -0.000325225293636322, -0.0003086775541305542, -0.0002921298146247864, -0.00027558207511901855, -0.00025903433561325073, -0.0002424865961074829, -0.0002259388566017151, -0.00020939111709594727, -0.00019284337759017944, -0.00017629563808441162, -0.0001597478985786438, -0.00014320015907287598, -0.00012665241956710815, -0.00011010468006134033, -9.355694055557251e-05, -7.700920104980469e-05, -6.0461461544036865e-05, -4.391372203826904e-05, -2.736598253250122e-05, -1.0818243026733398e-05, 5.729496479034424e-06, 2.2277235984802246e-05, 3.882497549057007e-05, 5.537271499633789e-05, 7.192045450210571e-05, 8.846819400787354e-05, 0.00010501593351364136, 0.00012156367301940918, 0.000138111412525177, 0.00015465915203094482, 0.00017120689153671265, 0.00018775463104248047, 0.0002043023705482483, 0.0002208501100540161, 0.00023739784955978394, 0.00025394558906555176, 0.0002704933285713196, 0.0002870410680770874, 0.0003035888075828552, 0.00032013654708862305, 0.00033668428659439087, 0.0003532320261001587, 0.0003697797656059265, 0.00038632750511169434, 0.00040287524461746216, 0.00041942298412323, 0.0004359707236289978, 0.0004525184631347656]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 10.0, 10.0, 21.0, 30.0, 63.0, 74.0, 118.0, 173.0, 288.0, 467.0, 775.0, 1245.0, 2103.0, 3413.0, 5686.0, 9694.0, 16325.0, 27727.0, 44665.0, 69633.0, 98776.0, 127312.0, 142706.0, 139227.0, 117153.0, 87486.0, 59265.0, 37616.0, 22883.0, 13579.0, 8012.0, 4842.0, 2750.0, 1682.0, 1040.0, 611.0, 406.0, 237.0, 141.0, 100.0, 59.0, 49.0, 33.0, 23.0, 11.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.7955322265625, -5.587158203125, -5.3787841796875, -5.17041015625, -4.9620361328125, -4.753662109375, -4.5452880859375, -4.3369140625, -4.1285400390625, -3.920166015625, -3.7117919921875, -3.50341796875, -3.2950439453125, -3.086669921875, -2.8782958984375, -2.669921875, -2.4615478515625, -2.253173828125, -2.0447998046875, -1.83642578125, -1.6280517578125, -1.419677734375, -1.2113037109375, -1.0029296875, -0.7945556640625, -0.586181640625, -0.3778076171875, -0.16943359375, 0.0389404296875, 0.247314453125, 0.4556884765625, 0.6640625, 0.8724365234375, 1.080810546875, 1.2891845703125, 1.49755859375, 1.7059326171875, 1.914306640625, 2.1226806640625, 2.3310546875, 2.5394287109375, 2.747802734375, 2.9561767578125, 3.16455078125, 3.3729248046875, 3.581298828125, 3.7896728515625, 3.998046875, 4.2064208984375, 4.414794921875, 4.6231689453125, 4.83154296875, 5.0399169921875, 5.248291015625, 5.4566650390625, 5.6650390625, 5.8734130859375, 6.081787109375, 6.2901611328125, 6.49853515625, 6.7069091796875, 6.915283203125, 7.1236572265625, 7.33203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 16.0, 21.0, 36.0, 38.0, 51.0, 72.0, 90.0, 96.0, 81.0, 93.0, 89.0, 84.0, 62.0, 42.0, 34.0, 15.0, 14.0, 10.0, 8.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.08099365234375, -3.9276123046875, -3.77423095703125, -3.620849609375, -3.46746826171875, -3.3140869140625, -3.16070556640625, -3.00732421875, -2.85394287109375, -2.7005615234375, -2.54718017578125, -2.393798828125, -2.24041748046875, -2.0870361328125, -1.93365478515625, -1.7802734375, -1.62689208984375, -1.4735107421875, -1.32012939453125, -1.166748046875, -1.01336669921875, -0.8599853515625, -0.70660400390625, -0.55322265625, -0.39984130859375, -0.2464599609375, -0.09307861328125, 0.060302734375, 0.21368408203125, 0.3670654296875, 0.52044677734375, 0.673828125, 0.82720947265625, 0.9805908203125, 1.13397216796875, 1.287353515625, 1.44073486328125, 1.5941162109375, 1.74749755859375, 1.90087890625, 2.05426025390625, 2.2076416015625, 2.36102294921875, 2.514404296875, 2.66778564453125, 2.8211669921875, 2.97454833984375, 3.1279296875, 3.28131103515625, 3.4346923828125, 3.58807373046875, 3.741455078125, 3.89483642578125, 4.0482177734375, 4.20159912109375, 4.35498046875, 4.50836181640625, 4.6617431640625, 4.81512451171875, 4.968505859375, 5.12188720703125, 5.2752685546875, 5.42864990234375, 5.58203125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 5.0, 8.0, 5.0, 7.0, 12.0, 19.0, 17.0, 28.0, 21.0, 23.0, 23.0, 33.0, 27.0, 33.0, 39.0, 53.0, 39.0, 43.0, 39.0, 39.0, 55.0, 43.0, 42.0, 36.0, 30.0, 26.0, 38.0, 27.0, 25.0, 33.0, 20.0, 21.0, 13.0, 13.0, 13.0, 5.0, 16.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.781293869018555, -12.363321304321289, -11.945348739624023, -11.527376174926758, -11.109403610229492, -10.691431045532227, -10.273458480834961, -9.855485916137695, -9.43751335144043, -9.019540786743164, -8.601568222045898, -8.183595657348633, -7.765623092651367, -7.347650527954102, -6.929677963256836, -6.51170539855957, -6.093733310699463, -5.675760746002197, -5.257788181304932, -4.839815616607666, -4.4218430519104, -4.003870964050293, -3.5858981609344482, -3.1679255962371826, -2.749953031539917, -2.3319804668426514, -1.9140079021453857, -1.4960354566574097, -1.078062891960144, -0.660090446472168, -0.24211788177490234, 0.17585468292236328, 0.5938272476196289, 1.0117998123168945, 1.4297723770141602, 1.8477448225021362, 2.2657175064086914, 2.683689832687378, 3.1016623973846436, 3.519634962081909, 3.937607526779175, 4.355579853057861, 4.773552417755127, 5.191524982452393, 5.609497547149658, 6.027470111846924, 6.4454426765441895, 6.863415241241455, 7.281387805938721, 7.699360370635986, 8.117332458496094, 8.53530502319336, 8.953277587890625, 9.37125015258789, 9.789222717285156, 10.207195281982422, 10.625167846679688, 11.043140411376953, 11.461112976074219, 11.879085540771484, 12.29705810546875, 12.715030670166016, 13.133003234863281, 13.550975799560547, 13.968948364257812]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 2.0, 6.0, 14.0, 4.0, 14.0, 16.0, 19.0, 14.0, 25.0, 30.0, 28.0, 30.0, 22.0, 35.0, 43.0, 38.0, 41.0, 42.0, 46.0, 40.0, 37.0, 41.0, 28.0, 38.0, 29.0, 27.0, 32.0, 28.0, 29.0, 40.0, 21.0, 25.0, 16.0, 18.0, 11.0, 11.0, 12.0, 11.0, 2.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.830852508544922, -14.405828475952148, -13.980804443359375, -13.555780410766602, -13.130756378173828, -12.705732345581055, -12.280708312988281, -11.855684280395508, -11.430660247802734, -11.005636215209961, -10.580612182617188, -10.155588150024414, -9.73056411743164, -9.305540084838867, -8.880516052246094, -8.45549201965332, -8.03046703338623, -7.605443000793457, -7.180418968200684, -6.75539493560791, -6.330370903015137, -5.905346870422363, -5.480322360992432, -5.055298328399658, -4.630274295806885, -4.205250263214111, -3.780226230621338, -3.3552019596099854, -2.930177927017212, -2.5051538944244385, -2.080129623413086, -1.6551055908203125, -1.2300825119018555, -0.8050584197044373, -0.38003432750701904, 0.044989824295043945, 0.4700138568878174, 0.8950378894805908, 1.3200621604919434, 1.7450861930847168, 2.1701102256774902, 2.5951342582702637, 3.020158290863037, 3.4451825618743896, 3.870206594467163, 4.295230865478516, 4.720254898071289, 5.1452789306640625, 5.570302963256836, 5.995326995849609, 6.420351028442383, 6.845375061035156, 7.27039909362793, 7.695423126220703, 8.120447158813477, 8.54547119140625, 8.970495223999023, 9.395519256591797, 9.82054328918457, 10.245567321777344, 10.670591354370117, 11.09561538696289, 11.520639419555664, 11.945663452148438, 12.370688438415527]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 8.0, 4.0, 18.0, 23.0, 33.0, 61.0, 97.0, 168.0, 238.0, 445.0, 706.0, 1123.0, 1869.0, 3000.0, 4892.0, 7628.0, 12094.0, 19039.0, 28843.0, 43753.0, 65179.0, 92833.0, 131839.0, 177493.0, 231719.0, 287783.0, 340084.0, 379328.0, 395537.0, 387341.0, 356157.0, 307703.0, 252288.0, 195875.0, 145952.0, 105075.0, 73836.0, 49960.0, 33886.0, 22237.0, 14190.0, 9086.0, 5666.0, 3623.0, 2193.0, 1417.0, 772.0, 466.0, 308.0, 185.0, 114.0, 41.0, 42.0, 25.0, 11.0, 8.0, 4.0, 1.0, 0.0, 2.0], "bins": [-9.0859375, -8.807861328125, -8.52978515625, -8.251708984375, -7.9736328125, -7.695556640625, -7.41748046875, -7.139404296875, -6.861328125, -6.583251953125, -6.30517578125, -6.027099609375, -5.7490234375, -5.470947265625, -5.19287109375, -4.914794921875, -4.63671875, -4.358642578125, -4.08056640625, -3.802490234375, -3.5244140625, -3.246337890625, -2.96826171875, -2.690185546875, -2.412109375, -2.134033203125, -1.85595703125, -1.577880859375, -1.2998046875, -1.021728515625, -0.74365234375, -0.465576171875, -0.1875, 0.090576171875, 0.36865234375, 0.646728515625, 0.9248046875, 1.202880859375, 1.48095703125, 1.759033203125, 2.037109375, 2.315185546875, 2.59326171875, 2.871337890625, 3.1494140625, 3.427490234375, 3.70556640625, 3.983642578125, 4.26171875, 4.539794921875, 4.81787109375, 5.095947265625, 5.3740234375, 5.652099609375, 5.93017578125, 6.208251953125, 6.486328125, 6.764404296875, 7.04248046875, 7.320556640625, 7.5986328125, 7.876708984375, 8.15478515625, 8.432861328125, 8.7109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 5.0, 7.0, 9.0, 10.0, 7.0, 16.0, 17.0, 15.0, 22.0, 24.0, 39.0, 25.0, 31.0, 26.0, 38.0, 39.0, 43.0, 34.0, 44.0, 53.0, 36.0, 40.0, 31.0, 34.0, 25.0, 34.0, 34.0, 31.0, 21.0, 44.0, 24.0, 24.0, 15.0, 16.0, 16.0, 11.0, 11.0, 9.0, 6.0, 7.0, 6.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.8203125, -12.4451904296875, -12.070068359375, -11.6949462890625, -11.31982421875, -10.9447021484375, -10.569580078125, -10.1944580078125, -9.8193359375, -9.4442138671875, -9.069091796875, -8.6939697265625, -8.31884765625, -7.9437255859375, -7.568603515625, -7.1934814453125, -6.818359375, -6.4432373046875, -6.068115234375, -5.6929931640625, -5.31787109375, -4.9427490234375, -4.567626953125, -4.1925048828125, -3.8173828125, -3.4422607421875, -3.067138671875, -2.6920166015625, -2.31689453125, -1.9417724609375, -1.566650390625, -1.1915283203125, -0.81640625, -0.4412841796875, -0.066162109375, 0.3089599609375, 0.68408203125, 1.0592041015625, 1.434326171875, 1.8094482421875, 2.1845703125, 2.5596923828125, 2.934814453125, 3.3099365234375, 3.68505859375, 4.0601806640625, 4.435302734375, 4.8104248046875, 5.185546875, 5.5606689453125, 5.935791015625, 6.3109130859375, 6.68603515625, 7.0611572265625, 7.436279296875, 7.8114013671875, 8.1865234375, 8.5616455078125, 8.936767578125, 9.3118896484375, 9.68701171875, 10.0621337890625, 10.437255859375, 10.8123779296875, 11.1875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 8.0, 13.0, 24.0, 58.0, 85.0, 120.0, 259.0, 462.0, 773.0, 1326.0, 2248.0, 3978.0, 6403.0, 10794.0, 17424.0, 27852.0, 43248.0, 66161.0, 95829.0, 136080.0, 184670.0, 239919.0, 295793.0, 345790.0, 380985.0, 395161.0, 384950.0, 354823.0, 305503.0, 250648.0, 195396.0, 145423.0, 103545.0, 71462.0, 47592.0, 30703.0, 19192.0, 12077.0, 7202.0, 4233.0, 2604.0, 1464.0, 870.0, 513.0, 285.0, 120.0, 100.0, 56.0, 25.0, 23.0, 8.0, 6.0, 4.0, 1.0, 2.0], "bins": [-10.546875, -10.2420654296875, -9.937255859375, -9.6324462890625, -9.32763671875, -9.0228271484375, -8.718017578125, -8.4132080078125, -8.1083984375, -7.8035888671875, -7.498779296875, -7.1939697265625, -6.88916015625, -6.5843505859375, -6.279541015625, -5.9747314453125, -5.669921875, -5.3651123046875, -5.060302734375, -4.7554931640625, -4.45068359375, -4.1458740234375, -3.841064453125, -3.5362548828125, -3.2314453125, -2.9266357421875, -2.621826171875, -2.3170166015625, -2.01220703125, -1.7073974609375, -1.402587890625, -1.0977783203125, -0.79296875, -0.4881591796875, -0.183349609375, 0.1214599609375, 0.42626953125, 0.7310791015625, 1.035888671875, 1.3406982421875, 1.6455078125, 1.9503173828125, 2.255126953125, 2.5599365234375, 2.86474609375, 3.1695556640625, 3.474365234375, 3.7791748046875, 4.083984375, 4.3887939453125, 4.693603515625, 4.9984130859375, 5.30322265625, 5.6080322265625, 5.912841796875, 6.2176513671875, 6.5224609375, 6.8272705078125, 7.132080078125, 7.4368896484375, 7.74169921875, 8.0465087890625, 8.351318359375, 8.6561279296875, 8.9609375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 5.0, 8.0, 6.0, 9.0, 12.0, 14.0, 29.0, 31.0, 28.0, 38.0, 45.0, 60.0, 60.0, 87.0, 93.0, 118.0, 118.0, 156.0, 146.0, 153.0, 153.0, 178.0, 189.0, 189.0, 167.0, 191.0, 175.0, 190.0, 182.0, 170.0, 153.0, 151.0, 130.0, 112.0, 89.0, 96.0, 63.0, 56.0, 43.0, 40.0, 29.0, 29.0, 26.0, 14.0, 9.0, 13.0, 10.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.84765625, -5.683349609375, -5.51904296875, -5.354736328125, -5.1904296875, -5.026123046875, -4.86181640625, -4.697509765625, -4.533203125, -4.368896484375, -4.20458984375, -4.040283203125, -3.8759765625, -3.711669921875, -3.54736328125, -3.383056640625, -3.21875, -3.054443359375, -2.89013671875, -2.725830078125, -2.5615234375, -2.397216796875, -2.23291015625, -2.068603515625, -1.904296875, -1.739990234375, -1.57568359375, -1.411376953125, -1.2470703125, -1.082763671875, -0.91845703125, -0.754150390625, -0.58984375, -0.425537109375, -0.26123046875, -0.096923828125, 0.0673828125, 0.231689453125, 0.39599609375, 0.560302734375, 0.724609375, 0.888916015625, 1.05322265625, 1.217529296875, 1.3818359375, 1.546142578125, 1.71044921875, 1.874755859375, 2.0390625, 2.203369140625, 2.36767578125, 2.531982421875, 2.6962890625, 2.860595703125, 3.02490234375, 3.189208984375, 3.353515625, 3.517822265625, 3.68212890625, 3.846435546875, 4.0107421875, 4.175048828125, 4.33935546875, 4.503662109375, 4.66796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 7.0, 5.0, 6.0, 8.0, 11.0, 15.0, 14.0, 12.0, 7.0, 19.0, 24.0, 23.0, 38.0, 37.0, 33.0, 29.0, 41.0, 43.0, 31.0, 34.0, 42.0, 39.0, 47.0, 48.0, 38.0, 45.0, 33.0, 30.0, 29.0, 25.0, 31.0, 26.0, 20.0, 18.0, 11.0, 14.0, 11.0, 14.0, 14.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-13.379307746887207, -12.9785737991333, -12.577839851379395, -12.177105903625488, -11.776371955871582, -11.375638008117676, -10.974905014038086, -10.57417106628418, -10.173437118530273, -9.772703170776367, -9.371969223022461, -8.971235275268555, -8.570501327514648, -8.169767379760742, -7.769033908843994, -7.368299961090088, -6.967565536499023, -6.566831588745117, -6.166097640991211, -5.765363693237305, -5.364629745483398, -4.963895797729492, -4.563162326812744, -4.162428379058838, -3.7616944313049316, -3.3609604835510254, -2.960226535797119, -2.559492826461792, -2.1587588787078857, -1.7580249309539795, -1.3572912216186523, -0.9565572738647461, -0.5558242797851562, -0.15509039163589478, 0.2456434965133667, 0.6463773250579834, 1.0471112728118896, 1.447845220565796, 1.848578929901123, 2.2493128776550293, 2.6500468254089355, 3.050780773162842, 3.451514720916748, 3.852248430252075, 4.252982139587402, 4.653716087341309, 5.054450035095215, 5.455183982849121, 5.855917930603027, 6.256651878356934, 6.65738582611084, 7.058119773864746, 7.458853721618652, 7.859587669372559, 8.260320663452148, 8.661054611206055, 9.061788558959961, 9.462522506713867, 9.863256454467773, 10.26399040222168, 10.664724349975586, 11.065458297729492, 11.466192245483398, 11.866926193237305, 12.267660140991211]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 4.0, 8.0, 3.0, 11.0, 16.0, 10.0, 21.0, 15.0, 19.0, 21.0, 25.0, 28.0, 23.0, 27.0, 31.0, 39.0, 39.0, 39.0, 31.0, 38.0, 37.0, 31.0, 33.0, 36.0, 41.0, 27.0, 35.0, 32.0, 32.0, 28.0, 22.0, 18.0, 33.0, 17.0, 13.0, 16.0, 17.0, 14.0, 15.0, 10.0, 10.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.455949783325195, -12.056567192077637, -11.657184600830078, -11.257801055908203, -10.858418464660645, -10.459035873413086, -10.059653282165527, -9.660270690917969, -9.260887145996094, -8.861504554748535, -8.462121963500977, -8.062738418579102, -7.663355827331543, -7.263973236083984, -6.864590644836426, -6.465208053588867, -6.065825462341309, -5.66644287109375, -5.267059803009033, -4.867677211761475, -4.468294143676758, -4.068911552429199, -3.6695289611816406, -3.270146131515503, -2.8707633018493652, -2.4713804721832275, -2.07199764251709, -1.6726150512695312, -1.2732322216033936, -0.8738493919372559, -0.47446680068969727, -0.07508397102355957, 0.3242979049682617, 0.7236806750297546, 1.1230634450912476, 1.5224461555480957, 1.9218289852142334, 2.321211814880371, 2.7205944061279297, 3.1199772357940674, 3.519360065460205, 3.9187428951263428, 4.3181257247924805, 4.717508316040039, 5.116890907287598, 5.5162739753723145, 5.915656566619873, 6.31503963470459, 6.714422225952148, 7.113804817199707, 7.513187885284424, 7.912570476531982, 8.3119535446167, 8.711336135864258, 9.110718727111816, 9.510101318359375, 9.90948486328125, 10.308867454528809, 10.708250045776367, 11.107633590698242, 11.5070161819458, 11.90639877319336, 12.305781364440918, 12.705163955688477, 13.104546546936035]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 7.0, 10.0, 29.0, 37.0, 46.0, 61.0, 118.0, 151.0, 256.0, 412.0, 681.0, 1169.0, 2097.0, 3524.0, 6372.0, 11724.0, 21869.0, 40659.0, 74010.0, 126408.0, 186727.0, 202765.0, 155428.0, 95695.0, 53725.0, 29228.0, 15674.0, 8461.0, 4782.0, 2610.0, 1533.0, 876.0, 508.0, 319.0, 203.0, 129.0, 72.0, 61.0, 41.0, 25.0, 18.0, 7.0, 9.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.4295654296875, -2.343505859375, -2.2574462890625, -2.17138671875, -2.0853271484375, -1.999267578125, -1.9132080078125, -1.8271484375, -1.7410888671875, -1.655029296875, -1.5689697265625, -1.48291015625, -1.3968505859375, -1.310791015625, -1.2247314453125, -1.138671875, -1.0526123046875, -0.966552734375, -0.8804931640625, -0.79443359375, -0.7083740234375, -0.622314453125, -0.5362548828125, -0.4501953125, -0.3641357421875, -0.278076171875, -0.1920166015625, -0.10595703125, -0.0198974609375, 0.066162109375, 0.1522216796875, 0.23828125, 0.3243408203125, 0.410400390625, 0.4964599609375, 0.58251953125, 0.6685791015625, 0.754638671875, 0.8406982421875, 0.9267578125, 1.0128173828125, 1.098876953125, 1.1849365234375, 1.27099609375, 1.3570556640625, 1.443115234375, 1.5291748046875, 1.615234375, 1.7012939453125, 1.787353515625, 1.8734130859375, 1.95947265625, 2.0455322265625, 2.131591796875, 2.2176513671875, 2.3037109375, 2.3897705078125, 2.475830078125, 2.5618896484375, 2.64794921875, 2.7340087890625, 2.820068359375, 2.9061279296875, 2.9921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 4.0, 8.0, 4.0, 10.0, 16.0, 12.0, 19.0, 14.0, 23.0, 18.0, 27.0, 25.0, 27.0, 24.0, 30.0, 40.0, 40.0, 39.0, 30.0, 38.0, 39.0, 30.0, 31.0, 37.0, 42.0, 27.0, 36.0, 30.0, 32.0, 31.0, 20.0, 19.0, 31.0, 17.0, 14.0, 15.0, 17.0, 14.0, 16.0, 9.0, 10.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.4921875, -12.092529296875, -11.69287109375, -11.293212890625, -10.8935546875, -10.493896484375, -10.09423828125, -9.694580078125, -9.294921875, -8.895263671875, -8.49560546875, -8.095947265625, -7.6962890625, -7.296630859375, -6.89697265625, -6.497314453125, -6.09765625, -5.697998046875, -5.29833984375, -4.898681640625, -4.4990234375, -4.099365234375, -3.69970703125, -3.300048828125, -2.900390625, -2.500732421875, -2.10107421875, -1.701416015625, -1.3017578125, -0.902099609375, -0.50244140625, -0.102783203125, 0.296875, 0.696533203125, 1.09619140625, 1.495849609375, 1.8955078125, 2.295166015625, 2.69482421875, 3.094482421875, 3.494140625, 3.893798828125, 4.29345703125, 4.693115234375, 5.0927734375, 5.492431640625, 5.89208984375, 6.291748046875, 6.69140625, 7.091064453125, 7.49072265625, 7.890380859375, 8.2900390625, 8.689697265625, 9.08935546875, 9.489013671875, 9.888671875, 10.288330078125, 10.68798828125, 11.087646484375, 11.4873046875, 11.886962890625, 12.28662109375, 12.686279296875, 13.0859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 6.0, 11.0, 11.0, 14.0, 22.0, 28.0, 48.0, 62.0, 73.0, 130.0, 155.0, 211.0, 315.0, 454.0, 624.0, 923.0, 1381.0, 2184.0, 3399.0, 5455.0, 8926.0, 15236.0, 26015.0, 47743.0, 90749.0, 169281.0, 244131.0, 191861.0, 106638.0, 56224.0, 30693.0, 17570.0, 10475.0, 6258.0, 3825.0, 2419.0, 1626.0, 1020.0, 682.0, 494.0, 357.0, 229.0, 191.0, 109.0, 86.0, 63.0, 45.0, 27.0, 33.0, 22.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.701171875, -2.6099853515625, -2.518798828125, -2.4276123046875, -2.33642578125, -2.2452392578125, -2.154052734375, -2.0628662109375, -1.9716796875, -1.8804931640625, -1.789306640625, -1.6981201171875, -1.60693359375, -1.5157470703125, -1.424560546875, -1.3333740234375, -1.2421875, -1.1510009765625, -1.059814453125, -0.9686279296875, -0.87744140625, -0.7862548828125, -0.695068359375, -0.6038818359375, -0.5126953125, -0.4215087890625, -0.330322265625, -0.2391357421875, -0.14794921875, -0.0567626953125, 0.034423828125, 0.1256103515625, 0.216796875, 0.3079833984375, 0.399169921875, 0.4903564453125, 0.58154296875, 0.6727294921875, 0.763916015625, 0.8551025390625, 0.9462890625, 1.0374755859375, 1.128662109375, 1.2198486328125, 1.31103515625, 1.4022216796875, 1.493408203125, 1.5845947265625, 1.67578125, 1.7669677734375, 1.858154296875, 1.9493408203125, 2.04052734375, 2.1317138671875, 2.222900390625, 2.3140869140625, 2.4052734375, 2.4964599609375, 2.587646484375, 2.6788330078125, 2.77001953125, 2.8612060546875, 2.952392578125, 3.0435791015625, 3.134765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 4.0, 7.0, 10.0, 11.0, 15.0, 11.0, 15.0, 26.0, 16.0, 17.0, 31.0, 35.0, 25.0, 29.0, 51.0, 29.0, 45.0, 33.0, 38.0, 41.0, 38.0, 45.0, 40.0, 40.0, 36.0, 35.0, 36.0, 30.0, 37.0, 26.0, 24.0, 15.0, 22.0, 12.0, 12.0, 6.0, 12.0, 12.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.479248046875, -8.20849609375, -7.937744140625, -7.6669921875, -7.396240234375, -7.12548828125, -6.854736328125, -6.583984375, -6.313232421875, -6.04248046875, -5.771728515625, -5.5009765625, -5.230224609375, -4.95947265625, -4.688720703125, -4.41796875, -4.147216796875, -3.87646484375, -3.605712890625, -3.3349609375, -3.064208984375, -2.79345703125, -2.522705078125, -2.251953125, -1.981201171875, -1.71044921875, -1.439697265625, -1.1689453125, -0.898193359375, -0.62744140625, -0.356689453125, -0.0859375, 0.184814453125, 0.45556640625, 0.726318359375, 0.9970703125, 1.267822265625, 1.53857421875, 1.809326171875, 2.080078125, 2.350830078125, 2.62158203125, 2.892333984375, 3.1630859375, 3.433837890625, 3.70458984375, 3.975341796875, 4.24609375, 4.516845703125, 4.78759765625, 5.058349609375, 5.3291015625, 5.599853515625, 5.87060546875, 6.141357421875, 6.412109375, 6.682861328125, 6.95361328125, 7.224365234375, 7.4951171875, 7.765869140625, 8.03662109375, 8.307373046875, 8.578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 13.0, 18.0, 20.0, 27.0, 38.0, 51.0, 76.0, 120.0, 152.0, 229.0, 358.0, 555.0, 886.0, 1406.0, 2480.0, 4668.0, 9283.0, 21455.0, 62338.0, 271543.0, 483627.0, 125075.0, 35301.0, 14134.0, 6437.0, 3328.0, 1901.0, 1086.0, 680.0, 388.0, 259.0, 213.0, 118.0, 92.0, 49.0, 33.0, 23.0, 27.0, 12.0, 25.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5615234375, -1.5131072998046875, -1.464691162109375, -1.4162750244140625, -1.36785888671875, -1.3194427490234375, -1.271026611328125, -1.2226104736328125, -1.1741943359375, -1.1257781982421875, -1.077362060546875, -1.0289459228515625, -0.98052978515625, -0.9321136474609375, -0.883697509765625, -0.8352813720703125, -0.786865234375, -0.7384490966796875, -0.690032958984375, -0.6416168212890625, -0.59320068359375, -0.5447845458984375, -0.496368408203125, -0.4479522705078125, -0.3995361328125, -0.3511199951171875, -0.302703857421875, -0.2542877197265625, -0.20587158203125, -0.1574554443359375, -0.109039306640625, -0.0606231689453125, -0.01220703125, 0.0362091064453125, 0.084625244140625, 0.1330413818359375, 0.18145751953125, 0.2298736572265625, 0.278289794921875, 0.3267059326171875, 0.3751220703125, 0.4235382080078125, 0.471954345703125, 0.5203704833984375, 0.56878662109375, 0.6172027587890625, 0.665618896484375, 0.7140350341796875, 0.762451171875, 0.8108673095703125, 0.859283447265625, 0.9076995849609375, 0.95611572265625, 1.0045318603515625, 1.052947998046875, 1.1013641357421875, 1.1497802734375, 1.1981964111328125, 1.246612548828125, 1.2950286865234375, 1.34344482421875, 1.3918609619140625, 1.440277099609375, 1.4886932373046875, 1.537109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 4.0, 13.0, 15.0, 10.0, 8.0, 15.0, 22.0, 22.0, 34.0, 36.0, 29.0, 46.0, 38.0, 51.0, 53.0, 59.0, 55.0, 51.0, 60.0, 48.0, 44.0, 44.0, 39.0, 33.0, 27.0, 24.0, 28.0, 18.0, 17.0, 9.0, 9.0, 5.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.930133819580078e-05, -9.651482105255127e-05, -9.372830390930176e-05, -9.094178676605225e-05, -8.815526962280273e-05, -8.536875247955322e-05, -8.258223533630371e-05, -7.97957181930542e-05, -7.700920104980469e-05, -7.422268390655518e-05, -7.143616676330566e-05, -6.864964962005615e-05, -6.586313247680664e-05, -6.307661533355713e-05, -6.029009819030762e-05, -5.7503581047058105e-05, -5.4717063903808594e-05, -5.193054676055908e-05, -4.914402961730957e-05, -4.635751247406006e-05, -4.357099533081055e-05, -4.0784478187561035e-05, -3.7997961044311523e-05, -3.521144390106201e-05, -3.24249267578125e-05, -2.9638409614562988e-05, -2.6851892471313477e-05, -2.4065375328063965e-05, -2.1278858184814453e-05, -1.849234104156494e-05, -1.570582389831543e-05, -1.2919306755065918e-05, -1.0132789611816406e-05, -7.3462724685668945e-06, -4.559755325317383e-06, -1.773238182067871e-06, 1.0132789611816406e-06, 3.7997961044311523e-06, 6.586313247680664e-06, 9.372830390930176e-06, 1.2159347534179688e-05, 1.49458646774292e-05, 1.773238182067871e-05, 2.0518898963928223e-05, 2.3305416107177734e-05, 2.6091933250427246e-05, 2.8878450393676758e-05, 3.166496753692627e-05, 3.445148468017578e-05, 3.723800182342529e-05, 4.0024518966674805e-05, 4.2811036109924316e-05, 4.559755325317383e-05, 4.838407039642334e-05, 5.117058753967285e-05, 5.395710468292236e-05, 5.6743621826171875e-05, 5.953013896942139e-05, 6.23166561126709e-05, 6.510317325592041e-05, 6.788969039916992e-05, 7.067620754241943e-05, 7.346272468566895e-05, 7.624924182891846e-05, 7.903575897216797e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 15.0, 13.0, 20.0, 22.0, 34.0, 42.0, 75.0, 107.0, 145.0, 183.0, 275.0, 343.0, 541.0, 862.0, 1168.0, 1784.0, 2796.0, 4240.0, 7085.0, 11900.0, 21198.0, 40182.0, 80397.0, 159179.0, 247106.0, 216694.0, 120299.0, 59472.0, 30394.0, 16211.0, 9313.0, 5621.0, 3675.0, 2327.0, 1490.0, 998.0, 666.0, 484.0, 404.0, 231.0, 167.0, 111.0, 85.0, 50.0, 48.0, 30.0, 25.0, 19.0, 9.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.6533203125, -1.6043853759765625, -1.555450439453125, -1.5065155029296875, -1.45758056640625, -1.4086456298828125, -1.359710693359375, -1.3107757568359375, -1.2618408203125, -1.2129058837890625, -1.163970947265625, -1.1150360107421875, -1.06610107421875, -1.0171661376953125, -0.968231201171875, -0.9192962646484375, -0.870361328125, -0.8214263916015625, -0.772491455078125, -0.7235565185546875, -0.67462158203125, -0.6256866455078125, -0.576751708984375, -0.5278167724609375, -0.4788818359375, -0.4299468994140625, -0.381011962890625, -0.3320770263671875, -0.28314208984375, -0.2342071533203125, -0.185272216796875, -0.1363372802734375, -0.08740234375, -0.0384674072265625, 0.010467529296875, 0.0594024658203125, 0.10833740234375, 0.1572723388671875, 0.206207275390625, 0.2551422119140625, 0.3040771484375, 0.3530120849609375, 0.401947021484375, 0.4508819580078125, 0.49981689453125, 0.5487518310546875, 0.597686767578125, 0.6466217041015625, 0.695556640625, 0.7444915771484375, 0.793426513671875, 0.8423614501953125, 0.89129638671875, 0.9402313232421875, 0.989166259765625, 1.0381011962890625, 1.0870361328125, 1.1359710693359375, 1.184906005859375, 1.2338409423828125, 1.28277587890625, 1.3317108154296875, 1.380645751953125, 1.4295806884765625, 1.478515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 10.0, 3.0, 8.0, 6.0, 13.0, 15.0, 12.0, 7.0, 12.0, 18.0, 30.0, 38.0, 51.0, 73.0, 86.0, 102.0, 95.0, 80.0, 64.0, 49.0, 52.0, 27.0, 22.0, 18.0, 12.0, 16.0, 9.0, 11.0, 7.0, 9.0, 2.0, 9.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.607879638671875, -0.58636474609375, -0.564849853515625, -0.5433349609375, -0.521820068359375, -0.50030517578125, -0.478790283203125, -0.457275390625, -0.435760498046875, -0.41424560546875, -0.392730712890625, -0.3712158203125, -0.349700927734375, -0.32818603515625, -0.306671142578125, -0.28515625, -0.263641357421875, -0.24212646484375, -0.220611572265625, -0.1990966796875, -0.177581787109375, -0.15606689453125, -0.134552001953125, -0.113037109375, -0.091522216796875, -0.07000732421875, -0.048492431640625, -0.0269775390625, -0.005462646484375, 0.01605224609375, 0.037567138671875, 0.05908203125, 0.080596923828125, 0.10211181640625, 0.123626708984375, 0.1451416015625, 0.166656494140625, 0.18817138671875, 0.209686279296875, 0.231201171875, 0.252716064453125, 0.27423095703125, 0.295745849609375, 0.3172607421875, 0.338775634765625, 0.36029052734375, 0.381805419921875, 0.4033203125, 0.424835205078125, 0.44635009765625, 0.467864990234375, 0.4893798828125, 0.510894775390625, 0.53240966796875, 0.553924560546875, 0.575439453125, 0.596954345703125, 0.61846923828125, 0.639984130859375, 0.6614990234375, 0.683013916015625, 0.70452880859375, 0.726043701171875, 0.74755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 18.0, 15.0, 11.0, 14.0, 12.0, 19.0, 27.0, 33.0, 27.0, 42.0, 32.0, 37.0, 39.0, 38.0, 37.0, 35.0, 46.0, 43.0, 50.0, 43.0, 35.0, 39.0, 31.0, 35.0, 18.0, 27.0, 28.0, 30.0, 17.0, 8.0, 16.0, 14.0, 15.0, 9.0, 7.0, 8.0, 8.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.17137336730957, -12.766740798950195, -12.36210823059082, -11.957475662231445, -11.55284309387207, -11.148210525512695, -10.74357795715332, -10.338946342468262, -9.934313774108887, -9.529681205749512, -9.125048637390137, -8.720416069030762, -8.315783500671387, -7.91115140914917, -7.506518840789795, -7.101886749267578, -6.697253704071045, -6.29262113571167, -5.887988567352295, -5.483356475830078, -5.078723907470703, -4.674091339111328, -4.269458770751953, -3.8648264408111572, -3.4601938724517822, -3.0555613040924072, -2.6509289741516113, -2.2462964057922363, -1.8416639566421509, -1.4370315074920654, -1.0323989391326904, -0.6277666091918945, -0.22313404083251953, 0.1814984381198883, 0.5861309170722961, 0.9907634258270264, 1.3953958749771118, 1.8000283241271973, 2.2046608924865723, 2.609293222427368, 3.013925790786743, 3.418558359146118, 3.823190689086914, 4.227823257446289, 4.632455825805664, 5.037088394165039, 5.441720962524414, 5.846353054046631, 6.250985622406006, 6.655618190765381, 7.060250759124756, 7.464882850646973, 7.869515419006348, 8.274147987365723, 8.678780555725098, 9.083413124084473, 9.488045692443848, 9.892678260803223, 10.297310829162598, 10.701943397521973, 11.106575965881348, 11.511207580566406, 11.915840148925781, 12.320472717285156, 12.725105285644531]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 8.0, 5.0, 9.0, 13.0, 15.0, 18.0, 17.0, 19.0, 25.0, 24.0, 23.0, 26.0, 27.0, 31.0, 49.0, 35.0, 33.0, 36.0, 37.0, 36.0, 32.0, 35.0, 46.0, 31.0, 27.0, 35.0, 33.0, 33.0, 26.0, 24.0, 23.0, 26.0, 11.0, 19.0, 19.0, 14.0, 14.0, 15.0, 10.0, 5.0, 11.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.595891952514648, -12.190874099731445, -11.785857200622559, -11.380839347839355, -10.975821495056152, -10.570804595947266, -10.165786743164062, -9.76076889038086, -9.355751037597656, -8.950733184814453, -8.545716285705566, -8.140698432922363, -7.73568058013916, -7.330663204193115, -6.92564582824707, -6.520627975463867, -6.1156110763549805, -5.7105937004089355, -5.305575847625732, -4.9005584716796875, -4.495540618896484, -4.0905232429504395, -3.6855058670043945, -3.2804882526397705, -2.8754706382751465, -2.4704530239105225, -2.0654354095458984, -1.6604180335998535, -1.2554004192352295, -0.8503828048706055, -0.44536542892456055, -0.04034781455993652, 0.3646688461303711, 0.7696864008903503, 1.1747039556503296, 1.579721450805664, 1.984739065170288, 2.389756679534912, 2.794774055480957, 3.199791669845581, 3.604809284210205, 4.00982666015625, 4.414844512939453, 4.819861888885498, 5.224879264831543, 5.629897117614746, 6.034914493560791, 6.439931869506836, 6.844949722290039, 7.249967098236084, 7.654984951019287, 8.060002326965332, 8.465020179748535, 8.870037078857422, 9.275054931640625, 9.680072784423828, 10.085090637207031, 10.490108489990234, 10.895125389099121, 11.300143241882324, 11.705161094665527, 12.110177993774414, 12.515195846557617, 12.92021369934082, 13.325230598449707]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 15.0, 24.0, 41.0, 92.0, 151.0, 229.0, 397.0, 655.0, 888.0, 1549.0, 2266.0, 3573.0, 5487.0, 8058.0, 11825.0, 16806.0, 23099.0, 31165.0, 40658.0, 51360.0, 62040.0, 72326.0, 80875.0, 85377.0, 86894.0, 84367.0, 77451.0, 68331.0, 57449.0, 46822.0, 36353.0, 27701.0, 20141.0, 14579.0, 9997.0, 6772.0, 4575.0, 2985.0, 1924.0, 1269.0, 744.0, 494.0, 299.0, 186.0, 96.0, 61.0, 47.0, 25.0, 6.0, 12.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2109375, -7.948486328125, -7.68603515625, -7.423583984375, -7.1611328125, -6.898681640625, -6.63623046875, -6.373779296875, -6.111328125, -5.848876953125, -5.58642578125, -5.323974609375, -5.0615234375, -4.799072265625, -4.53662109375, -4.274169921875, -4.01171875, -3.749267578125, -3.48681640625, -3.224365234375, -2.9619140625, -2.699462890625, -2.43701171875, -2.174560546875, -1.912109375, -1.649658203125, -1.38720703125, -1.124755859375, -0.8623046875, -0.599853515625, -0.33740234375, -0.074951171875, 0.1875, 0.449951171875, 0.71240234375, 0.974853515625, 1.2373046875, 1.499755859375, 1.76220703125, 2.024658203125, 2.287109375, 2.549560546875, 2.81201171875, 3.074462890625, 3.3369140625, 3.599365234375, 3.86181640625, 4.124267578125, 4.38671875, 4.649169921875, 4.91162109375, 5.174072265625, 5.4365234375, 5.698974609375, 5.96142578125, 6.223876953125, 6.486328125, 6.748779296875, 7.01123046875, 7.273681640625, 7.5361328125, 7.798583984375, 8.06103515625, 8.323486328125, 8.5859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 3.0, 7.0, 7.0, 5.0, 18.0, 14.0, 17.0, 16.0, 16.0, 25.0, 25.0, 25.0, 25.0, 27.0, 30.0, 40.0, 44.0, 36.0, 26.0, 44.0, 39.0, 27.0, 38.0, 38.0, 40.0, 24.0, 34.0, 31.0, 39.0, 25.0, 24.0, 20.0, 30.0, 14.0, 14.0, 21.0, 12.0, 18.0, 12.0, 12.0, 6.0, 8.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.265625, -11.8736572265625, -11.481689453125, -11.0897216796875, -10.69775390625, -10.3057861328125, -9.913818359375, -9.5218505859375, -9.1298828125, -8.7379150390625, -8.345947265625, -7.9539794921875, -7.56201171875, -7.1700439453125, -6.778076171875, -6.3861083984375, -5.994140625, -5.6021728515625, -5.210205078125, -4.8182373046875, -4.42626953125, -4.0343017578125, -3.642333984375, -3.2503662109375, -2.8583984375, -2.4664306640625, -2.074462890625, -1.6824951171875, -1.29052734375, -0.8985595703125, -0.506591796875, -0.1146240234375, 0.27734375, 0.6693115234375, 1.061279296875, 1.4532470703125, 1.84521484375, 2.2371826171875, 2.629150390625, 3.0211181640625, 3.4130859375, 3.8050537109375, 4.197021484375, 4.5889892578125, 4.98095703125, 5.3729248046875, 5.764892578125, 6.1568603515625, 6.548828125, 6.9407958984375, 7.332763671875, 7.7247314453125, 8.11669921875, 8.5086669921875, 8.900634765625, 9.2926025390625, 9.6845703125, 10.0765380859375, 10.468505859375, 10.8604736328125, 11.25244140625, 11.6444091796875, 12.036376953125, 12.4283447265625, 12.8203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 0.0, 4.0, 23.0, 19.0, 29.0, 42.0, 91.0, 118.0, 207.0, 355.0, 562.0, 905.0, 1443.0, 2262.0, 3312.0, 5159.0, 7841.0, 11457.0, 16282.0, 23081.0, 31517.0, 41594.0, 53295.0, 65025.0, 76127.0, 85084.0, 90213.0, 90553.0, 86065.0, 78305.0, 66813.0, 55558.0, 43882.0, 33112.0, 24478.0, 17549.0, 12175.0, 8326.0, 5567.0, 3617.0, 2406.0, 1525.0, 976.0, 636.0, 391.0, 218.0, 136.0, 73.0, 56.0, 39.0, 26.0, 19.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1875, -7.9154052734375, -7.643310546875, -7.3712158203125, -7.09912109375, -6.8270263671875, -6.554931640625, -6.2828369140625, -6.0107421875, -5.7386474609375, -5.466552734375, -5.1944580078125, -4.92236328125, -4.6502685546875, -4.378173828125, -4.1060791015625, -3.833984375, -3.5618896484375, -3.289794921875, -3.0177001953125, -2.74560546875, -2.4735107421875, -2.201416015625, -1.9293212890625, -1.6572265625, -1.3851318359375, -1.113037109375, -0.8409423828125, -0.56884765625, -0.2967529296875, -0.024658203125, 0.2474365234375, 0.51953125, 0.7916259765625, 1.063720703125, 1.3358154296875, 1.60791015625, 1.8800048828125, 2.152099609375, 2.4241943359375, 2.6962890625, 2.9683837890625, 3.240478515625, 3.5125732421875, 3.78466796875, 4.0567626953125, 4.328857421875, 4.6009521484375, 4.873046875, 5.1451416015625, 5.417236328125, 5.6893310546875, 5.96142578125, 6.2335205078125, 6.505615234375, 6.7777099609375, 7.0498046875, 7.3218994140625, 7.593994140625, 7.8660888671875, 8.13818359375, 8.4102783203125, 8.682373046875, 8.9544677734375, 9.2265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 3.0, 7.0, 12.0, 13.0, 14.0, 15.0, 29.0, 16.0, 20.0, 28.0, 31.0, 14.0, 36.0, 34.0, 38.0, 37.0, 43.0, 35.0, 28.0, 36.0, 23.0, 37.0, 48.0, 40.0, 35.0, 27.0, 38.0, 39.0, 32.0, 25.0, 22.0, 26.0, 15.0, 16.0, 11.0, 10.0, 7.0, 9.0, 13.0, 9.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.2890625, -8.0181884765625, -7.747314453125, -7.4764404296875, -7.20556640625, -6.9346923828125, -6.663818359375, -6.3929443359375, -6.1220703125, -5.8511962890625, -5.580322265625, -5.3094482421875, -5.03857421875, -4.7677001953125, -4.496826171875, -4.2259521484375, -3.955078125, -3.6842041015625, -3.413330078125, -3.1424560546875, -2.87158203125, -2.6007080078125, -2.329833984375, -2.0589599609375, -1.7880859375, -1.5172119140625, -1.246337890625, -0.9754638671875, -0.70458984375, -0.4337158203125, -0.162841796875, 0.1080322265625, 0.37890625, 0.6497802734375, 0.920654296875, 1.1915283203125, 1.46240234375, 1.7332763671875, 2.004150390625, 2.2750244140625, 2.5458984375, 2.8167724609375, 3.087646484375, 3.3585205078125, 3.62939453125, 3.9002685546875, 4.171142578125, 4.4420166015625, 4.712890625, 4.9837646484375, 5.254638671875, 5.5255126953125, 5.79638671875, 6.0672607421875, 6.338134765625, 6.6090087890625, 6.8798828125, 7.1507568359375, 7.421630859375, 7.6925048828125, 7.96337890625, 8.2342529296875, 8.505126953125, 8.7760009765625, 9.046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 6.0, 9.0, 12.0, 9.0, 21.0, 38.0, 50.0, 73.0, 111.0, 202.0, 304.0, 434.0, 666.0, 1063.0, 1544.0, 2458.0, 3735.0, 5754.0, 8673.0, 13370.0, 19719.0, 28707.0, 40113.0, 54434.0, 69987.0, 85386.0, 98179.0, 104143.0, 103062.0, 94886.0, 81527.0, 65492.0, 50294.0, 36769.0, 25571.0, 17544.0, 11709.0, 7841.0, 5172.0, 3315.0, 2099.0, 1379.0, 971.0, 567.0, 410.0, 246.0, 153.0, 110.0, 89.0, 52.0, 46.0, 26.0, 11.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.03289794921875, -3.8978271484375, -3.76275634765625, -3.627685546875, -3.49261474609375, -3.3575439453125, -3.22247314453125, -3.08740234375, -2.95233154296875, -2.8172607421875, -2.68218994140625, -2.547119140625, -2.41204833984375, -2.2769775390625, -2.14190673828125, -2.0068359375, -1.87176513671875, -1.7366943359375, -1.60162353515625, -1.466552734375, -1.33148193359375, -1.1964111328125, -1.06134033203125, -0.92626953125, -0.79119873046875, -0.6561279296875, -0.52105712890625, -0.385986328125, -0.25091552734375, -0.1158447265625, 0.01922607421875, 0.154296875, 0.28936767578125, 0.4244384765625, 0.55950927734375, 0.694580078125, 0.82965087890625, 0.9647216796875, 1.09979248046875, 1.23486328125, 1.36993408203125, 1.5050048828125, 1.64007568359375, 1.775146484375, 1.91021728515625, 2.0452880859375, 2.18035888671875, 2.3154296875, 2.45050048828125, 2.5855712890625, 2.72064208984375, 2.855712890625, 2.99078369140625, 3.1258544921875, 3.26092529296875, 3.39599609375, 3.53106689453125, 3.6661376953125, 3.80120849609375, 3.936279296875, 4.07135009765625, 4.2064208984375, 4.34149169921875, 4.4765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 7.0, 11.0, 10.0, 18.0, 17.0, 17.0, 18.0, 33.0, 24.0, 23.0, 40.0, 48.0, 32.0, 30.0, 46.0, 43.0, 49.0, 48.0, 43.0, 53.0, 38.0, 41.0, 34.0, 31.0, 37.0, 26.0, 26.0, 24.0, 23.0, 24.0, 18.0, 12.0, 6.0, 7.0, 4.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005769729614257812, -0.0005591660737991333, -0.0005413591861724854, -0.0005235522985458374, -0.0005057454109191895, -0.0004879385232925415, -0.00047013163566589355, -0.0004523247480392456, -0.00043451786041259766, -0.0004167109727859497, -0.00039890408515930176, -0.0003810971975326538, -0.00036329030990600586, -0.0003454834222793579, -0.00032767653465270996, -0.000309869647026062, -0.00029206275939941406, -0.0002742558717727661, -0.00025644898414611816, -0.00023864209651947021, -0.00022083520889282227, -0.00020302832126617432, -0.00018522143363952637, -0.00016741454601287842, -0.00014960765838623047, -0.00013180077075958252, -0.00011399388313293457, -9.618699550628662e-05, -7.838010787963867e-05, -6.057322025299072e-05, -4.2766332626342773e-05, -2.4959444999694824e-05, -7.152557373046875e-06, 1.0654330253601074e-05, 2.8461217880249023e-05, 4.626810550689697e-05, 6.407499313354492e-05, 8.188188076019287e-05, 9.968876838684082e-05, 0.00011749565601348877, 0.00013530254364013672, 0.00015310943126678467, 0.00017091631889343262, 0.00018872320652008057, 0.00020653009414672852, 0.00022433698177337646, 0.00024214386940002441, 0.00025995075702667236, 0.0002777576446533203, 0.00029556453227996826, 0.0003133714199066162, 0.00033117830753326416, 0.0003489851951599121, 0.00036679208278656006, 0.000384598970413208, 0.00040240585803985596, 0.0004202127456665039, 0.00043801963329315186, 0.0004558265209197998, 0.00047363340854644775, 0.0004914402961730957, 0.0005092471837997437, 0.0005270540714263916, 0.0005448609590530396, 0.0005626678466796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 16.0, 21.0, 36.0, 65.0, 103.0, 149.0, 245.0, 373.0, 603.0, 963.0, 1581.0, 2614.0, 4212.0, 7069.0, 11242.0, 18101.0, 27959.0, 42861.0, 61657.0, 83941.0, 104521.0, 119798.0, 123334.0, 114953.0, 96448.0, 74097.0, 53311.0, 36085.0, 23522.0, 14811.0, 9171.0, 5649.0, 3426.0, 2186.0, 1287.0, 799.0, 509.0, 289.0, 197.0, 131.0, 75.0, 42.0, 37.0, 14.0, 15.0, 16.0, 9.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.1484375, -5.9637451171875, -5.779052734375, -5.5943603515625, -5.40966796875, -5.2249755859375, -5.040283203125, -4.8555908203125, -4.6708984375, -4.4862060546875, -4.301513671875, -4.1168212890625, -3.93212890625, -3.7474365234375, -3.562744140625, -3.3780517578125, -3.193359375, -3.0086669921875, -2.823974609375, -2.6392822265625, -2.45458984375, -2.2698974609375, -2.085205078125, -1.9005126953125, -1.7158203125, -1.5311279296875, -1.346435546875, -1.1617431640625, -0.97705078125, -0.7923583984375, -0.607666015625, -0.4229736328125, -0.23828125, -0.0535888671875, 0.131103515625, 0.3157958984375, 0.50048828125, 0.6851806640625, 0.869873046875, 1.0545654296875, 1.2392578125, 1.4239501953125, 1.608642578125, 1.7933349609375, 1.97802734375, 2.1627197265625, 2.347412109375, 2.5321044921875, 2.716796875, 2.9014892578125, 3.086181640625, 3.2708740234375, 3.45556640625, 3.6402587890625, 3.824951171875, 4.0096435546875, 4.1943359375, 4.3790283203125, 4.563720703125, 4.7484130859375, 4.93310546875, 5.1177978515625, 5.302490234375, 5.4871826171875, 5.671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 8.0, 16.0, 9.0, 12.0, 25.0, 12.0, 18.0, 25.0, 44.0, 40.0, 35.0, 48.0, 44.0, 39.0, 52.0, 44.0, 52.0, 45.0, 47.0, 43.0, 54.0, 43.0, 42.0, 31.0, 35.0, 20.0, 21.0, 23.0, 8.0, 12.0, 10.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.2862548828125, -2.207275390625, -2.1282958984375, -2.04931640625, -1.9703369140625, -1.891357421875, -1.8123779296875, -1.7333984375, -1.6544189453125, -1.575439453125, -1.4964599609375, -1.41748046875, -1.3385009765625, -1.259521484375, -1.1805419921875, -1.1015625, -1.0225830078125, -0.943603515625, -0.8646240234375, -0.78564453125, -0.7066650390625, -0.627685546875, -0.5487060546875, -0.4697265625, -0.3907470703125, -0.311767578125, -0.2327880859375, -0.15380859375, -0.0748291015625, 0.004150390625, 0.0831298828125, 0.162109375, 0.2410888671875, 0.320068359375, 0.3990478515625, 0.47802734375, 0.5570068359375, 0.635986328125, 0.7149658203125, 0.7939453125, 0.8729248046875, 0.951904296875, 1.0308837890625, 1.10986328125, 1.1888427734375, 1.267822265625, 1.3468017578125, 1.42578125, 1.5047607421875, 1.583740234375, 1.6627197265625, 1.74169921875, 1.8206787109375, 1.899658203125, 1.9786376953125, 2.0576171875, 2.1365966796875, 2.215576171875, 2.2945556640625, 2.37353515625, 2.4525146484375, 2.531494140625, 2.6104736328125, 2.689453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 12.0, 5.0, 12.0, 6.0, 24.0, 27.0, 23.0, 25.0, 23.0, 31.0, 34.0, 40.0, 33.0, 47.0, 42.0, 53.0, 45.0, 33.0, 41.0, 37.0, 44.0, 34.0, 39.0, 35.0, 37.0, 26.0, 25.0, 30.0, 21.0, 13.0, 8.0, 13.0, 20.0, 13.0, 5.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.258975982666016, -11.840922355651855, -11.422869682312012, -11.004816055297852, -10.586762428283691, -10.168708801269531, -9.750656127929688, -9.332602500915527, -8.914548873901367, -8.496495246887207, -8.078442573547363, -7.660388946533203, -7.242335319519043, -6.824282169342041, -6.406229019165039, -5.988175392150879, -5.570122718811035, -5.152069568634033, -4.734015941619873, -4.315962791442871, -3.89790940284729, -3.479856014251709, -3.061802864074707, -2.643749475479126, -2.225696086883545, -1.8076426982879639, -1.3895894289016724, -0.9715361595153809, -0.5534827709197998, -0.13542938232421875, 0.2826237678527832, 0.7006771564483643, 1.1187314987182617, 1.5367848873138428, 1.9548381567001343, 2.372891426086426, 2.790944814682007, 3.208998203277588, 3.62705135345459, 4.04510498046875, 4.463158130645752, 4.881211280822754, 5.299264907836914, 5.717318058013916, 6.135371208190918, 6.553424835205078, 6.97147798538208, 7.389531135559082, 7.807584762573242, 8.225638389587402, 8.643691062927246, 9.061744689941406, 9.479798316955566, 9.897851943969727, 10.31590461730957, 10.73395824432373, 11.15201187133789, 11.57006549835205, 11.988118171691895, 12.406171798706055, 12.824225425720215, 13.242279052734375, 13.660331726074219, 14.078385353088379, 14.496438026428223]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 7.0, 2.0, 4.0, 8.0, 9.0, 16.0, 13.0, 24.0, 23.0, 20.0, 26.0, 35.0, 27.0, 34.0, 30.0, 40.0, 28.0, 35.0, 23.0, 36.0, 27.0, 43.0, 30.0, 43.0, 45.0, 32.0, 33.0, 31.0, 18.0, 33.0, 30.0, 27.0, 23.0, 10.0, 20.0, 20.0, 23.0, 16.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-14.283504486083984, -13.853324890136719, -13.423145294189453, -12.992965698242188, -12.562786102294922, -12.132606506347656, -11.702427864074707, -11.272248268127441, -10.842068672180176, -10.41188907623291, -9.981709480285645, -9.551529884338379, -9.12135124206543, -8.691171646118164, -8.260992050170898, -7.830812454223633, -7.400632858276367, -6.970453262329102, -6.540273666381836, -6.1100945472717285, -5.679914951324463, -5.249735355377197, -4.81955623626709, -4.389376640319824, -3.9591970443725586, -3.529017448425293, -3.0988380908966064, -2.66865873336792, -2.2384791374206543, -1.8082995414733887, -1.3781201839447021, -0.9479408264160156, -0.5177621841430664, -0.08758270740509033, 0.34259676933288574, 0.7727762460708618, 1.202955722808838, 1.6331353187561035, 2.06331467628479, 2.4934940338134766, 2.923673629760742, 3.353853225708008, 3.7840325832366943, 4.214211940765381, 4.6443915367126465, 5.074571132659912, 5.5047502517700195, 5.934929847717285, 6.365109443664551, 6.795289039611816, 7.225468635559082, 7.6556477546691895, 8.085826873779297, 8.516006469726562, 8.946186065673828, 9.376365661621094, 9.80654525756836, 10.236724853515625, 10.66690444946289, 11.097084045410156, 11.527263641357422, 11.957443237304688, 12.387621879577637, 12.817801475524902, 13.247981071472168]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 13.0, 26.0, 32.0, 53.0, 95.0, 120.0, 252.0, 385.0, 601.0, 908.0, 1484.0, 2386.0, 3948.0, 6133.0, 9481.0, 14867.0, 22909.0, 34173.0, 50825.0, 74028.0, 105503.0, 144804.0, 193267.0, 246506.0, 300130.0, 346664.0, 378673.0, 386931.0, 374350.0, 338674.0, 290730.0, 237321.0, 183953.0, 137274.0, 99229.0, 69708.0, 48035.0, 31809.0, 21016.0, 13665.0, 8782.0, 5577.0, 3495.0, 2125.0, 1322.0, 791.0, 506.0, 298.0, 184.0, 96.0, 70.0, 33.0, 26.0, 7.0, 7.0, 2.0, 3.0, 3.0], "bins": [-9.7265625, -9.4354248046875, -9.144287109375, -8.8531494140625, -8.56201171875, -8.2708740234375, -7.979736328125, -7.6885986328125, -7.3974609375, -7.1063232421875, -6.815185546875, -6.5240478515625, -6.23291015625, -5.9417724609375, -5.650634765625, -5.3594970703125, -5.068359375, -4.7772216796875, -4.486083984375, -4.1949462890625, -3.90380859375, -3.6126708984375, -3.321533203125, -3.0303955078125, -2.7392578125, -2.4481201171875, -2.156982421875, -1.8658447265625, -1.57470703125, -1.2835693359375, -0.992431640625, -0.7012939453125, -0.41015625, -0.1190185546875, 0.172119140625, 0.4632568359375, 0.75439453125, 1.0455322265625, 1.336669921875, 1.6278076171875, 1.9189453125, 2.2100830078125, 2.501220703125, 2.7923583984375, 3.08349609375, 3.3746337890625, 3.665771484375, 3.9569091796875, 4.248046875, 4.5391845703125, 4.830322265625, 5.1214599609375, 5.41259765625, 5.7037353515625, 5.994873046875, 6.2860107421875, 6.5771484375, 6.8682861328125, 7.159423828125, 7.4505615234375, 7.74169921875, 8.0328369140625, 8.323974609375, 8.6151123046875, 8.90625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 10.0, 4.0, 5.0, 3.0, 9.0, 9.0, 11.0, 14.0, 27.0, 20.0, 18.0, 30.0, 35.0, 25.0, 32.0, 27.0, 37.0, 35.0, 39.0, 21.0, 30.0, 25.0, 44.0, 37.0, 32.0, 49.0, 31.0, 38.0, 26.0, 23.0, 25.0, 26.0, 35.0, 24.0, 13.0, 17.0, 19.0, 25.0, 18.0, 9.0, 10.0, 7.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-12.6875, -12.3055419921875, -11.923583984375, -11.5416259765625, -11.15966796875, -10.7777099609375, -10.395751953125, -10.0137939453125, -9.6318359375, -9.2498779296875, -8.867919921875, -8.4859619140625, -8.10400390625, -7.7220458984375, -7.340087890625, -6.9581298828125, -6.576171875, -6.1942138671875, -5.812255859375, -5.4302978515625, -5.04833984375, -4.6663818359375, -4.284423828125, -3.9024658203125, -3.5205078125, -3.1385498046875, -2.756591796875, -2.3746337890625, -1.99267578125, -1.6107177734375, -1.228759765625, -0.8468017578125, -0.46484375, -0.0828857421875, 0.299072265625, 0.6810302734375, 1.06298828125, 1.4449462890625, 1.826904296875, 2.2088623046875, 2.5908203125, 2.9727783203125, 3.354736328125, 3.7366943359375, 4.11865234375, 4.5006103515625, 4.882568359375, 5.2645263671875, 5.646484375, 6.0284423828125, 6.410400390625, 6.7923583984375, 7.17431640625, 7.5562744140625, 7.938232421875, 8.3201904296875, 8.7021484375, 9.0841064453125, 9.466064453125, 9.8480224609375, 10.22998046875, 10.6119384765625, 10.993896484375, 11.3758544921875, 11.7578125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 17.0, 24.0, 48.0, 70.0, 142.0, 207.0, 356.0, 571.0, 962.0, 1731.0, 2516.0, 4228.0, 6857.0, 10594.0, 16272.0, 25056.0, 37239.0, 54156.0, 77201.0, 106267.0, 142176.0, 183903.0, 228781.0, 273577.0, 312054.0, 339258.0, 352237.0, 349502.0, 329485.0, 293829.0, 252922.0, 209530.0, 165111.0, 124887.0, 92048.0, 66349.0, 45716.0, 31092.0, 20828.0, 13616.0, 8652.0, 5477.0, 3462.0, 2051.0, 1289.0, 766.0, 495.0, 281.0, 160.0, 113.0, 44.0, 27.0, 22.0, 13.0, 7.0, 4.0, 2.0, 3.0], "bins": [-9.421875, -9.1343994140625, -8.846923828125, -8.5594482421875, -8.27197265625, -7.9844970703125, -7.697021484375, -7.4095458984375, -7.1220703125, -6.8345947265625, -6.547119140625, -6.2596435546875, -5.97216796875, -5.6846923828125, -5.397216796875, -5.1097412109375, -4.822265625, -4.5347900390625, -4.247314453125, -3.9598388671875, -3.67236328125, -3.3848876953125, -3.097412109375, -2.8099365234375, -2.5224609375, -2.2349853515625, -1.947509765625, -1.6600341796875, -1.37255859375, -1.0850830078125, -0.797607421875, -0.5101318359375, -0.22265625, 0.0648193359375, 0.352294921875, 0.6397705078125, 0.92724609375, 1.2147216796875, 1.502197265625, 1.7896728515625, 2.0771484375, 2.3646240234375, 2.652099609375, 2.9395751953125, 3.22705078125, 3.5145263671875, 3.802001953125, 4.0894775390625, 4.376953125, 4.6644287109375, 4.951904296875, 5.2393798828125, 5.52685546875, 5.8143310546875, 6.101806640625, 6.3892822265625, 6.6767578125, 6.9642333984375, 7.251708984375, 7.5391845703125, 7.82666015625, 8.1141357421875, 8.401611328125, 8.6890869140625, 8.9765625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 9.0, 8.0, 7.0, 8.0, 24.0, 20.0, 25.0, 25.0, 34.0, 59.0, 74.0, 79.0, 90.0, 110.0, 109.0, 148.0, 144.0, 149.0, 171.0, 171.0, 198.0, 193.0, 183.0, 170.0, 196.0, 195.0, 184.0, 169.0, 162.0, 151.0, 108.0, 102.0, 111.0, 99.0, 69.0, 76.0, 45.0, 42.0, 35.0, 38.0, 25.0, 15.0, 10.0, 12.0, 4.0, 3.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.582275390625, -5.39501953125, -5.207763671875, -5.0205078125, -4.833251953125, -4.64599609375, -4.458740234375, -4.271484375, -4.084228515625, -3.89697265625, -3.709716796875, -3.5224609375, -3.335205078125, -3.14794921875, -2.960693359375, -2.7734375, -2.586181640625, -2.39892578125, -2.211669921875, -2.0244140625, -1.837158203125, -1.64990234375, -1.462646484375, -1.275390625, -1.088134765625, -0.90087890625, -0.713623046875, -0.5263671875, -0.339111328125, -0.15185546875, 0.035400390625, 0.22265625, 0.409912109375, 0.59716796875, 0.784423828125, 0.9716796875, 1.158935546875, 1.34619140625, 1.533447265625, 1.720703125, 1.907958984375, 2.09521484375, 2.282470703125, 2.4697265625, 2.656982421875, 2.84423828125, 3.031494140625, 3.21875, 3.406005859375, 3.59326171875, 3.780517578125, 3.9677734375, 4.155029296875, 4.34228515625, 4.529541015625, 4.716796875, 4.904052734375, 5.09130859375, 5.278564453125, 5.4658203125, 5.653076171875, 5.84033203125, 6.027587890625, 6.21484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 10.0, 9.0, 13.0, 21.0, 28.0, 25.0, 19.0, 36.0, 19.0, 33.0, 22.0, 36.0, 46.0, 34.0, 53.0, 36.0, 46.0, 47.0, 44.0, 43.0, 48.0, 45.0, 27.0, 35.0, 25.0, 31.0, 28.0, 26.0, 18.0, 13.0, 15.0, 8.0, 10.0, 8.0, 11.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.842455863952637, -14.399292945861816, -13.95612907409668, -13.51296615600586, -13.069803237915039, -12.626640319824219, -12.183477401733398, -11.740313529968262, -11.297150611877441, -10.853987693786621, -10.410823822021484, -9.967660903930664, -9.524497985839844, -9.081335067749023, -8.638172149658203, -8.195008277893066, -7.751845359802246, -7.308682441711426, -6.865519046783447, -6.422355651855469, -5.979192733764648, -5.536029815673828, -5.09286642074585, -4.649703025817871, -4.206540107727051, -3.7633769512176514, -3.320213794708252, -2.8770506381988525, -2.433887481689453, -1.9907243251800537, -1.5475611686706543, -1.1043980121612549, -0.6612358093261719, -0.21807265281677246, 0.22509050369262695, 0.6682536602020264, 1.1114168167114258, 1.5545799732208252, 1.9977431297302246, 2.440906286239624, 2.8840694427490234, 3.327232599258423, 3.7703957557678223, 4.213559150695801, 4.656722068786621, 5.099884986877441, 5.54304838180542, 5.986211776733398, 6.429374694824219, 6.872537612915039, 7.315701007843018, 7.758864402770996, 8.202027320861816, 8.645190238952637, 9.088354110717773, 9.531517028808594, 9.974679946899414, 10.417842864990234, 10.861005783081055, 11.304169654846191, 11.747332572937012, 12.190495491027832, 12.633659362792969, 13.076822280883789, 13.51998519897461]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 4.0, 11.0, 7.0, 16.0, 15.0, 15.0, 15.0, 10.0, 26.0, 21.0, 24.0, 28.0, 28.0, 37.0, 34.0, 45.0, 28.0, 38.0, 46.0, 34.0, 37.0, 33.0, 41.0, 27.0, 38.0, 33.0, 42.0, 28.0, 29.0, 26.0, 33.0, 15.0, 15.0, 23.0, 16.0, 13.0, 7.0, 13.0, 4.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-15.027436256408691, -14.58669662475586, -14.145956993103027, -13.705217361450195, -13.264477729797363, -12.823738098144531, -12.3829984664917, -11.942258834838867, -11.501519203186035, -11.060779571533203, -10.620039939880371, -10.179300308227539, -9.738560676574707, -9.297821044921875, -8.857081413269043, -8.416341781616211, -7.975601673126221, -7.534862041473389, -7.094122409820557, -6.653382778167725, -6.212643146514893, -5.771903038024902, -5.33116340637207, -4.890423774719238, -4.449684143066406, -4.008944511413574, -3.568204879760742, -3.12746524810791, -2.686725616455078, -2.245985746383667, -1.805246114730835, -1.364506483078003, -0.92376708984375, -0.4830274283885956, -0.04228776693344116, 0.39845192432403564, 0.8391915559768677, 1.2799313068389893, 1.7206709384918213, 2.1614105701446533, 2.6021502017974854, 3.0428898334503174, 3.4836294651031494, 3.9243693351745605, 4.365108966827393, 4.805848598480225, 5.246588230133057, 5.687327861785889, 6.128067493438721, 6.568807125091553, 7.009546756744385, 7.450286388397217, 7.891026020050049, 8.331766128540039, 8.772505760192871, 9.213245391845703, 9.653985023498535, 10.094724655151367, 10.5354642868042, 10.976203918457031, 11.416943550109863, 11.857683181762695, 12.298422813415527, 12.73916244506836, 13.179902076721191]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 11.0, 5.0, 10.0, 10.0, 17.0, 27.0, 38.0, 43.0, 95.0, 98.0, 137.0, 218.0, 366.0, 528.0, 737.0, 1191.0, 1856.0, 2993.0, 4917.0, 7931.0, 13384.0, 22555.0, 37947.0, 63435.0, 98655.0, 141623.0, 169179.0, 159199.0, 120014.0, 78917.0, 48678.0, 29293.0, 17628.0, 10205.0, 6206.0, 3776.0, 2303.0, 1488.0, 984.0, 560.0, 406.0, 292.0, 180.0, 121.0, 87.0, 71.0, 44.0, 30.0, 21.0, 15.0, 14.0, 8.0, 10.0, 2.0, 5.0, 3.0], "bins": [-2.62109375, -2.545654296875, -2.47021484375, -2.394775390625, -2.3193359375, -2.243896484375, -2.16845703125, -2.093017578125, -2.017578125, -1.942138671875, -1.86669921875, -1.791259765625, -1.7158203125, -1.640380859375, -1.56494140625, -1.489501953125, -1.4140625, -1.338623046875, -1.26318359375, -1.187744140625, -1.1123046875, -1.036865234375, -0.96142578125, -0.885986328125, -0.810546875, -0.735107421875, -0.65966796875, -0.584228515625, -0.5087890625, -0.433349609375, -0.35791015625, -0.282470703125, -0.20703125, -0.131591796875, -0.05615234375, 0.019287109375, 0.0947265625, 0.170166015625, 0.24560546875, 0.321044921875, 0.396484375, 0.471923828125, 0.54736328125, 0.622802734375, 0.6982421875, 0.773681640625, 0.84912109375, 0.924560546875, 1.0, 1.075439453125, 1.15087890625, 1.226318359375, 1.3017578125, 1.377197265625, 1.45263671875, 1.528076171875, 1.603515625, 1.678955078125, 1.75439453125, 1.829833984375, 1.9052734375, 1.980712890625, 2.05615234375, 2.131591796875, 2.20703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 4.0, 11.0, 7.0, 16.0, 16.0, 14.0, 14.0, 11.0, 28.0, 18.0, 25.0, 29.0, 27.0, 37.0, 35.0, 44.0, 28.0, 39.0, 44.0, 35.0, 38.0, 33.0, 41.0, 26.0, 38.0, 33.0, 40.0, 29.0, 30.0, 26.0, 33.0, 13.0, 17.0, 23.0, 16.0, 13.0, 6.0, 14.0, 4.0, 7.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-14.96875, -14.5284423828125, -14.088134765625, -13.6478271484375, -13.20751953125, -12.7672119140625, -12.326904296875, -11.8865966796875, -11.4462890625, -11.0059814453125, -10.565673828125, -10.1253662109375, -9.68505859375, -9.2447509765625, -8.804443359375, -8.3641357421875, -7.923828125, -7.4835205078125, -7.043212890625, -6.6029052734375, -6.16259765625, -5.7222900390625, -5.281982421875, -4.8416748046875, -4.4013671875, -3.9610595703125, -3.520751953125, -3.0804443359375, -2.64013671875, -2.1998291015625, -1.759521484375, -1.3192138671875, -0.87890625, -0.4385986328125, 0.001708984375, 0.4420166015625, 0.88232421875, 1.3226318359375, 1.762939453125, 2.2032470703125, 2.6435546875, 3.0838623046875, 3.524169921875, 3.9644775390625, 4.40478515625, 4.8450927734375, 5.285400390625, 5.7257080078125, 6.166015625, 6.6063232421875, 7.046630859375, 7.4869384765625, 7.92724609375, 8.3675537109375, 8.807861328125, 9.2481689453125, 9.6884765625, 10.1287841796875, 10.569091796875, 11.0093994140625, 11.44970703125, 11.8900146484375, 12.330322265625, 12.7706298828125, 13.2109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 14.0, 11.0, 14.0, 25.0, 31.0, 48.0, 60.0, 97.0, 147.0, 195.0, 266.0, 444.0, 626.0, 980.0, 1645.0, 2580.0, 4127.0, 7111.0, 12328.0, 22252.0, 42919.0, 84027.0, 165514.0, 254747.0, 211072.0, 113449.0, 56713.0, 29325.0, 15905.0, 8613.0, 5041.0, 2981.0, 1819.0, 1143.0, 761.0, 499.0, 307.0, 196.0, 146.0, 116.0, 73.0, 47.0, 35.0, 40.0, 16.0, 17.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.3515625, -3.245880126953125, -3.14019775390625, -3.034515380859375, -2.9288330078125, -2.823150634765625, -2.71746826171875, -2.611785888671875, -2.506103515625, -2.400421142578125, -2.29473876953125, -2.189056396484375, -2.0833740234375, -1.977691650390625, -1.87200927734375, -1.766326904296875, -1.66064453125, -1.554962158203125, -1.44927978515625, -1.343597412109375, -1.2379150390625, -1.132232666015625, -1.02655029296875, -0.920867919921875, -0.815185546875, -0.709503173828125, -0.60382080078125, -0.498138427734375, -0.3924560546875, -0.286773681640625, -0.18109130859375, -0.075408935546875, 0.0302734375, 0.135955810546875, 0.24163818359375, 0.347320556640625, 0.4530029296875, 0.558685302734375, 0.66436767578125, 0.770050048828125, 0.875732421875, 0.981414794921875, 1.08709716796875, 1.192779541015625, 1.2984619140625, 1.404144287109375, 1.50982666015625, 1.615509033203125, 1.72119140625, 1.826873779296875, 1.93255615234375, 2.038238525390625, 2.1439208984375, 2.249603271484375, 2.35528564453125, 2.460968017578125, 2.566650390625, 2.672332763671875, 2.77801513671875, 2.883697509765625, 2.9893798828125, 3.095062255859375, 3.20074462890625, 3.306427001953125, 3.412109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 8.0, 8.0, 15.0, 15.0, 14.0, 28.0, 26.0, 25.0, 29.0, 32.0, 30.0, 31.0, 33.0, 37.0, 37.0, 36.0, 45.0, 50.0, 43.0, 37.0, 40.0, 38.0, 36.0, 34.0, 35.0, 35.0, 30.0, 26.0, 18.0, 10.0, 24.0, 12.0, 16.0, 2.0, 8.0, 17.0, 2.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.234375, -9.93505859375, -9.6357421875, -9.33642578125, -9.037109375, -8.73779296875, -8.4384765625, -8.13916015625, -7.83984375, -7.54052734375, -7.2412109375, -6.94189453125, -6.642578125, -6.34326171875, -6.0439453125, -5.74462890625, -5.4453125, -5.14599609375, -4.8466796875, -4.54736328125, -4.248046875, -3.94873046875, -3.6494140625, -3.35009765625, -3.05078125, -2.75146484375, -2.4521484375, -2.15283203125, -1.853515625, -1.55419921875, -1.2548828125, -0.95556640625, -0.65625, -0.35693359375, -0.0576171875, 0.24169921875, 0.541015625, 0.84033203125, 1.1396484375, 1.43896484375, 1.73828125, 2.03759765625, 2.3369140625, 2.63623046875, 2.935546875, 3.23486328125, 3.5341796875, 3.83349609375, 4.1328125, 4.43212890625, 4.7314453125, 5.03076171875, 5.330078125, 5.62939453125, 5.9287109375, 6.22802734375, 6.52734375, 6.82666015625, 7.1259765625, 7.42529296875, 7.724609375, 8.02392578125, 8.3232421875, 8.62255859375, 8.921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 8.0, 20.0, 13.0, 35.0, 46.0, 60.0, 65.0, 120.0, 129.0, 217.0, 315.0, 451.0, 619.0, 1023.0, 1494.0, 2313.0, 3596.0, 5945.0, 10615.0, 19656.0, 41520.0, 103582.0, 284524.0, 335601.0, 132458.0, 50523.0, 23210.0, 12108.0, 6884.0, 4010.0, 2491.0, 1584.0, 1062.0, 699.0, 459.0, 312.0, 236.0, 166.0, 102.0, 85.0, 52.0, 43.0, 26.0, 30.0, 16.0, 8.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.05078125, -1.0170135498046875, -0.983245849609375, -0.9494781494140625, -0.91571044921875, -0.8819427490234375, -0.848175048828125, -0.8144073486328125, -0.7806396484375, -0.7468719482421875, -0.713104248046875, -0.6793365478515625, -0.64556884765625, -0.6118011474609375, -0.578033447265625, -0.5442657470703125, -0.510498046875, -0.4767303466796875, -0.442962646484375, -0.4091949462890625, -0.37542724609375, -0.3416595458984375, -0.307891845703125, -0.2741241455078125, -0.2403564453125, -0.2065887451171875, -0.172821044921875, -0.1390533447265625, -0.10528564453125, -0.0715179443359375, -0.037750244140625, -0.0039825439453125, 0.02978515625, 0.0635528564453125, 0.097320556640625, 0.1310882568359375, 0.16485595703125, 0.1986236572265625, 0.232391357421875, 0.2661590576171875, 0.2999267578125, 0.3336944580078125, 0.367462158203125, 0.4012298583984375, 0.43499755859375, 0.4687652587890625, 0.502532958984375, 0.5363006591796875, 0.570068359375, 0.6038360595703125, 0.637603759765625, 0.6713714599609375, 0.70513916015625, 0.7389068603515625, 0.772674560546875, 0.8064422607421875, 0.8402099609375, 0.8739776611328125, 0.907745361328125, 0.9415130615234375, 0.97528076171875, 1.0090484619140625, 1.042816162109375, 1.0765838623046875, 1.1103515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 3.0, 6.0, 11.0, 15.0, 16.0, 12.0, 19.0, 21.0, 28.0, 33.0, 30.0, 33.0, 38.0, 29.0, 43.0, 38.0, 37.0, 39.0, 47.0, 55.0, 53.0, 50.0, 50.0, 39.0, 45.0, 32.0, 28.0, 22.0, 20.0, 18.0, 17.0, 16.0, 12.0, 12.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.43865966796875e-05, -7.17993825674057e-05, -6.92121684551239e-05, -6.66249543428421e-05, -6.40377402305603e-05, -6.14505261182785e-05, -5.8863312005996704e-05, -5.6276097893714905e-05, -5.3688883781433105e-05, -5.1101669669151306e-05, -4.851445555686951e-05, -4.592724144458771e-05, -4.334002733230591e-05, -4.075281322002411e-05, -3.816559910774231e-05, -3.557838499546051e-05, -3.299117088317871e-05, -3.040395677089691e-05, -2.7816742658615112e-05, -2.5229528546333313e-05, -2.2642314434051514e-05, -2.0055100321769714e-05, -1.7467886209487915e-05, -1.4880672097206116e-05, -1.2293457984924316e-05, -9.706243872642517e-06, -7.119029760360718e-06, -4.5318156480789185e-06, -1.944601535797119e-06, 6.426125764846802e-07, 3.2298266887664795e-06, 5.817040801048279e-06, 8.404254913330078e-06, 1.0991469025611877e-05, 1.3578683137893677e-05, 1.6165897250175476e-05, 1.8753111362457275e-05, 2.1340325474739075e-05, 2.3927539587020874e-05, 2.6514753699302673e-05, 2.9101967811584473e-05, 3.168918192386627e-05, 3.427639603614807e-05, 3.686361014842987e-05, 3.945082426071167e-05, 4.203803837299347e-05, 4.462525248527527e-05, 4.721246659755707e-05, 4.979968070983887e-05, 5.2386894822120667e-05, 5.4974108934402466e-05, 5.7561323046684265e-05, 6.0148537158966064e-05, 6.273575127124786e-05, 6.532296538352966e-05, 6.791017949581146e-05, 7.049739360809326e-05, 7.308460772037506e-05, 7.567182183265686e-05, 7.825903594493866e-05, 8.084625005722046e-05, 8.343346416950226e-05, 8.602067828178406e-05, 8.860789239406586e-05, 9.119510650634766e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 11.0, 9.0, 18.0, 17.0, 29.0, 37.0, 56.0, 81.0, 100.0, 181.0, 273.0, 402.0, 655.0, 982.0, 1503.0, 2274.0, 3771.0, 5974.0, 9914.0, 16708.0, 29238.0, 51951.0, 93278.0, 159641.0, 217307.0, 186318.0, 115471.0, 64415.0, 35859.0, 20406.0, 12121.0, 7350.0, 4518.0, 2726.0, 1702.0, 1130.0, 711.0, 470.0, 303.0, 213.0, 128.0, 82.0, 65.0, 49.0, 42.0, 14.0, 11.0, 14.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3212890625, -1.278228759765625, -1.23516845703125, -1.192108154296875, -1.1490478515625, -1.105987548828125, -1.06292724609375, -1.019866943359375, -0.976806640625, -0.933746337890625, -0.89068603515625, -0.847625732421875, -0.8045654296875, -0.761505126953125, -0.71844482421875, -0.675384521484375, -0.63232421875, -0.589263916015625, -0.54620361328125, -0.503143310546875, -0.4600830078125, -0.417022705078125, -0.37396240234375, -0.330902099609375, -0.287841796875, -0.244781494140625, -0.20172119140625, -0.158660888671875, -0.1156005859375, -0.072540283203125, -0.02947998046875, 0.013580322265625, 0.056640625, 0.099700927734375, 0.14276123046875, 0.185821533203125, 0.2288818359375, 0.271942138671875, 0.31500244140625, 0.358062744140625, 0.401123046875, 0.444183349609375, 0.48724365234375, 0.530303955078125, 0.5733642578125, 0.616424560546875, 0.65948486328125, 0.702545166015625, 0.74560546875, 0.788665771484375, 0.83172607421875, 0.874786376953125, 0.9178466796875, 0.960906982421875, 1.00396728515625, 1.047027587890625, 1.090087890625, 1.133148193359375, 1.17620849609375, 1.219268798828125, 1.2623291015625, 1.305389404296875, 1.34844970703125, 1.391510009765625, 1.4345703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 4.0, 6.0, 5.0, 5.0, 9.0, 15.0, 10.0, 10.0, 23.0, 23.0, 29.0, 31.0, 31.0, 39.0, 46.0, 52.0, 44.0, 66.0, 49.0, 53.0, 41.0, 44.0, 59.0, 35.0, 42.0, 28.0, 27.0, 27.0, 17.0, 20.0, 14.0, 25.0, 12.0, 6.0, 11.0, 9.0, 5.0, 9.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.4609375, -0.4478912353515625, -0.434844970703125, -0.4217987060546875, -0.40875244140625, -0.3957061767578125, -0.382659912109375, -0.3696136474609375, -0.3565673828125, -0.3435211181640625, -0.330474853515625, -0.3174285888671875, -0.30438232421875, -0.2913360595703125, -0.278289794921875, -0.2652435302734375, -0.252197265625, -0.2391510009765625, -0.226104736328125, -0.2130584716796875, -0.20001220703125, -0.1869659423828125, -0.173919677734375, -0.1608734130859375, -0.1478271484375, -0.1347808837890625, -0.121734619140625, -0.1086883544921875, -0.09564208984375, -0.0825958251953125, -0.069549560546875, -0.0565032958984375, -0.04345703125, -0.0304107666015625, -0.017364501953125, -0.0043182373046875, 0.00872802734375, 0.0217742919921875, 0.034820556640625, 0.0478668212890625, 0.0609130859375, 0.0739593505859375, 0.087005615234375, 0.1000518798828125, 0.11309814453125, 0.1261444091796875, 0.139190673828125, 0.1522369384765625, 0.165283203125, 0.1783294677734375, 0.191375732421875, 0.2044219970703125, 0.21746826171875, 0.2305145263671875, 0.243560791015625, 0.2566070556640625, 0.2696533203125, 0.2826995849609375, 0.295745849609375, 0.3087921142578125, 0.32183837890625, 0.3348846435546875, 0.347930908203125, 0.3609771728515625, 0.3740234375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 10.0, 6.0, 5.0, 10.0, 14.0, 13.0, 32.0, 24.0, 13.0, 35.0, 32.0, 22.0, 26.0, 27.0, 45.0, 41.0, 53.0, 32.0, 43.0, 55.0, 43.0, 40.0, 49.0, 43.0, 34.0, 29.0, 36.0, 27.0, 23.0, 25.0, 25.0, 16.0, 17.0, 9.0, 8.0, 13.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.107321739196777, -14.661651611328125, -14.215982437133789, -13.770312309265137, -13.324642181396484, -12.878972053527832, -12.43330192565918, -11.987632751464844, -11.541962623596191, -11.096292495727539, -10.650623321533203, -10.20495319366455, -9.759283065795898, -9.313612937927246, -8.867942810058594, -8.422273635864258, -7.9766035079956055, -7.530933380126953, -7.085263729095459, -6.639594078063965, -6.1939239501953125, -5.74825382232666, -5.302584171295166, -4.856914520263672, -4.4112443923950195, -3.9655745029449463, -3.519904613494873, -3.0742347240448, -2.6285648345947266, -2.1828949451446533, -1.73722505569458, -1.2915551662445068, -0.8458852767944336, -0.40021538734436035, 0.04545450210571289, 0.49112439155578613, 0.9367942810058594, 1.3824641704559326, 1.8281340599060059, 2.273803949356079, 2.7194738388061523, 3.1651437282562256, 3.610813617706299, 4.056483268737793, 4.502153396606445, 4.947823524475098, 5.393493175506592, 5.839162826538086, 6.284832954406738, 6.730503082275391, 7.176172733306885, 7.621842384338379, 8.067512512207031, 8.513182640075684, 8.958852767944336, 9.404521942138672, 9.850192070007324, 10.295862197875977, 10.741531372070312, 11.187201499938965, 11.632871627807617, 12.07854175567627, 12.524211883544922, 12.969881057739258, 13.41555118560791]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 7.0, 6.0, 11.0, 18.0, 15.0, 15.0, 10.0, 16.0, 27.0, 20.0, 21.0, 32.0, 23.0, 41.0, 36.0, 42.0, 28.0, 39.0, 48.0, 32.0, 36.0, 37.0, 39.0, 24.0, 37.0, 34.0, 41.0, 28.0, 31.0, 21.0, 32.0, 17.0, 16.0, 18.0, 19.0, 12.0, 8.0, 10.0, 6.0, 5.0, 9.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0], "bins": [-14.735434532165527, -14.299111366271973, -13.862788200378418, -13.426465034484863, -12.990141868591309, -12.553818702697754, -12.1174955368042, -11.681172370910645, -11.24484920501709, -10.808526039123535, -10.37220287322998, -9.935879707336426, -9.499556541442871, -9.063233375549316, -8.626910209655762, -8.190587043762207, -7.754263877868652, -7.317940711975098, -6.881617546081543, -6.445294380187988, -6.008971214294434, -5.572648048400879, -5.136324882507324, -4.7000017166137695, -4.263678550720215, -3.82735538482666, -3.3910322189331055, -2.954709053039551, -2.518385887145996, -2.0820627212524414, -1.6457395553588867, -1.209416389465332, -0.7730932235717773, -0.33677005767822266, 0.09955310821533203, 0.5358762741088867, 0.9721994400024414, 1.408522605895996, 1.8448457717895508, 2.2811689376831055, 2.71749210357666, 3.153815269470215, 3.5901384353637695, 4.026461601257324, 4.462784767150879, 4.899107933044434, 5.335431098937988, 5.771754264831543, 6.208077430725098, 6.644400596618652, 7.080723762512207, 7.517046928405762, 7.953370094299316, 8.389693260192871, 8.826016426086426, 9.26233959197998, 9.698662757873535, 10.13498592376709, 10.571309089660645, 11.0076322555542, 11.443955421447754, 11.880278587341309, 12.316601753234863, 12.752924919128418, 13.189248085021973]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 8.0, 19.0, 29.0, 37.0, 61.0, 117.0, 167.0, 258.0, 407.0, 617.0, 1092.0, 1642.0, 2493.0, 3833.0, 5758.0, 8343.0, 11899.0, 16830.0, 22943.0, 30347.0, 39371.0, 49002.0, 58827.0, 68143.0, 75995.0, 80996.0, 82823.0, 81408.0, 76320.0, 69221.0, 59819.0, 49689.0, 40177.0, 31087.0, 23533.0, 16906.0, 12465.0, 8593.0, 5859.0, 4034.0, 2647.0, 1677.0, 1103.0, 769.0, 440.0, 276.0, 200.0, 112.0, 65.0, 44.0, 24.0, 18.0, 13.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.0234375, -7.7607421875, -7.498046875, -7.2353515625, -6.97265625, -6.7099609375, -6.447265625, -6.1845703125, -5.921875, -5.6591796875, -5.396484375, -5.1337890625, -4.87109375, -4.6083984375, -4.345703125, -4.0830078125, -3.8203125, -3.5576171875, -3.294921875, -3.0322265625, -2.76953125, -2.5068359375, -2.244140625, -1.9814453125, -1.71875, -1.4560546875, -1.193359375, -0.9306640625, -0.66796875, -0.4052734375, -0.142578125, 0.1201171875, 0.3828125, 0.6455078125, 0.908203125, 1.1708984375, 1.43359375, 1.6962890625, 1.958984375, 2.2216796875, 2.484375, 2.7470703125, 3.009765625, 3.2724609375, 3.53515625, 3.7978515625, 4.060546875, 4.3232421875, 4.5859375, 4.8486328125, 5.111328125, 5.3740234375, 5.63671875, 5.8994140625, 6.162109375, 6.4248046875, 6.6875, 6.9501953125, 7.212890625, 7.4755859375, 7.73828125, 8.0009765625, 8.263671875, 8.5263671875, 8.7890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 5.0, 13.0, 15.0, 16.0, 16.0, 8.0, 19.0, 26.0, 23.0, 19.0, 31.0, 24.0, 40.0, 41.0, 39.0, 27.0, 44.0, 41.0, 35.0, 31.0, 40.0, 36.0, 28.0, 39.0, 34.0, 36.0, 28.0, 31.0, 24.0, 30.0, 17.0, 17.0, 21.0, 13.0, 14.0, 8.0, 9.0, 4.0, 6.0, 10.0, 1.0, 6.0, 2.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-14.2265625, -13.8043212890625, -13.382080078125, -12.9598388671875, -12.53759765625, -12.1153564453125, -11.693115234375, -11.2708740234375, -10.8486328125, -10.4263916015625, -10.004150390625, -9.5819091796875, -9.15966796875, -8.7374267578125, -8.315185546875, -7.8929443359375, -7.470703125, -7.0484619140625, -6.626220703125, -6.2039794921875, -5.78173828125, -5.3594970703125, -4.937255859375, -4.5150146484375, -4.0927734375, -3.6705322265625, -3.248291015625, -2.8260498046875, -2.40380859375, -1.9815673828125, -1.559326171875, -1.1370849609375, -0.71484375, -0.2926025390625, 0.129638671875, 0.5518798828125, 0.97412109375, 1.3963623046875, 1.818603515625, 2.2408447265625, 2.6630859375, 3.0853271484375, 3.507568359375, 3.9298095703125, 4.35205078125, 4.7742919921875, 5.196533203125, 5.6187744140625, 6.041015625, 6.4632568359375, 6.885498046875, 7.3077392578125, 7.72998046875, 8.1522216796875, 8.574462890625, 8.9967041015625, 9.4189453125, 9.8411865234375, 10.263427734375, 10.6856689453125, 11.10791015625, 11.5301513671875, 11.952392578125, 12.3746337890625, 12.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 14.0, 16.0, 19.0, 53.0, 74.0, 107.0, 173.0, 276.0, 447.0, 685.0, 1120.0, 1717.0, 2591.0, 4050.0, 5881.0, 8862.0, 12879.0, 17502.0, 24331.0, 32832.0, 42320.0, 52565.0, 63238.0, 73118.0, 80722.0, 85583.0, 85495.0, 82584.0, 75799.0, 66525.0, 56174.0, 45300.0, 35871.0, 26397.0, 19757.0, 14161.0, 9851.0, 6666.0, 4552.0, 2850.0, 1940.0, 1259.0, 840.0, 506.0, 300.0, 229.0, 139.0, 73.0, 38.0, 30.0, 18.0, 15.0, 10.0, 4.0, 2.0, 2.0], "bins": [-9.421875, -9.14599609375, -8.8701171875, -8.59423828125, -8.318359375, -8.04248046875, -7.7666015625, -7.49072265625, -7.21484375, -6.93896484375, -6.6630859375, -6.38720703125, -6.111328125, -5.83544921875, -5.5595703125, -5.28369140625, -5.0078125, -4.73193359375, -4.4560546875, -4.18017578125, -3.904296875, -3.62841796875, -3.3525390625, -3.07666015625, -2.80078125, -2.52490234375, -2.2490234375, -1.97314453125, -1.697265625, -1.42138671875, -1.1455078125, -0.86962890625, -0.59375, -0.31787109375, -0.0419921875, 0.23388671875, 0.509765625, 0.78564453125, 1.0615234375, 1.33740234375, 1.61328125, 1.88916015625, 2.1650390625, 2.44091796875, 2.716796875, 2.99267578125, 3.2685546875, 3.54443359375, 3.8203125, 4.09619140625, 4.3720703125, 4.64794921875, 4.923828125, 5.19970703125, 5.4755859375, 5.75146484375, 6.02734375, 6.30322265625, 6.5791015625, 6.85498046875, 7.130859375, 7.40673828125, 7.6826171875, 7.95849609375, 8.234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 3.0, 5.0, 8.0, 10.0, 12.0, 13.0, 22.0, 18.0, 13.0, 19.0, 16.0, 19.0, 26.0, 30.0, 37.0, 32.0, 40.0, 37.0, 40.0, 32.0, 45.0, 41.0, 38.0, 30.0, 27.0, 38.0, 41.0, 28.0, 21.0, 28.0, 26.0, 31.0, 29.0, 18.0, 16.0, 13.0, 8.0, 15.0, 10.0, 10.0, 10.0, 4.0, 5.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0], "bins": [-8.78125, -8.5059814453125, -8.230712890625, -7.9554443359375, -7.68017578125, -7.4049072265625, -7.129638671875, -6.8543701171875, -6.5791015625, -6.3038330078125, -6.028564453125, -5.7532958984375, -5.47802734375, -5.2027587890625, -4.927490234375, -4.6522216796875, -4.376953125, -4.1016845703125, -3.826416015625, -3.5511474609375, -3.27587890625, -3.0006103515625, -2.725341796875, -2.4500732421875, -2.1748046875, -1.8995361328125, -1.624267578125, -1.3489990234375, -1.07373046875, -0.7984619140625, -0.523193359375, -0.2479248046875, 0.02734375, 0.3026123046875, 0.577880859375, 0.8531494140625, 1.12841796875, 1.4036865234375, 1.678955078125, 1.9542236328125, 2.2294921875, 2.5047607421875, 2.780029296875, 3.0552978515625, 3.33056640625, 3.6058349609375, 3.881103515625, 4.1563720703125, 4.431640625, 4.7069091796875, 4.982177734375, 5.2574462890625, 5.53271484375, 5.8079833984375, 6.083251953125, 6.3585205078125, 6.6337890625, 6.9090576171875, 7.184326171875, 7.4595947265625, 7.73486328125, 8.0101318359375, 8.285400390625, 8.5606689453125, 8.8359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 7.0, 4.0, 8.0, 15.0, 22.0, 26.0, 36.0, 78.0, 118.0, 194.0, 357.0, 590.0, 947.0, 1530.0, 2666.0, 4620.0, 7813.0, 13266.0, 21062.0, 33146.0, 50152.0, 71311.0, 94147.0, 113610.0, 124790.0, 122699.0, 109077.0, 88364.0, 65476.0, 45633.0, 29822.0, 18851.0, 11402.0, 6815.0, 4098.0, 2435.0, 1373.0, 817.0, 438.0, 292.0, 165.0, 102.0, 80.0, 33.0, 22.0, 17.0, 7.0, 7.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.86328125, -5.6793212890625, -5.495361328125, -5.3114013671875, -5.12744140625, -4.9434814453125, -4.759521484375, -4.5755615234375, -4.3916015625, -4.2076416015625, -4.023681640625, -3.8397216796875, -3.65576171875, -3.4718017578125, -3.287841796875, -3.1038818359375, -2.919921875, -2.7359619140625, -2.552001953125, -2.3680419921875, -2.18408203125, -2.0001220703125, -1.816162109375, -1.6322021484375, -1.4482421875, -1.2642822265625, -1.080322265625, -0.8963623046875, -0.71240234375, -0.5284423828125, -0.344482421875, -0.1605224609375, 0.0234375, 0.2073974609375, 0.391357421875, 0.5753173828125, 0.75927734375, 0.9432373046875, 1.127197265625, 1.3111572265625, 1.4951171875, 1.6790771484375, 1.863037109375, 2.0469970703125, 2.23095703125, 2.4149169921875, 2.598876953125, 2.7828369140625, 2.966796875, 3.1507568359375, 3.334716796875, 3.5186767578125, 3.70263671875, 3.8865966796875, 4.070556640625, 4.2545166015625, 4.4384765625, 4.6224365234375, 4.806396484375, 4.9903564453125, 5.17431640625, 5.3582763671875, 5.542236328125, 5.7261962890625, 5.91015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 6.0, 7.0, 12.0, 16.0, 34.0, 24.0, 23.0, 30.0, 35.0, 29.0, 25.0, 36.0, 47.0, 42.0, 35.0, 52.0, 49.0, 44.0, 46.0, 43.0, 51.0, 50.0, 35.0, 28.0, 24.0, 29.0, 18.0, 16.0, 17.0, 12.0, 12.0, 7.0, 6.0, 5.0, 4.0, 12.0, 5.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0007319450378417969, -0.0007120594382286072, -0.0006921738386154175, -0.0006722882390022278, -0.0006524026393890381, -0.0006325170397758484, -0.0006126314401626587, -0.000592745840549469, -0.0005728602409362793, -0.0005529746413230896, -0.0005330890417098999, -0.0005132034420967102, -0.0004933178424835205, -0.0004734322428703308, -0.0004535466432571411, -0.0004336610436439514, -0.0004137754440307617, -0.000393889844417572, -0.0003740042448043823, -0.0003541186451911926, -0.00033423304557800293, -0.00031434744596481323, -0.00029446184635162354, -0.00027457624673843384, -0.00025469064712524414, -0.00023480504751205444, -0.00021491944789886475, -0.00019503384828567505, -0.00017514824867248535, -0.00015526264905929565, -0.00013537704944610596, -0.00011549144983291626, -9.560585021972656e-05, -7.572025060653687e-05, -5.583465099334717e-05, -3.594905138015747e-05, -1.6063451766967773e-05, 3.822147846221924e-06, 2.370774745941162e-05, 4.359334707260132e-05, 6.347894668579102e-05, 8.336454629898071e-05, 0.00010325014591217041, 0.0001231357455253601, 0.0001430213451385498, 0.0001629069447517395, 0.0001827925443649292, 0.0002026781439781189, 0.0002225637435913086, 0.0002424493432044983, 0.000262334942817688, 0.0002822205424308777, 0.0003021061420440674, 0.0003219917416572571, 0.0003418773412704468, 0.0003617629408836365, 0.00038164854049682617, 0.00040153414011001587, 0.00042141973972320557, 0.00044130533933639526, 0.00046119093894958496, 0.00048107653856277466, 0.0005009621381759644, 0.000520847737789154, 0.0005407333374023438]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 10.0, 9.0, 15.0, 36.0, 46.0, 67.0, 139.0, 190.0, 279.0, 462.0, 774.0, 1268.0, 2224.0, 3698.0, 6224.0, 10457.0, 17360.0, 28400.0, 44084.0, 66103.0, 92241.0, 116281.0, 132643.0, 132311.0, 117156.0, 92764.0, 66346.0, 45050.0, 28429.0, 17421.0, 10578.0, 6177.0, 3780.0, 2196.0, 1301.0, 788.0, 433.0, 292.0, 182.0, 114.0, 84.0, 47.0, 34.0, 24.0, 13.0, 12.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.03106689453125, -6.8043212890625, -6.57757568359375, -6.350830078125, -6.12408447265625, -5.8973388671875, -5.67059326171875, -5.44384765625, -5.21710205078125, -4.9903564453125, -4.76361083984375, -4.536865234375, -4.31011962890625, -4.0833740234375, -3.85662841796875, -3.6298828125, -3.40313720703125, -3.1763916015625, -2.94964599609375, -2.722900390625, -2.49615478515625, -2.2694091796875, -2.04266357421875, -1.81591796875, -1.58917236328125, -1.3624267578125, -1.13568115234375, -0.908935546875, -0.68218994140625, -0.4554443359375, -0.22869873046875, -0.001953125, 0.22479248046875, 0.4515380859375, 0.67828369140625, 0.905029296875, 1.13177490234375, 1.3585205078125, 1.58526611328125, 1.81201171875, 2.03875732421875, 2.2655029296875, 2.49224853515625, 2.718994140625, 2.94573974609375, 3.1724853515625, 3.39923095703125, 3.6259765625, 3.85272216796875, 4.0794677734375, 4.30621337890625, 4.532958984375, 4.75970458984375, 4.9864501953125, 5.21319580078125, 5.43994140625, 5.66668701171875, 5.8934326171875, 6.12017822265625, 6.346923828125, 6.57366943359375, 6.8004150390625, 7.02716064453125, 7.25390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 2.0, 7.0, 9.0, 6.0, 7.0, 14.0, 16.0, 13.0, 26.0, 31.0, 26.0, 33.0, 36.0, 22.0, 46.0, 39.0, 59.0, 39.0, 64.0, 46.0, 56.0, 48.0, 32.0, 37.0, 41.0, 33.0, 24.0, 20.0, 20.0, 30.0, 21.0, 18.0, 11.0, 15.0, 5.0, 6.0, 7.0, 7.0, 1.0, 8.0, 8.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.249359130859375, -2.16278076171875, -2.076202392578125, -1.9896240234375, -1.903045654296875, -1.81646728515625, -1.729888916015625, -1.643310546875, -1.556732177734375, -1.47015380859375, -1.383575439453125, -1.2969970703125, -1.210418701171875, -1.12384033203125, -1.037261962890625, -0.95068359375, -0.864105224609375, -0.77752685546875, -0.690948486328125, -0.6043701171875, -0.517791748046875, -0.43121337890625, -0.344635009765625, -0.258056640625, -0.171478271484375, -0.08489990234375, 0.001678466796875, 0.0882568359375, 0.174835205078125, 0.26141357421875, 0.347991943359375, 0.4345703125, 0.521148681640625, 0.60772705078125, 0.694305419921875, 0.7808837890625, 0.867462158203125, 0.95404052734375, 1.040618896484375, 1.127197265625, 1.213775634765625, 1.30035400390625, 1.386932373046875, 1.4735107421875, 1.560089111328125, 1.64666748046875, 1.733245849609375, 1.81982421875, 1.906402587890625, 1.99298095703125, 2.079559326171875, 2.1661376953125, 2.252716064453125, 2.33929443359375, 2.425872802734375, 2.512451171875, 2.599029541015625, 2.68560791015625, 2.772186279296875, 2.8587646484375, 2.945343017578125, 3.03192138671875, 3.118499755859375, 3.205078125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 19.0, 14.0, 26.0, 19.0, 18.0, 21.0, 34.0, 27.0, 36.0, 38.0, 52.0, 28.0, 48.0, 38.0, 37.0, 42.0, 59.0, 41.0, 22.0, 30.0, 23.0, 42.0, 33.0, 33.0, 23.0, 26.0, 21.0, 17.0, 17.0, 8.0, 10.0, 4.0, 14.0, 4.0, 9.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.258090019226074, -12.842058181762695, -12.426026344299316, -12.009994506835938, -11.593961715698242, -11.17793083190918, -10.761898040771484, -10.345866203308105, -9.929834365844727, -9.513802528381348, -9.097770690917969, -8.68173885345459, -8.265707015991211, -7.849674701690674, -7.433642387390137, -7.017610549926758, -6.601578712463379, -6.185546875, -5.769515037536621, -5.353482723236084, -4.937450885772705, -4.521419048309326, -4.105386734008789, -3.68935489654541, -3.2733230590820312, -2.8572912216186523, -2.4412591457366943, -2.0252270698547363, -1.6091952323913574, -1.1931633949279785, -0.7771313190460205, -0.3610992431640625, 0.05493354797363281, 0.47096550464630127, 0.8869974613189697, 1.3030294179916382, 1.7190613746643066, 2.1350932121276855, 2.5511252880096436, 2.9671573638916016, 3.3831892013549805, 3.7992210388183594, 4.215252876281738, 4.631285190582275, 5.047317028045654, 5.463348865509033, 5.87938117980957, 6.295413017272949, 6.711444854736328, 7.127476692199707, 7.543508529663086, 7.959540843963623, 8.375572204589844, 8.791604995727539, 9.207636833190918, 9.623668670654297, 10.039700508117676, 10.455732345581055, 10.871764183044434, 11.287796020507812, 11.703828811645508, 12.11985969543457, 12.535892486572266, 12.951924324035645, 13.367956161499023]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 7.0, 14.0, 10.0, 9.0, 7.0, 16.0, 19.0, 20.0, 23.0, 32.0, 29.0, 34.0, 39.0, 34.0, 35.0, 41.0, 40.0, 48.0, 36.0, 40.0, 41.0, 42.0, 44.0, 30.0, 33.0, 32.0, 32.0, 20.0, 28.0, 34.0, 19.0, 14.0, 18.0, 14.0, 9.0, 11.0, 8.0, 12.0, 8.0, 5.0, 3.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.291322708129883, -16.76630401611328, -16.24128532409668, -15.716267585754395, -15.19124984741211, -14.666231155395508, -14.141212463378906, -13.616193771362305, -13.09117603302002, -12.566157341003418, -12.041139602661133, -11.516120910644531, -10.99110221862793, -10.466084480285645, -9.941065788269043, -9.416048049926758, -8.891029357910156, -8.366010665893555, -7.8409929275512695, -7.315974235534668, -6.790956020355225, -6.265937805175781, -5.74091911315918, -5.215900897979736, -4.690882682800293, -4.16586446762085, -3.640846014022827, -3.1158275604248047, -2.5908093452453613, -2.065791130065918, -1.5407726764678955, -1.015754222869873, -0.4907341003417969, 0.034284234046936035, 0.559302568435669, 1.0843209028244019, 1.6093392372131348, 2.134357452392578, 2.6593759059906006, 3.184394359588623, 3.7094125747680664, 4.23443078994751, 4.759449005126953, 5.284467697143555, 5.809485912322998, 6.334504127502441, 6.859522819519043, 7.384541034698486, 7.90955924987793, 8.434577941894531, 8.959595680236816, 9.484614372253418, 10.009632110595703, 10.534650802612305, 11.059669494628906, 11.584688186645508, 12.109705924987793, 12.634724617004395, 13.15974235534668, 13.684761047363281, 14.209779739379883, 14.734797477722168, 15.25981616973877, 15.784833908081055, 16.309852600097656]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 13.0, 16.0, 31.0, 51.0, 80.0, 152.0, 276.0, 433.0, 752.0, 1155.0, 2019.0, 3200.0, 5238.0, 8559.0, 13725.0, 21975.0, 34273.0, 52779.0, 79661.0, 115385.0, 163294.0, 221825.0, 286427.0, 346657.0, 396866.0, 420381.0, 414759.0, 380040.0, 324291.0, 261537.0, 199834.0, 144823.0, 101632.0, 69022.0, 45499.0, 29265.0, 18749.0, 11620.0, 6982.0, 4385.0, 2683.0, 1605.0, 939.0, 609.0, 349.0, 193.0, 107.0, 77.0, 27.0, 13.0, 7.0, 9.0, 3.0, 2.0, 0.0, 3.0], "bins": [-11.703125, -11.3570556640625, -11.010986328125, -10.6649169921875, -10.31884765625, -9.9727783203125, -9.626708984375, -9.2806396484375, -8.9345703125, -8.5885009765625, -8.242431640625, -7.8963623046875, -7.55029296875, -7.2042236328125, -6.858154296875, -6.5120849609375, -6.166015625, -5.8199462890625, -5.473876953125, -5.1278076171875, -4.78173828125, -4.4356689453125, -4.089599609375, -3.7435302734375, -3.3974609375, -3.0513916015625, -2.705322265625, -2.3592529296875, -2.01318359375, -1.6671142578125, -1.321044921875, -0.9749755859375, -0.62890625, -0.2828369140625, 0.063232421875, 0.4093017578125, 0.75537109375, 1.1014404296875, 1.447509765625, 1.7935791015625, 2.1396484375, 2.4857177734375, 2.831787109375, 3.1778564453125, 3.52392578125, 3.8699951171875, 4.216064453125, 4.5621337890625, 4.908203125, 5.2542724609375, 5.600341796875, 5.9464111328125, 6.29248046875, 6.6385498046875, 6.984619140625, 7.3306884765625, 7.6767578125, 8.0228271484375, 8.368896484375, 8.7149658203125, 9.06103515625, 9.4071044921875, 9.753173828125, 10.0992431640625, 10.4453125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 1.0, 4.0, 5.0, 13.0, 10.0, 12.0, 9.0, 14.0, 17.0, 18.0, 26.0, 20.0, 33.0, 37.0, 36.0, 35.0, 41.0, 40.0, 36.0, 44.0, 37.0, 40.0, 40.0, 44.0, 43.0, 34.0, 29.0, 36.0, 28.0, 25.0, 29.0, 28.0, 25.0, 13.0, 21.0, 14.0, 9.0, 14.0, 9.0, 8.0, 11.0, 2.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.1405029296875, -15.640380859375, -15.1402587890625, -14.64013671875, -14.1400146484375, -13.639892578125, -13.1397705078125, -12.6396484375, -12.1395263671875, -11.639404296875, -11.1392822265625, -10.63916015625, -10.1390380859375, -9.638916015625, -9.1387939453125, -8.638671875, -8.1385498046875, -7.638427734375, -7.1383056640625, -6.63818359375, -6.1380615234375, -5.637939453125, -5.1378173828125, -4.6376953125, -4.1375732421875, -3.637451171875, -3.1373291015625, -2.63720703125, -2.1370849609375, -1.636962890625, -1.1368408203125, -0.63671875, -0.1365966796875, 0.363525390625, 0.8636474609375, 1.36376953125, 1.8638916015625, 2.364013671875, 2.8641357421875, 3.3642578125, 3.8643798828125, 4.364501953125, 4.8646240234375, 5.36474609375, 5.8648681640625, 6.364990234375, 6.8651123046875, 7.365234375, 7.8653564453125, 8.365478515625, 8.8656005859375, 9.36572265625, 9.8658447265625, 10.365966796875, 10.8660888671875, 11.3662109375, 11.8663330078125, 12.366455078125, 12.8665771484375, 13.36669921875, 13.8668212890625, 14.366943359375, 14.8670654296875, 15.3671875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 7.0, 7.0, 14.0, 25.0, 34.0, 53.0, 121.0, 191.0, 353.0, 655.0, 1203.0, 2167.0, 3832.0, 6636.0, 11559.0, 19142.0, 31728.0, 49772.0, 78039.0, 114268.0, 164527.0, 224435.0, 288965.0, 350191.0, 397964.0, 423063.0, 418344.0, 383523.0, 329341.0, 268393.0, 202582.0, 146636.0, 101859.0, 66578.0, 43006.0, 26696.0, 16006.0, 9711.0, 5518.0, 3104.0, 1828.0, 976.0, 576.0, 303.0, 162.0, 93.0, 48.0, 33.0, 16.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0616455078125, -10.677978515625, -10.2943115234375, -9.91064453125, -9.5269775390625, -9.143310546875, -8.7596435546875, -8.3759765625, -7.9923095703125, -7.608642578125, -7.2249755859375, -6.84130859375, -6.4576416015625, -6.073974609375, -5.6903076171875, -5.306640625, -4.9229736328125, -4.539306640625, -4.1556396484375, -3.77197265625, -3.3883056640625, -3.004638671875, -2.6209716796875, -2.2373046875, -1.8536376953125, -1.469970703125, -1.0863037109375, -0.70263671875, -0.3189697265625, 0.064697265625, 0.4483642578125, 0.83203125, 1.2156982421875, 1.599365234375, 1.9830322265625, 2.36669921875, 2.7503662109375, 3.134033203125, 3.5177001953125, 3.9013671875, 4.2850341796875, 4.668701171875, 5.0523681640625, 5.43603515625, 5.8197021484375, 6.203369140625, 6.5870361328125, 6.970703125, 7.3543701171875, 7.738037109375, 8.1217041015625, 8.50537109375, 8.8890380859375, 9.272705078125, 9.6563720703125, 10.0400390625, 10.4237060546875, 10.807373046875, 11.1910400390625, 11.57470703125, 11.9583740234375, 12.342041015625, 12.7257080078125, 13.109375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 16.0, 15.0, 22.0, 27.0, 35.0, 34.0, 43.0, 61.0, 80.0, 76.0, 90.0, 100.0, 110.0, 162.0, 156.0, 133.0, 184.0, 193.0, 195.0, 190.0, 190.0, 213.0, 191.0, 201.0, 147.0, 175.0, 152.0, 126.0, 131.0, 124.0, 89.0, 72.0, 68.0, 52.0, 53.0, 29.0, 35.0, 29.0, 20.0, 16.0, 9.0, 7.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.625, -6.41522216796875, -6.2054443359375, -5.99566650390625, -5.785888671875, -5.57611083984375, -5.3663330078125, -5.15655517578125, -4.94677734375, -4.73699951171875, -4.5272216796875, -4.31744384765625, -4.107666015625, -3.89788818359375, -3.6881103515625, -3.47833251953125, -3.2685546875, -3.05877685546875, -2.8489990234375, -2.63922119140625, -2.429443359375, -2.21966552734375, -2.0098876953125, -1.80010986328125, -1.59033203125, -1.38055419921875, -1.1707763671875, -0.96099853515625, -0.751220703125, -0.54144287109375, -0.3316650390625, -0.12188720703125, 0.087890625, 0.29766845703125, 0.5074462890625, 0.71722412109375, 0.927001953125, 1.13677978515625, 1.3465576171875, 1.55633544921875, 1.76611328125, 1.97589111328125, 2.1856689453125, 2.39544677734375, 2.605224609375, 2.81500244140625, 3.0247802734375, 3.23455810546875, 3.4443359375, 3.65411376953125, 3.8638916015625, 4.07366943359375, 4.283447265625, 4.49322509765625, 4.7030029296875, 4.91278076171875, 5.12255859375, 5.33233642578125, 5.5421142578125, 5.75189208984375, 5.961669921875, 6.17144775390625, 6.3812255859375, 6.59100341796875, 6.80078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 8.0, 10.0, 12.0, 10.0, 13.0, 10.0, 18.0, 24.0, 35.0, 29.0, 31.0, 30.0, 32.0, 35.0, 32.0, 42.0, 47.0, 33.0, 39.0, 42.0, 49.0, 42.0, 33.0, 37.0, 36.0, 27.0, 40.0, 22.0, 21.0, 25.0, 15.0, 19.0, 15.0, 13.0, 15.0, 9.0, 7.0, 7.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.516847610473633, -13.0610933303833, -12.605339050292969, -12.149584770202637, -11.693830490112305, -11.238077163696289, -10.782322883605957, -10.326568603515625, -9.870814323425293, -9.415060043334961, -8.959305763244629, -8.503551483154297, -8.047798156738281, -7.592043399810791, -7.136289596557617, -6.680535316467285, -6.224781036376953, -5.769026756286621, -5.313272476196289, -4.857518672943115, -4.401764392852783, -3.946010112762451, -3.4902560710906982, -3.0345020294189453, -2.5787477493286133, -2.1229934692382812, -1.6672394275665283, -1.2114852666854858, -0.7557311058044434, -0.29997682571411133, 0.1557772159576416, 0.6115312576293945, 1.0672845840454102, 1.5230387449264526, 1.9787929058074951, 2.434546947479248, 2.89030122756958, 3.346055507659912, 3.801809549331665, 4.257563591003418, 4.71331787109375, 5.169072151184082, 5.624826431274414, 6.080580234527588, 6.53633451461792, 6.992088794708252, 7.447842597961426, 7.903596878051758, 8.35935115814209, 8.815105438232422, 9.270859718322754, 9.726613998413086, 10.182367324829102, 10.63812255859375, 11.093875885009766, 11.549630165100098, 12.00538444519043, 12.461138725280762, 12.916893005371094, 13.372647285461426, 13.828401565551758, 14.284154891967773, 14.739909172058105, 15.195663452148438, 15.65141773223877]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 8.0, 13.0, 7.0, 13.0, 11.0, 15.0, 9.0, 17.0, 18.0, 23.0, 23.0, 32.0, 24.0, 36.0, 33.0, 28.0, 27.0, 36.0, 33.0, 45.0, 32.0, 37.0, 36.0, 33.0, 41.0, 33.0, 34.0, 39.0, 33.0, 18.0, 29.0, 25.0, 26.0, 19.0, 14.0, 17.0, 9.0, 14.0, 12.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.059412002563477, -15.555341720581055, -15.051271438598633, -14.547201156616211, -14.043130874633789, -13.539060592651367, -13.034990310668945, -12.530920028686523, -12.026849746704102, -11.52277946472168, -11.018709182739258, -10.514638900756836, -10.010568618774414, -9.506498336791992, -9.00242805480957, -8.498357772827148, -7.99428653717041, -7.490216255187988, -6.986145973205566, -6.4820756912231445, -5.978005409240723, -5.473935127258301, -4.969864368438721, -4.465794086456299, -3.961723804473877, -3.457653522491455, -2.953583240509033, -2.4495127201080322, -1.9454424381256104, -1.4413721561431885, -0.9373016357421875, -0.4332313537597656, 0.07083892822265625, 0.5749092698097229, 1.0789796113967896, 1.583050012588501, 2.087120294570923, 2.5911905765533447, 3.0952610969543457, 3.5993313789367676, 4.1034016609191895, 4.607471942901611, 5.111542224884033, 5.615612983703613, 6.119683265686035, 6.623753547668457, 7.127823829650879, 7.631894111633301, 8.135964393615723, 8.640034675598145, 9.144104957580566, 9.648175239562988, 10.15224552154541, 10.656315803527832, 11.16038703918457, 11.664457321166992, 12.168527603149414, 12.672597885131836, 13.176668167114258, 13.68073844909668, 14.184808731079102, 14.688879013061523, 15.192949295043945, 15.697019577026367, 16.20108985900879]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 9.0, 8.0, 15.0, 15.0, 33.0, 37.0, 58.0, 80.0, 100.0, 154.0, 224.0, 282.0, 488.0, 748.0, 1088.0, 1733.0, 2764.0, 4532.0, 7364.0, 12160.0, 21267.0, 37250.0, 66425.0, 113794.0, 176085.0, 203993.0, 160643.0, 100624.0, 57446.0, 32476.0, 18446.0, 10736.0, 6435.0, 3870.0, 2524.0, 1560.0, 990.0, 655.0, 480.0, 294.0, 205.0, 131.0, 109.0, 72.0, 46.0, 44.0, 29.0, 13.0, 12.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0], "bins": [-3.669921875, -3.559967041015625, -3.45001220703125, -3.340057373046875, -3.2301025390625, -3.120147705078125, -3.01019287109375, -2.900238037109375, -2.790283203125, -2.680328369140625, -2.57037353515625, -2.460418701171875, -2.3504638671875, -2.240509033203125, -2.13055419921875, -2.020599365234375, -1.91064453125, -1.800689697265625, -1.69073486328125, -1.580780029296875, -1.4708251953125, -1.360870361328125, -1.25091552734375, -1.140960693359375, -1.031005859375, -0.921051025390625, -0.81109619140625, -0.701141357421875, -0.5911865234375, -0.481231689453125, -0.37127685546875, -0.261322021484375, -0.1513671875, -0.041412353515625, 0.06854248046875, 0.178497314453125, 0.2884521484375, 0.398406982421875, 0.50836181640625, 0.618316650390625, 0.728271484375, 0.838226318359375, 0.94818115234375, 1.058135986328125, 1.1680908203125, 1.278045654296875, 1.38800048828125, 1.497955322265625, 1.60791015625, 1.717864990234375, 1.82781982421875, 1.937774658203125, 2.0477294921875, 2.157684326171875, 2.26763916015625, 2.377593994140625, 2.487548828125, 2.597503662109375, 2.70745849609375, 2.817413330078125, 2.9273681640625, 3.037322998046875, 3.14727783203125, 3.257232666015625, 3.3671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 3.0, 8.0, 13.0, 7.0, 13.0, 10.0, 16.0, 9.0, 18.0, 17.0, 22.0, 24.0, 32.0, 25.0, 38.0, 31.0, 30.0, 24.0, 36.0, 35.0, 43.0, 31.0, 37.0, 39.0, 31.0, 40.0, 38.0, 31.0, 41.0, 31.0, 18.0, 29.0, 24.0, 26.0, 19.0, 15.0, 16.0, 10.0, 13.0, 12.0, 7.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.078125, -15.572509765625, -15.06689453125, -14.561279296875, -14.0556640625, -13.550048828125, -13.04443359375, -12.538818359375, -12.033203125, -11.527587890625, -11.02197265625, -10.516357421875, -10.0107421875, -9.505126953125, -8.99951171875, -8.493896484375, -7.98828125, -7.482666015625, -6.97705078125, -6.471435546875, -5.9658203125, -5.460205078125, -4.95458984375, -4.448974609375, -3.943359375, -3.437744140625, -2.93212890625, -2.426513671875, -1.9208984375, -1.415283203125, -0.90966796875, -0.404052734375, 0.1015625, 0.607177734375, 1.11279296875, 1.618408203125, 2.1240234375, 2.629638671875, 3.13525390625, 3.640869140625, 4.146484375, 4.652099609375, 5.15771484375, 5.663330078125, 6.1689453125, 6.674560546875, 7.18017578125, 7.685791015625, 8.19140625, 8.697021484375, 9.20263671875, 9.708251953125, 10.2138671875, 10.719482421875, 11.22509765625, 11.730712890625, 12.236328125, 12.741943359375, 13.24755859375, 13.753173828125, 14.2587890625, 14.764404296875, 15.27001953125, 15.775634765625, 16.28125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 6.0, 14.0, 15.0, 23.0, 25.0, 45.0, 53.0, 75.0, 124.0, 161.0, 247.0, 381.0, 687.0, 901.0, 1527.0, 2620.0, 4680.0, 8401.0, 15799.0, 33677.0, 74048.0, 169845.0, 303917.0, 232557.0, 105170.0, 46619.0, 21855.0, 10915.0, 5788.0, 3292.0, 1906.0, 1108.0, 696.0, 458.0, 260.0, 178.0, 161.0, 102.0, 66.0, 47.0, 34.0, 23.0, 15.0, 16.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.535888671875, -4.38818359375, -4.240478515625, -4.0927734375, -3.945068359375, -3.79736328125, -3.649658203125, -3.501953125, -3.354248046875, -3.20654296875, -3.058837890625, -2.9111328125, -2.763427734375, -2.61572265625, -2.468017578125, -2.3203125, -2.172607421875, -2.02490234375, -1.877197265625, -1.7294921875, -1.581787109375, -1.43408203125, -1.286376953125, -1.138671875, -0.990966796875, -0.84326171875, -0.695556640625, -0.5478515625, -0.400146484375, -0.25244140625, -0.104736328125, 0.04296875, 0.190673828125, 0.33837890625, 0.486083984375, 0.6337890625, 0.781494140625, 0.92919921875, 1.076904296875, 1.224609375, 1.372314453125, 1.52001953125, 1.667724609375, 1.8154296875, 1.963134765625, 2.11083984375, 2.258544921875, 2.40625, 2.553955078125, 2.70166015625, 2.849365234375, 2.9970703125, 3.144775390625, 3.29248046875, 3.440185546875, 3.587890625, 3.735595703125, 3.88330078125, 4.031005859375, 4.1787109375, 4.326416015625, 4.47412109375, 4.621826171875, 4.76953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 6.0, 1.0, 5.0, 6.0, 14.0, 9.0, 14.0, 19.0, 23.0, 20.0, 25.0, 25.0, 15.0, 36.0, 32.0, 38.0, 33.0, 42.0, 43.0, 37.0, 31.0, 50.0, 46.0, 38.0, 59.0, 37.0, 38.0, 28.0, 28.0, 28.0, 19.0, 18.0, 19.0, 23.0, 21.0, 8.0, 11.0, 15.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5333251953125, -10.183837890625, -9.8343505859375, -9.48486328125, -9.1353759765625, -8.785888671875, -8.4364013671875, -8.0869140625, -7.7374267578125, -7.387939453125, -7.0384521484375, -6.68896484375, -6.3394775390625, -5.989990234375, -5.6405029296875, -5.291015625, -4.9415283203125, -4.592041015625, -4.2425537109375, -3.89306640625, -3.5435791015625, -3.194091796875, -2.8446044921875, -2.4951171875, -2.1456298828125, -1.796142578125, -1.4466552734375, -1.09716796875, -0.7476806640625, -0.398193359375, -0.0487060546875, 0.30078125, 0.6502685546875, 0.999755859375, 1.3492431640625, 1.69873046875, 2.0482177734375, 2.397705078125, 2.7471923828125, 3.0966796875, 3.4461669921875, 3.795654296875, 4.1451416015625, 4.49462890625, 4.8441162109375, 5.193603515625, 5.5430908203125, 5.892578125, 6.2420654296875, 6.591552734375, 6.9410400390625, 7.29052734375, 7.6400146484375, 7.989501953125, 8.3389892578125, 8.6884765625, 9.0379638671875, 9.387451171875, 9.7369384765625, 10.08642578125, 10.4359130859375, 10.785400390625, 11.1348876953125, 11.484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 3.0, 5.0, 15.0, 17.0, 17.0, 31.0, 41.0, 86.0, 96.0, 154.0, 202.0, 289.0, 494.0, 665.0, 1122.0, 1645.0, 2625.0, 4492.0, 8051.0, 14747.0, 30062.0, 68083.0, 173504.0, 333660.0, 234452.0, 92744.0, 38989.0, 18578.0, 9717.0, 5375.0, 3116.0, 1929.0, 1198.0, 767.0, 497.0, 347.0, 242.0, 171.0, 109.0, 60.0, 45.0, 29.0, 32.0, 19.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.0887451171875, -1.055419921875, -1.0220947265625, -0.98876953125, -0.9554443359375, -0.922119140625, -0.8887939453125, -0.85546875, -0.8221435546875, -0.788818359375, -0.7554931640625, -0.72216796875, -0.6888427734375, -0.655517578125, -0.6221923828125, -0.5888671875, -0.5555419921875, -0.522216796875, -0.4888916015625, -0.45556640625, -0.4222412109375, -0.388916015625, -0.3555908203125, -0.322265625, -0.2889404296875, -0.255615234375, -0.2222900390625, -0.18896484375, -0.1556396484375, -0.122314453125, -0.0889892578125, -0.0556640625, -0.0223388671875, 0.010986328125, 0.0443115234375, 0.07763671875, 0.1109619140625, 0.144287109375, 0.1776123046875, 0.2109375, 0.2442626953125, 0.277587890625, 0.3109130859375, 0.34423828125, 0.3775634765625, 0.410888671875, 0.4442138671875, 0.4775390625, 0.5108642578125, 0.544189453125, 0.5775146484375, 0.61083984375, 0.6441650390625, 0.677490234375, 0.7108154296875, 0.744140625, 0.7774658203125, 0.810791015625, 0.8441162109375, 0.87744140625, 0.9107666015625, 0.944091796875, 0.9774169921875, 1.0107421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 6.0, 1.0, 8.0, 4.0, 10.0, 10.0, 12.0, 14.0, 15.0, 29.0, 20.0, 24.0, 28.0, 24.0, 34.0, 48.0, 47.0, 42.0, 46.0, 59.0, 61.0, 62.0, 54.0, 51.0, 39.0, 34.0, 40.0, 26.0, 24.0, 30.0, 24.0, 15.0, 7.0, 11.0, 11.0, 7.0, 3.0, 7.0, 2.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1552734375e-05, -8.82614403963089e-05, -8.49701464176178e-05, -8.16788524389267e-05, -7.83875584602356e-05, -7.50962644815445e-05, -7.18049705028534e-05, -6.851367652416229e-05, -6.522238254547119e-05, -6.193108856678009e-05, -5.863979458808899e-05, -5.534850060939789e-05, -5.205720663070679e-05, -4.8765912652015686e-05, -4.5474618673324585e-05, -4.2183324694633484e-05, -3.889203071594238e-05, -3.560073673725128e-05, -3.230944275856018e-05, -2.901814877986908e-05, -2.572685480117798e-05, -2.2435560822486877e-05, -1.9144266843795776e-05, -1.5852972865104675e-05, -1.2561678886413574e-05, -9.270384907722473e-06, -5.979090929031372e-06, -2.687796950340271e-06, 6.034970283508301e-07, 3.894791007041931e-06, 7.186084985733032e-06, 1.0477378964424133e-05, 1.3768672943115234e-05, 1.7059966921806335e-05, 2.0351260900497437e-05, 2.3642554879188538e-05, 2.693384885787964e-05, 3.022514283657074e-05, 3.351643681526184e-05, 3.680773079395294e-05, 4.009902477264404e-05, 4.3390318751335144e-05, 4.6681612730026245e-05, 4.9972906708717346e-05, 5.326420068740845e-05, 5.655549466609955e-05, 5.984678864479065e-05, 6.313808262348175e-05, 6.642937660217285e-05, 6.972067058086395e-05, 7.301196455955505e-05, 7.630325853824615e-05, 7.959455251693726e-05, 8.288584649562836e-05, 8.617714047431946e-05, 8.946843445301056e-05, 9.275972843170166e-05, 9.605102241039276e-05, 9.934231638908386e-05, 0.00010263361036777496, 0.00010592490434646606, 0.00010921619832515717, 0.00011250749230384827, 0.00011579878628253937, 0.00011909008026123047]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 9.0, 9.0, 23.0, 28.0, 42.0, 56.0, 77.0, 101.0, 188.0, 294.0, 407.0, 609.0, 951.0, 1442.0, 2268.0, 3806.0, 6017.0, 10064.0, 16835.0, 28640.0, 49983.0, 84118.0, 133158.0, 179578.0, 181333.0, 136376.0, 86528.0, 51275.0, 29832.0, 17479.0, 10358.0, 6057.0, 3864.0, 2360.0, 1572.0, 916.0, 629.0, 400.0, 276.0, 197.0, 152.0, 80.0, 49.0, 42.0, 31.0, 15.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1044921875, -1.07000732421875, -1.0355224609375, -1.00103759765625, -0.966552734375, -0.93206787109375, -0.8975830078125, -0.86309814453125, -0.82861328125, -0.79412841796875, -0.7596435546875, -0.72515869140625, -0.690673828125, -0.65618896484375, -0.6217041015625, -0.58721923828125, -0.552734375, -0.51824951171875, -0.4837646484375, -0.44927978515625, -0.414794921875, -0.38031005859375, -0.3458251953125, -0.31134033203125, -0.27685546875, -0.24237060546875, -0.2078857421875, -0.17340087890625, -0.138916015625, -0.10443115234375, -0.0699462890625, -0.03546142578125, -0.0009765625, 0.03350830078125, 0.0679931640625, 0.10247802734375, 0.136962890625, 0.17144775390625, 0.2059326171875, 0.24041748046875, 0.27490234375, 0.30938720703125, 0.3438720703125, 0.37835693359375, 0.412841796875, 0.44732666015625, 0.4818115234375, 0.51629638671875, 0.55078125, 0.58526611328125, 0.6197509765625, 0.65423583984375, 0.688720703125, 0.72320556640625, 0.7576904296875, 0.79217529296875, 0.82666015625, 0.86114501953125, 0.8956298828125, 0.93011474609375, 0.964599609375, 0.99908447265625, 1.0335693359375, 1.06805419921875, 1.1025390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 0.0, 3.0, 4.0, 15.0, 10.0, 7.0, 19.0, 17.0, 22.0, 25.0, 33.0, 30.0, 24.0, 40.0, 35.0, 44.0, 35.0, 46.0, 41.0, 60.0, 48.0, 56.0, 40.0, 30.0, 33.0, 34.0, 34.0, 33.0, 23.0, 25.0, 23.0, 21.0, 16.0, 10.0, 8.0, 8.0, 5.0, 5.0, 10.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 5.0], "bins": [-0.3828125, -0.3716697692871094, -0.36052703857421875, -0.3493843078613281, -0.3382415771484375, -0.3270988464355469, -0.31595611572265625, -0.3048133850097656, -0.293670654296875, -0.2825279235839844, -0.27138519287109375, -0.2602424621582031, -0.2490997314453125, -0.23795700073242188, -0.22681427001953125, -0.21567153930664062, -0.20452880859375, -0.19338607788085938, -0.18224334716796875, -0.17110061645507812, -0.1599578857421875, -0.14881515502929688, -0.13767242431640625, -0.12652969360351562, -0.115386962890625, -0.10424423217773438, -0.09310150146484375, -0.08195877075195312, -0.0708160400390625, -0.059673309326171875, -0.04853057861328125, -0.037387847900390625, -0.0262451171875, -0.015102386474609375, -0.00395965576171875, 0.007183074951171875, 0.0183258056640625, 0.029468536376953125, 0.04061126708984375, 0.051753997802734375, 0.062896728515625, 0.07403945922851562, 0.08518218994140625, 0.09632492065429688, 0.1074676513671875, 0.11861038208007812, 0.12975311279296875, 0.14089584350585938, 0.15203857421875, 0.16318130493164062, 0.17432403564453125, 0.18546676635742188, 0.1966094970703125, 0.20775222778320312, 0.21889495849609375, 0.23003768920898438, 0.241180419921875, 0.2523231506347656, 0.26346588134765625, 0.2746086120605469, 0.2857513427734375, 0.2968940734863281, 0.30803680419921875, 0.3191795349121094, 0.330322265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 3.0, 9.0, 9.0, 10.0, 12.0, 12.0, 13.0, 15.0, 19.0, 32.0, 38.0, 27.0, 26.0, 32.0, 34.0, 33.0, 44.0, 45.0, 33.0, 37.0, 35.0, 44.0, 47.0, 39.0, 34.0, 42.0, 30.0, 27.0, 32.0, 22.0, 26.0, 16.0, 18.0, 17.0, 11.0, 15.0, 15.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.597350120544434, -13.143797874450684, -12.690245628356934, -12.236693382263184, -11.783141136169434, -11.329588890075684, -10.876036643981934, -10.422484397888184, -9.968932151794434, -9.515379905700684, -9.061827659606934, -8.608275413513184, -8.154723167419434, -7.701170921325684, -7.247618675231934, -6.794066429138184, -6.340514183044434, -5.886961936950684, -5.433409690856934, -4.979857444763184, -4.526305198669434, -4.072752952575684, -3.6192007064819336, -3.1656484603881836, -2.7120962142944336, -2.2585439682006836, -1.8049917221069336, -1.3514394760131836, -0.8978872299194336, -0.4443349838256836, 0.009217262268066406, 0.4627695083618164, 0.9163227081298828, 1.3698749542236328, 1.8234272003173828, 2.276979446411133, 2.730531692504883, 3.184083938598633, 3.637636184692383, 4.091188430786133, 4.544740676879883, 4.998292922973633, 5.451845169067383, 5.905397415161133, 6.358949661254883, 6.812501907348633, 7.266054153442383, 7.719606399536133, 8.173158645629883, 8.626710891723633, 9.080263137817383, 9.533815383911133, 9.987367630004883, 10.440919876098633, 10.894472122192383, 11.348024368286133, 11.801576614379883, 12.255128860473633, 12.708681106567383, 13.162233352661133, 13.615785598754883, 14.069337844848633, 14.522890090942383, 14.976442337036133, 15.429994583129883]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 13.0, 9.0, 9.0, 14.0, 14.0, 9.0, 18.0, 15.0, 25.0, 25.0, 28.0, 24.0, 39.0, 31.0, 29.0, 27.0, 36.0, 33.0, 44.0, 31.0, 39.0, 35.0, 39.0, 35.0, 34.0, 35.0, 40.0, 37.0, 13.0, 33.0, 20.0, 23.0, 26.0, 11.0, 16.0, 11.0, 12.0, 13.0, 7.0, 7.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.131114959716797, -15.624518394470215, -15.117921829223633, -14.61132526397705, -14.104728698730469, -13.598132133483887, -13.091535568237305, -12.584939002990723, -12.07834243774414, -11.571745872497559, -11.065149307250977, -10.558552742004395, -10.051956176757812, -9.54535961151123, -9.038763046264648, -8.532166481018066, -8.025569915771484, -7.518973350524902, -7.01237678527832, -6.505780220031738, -5.999183654785156, -5.492587089538574, -4.985990524291992, -4.47939395904541, -3.972797393798828, -3.466200828552246, -2.959604263305664, -2.453007698059082, -1.9464111328125, -1.439814567565918, -0.9332180023193359, -0.4266214370727539, 0.07997512817382812, 0.5865716934204102, 1.0931682586669922, 1.5997648239135742, 2.1063613891601562, 2.6129579544067383, 3.1195545196533203, 3.6261510848999023, 4.132747650146484, 4.639344215393066, 5.145940780639648, 5.6525373458862305, 6.1591339111328125, 6.6657304763793945, 7.172327041625977, 7.678923606872559, 8.18552017211914, 8.692116737365723, 9.198713302612305, 9.705309867858887, 10.211906433105469, 10.71850299835205, 11.225099563598633, 11.731696128845215, 12.238292694091797, 12.744889259338379, 13.251485824584961, 13.758082389831543, 14.264678955078125, 14.771275520324707, 15.277872085571289, 15.784468650817871, 16.291065216064453]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 14.0, 30.0, 37.0, 69.0, 145.0, 177.0, 288.0, 517.0, 804.0, 1194.0, 1931.0, 3012.0, 4610.0, 6921.0, 10405.0, 15245.0, 21502.0, 30131.0, 40429.0, 52256.0, 64851.0, 77060.0, 86591.0, 91808.0, 92679.0, 88595.0, 80077.0, 68792.0, 56325.0, 44145.0, 32757.0, 24368.0, 16679.0, 11575.0, 7925.0, 5203.0, 3441.0, 2160.0, 1430.0, 936.0, 504.0, 327.0, 241.0, 135.0, 93.0, 63.0, 27.0, 16.0, 15.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-11.015625, -10.683349609375, -10.35107421875, -10.018798828125, -9.6865234375, -9.354248046875, -9.02197265625, -8.689697265625, -8.357421875, -8.025146484375, -7.69287109375, -7.360595703125, -7.0283203125, -6.696044921875, -6.36376953125, -6.031494140625, -5.69921875, -5.366943359375, -5.03466796875, -4.702392578125, -4.3701171875, -4.037841796875, -3.70556640625, -3.373291015625, -3.041015625, -2.708740234375, -2.37646484375, -2.044189453125, -1.7119140625, -1.379638671875, -1.04736328125, -0.715087890625, -0.3828125, -0.050537109375, 0.28173828125, 0.614013671875, 0.9462890625, 1.278564453125, 1.61083984375, 1.943115234375, 2.275390625, 2.607666015625, 2.93994140625, 3.272216796875, 3.6044921875, 3.936767578125, 4.26904296875, 4.601318359375, 4.93359375, 5.265869140625, 5.59814453125, 5.930419921875, 6.2626953125, 6.594970703125, 6.92724609375, 7.259521484375, 7.591796875, 7.924072265625, 8.25634765625, 8.588623046875, 8.9208984375, 9.253173828125, 9.58544921875, 9.917724609375, 10.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 14.0, 9.0, 11.0, 12.0, 16.0, 7.0, 16.0, 17.0, 25.0, 23.0, 30.0, 21.0, 42.0, 34.0, 28.0, 24.0, 38.0, 34.0, 40.0, 32.0, 38.0, 35.0, 38.0, 38.0, 31.0, 37.0, 42.0, 32.0, 22.0, 31.0, 17.0, 26.0, 23.0, 9.0, 19.0, 12.0, 11.0, 11.0, 9.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.296875, -15.785888671875, -15.27490234375, -14.763916015625, -14.2529296875, -13.741943359375, -13.23095703125, -12.719970703125, -12.208984375, -11.697998046875, -11.18701171875, -10.676025390625, -10.1650390625, -9.654052734375, -9.14306640625, -8.632080078125, -8.12109375, -7.610107421875, -7.09912109375, -6.588134765625, -6.0771484375, -5.566162109375, -5.05517578125, -4.544189453125, -4.033203125, -3.522216796875, -3.01123046875, -2.500244140625, -1.9892578125, -1.478271484375, -0.96728515625, -0.456298828125, 0.0546875, 0.565673828125, 1.07666015625, 1.587646484375, 2.0986328125, 2.609619140625, 3.12060546875, 3.631591796875, 4.142578125, 4.653564453125, 5.16455078125, 5.675537109375, 6.1865234375, 6.697509765625, 7.20849609375, 7.719482421875, 8.23046875, 8.741455078125, 9.25244140625, 9.763427734375, 10.2744140625, 10.785400390625, 11.29638671875, 11.807373046875, 12.318359375, 12.829345703125, 13.34033203125, 13.851318359375, 14.3623046875, 14.873291015625, 15.38427734375, 15.895263671875, 16.40625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 10.0, 2.0, 7.0, 14.0, 19.0, 31.0, 32.0, 76.0, 112.0, 179.0, 259.0, 367.0, 601.0, 1023.0, 1489.0, 2304.0, 3462.0, 5616.0, 8387.0, 12319.0, 18732.0, 27380.0, 38481.0, 52366.0, 67699.0, 84048.0, 96806.0, 103076.0, 103988.0, 96302.0, 83478.0, 67530.0, 52474.0, 38560.0, 26898.0, 18422.0, 12533.0, 8197.0, 5406.0, 3394.0, 2234.0, 1534.0, 917.0, 642.0, 411.0, 239.0, 171.0, 121.0, 71.0, 54.0, 29.0, 27.0, 14.0, 11.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.5546875, -13.1309814453125, -12.707275390625, -12.2835693359375, -11.85986328125, -11.4361572265625, -11.012451171875, -10.5887451171875, -10.1650390625, -9.7413330078125, -9.317626953125, -8.8939208984375, -8.47021484375, -8.0465087890625, -7.622802734375, -7.1990966796875, -6.775390625, -6.3516845703125, -5.927978515625, -5.5042724609375, -5.08056640625, -4.6568603515625, -4.233154296875, -3.8094482421875, -3.3857421875, -2.9620361328125, -2.538330078125, -2.1146240234375, -1.69091796875, -1.2672119140625, -0.843505859375, -0.4197998046875, 0.00390625, 0.4276123046875, 0.851318359375, 1.2750244140625, 1.69873046875, 2.1224365234375, 2.546142578125, 2.9698486328125, 3.3935546875, 3.8172607421875, 4.240966796875, 4.6646728515625, 5.08837890625, 5.5120849609375, 5.935791015625, 6.3594970703125, 6.783203125, 7.2069091796875, 7.630615234375, 8.0543212890625, 8.47802734375, 8.9017333984375, 9.325439453125, 9.7491455078125, 10.1728515625, 10.5965576171875, 11.020263671875, 11.4439697265625, 11.86767578125, 12.2913818359375, 12.715087890625, 13.1387939453125, 13.5625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 8.0, 11.0, 14.0, 15.0, 13.0, 20.0, 25.0, 25.0, 27.0, 39.0, 44.0, 32.0, 39.0, 49.0, 41.0, 52.0, 44.0, 51.0, 42.0, 43.0, 33.0, 55.0, 33.0, 32.0, 32.0, 26.0, 26.0, 23.0, 15.0, 10.0, 11.0, 13.0, 9.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4140625, -14.009033203125, -13.60400390625, -13.198974609375, -12.7939453125, -12.388916015625, -11.98388671875, -11.578857421875, -11.173828125, -10.768798828125, -10.36376953125, -9.958740234375, -9.5537109375, -9.148681640625, -8.74365234375, -8.338623046875, -7.93359375, -7.528564453125, -7.12353515625, -6.718505859375, -6.3134765625, -5.908447265625, -5.50341796875, -5.098388671875, -4.693359375, -4.288330078125, -3.88330078125, -3.478271484375, -3.0732421875, -2.668212890625, -2.26318359375, -1.858154296875, -1.453125, -1.048095703125, -0.64306640625, -0.238037109375, 0.1669921875, 0.572021484375, 0.97705078125, 1.382080078125, 1.787109375, 2.192138671875, 2.59716796875, 3.002197265625, 3.4072265625, 3.812255859375, 4.21728515625, 4.622314453125, 5.02734375, 5.432373046875, 5.83740234375, 6.242431640625, 6.6474609375, 7.052490234375, 7.45751953125, 7.862548828125, 8.267578125, 8.672607421875, 9.07763671875, 9.482666015625, 9.8876953125, 10.292724609375, 10.69775390625, 11.102783203125, 11.5078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 10.0, 5.0, 15.0, 14.0, 36.0, 46.0, 82.0, 120.0, 195.0, 312.0, 495.0, 786.0, 1284.0, 2025.0, 3335.0, 5519.0, 8898.0, 13828.0, 21847.0, 33117.0, 48610.0, 68005.0, 88074.0, 106552.0, 117185.0, 117755.0, 107562.0, 89639.0, 68900.0, 49958.0, 33844.0, 22325.0, 14519.0, 9071.0, 5446.0, 3494.0, 2091.0, 1325.0, 821.0, 514.0, 327.0, 216.0, 128.0, 92.0, 46.0, 33.0, 23.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.30078125, -5.124267578125, -4.94775390625, -4.771240234375, -4.5947265625, -4.418212890625, -4.24169921875, -4.065185546875, -3.888671875, -3.712158203125, -3.53564453125, -3.359130859375, -3.1826171875, -3.006103515625, -2.82958984375, -2.653076171875, -2.4765625, -2.300048828125, -2.12353515625, -1.947021484375, -1.7705078125, -1.593994140625, -1.41748046875, -1.240966796875, -1.064453125, -0.887939453125, -0.71142578125, -0.534912109375, -0.3583984375, -0.181884765625, -0.00537109375, 0.171142578125, 0.34765625, 0.524169921875, 0.70068359375, 0.877197265625, 1.0537109375, 1.230224609375, 1.40673828125, 1.583251953125, 1.759765625, 1.936279296875, 2.11279296875, 2.289306640625, 2.4658203125, 2.642333984375, 2.81884765625, 2.995361328125, 3.171875, 3.348388671875, 3.52490234375, 3.701416015625, 3.8779296875, 4.054443359375, 4.23095703125, 4.407470703125, 4.583984375, 4.760498046875, 4.93701171875, 5.113525390625, 5.2900390625, 5.466552734375, 5.64306640625, 5.819580078125, 5.99609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 5.0, 12.0, 8.0, 14.0, 16.0, 20.0, 31.0, 33.0, 35.0, 42.0, 52.0, 39.0, 51.0, 65.0, 61.0, 52.0, 59.0, 42.0, 44.0, 47.0, 50.0, 42.0, 23.0, 39.0, 23.0, 19.0, 16.0, 7.0, 13.0, 9.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007200241088867188, -0.0006935149431228638, -0.0006670057773590088, -0.0006404966115951538, -0.0006139874458312988, -0.0005874782800674438, -0.0005609691143035889, -0.0005344599485397339, -0.0005079507827758789, -0.0004814416170120239, -0.00045493245124816895, -0.00042842328548431396, -0.000401914119720459, -0.000375404953956604, -0.000348895788192749, -0.00032238662242889404, -0.00029587745666503906, -0.0002693682909011841, -0.0002428591251373291, -0.00021634995937347412, -0.00018984079360961914, -0.00016333162784576416, -0.00013682246208190918, -0.0001103132963180542, -8.380413055419922e-05, -5.729496479034424e-05, -3.078579902648926e-05, -4.276633262634277e-06, 2.2232532501220703e-05, 4.8741698265075684e-05, 7.525086402893066e-05, 0.00010176002979278564, 0.00012826919555664062, 0.0001547783613204956, 0.00018128752708435059, 0.00020779669284820557, 0.00023430585861206055, 0.00026081502437591553, 0.0002873241901397705, 0.0003138333559036255, 0.00034034252166748047, 0.00036685168743133545, 0.00039336085319519043, 0.0004198700189590454, 0.0004463791847229004, 0.00047288835048675537, 0.0004993975162506104, 0.0005259066820144653, 0.0005524158477783203, 0.0005789250135421753, 0.0006054341793060303, 0.0006319433450698853, 0.0006584525108337402, 0.0006849616765975952, 0.0007114708423614502, 0.0007379800081253052, 0.0007644891738891602, 0.0007909983396530151, 0.0008175075054168701, 0.0008440166711807251, 0.0008705258369445801, 0.0008970350027084351, 0.00092354416847229, 0.000950053334236145, 0.0009765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 16.0, 16.0, 29.0, 36.0, 63.0, 103.0, 183.0, 302.0, 545.0, 845.0, 1346.0, 2356.0, 3731.0, 6174.0, 10013.0, 16206.0, 25110.0, 37892.0, 54871.0, 74617.0, 95134.0, 111656.0, 119401.0, 115745.0, 101948.0, 83032.0, 62704.0, 44275.0, 29627.0, 19206.0, 12196.0, 7528.0, 4610.0, 2778.0, 1646.0, 1072.0, 610.0, 352.0, 246.0, 117.0, 91.0, 49.0, 27.0, 19.0, 16.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56640625, -5.37896728515625, -5.1915283203125, -5.00408935546875, -4.816650390625, -4.62921142578125, -4.4417724609375, -4.25433349609375, -4.06689453125, -3.87945556640625, -3.6920166015625, -3.50457763671875, -3.317138671875, -3.12969970703125, -2.9422607421875, -2.75482177734375, -2.5673828125, -2.37994384765625, -2.1925048828125, -2.00506591796875, -1.817626953125, -1.63018798828125, -1.4427490234375, -1.25531005859375, -1.06787109375, -0.88043212890625, -0.6929931640625, -0.50555419921875, -0.318115234375, -0.13067626953125, 0.0567626953125, 0.24420166015625, 0.431640625, 0.61907958984375, 0.8065185546875, 0.99395751953125, 1.181396484375, 1.36883544921875, 1.5562744140625, 1.74371337890625, 1.93115234375, 2.11859130859375, 2.3060302734375, 2.49346923828125, 2.680908203125, 2.86834716796875, 3.0557861328125, 3.24322509765625, 3.4306640625, 3.61810302734375, 3.8055419921875, 3.99298095703125, 4.180419921875, 4.36785888671875, 4.5552978515625, 4.74273681640625, 4.93017578125, 5.11761474609375, 5.3050537109375, 5.49249267578125, 5.679931640625, 5.86737060546875, 6.0548095703125, 6.24224853515625, 6.4296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 11.0, 18.0, 10.0, 20.0, 21.0, 31.0, 38.0, 33.0, 46.0, 60.0, 66.0, 55.0, 68.0, 54.0, 59.0, 59.0, 60.0, 39.0, 26.0, 38.0, 34.0, 31.0, 24.0, 19.0, 16.0, 14.0, 5.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.21319580078125, -3.1060791015625, -2.99896240234375, -2.891845703125, -2.78472900390625, -2.6776123046875, -2.57049560546875, -2.46337890625, -2.35626220703125, -2.2491455078125, -2.14202880859375, -2.034912109375, -1.92779541015625, -1.8206787109375, -1.71356201171875, -1.6064453125, -1.49932861328125, -1.3922119140625, -1.28509521484375, -1.177978515625, -1.07086181640625, -0.9637451171875, -0.85662841796875, -0.74951171875, -0.64239501953125, -0.5352783203125, -0.42816162109375, -0.321044921875, -0.21392822265625, -0.1068115234375, 0.00030517578125, 0.107421875, 0.21453857421875, 0.3216552734375, 0.42877197265625, 0.535888671875, 0.64300537109375, 0.7501220703125, 0.85723876953125, 0.96435546875, 1.07147216796875, 1.1785888671875, 1.28570556640625, 1.392822265625, 1.49993896484375, 1.6070556640625, 1.71417236328125, 1.8212890625, 1.92840576171875, 2.0355224609375, 2.14263916015625, 2.249755859375, 2.35687255859375, 2.4639892578125, 2.57110595703125, 2.67822265625, 2.78533935546875, 2.8924560546875, 2.99957275390625, 3.106689453125, 3.21380615234375, 3.3209228515625, 3.42803955078125, 3.53515625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 7.0, 10.0, 17.0, 21.0, 22.0, 23.0, 25.0, 16.0, 29.0, 29.0, 40.0, 28.0, 52.0, 37.0, 43.0, 41.0, 36.0, 47.0, 35.0, 48.0, 41.0, 43.0, 39.0, 22.0, 43.0, 20.0, 17.0, 20.0, 24.0, 19.0, 13.0, 10.0, 13.0, 12.0, 7.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.391257286071777, -13.896187782287598, -13.401119232177734, -12.906049728393555, -12.410980224609375, -11.915910720825195, -11.420842170715332, -10.925772666931152, -10.430704116821289, -9.93563461303711, -9.440566062927246, -8.945496559143066, -8.450427055358887, -7.955358028411865, -7.460289001464844, -6.965219497680664, -6.470149993896484, -5.975080966949463, -5.480011463165283, -4.984942436218262, -4.489872932434082, -3.9948039054870605, -3.499734878540039, -3.0046656131744385, -2.509596347808838, -2.0145270824432373, -1.5194579362869263, -1.0243887901306152, -0.5293195247650146, -0.03425025939941406, 0.4608187675476074, 0.955888032913208, 1.450958251953125, 1.9460275173187256, 2.441096782684326, 2.9361658096313477, 3.4312350749969482, 3.926304340362549, 4.42137336730957, 4.91644287109375, 5.4115118980407715, 5.906580924987793, 6.401650428771973, 6.896719455718994, 7.391788482666016, 7.886857986450195, 8.381927490234375, 8.876996040344238, 9.372065544128418, 9.867135047912598, 10.362203598022461, 10.85727310180664, 11.35234260559082, 11.847412109375, 12.342480659484863, 12.837550163269043, 13.332618713378906, 13.827688217163086, 14.32275676727295, 14.817826271057129, 15.312895774841309, 15.807964324951172, 16.30303382873535, 16.79810333251953, 17.29317283630371]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 3.0, 9.0, 15.0, 11.0, 4.0, 4.0, 14.0, 12.0, 23.0, 14.0, 25.0, 25.0, 22.0, 37.0, 31.0, 26.0, 35.0, 37.0, 37.0, 33.0, 29.0, 36.0, 31.0, 34.0, 32.0, 40.0, 32.0, 46.0, 36.0, 21.0, 37.0, 28.0, 27.0, 25.0, 12.0, 21.0, 17.0, 13.0, 13.0, 9.0, 7.0, 4.0, 7.0, 5.0, 9.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.196800231933594, -17.611371994018555, -17.02594566345215, -16.44051742553711, -15.855091094970703, -15.269662857055664, -14.684235572814941, -14.098808288574219, -13.513381004333496, -12.927953720092773, -12.34252643585205, -11.757099151611328, -11.171670913696289, -10.586244583129883, -10.000816345214844, -9.415389060974121, -8.829961776733398, -8.244534492492676, -7.659107208251953, -7.073679447174072, -6.48825216293335, -5.902824878692627, -5.317397117614746, -4.731969833374023, -4.146542549133301, -3.561115264892578, -2.9756877422332764, -2.3902602195739746, -1.804832935333252, -1.2194056510925293, -0.6339781284332275, -0.04855060577392578, 0.5368747711181641, 1.1223021745681763, 1.7077295780181885, 2.2931571006774902, 2.878584384918213, 3.4640116691589355, 4.049439430236816, 4.634866714477539, 5.220293998718262, 5.805721282958984, 6.391148567199707, 6.976576328277588, 7.5620036125183105, 8.147430419921875, 8.732858657836914, 9.318285942077637, 9.90371322631836, 10.489140510559082, 11.074567794799805, 11.659995079040527, 12.24542236328125, 12.830850601196289, 13.416277885437012, 14.001705169677734, 14.587132453918457, 15.17255973815918, 15.757987022399902, 16.343414306640625, 16.928842544555664, 17.51426887512207, 18.09969711303711, 18.685123443603516, 19.270551681518555]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 6.0, 0.0, 3.0, 3.0, 6.0, 6.0, 10.0, 9.0, 16.0, 18.0, 23.0, 39.0, 47.0, 49.0, 87.0, 99.0, 153.0, 163.0, 254.0, 301.0, 402.0, 512.0, 649.0, 791.0, 951.0, 1073.0, 1211.0, 1248.0, 1034512.0, 1184.0, 1146.0, 1043.0, 918.0, 761.0, 690.0, 501.0, 446.0, 309.0, 246.0, 183.0, 139.0, 108.0, 76.0, 63.0, 41.0, 33.0, 19.0, 21.0, 15.0, 8.0, 10.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-204.1968231201172, -197.27210998535156, -190.34739685058594, -183.4226837158203, -176.49795532226562, -169.5732421875, -162.64852905273438, -155.72381591796875, -148.79910278320312, -141.8743896484375, -134.94967651367188, -128.02496337890625, -121.1002426147461, -114.17552947998047, -107.25080871582031, -100.32609558105469, -93.40138244628906, -86.47666931152344, -79.55195617675781, -72.62723541259766, -65.70252227783203, -58.777809143066406, -51.853092193603516, -44.928375244140625, -38.003662109375, -31.078947067260742, -24.154232025146484, -17.229516983032227, -10.304801940917969, -3.3800888061523438, 3.544628143310547, 10.469345092773438, 17.394058227539062, 24.31877326965332, 31.243488311767578, 38.16820526123047, 45.092918395996094, 52.01763153076172, 58.94234848022461, 65.8670654296875, 72.79177856445312, 79.71649169921875, 86.64120483398438, 93.56592559814453, 100.49063873291016, 107.41535186767578, 114.34007263183594, 121.26478576660156, 128.1894989013672, 135.1142120361328, 142.03892517089844, 148.96363830566406, 155.88836669921875, 162.81307983398438, 169.73779296875, 176.66250610351562, 183.58721923828125, 190.51193237304688, 197.4366455078125, 204.36135864257812, 211.28607177734375, 218.21078491210938, 225.13551330566406, 232.0602264404297, 238.9849395751953]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 3.0, 7.0, 16.0, 15.0, 19.0, 30.0, 48.0, 57.0, 92.0, 111.0, 159.0, 264.0, 322.0, 419.0, 586.0, 769.0, 1035.0, 1391.0, 1827.0, 2400.0, 3012.0, 3687.0, 4751.0, 5840.0, 7760.0, 13664.0, 51321324.0, 59825.0, 10381.0, 6893.0, 5337.0, 4328.0, 3461.0, 2731.0, 2207.0, 1724.0, 1265.0, 957.0, 694.0, 529.0, 388.0, 294.0, 195.0, 153.0, 113.0, 95.0, 55.0, 33.0, 28.0, 22.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-128.9039306640625, -124.5826416015625, -120.26134490966797, -115.94005584716797, -111.61875915527344, -107.29747009277344, -102.97618103027344, -98.65489196777344, -94.3335952758789, -90.0123062133789, -85.69100952148438, -81.36972045898438, -77.04843139648438, -72.72713470458984, -68.40584564208984, -64.08454895019531, -59.76325988769531, -55.44196701049805, -51.12067413330078, -46.79938507080078, -42.478092193603516, -38.15679931640625, -33.83551025390625, -29.514217376708984, -25.19292449951172, -20.871631622314453, -16.55034065246582, -12.229048728942871, -7.907756805419922, -3.5864639282226562, 0.7348270416259766, 5.056118011474609, 9.377410888671875, 13.698702812194824, 18.019994735717773, 22.341285705566406, 26.662578582763672, 30.983871459960938, 35.30516052246094, 39.6264533996582, 43.94774627685547, 48.269039154052734, 52.59033203125, 56.91162109375, 61.232913970947266, 65.55420684814453, 69.87549591064453, 74.19679260253906, 78.51808166503906, 82.83937072753906, 87.1606674194336, 91.4819564819336, 95.80325317382812, 100.12454223632812, 104.44583129882812, 108.76712036132812, 113.08841705322266, 117.40970611572266, 121.73100280761719, 126.05229187011719, 130.3735809326172, 134.69488525390625, 139.01617431640625, 143.33746337890625, 147.65875244140625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 6.0, 11.0, 16.0, 31.0, 48.0, 67.0, 100.0, 160.0, 200.0, 276.0, 432.0, 672.0, 1040.0, 1528.0, 2596.0, 4377.0, 7818.0, 14250.0, 26420.0, 51916.0, 103574.0, 211711.0, 463547.0, 1692434.0, 2617698.0, 581561.0, 254270.0, 123366.0, 61446.0, 31153.0, 16528.0, 8996.0, 5033.0, 3002.0, 1739.0, 1159.0, 723.0, 459.0, 329.0, 192.0, 174.0, 103.0, 77.0, 63.0, 32.0, 21.0, 19.0, 18.0, 10.0, 10.0, 6.0, 3.0, 6.0, 0.0, 3.0], "bins": [-6.56640625, -6.3681640625, -6.169921875, -5.9716796875, -5.7734375, -5.5751953125, -5.376953125, -5.1787109375, -4.98046875, -4.7822265625, -4.583984375, -4.3857421875, -4.1875, -3.9892578125, -3.791015625, -3.5927734375, -3.39453125, -3.1962890625, -2.998046875, -2.7998046875, -2.6015625, -2.4033203125, -2.205078125, -2.0068359375, -1.80859375, -1.6103515625, -1.412109375, -1.2138671875, -1.015625, -0.8173828125, -0.619140625, -0.4208984375, -0.22265625, -0.0244140625, 0.173828125, 0.3720703125, 0.5703125, 0.7685546875, 0.966796875, 1.1650390625, 1.36328125, 1.5615234375, 1.759765625, 1.9580078125, 2.15625, 2.3544921875, 2.552734375, 2.7509765625, 2.94921875, 3.1474609375, 3.345703125, 3.5439453125, 3.7421875, 3.9404296875, 4.138671875, 4.3369140625, 4.53515625, 4.7333984375, 4.931640625, 5.1298828125, 5.328125, 5.5263671875, 5.724609375, 5.9228515625, 6.12109375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 0.0, 5.0, 10.0, 9.0, 17.0, 16.0, 19.0, 20.0, 35.0, 39.0, 25.0, 45.0, 42.0, 49.0, 65.0, 99.0, 379.0, 513.0, 187.0, 88.0, 48.0, 54.0, 50.0, 27.0, 37.0, 33.0, 24.0, 20.0, 16.0, 11.0, 10.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-15.3125, -14.920654296875, -14.52880859375, -14.136962890625, -13.7451171875, -13.353271484375, -12.96142578125, -12.569580078125, -12.177734375, -11.785888671875, -11.39404296875, -11.002197265625, -10.6103515625, -10.218505859375, -9.82666015625, -9.434814453125, -9.04296875, -8.651123046875, -8.25927734375, -7.867431640625, -7.4755859375, -7.083740234375, -6.69189453125, -6.300048828125, -5.908203125, -5.516357421875, -5.12451171875, -4.732666015625, -4.3408203125, -3.948974609375, -3.55712890625, -3.165283203125, -2.7734375, -2.381591796875, -1.98974609375, -1.597900390625, -1.2060546875, -0.814208984375, -0.42236328125, -0.030517578125, 0.361328125, 0.753173828125, 1.14501953125, 1.536865234375, 1.9287109375, 2.320556640625, 2.71240234375, 3.104248046875, 3.49609375, 3.887939453125, 4.27978515625, 4.671630859375, 5.0634765625, 5.455322265625, 5.84716796875, 6.239013671875, 6.630859375, 7.022705078125, 7.41455078125, 7.806396484375, 8.1982421875, 8.590087890625, 8.98193359375, 9.373779296875, 9.765625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 12.0, 5.0, 9.0, 7.0, 17.0, 22.0, 33.0, 39.0, 88.0, 110.0, 159.0, 249.0, 369.0, 616.0, 940.0, 1570.0, 2535.0, 4516.0, 7925.0, 15304.0, 30284.0, 62962.0, 137560.0, 308846.0, 824805.0, 3581663.0, 758175.0, 297395.0, 131891.0, 60290.0, 29071.0, 14658.0, 7940.0, 4494.0, 2592.0, 1600.0, 985.0, 557.0, 373.0, 265.0, 166.0, 117.0, 90.0, 40.0, 39.0, 24.0, 11.0, 8.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.7890625, -4.64599609375, -4.5029296875, -4.35986328125, -4.216796875, -4.07373046875, -3.9306640625, -3.78759765625, -3.64453125, -3.50146484375, -3.3583984375, -3.21533203125, -3.072265625, -2.92919921875, -2.7861328125, -2.64306640625, -2.5, -2.35693359375, -2.2138671875, -2.07080078125, -1.927734375, -1.78466796875, -1.6416015625, -1.49853515625, -1.35546875, -1.21240234375, -1.0693359375, -0.92626953125, -0.783203125, -0.64013671875, -0.4970703125, -0.35400390625, -0.2109375, -0.06787109375, 0.0751953125, 0.21826171875, 0.361328125, 0.50439453125, 0.6474609375, 0.79052734375, 0.93359375, 1.07666015625, 1.2197265625, 1.36279296875, 1.505859375, 1.64892578125, 1.7919921875, 1.93505859375, 2.078125, 2.22119140625, 2.3642578125, 2.50732421875, 2.650390625, 2.79345703125, 2.9365234375, 3.07958984375, 3.22265625, 3.36572265625, 3.5087890625, 3.65185546875, 3.794921875, 3.93798828125, 4.0810546875, 4.22412109375, 4.3671875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 8.0, 6.0, 24.0, 21.0, 27.0, 33.0, 40.0, 50.0, 51.0, 36.0, 43.0, 49.0, 110.0, 457.0, 407.0, 171.0, 101.0, 71.0, 59.0, 50.0, 34.0, 34.0, 33.0, 23.0, 16.0, 10.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4183349609375, -8.094482421875, -7.7706298828125, -7.44677734375, -7.1229248046875, -6.799072265625, -6.4752197265625, -6.1513671875, -5.8275146484375, -5.503662109375, -5.1798095703125, -4.85595703125, -4.5321044921875, -4.208251953125, -3.8843994140625, -3.560546875, -3.2366943359375, -2.912841796875, -2.5889892578125, -2.26513671875, -1.9412841796875, -1.617431640625, -1.2935791015625, -0.9697265625, -0.6458740234375, -0.322021484375, 0.0018310546875, 0.32568359375, 0.6495361328125, 0.973388671875, 1.2972412109375, 1.62109375, 1.9449462890625, 2.268798828125, 2.5926513671875, 2.91650390625, 3.2403564453125, 3.564208984375, 3.8880615234375, 4.2119140625, 4.5357666015625, 4.859619140625, 5.1834716796875, 5.50732421875, 5.8311767578125, 6.155029296875, 6.4788818359375, 6.802734375, 7.1265869140625, 7.450439453125, 7.7742919921875, 8.09814453125, 8.4219970703125, 8.745849609375, 9.0697021484375, 9.3935546875, 9.7174072265625, 10.041259765625, 10.3651123046875, 10.68896484375, 11.0128173828125, 11.336669921875, 11.6605224609375, 11.984375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 7.0, 13.0, 14.0, 35.0, 30.0, 36.0, 66.0, 65.0, 98.0, 119.0, 146.0, 205.0, 295.0, 461.0, 620.0, 1021.0, 1549.0, 3036.0, 6350.0, 15830.0, 54157.0, 5885631.0, 263414.0, 34886.0, 11741.0, 4959.0, 2499.0, 1333.0, 805.0, 522.0, 404.0, 226.0, 221.0, 145.0, 116.0, 105.0, 72.0, 40.0, 46.0, 10.0, 20.0, 14.0, 14.0, 16.0, 12.0, 3.0, 6.0, 4.0, 1.0, 0.0, 3.0, 5.0], "bins": [-35.75, -34.69384765625, -33.6376953125, -32.58154296875, -31.525390625, -30.46923828125, -29.4130859375, -28.35693359375, -27.30078125, -26.24462890625, -25.1884765625, -24.13232421875, -23.076171875, -22.02001953125, -20.9638671875, -19.90771484375, -18.8515625, -17.79541015625, -16.7392578125, -15.68310546875, -14.626953125, -13.57080078125, -12.5146484375, -11.45849609375, -10.40234375, -9.34619140625, -8.2900390625, -7.23388671875, -6.177734375, -5.12158203125, -4.0654296875, -3.00927734375, -1.953125, -0.89697265625, 0.1591796875, 1.21533203125, 2.271484375, 3.32763671875, 4.3837890625, 5.43994140625, 6.49609375, 7.55224609375, 8.6083984375, 9.66455078125, 10.720703125, 11.77685546875, 12.8330078125, 13.88916015625, 14.9453125, 16.00146484375, 17.0576171875, 18.11376953125, 19.169921875, 20.22607421875, 21.2822265625, 22.33837890625, 23.39453125, 24.45068359375, 25.5068359375, 26.56298828125, 27.619140625, 28.67529296875, 29.7314453125, 30.78759765625, 31.84375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 7.0, 2.0, 3.0, 7.0, 9.0, 8.0, 11.0, 15.0, 14.0, 16.0, 25.0, 39.0, 43.0, 52.0, 49.0, 89.0, 186.0, 549.0, 359.0, 170.0, 98.0, 75.0, 45.0, 34.0, 19.0, 16.0, 25.0, 15.0, 9.0, 8.0, 8.0, 6.0, 3.0, 7.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.3404541015625, -11.985595703125, -11.6307373046875, -11.27587890625, -10.9210205078125, -10.566162109375, -10.2113037109375, -9.8564453125, -9.5015869140625, -9.146728515625, -8.7918701171875, -8.43701171875, -8.0821533203125, -7.727294921875, -7.3724365234375, -7.017578125, -6.6627197265625, -6.307861328125, -5.9530029296875, -5.59814453125, -5.2432861328125, -4.888427734375, -4.5335693359375, -4.1787109375, -3.8238525390625, -3.468994140625, -3.1141357421875, -2.75927734375, -2.4044189453125, -2.049560546875, -1.6947021484375, -1.33984375, -0.9849853515625, -0.630126953125, -0.2752685546875, 0.07958984375, 0.4344482421875, 0.789306640625, 1.1441650390625, 1.4990234375, 1.8538818359375, 2.208740234375, 2.5635986328125, 2.91845703125, 3.2733154296875, 3.628173828125, 3.9830322265625, 4.337890625, 4.6927490234375, 5.047607421875, 5.4024658203125, 5.75732421875, 6.1121826171875, 6.467041015625, 6.8218994140625, 7.1767578125, 7.5316162109375, 7.886474609375, 8.2413330078125, 8.59619140625, 8.9510498046875, 9.305908203125, 9.6607666015625, 10.015625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 33.0, 221.0, 655.0, 59.0, 22.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.01712036132812, -212.94561767578125, -202.87411499023438, -192.80262756347656, -182.7311248779297, -172.6596221923828, -162.588134765625, -152.51663208007812, -142.44512939453125, -132.37362670898438, -122.30213165283203, -112.23063659667969, -102.15913391113281, -92.08763122558594, -82.0161361694336, -71.94464111328125, -61.873138427734375, -51.801639556884766, -41.730140686035156, -31.658641815185547, -21.587142944335938, -11.515644073486328, -1.4441452026367188, 8.627349853515625, 18.6988525390625, 28.77035140991211, 38.84185028076172, 48.91334915161133, 58.98484802246094, 69.05635070800781, 79.12784576416016, 89.1993408203125, 99.2708740234375, 109.34237670898438, 119.41387176513672, 129.48536682128906, 139.55686950683594, 149.6283721923828, 159.69985961914062, 169.7713623046875, 179.84286499023438, 189.91436767578125, 199.98587036132812, 210.05735778808594, 220.1288604736328, 230.2003631591797, 240.2718505859375, 250.34335327148438, 260.41485595703125, 270.4863586425781, 280.557861328125, 290.6293640136719, 300.70086669921875, 310.7723388671875, 320.8438415527344, 330.91534423828125, 340.9868469238281, 351.058349609375, 361.1298522949219, 371.20135498046875, 381.2728271484375, 391.3443298339844, 401.41583251953125, 411.4873352050781, 421.558837890625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 24.0, 37.0, 87.0, 262.0, 332.0, 108.0, 41.0, 22.0, 18.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.6688232421875, -119.075927734375, -115.4830322265625, -111.89013671875, -108.29723358154297, -104.70433807373047, -101.11144256591797, -97.51854705810547, -93.92564392089844, -90.33274841308594, -86.73985290527344, -83.14695739746094, -79.5540542602539, -75.9611587524414, -72.3682632446289, -68.7753677368164, -65.1824722290039, -61.589576721191406, -57.99667739868164, -54.40378189086914, -50.810882568359375, -47.217987060546875, -43.625091552734375, -40.032196044921875, -36.43929672241211, -32.84640121459961, -29.253501892089844, -25.660606384277344, -22.06770896911621, -18.474811553955078, -14.881916046142578, -11.289018630981445, -7.6961212158203125, -4.103224277496338, -0.5103273391723633, 3.082569122314453, 6.675466537475586, 10.268363952636719, 13.861259460449219, 17.45415687561035, 21.047054290771484, 24.639951705932617, 28.23284912109375, 31.82574462890625, 35.41864013671875, 39.011539459228516, 42.604434967041016, 46.19733428955078, 49.79022979736328, 53.38312530517578, 56.97602462768555, 60.56892013549805, 64.16181945800781, 67.75471496582031, 71.34761047363281, 74.94050598144531, 78.53340148925781, 82.12629699707031, 85.71919250488281, 89.31208801269531, 92.90499114990234, 96.49788665771484, 100.09078216552734, 103.68367767333984, 107.27658081054688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 6.0, 6.0, 7.0, 6.0, 10.0, 8.0, 14.0, 17.0, 25.0, 28.0, 35.0, 38.0, 59.0, 85.0, 96.0, 103.0, 151.0, 166.0, 266.0, 321.0, 414.0, 490.0, 734.0, 1051.0, 1546.0, 2382.0, 4039.0, 6707.0, 12374.0, 24987.0, 72851.0, 1048210.0, 2864738.0, 94704.0, 27795.0, 12622.0, 6513.0, 3808.0, 2475.0, 1611.0, 981.0, 646.0, 391.0, 261.0, 164.0, 129.0, 83.0, 50.0, 29.0, 18.0, 13.0, 10.0, 4.0, 6.0, 5.0], "bins": [-1.29296875, -1.2614898681640625, -1.230010986328125, -1.1985321044921875, -1.16705322265625, -1.1355743408203125, -1.104095458984375, -1.0726165771484375, -1.0411376953125, -1.0096588134765625, -0.978179931640625, -0.9467010498046875, -0.91522216796875, -0.8837432861328125, -0.852264404296875, -0.8207855224609375, -0.789306640625, -0.7578277587890625, -0.726348876953125, -0.6948699951171875, -0.66339111328125, -0.6319122314453125, -0.600433349609375, -0.5689544677734375, -0.5374755859375, -0.5059967041015625, -0.474517822265625, -0.4430389404296875, -0.41156005859375, -0.3800811767578125, -0.348602294921875, -0.3171234130859375, -0.28564453125, -0.2541656494140625, -0.222686767578125, -0.1912078857421875, -0.15972900390625, -0.1282501220703125, -0.096771240234375, -0.0652923583984375, -0.0338134765625, -0.0023345947265625, 0.029144287109375, 0.0606231689453125, 0.09210205078125, 0.1235809326171875, 0.155059814453125, 0.1865386962890625, 0.218017578125, 0.2494964599609375, 0.280975341796875, 0.3124542236328125, 0.34393310546875, 0.3754119873046875, 0.406890869140625, 0.4383697509765625, 0.4698486328125, 0.5013275146484375, 0.532806396484375, 0.5642852783203125, 0.59576416015625, 0.6272430419921875, 0.658721923828125, 0.6902008056640625, 0.7216796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 8.0, 9.0, 18.0, 35.0, 199.0, 384.0, 231.0, 42.0, 16.0, 15.0, 9.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1619873046875, -0.157989501953125, -0.15399169921875, -0.149993896484375, -0.14599609375, -0.141998291015625, -0.13800048828125, -0.134002685546875, -0.1300048828125, -0.126007080078125, -0.12200927734375, -0.118011474609375, -0.114013671875, -0.110015869140625, -0.10601806640625, -0.102020263671875, -0.0980224609375, -0.094024658203125, -0.09002685546875, -0.086029052734375, -0.08203125, -0.078033447265625, -0.07403564453125, -0.070037841796875, -0.0660400390625, -0.062042236328125, -0.05804443359375, -0.054046630859375, -0.050048828125, -0.046051025390625, -0.04205322265625, -0.038055419921875, -0.0340576171875, -0.030059814453125, -0.02606201171875, -0.022064208984375, -0.01806640625, -0.014068603515625, -0.01007080078125, -0.006072998046875, -0.0020751953125, 0.001922607421875, 0.00592041015625, 0.009918212890625, 0.013916015625, 0.017913818359375, 0.02191162109375, 0.025909423828125, 0.0299072265625, 0.033905029296875, 0.03790283203125, 0.041900634765625, 0.0458984375, 0.049896240234375, 0.05389404296875, 0.057891845703125, 0.0618896484375, 0.065887451171875, 0.06988525390625, 0.073883056640625, 0.077880859375, 0.081878662109375, 0.08587646484375, 0.089874267578125, 0.0938720703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 19.0, 24.0, 20.0, 48.0, 63.0, 74.0, 118.0, 176.0, 240.0, 424.0, 593.0, 1125.0, 2133.0, 4698.0, 10864.0, 31460.0, 108809.0, 550931.0, 2781530.0, 548049.0, 103443.0, 29095.0, 10557.0, 4589.0, 2271.0, 1166.0, 690.0, 368.0, 229.0, 167.0, 85.0, 60.0, 36.0, 24.0, 22.0, 16.0, 15.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0070953369140625, -0.975128173828125, -0.9431610107421875, -0.91119384765625, -0.8792266845703125, -0.847259521484375, -0.8152923583984375, -0.7833251953125, -0.7513580322265625, -0.719390869140625, -0.6874237060546875, -0.65545654296875, -0.6234893798828125, -0.591522216796875, -0.5595550537109375, -0.527587890625, -0.4956207275390625, -0.463653564453125, -0.4316864013671875, -0.39971923828125, -0.3677520751953125, -0.335784912109375, -0.3038177490234375, -0.2718505859375, -0.2398834228515625, -0.207916259765625, -0.1759490966796875, -0.14398193359375, -0.1120147705078125, -0.080047607421875, -0.0480804443359375, -0.01611328125, 0.0158538818359375, 0.047821044921875, 0.0797882080078125, 0.11175537109375, 0.1437225341796875, 0.175689697265625, 0.2076568603515625, 0.2396240234375, 0.2715911865234375, 0.303558349609375, 0.3355255126953125, 0.36749267578125, 0.3994598388671875, 0.431427001953125, 0.4633941650390625, 0.495361328125, 0.5273284912109375, 0.559295654296875, 0.5912628173828125, 0.62322998046875, 0.6551971435546875, 0.687164306640625, 0.7191314697265625, 0.7510986328125, 0.7830657958984375, 0.815032958984375, 0.8470001220703125, 0.87896728515625, 0.9109344482421875, 0.942901611328125, 0.9748687744140625, 1.0068359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 4.0, 12.0, 14.0, 14.0, 22.0, 21.0, 25.0, 33.0, 38.0, 45.0, 61.0, 69.0, 98.0, 138.0, 144.0, 175.0, 215.0, 297.0, 396.0, 614.0, 404.0, 290.0, 206.0, 165.0, 146.0, 88.0, 94.0, 60.0, 44.0, 39.0, 27.0, 23.0, 8.0, 7.0, 10.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2174072265625, -0.2105083465576172, -0.20360946655273438, -0.19671058654785156, -0.18981170654296875, -0.18291282653808594, -0.17601394653320312, -0.1691150665283203, -0.1622161865234375, -0.1553173065185547, -0.14841842651367188, -0.14151954650878906, -0.13462066650390625, -0.12772178649902344, -0.12082290649414062, -0.11392402648925781, -0.107025146484375, -0.10012626647949219, -0.09322738647460938, -0.08632850646972656, -0.07942962646484375, -0.07253074645996094, -0.06563186645507812, -0.05873298645019531, -0.0518341064453125, -0.04493522644042969, -0.038036346435546875, -0.031137466430664062, -0.02423858642578125, -0.017339706420898438, -0.010440826416015625, -0.0035419464111328125, 0.00335693359375, 0.010255813598632812, 0.017154693603515625, 0.024053573608398438, 0.03095245361328125, 0.03785133361816406, 0.044750213623046875, 0.05164909362792969, 0.0585479736328125, 0.06544685363769531, 0.07234573364257812, 0.07924461364746094, 0.08614349365234375, 0.09304237365722656, 0.09994125366210938, 0.10684013366699219, 0.113739013671875, 0.12063789367675781, 0.12753677368164062, 0.13443565368652344, 0.14133453369140625, 0.14823341369628906, 0.15513229370117188, 0.1620311737060547, 0.1689300537109375, 0.1758289337158203, 0.18272781372070312, 0.18962669372558594, 0.19652557373046875, 0.20342445373535156, 0.21032333374023438, 0.2172222137451172, 0.22412109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 12.0, 8.0, 17.0, 19.0, 24.0, 42.0, 49.0, 63.0, 78.0, 102.0, 142.0, 123.0, 90.0, 65.0, 41.0, 34.0, 26.0, 11.0, 12.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.8650496006011963, -3.777703046798706, -3.690356731414795, -3.6030101776123047, -3.5156636238098145, -3.428317070007324, -3.340970754623413, -3.253624200820923, -3.1662778854370117, -3.0789313316345215, -2.9915850162506104, -2.90423846244812, -2.81689190864563, -2.7295455932617188, -2.6421990394592285, -2.5548524856567383, -2.467505931854248, -2.380159378051758, -2.2928130626678467, -2.2054665088653564, -2.118119955062866, -2.030773639678955, -1.9434270858764648, -1.8560805320739746, -1.768734097480774, -1.6813876628875732, -1.594041109085083, -1.5066946744918823, -1.4193482398986816, -1.3320016860961914, -1.2446552515029907, -1.15730881690979, -1.0699620246887207, -0.9826155304908752, -0.8952690362930298, -0.8079226016998291, -0.7205761075019836, -0.6332296133041382, -0.5458831787109375, -0.45853668451309204, -0.3711901903152466, -0.2838436961174011, -0.19649723172187805, -0.10915076732635498, -0.02180427312850952, 0.06554222106933594, 0.15288865566253662, 0.24023514986038208, 0.32758164405822754, 0.414928138256073, 0.5022746324539185, 0.5896210670471191, 0.6769675612449646, 0.7643140554428101, 0.8516604900360107, 0.9390069842338562, 1.0263534784317017, 1.1136999130249023, 1.2010464668273926, 1.2883929014205933, 1.375739336013794, 1.4630858898162842, 1.5504323244094849, 1.6377787590026855, 1.7251253128051758]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 6.0, 10.0, 8.0, 6.0, 9.0, 13.0, 12.0, 13.0, 14.0, 22.0, 20.0, 20.0, 35.0, 33.0, 37.0, 29.0, 49.0, 50.0, 47.0, 38.0, 33.0, 31.0, 36.0, 51.0, 53.0, 28.0, 44.0, 38.0, 27.0, 25.0, 17.0, 30.0, 22.0, 15.0, 15.0, 15.0, 9.0, 4.0, 7.0, 10.0, 5.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650987148284912, -1.5945276021957397, -1.5380679368972778, -1.4816083908081055, -1.425148844718933, -1.3686892986297607, -1.3122296333312988, -1.2557700872421265, -1.199310541152954, -1.1428509950637817, -1.0863913297653198, -1.0299317836761475, -0.9734722375869751, -0.917012631893158, -0.8605530261993408, -0.8040934801101685, -0.7476338148117065, -0.6911742091178894, -0.634714663028717, -0.5782550573348999, -0.5217955112457275, -0.4653359055519104, -0.40887629985809326, -0.3524167239665985, -0.29595714807510376, -0.239497572183609, -0.18303798139095306, -0.12657839059829712, -0.07011881470680237, -0.013659238815307617, 0.04280036687850952, 0.09925994277000427, 0.15571951866149902, 0.21217909455299377, 0.2686386704444885, 0.32509827613830566, 0.3815578520298004, 0.43801742792129517, 0.4944770336151123, 0.5509365797042847, 0.6073961853981018, 0.663855791091919, 0.7203153371810913, 0.7767749428749084, 0.8332345485687256, 0.889694094657898, 0.9461537003517151, 1.0026133060455322, 1.0590728521347046, 1.115532398223877, 1.1719920635223389, 1.2284516096115112, 1.2849111557006836, 1.3413708209991455, 1.3978303670883179, 1.4542899131774902, 1.5107495784759521, 1.5672091245651245, 1.6236687898635864, 1.6801283359527588, 1.7365878820419312, 1.7930474281311035, 1.8495070934295654, 1.9059666395187378, 1.9624261856079102]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 15.0, 18.0, 19.0, 40.0, 67.0, 111.0, 165.0, 276.0, 605.0, 1181.0, 2585.0, 7520.0, 34849.0, 530043.0, 429170.0, 30072.0, 6936.0, 2507.0, 1123.0, 538.0, 274.0, 156.0, 91.0, 53.0, 36.0, 38.0, 16.0, 14.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3687591552734375, -1.321502685546875, -1.2742462158203125, -1.22698974609375, -1.1797332763671875, -1.132476806640625, -1.0852203369140625, -1.0379638671875, -0.9907073974609375, -0.943450927734375, -0.8961944580078125, -0.84893798828125, -0.8016815185546875, -0.754425048828125, -0.7071685791015625, -0.659912109375, -0.6126556396484375, -0.565399169921875, -0.5181427001953125, -0.47088623046875, -0.4236297607421875, -0.376373291015625, -0.3291168212890625, -0.2818603515625, -0.2346038818359375, -0.187347412109375, -0.1400909423828125, -0.09283447265625, -0.0455780029296875, 0.001678466796875, 0.0489349365234375, 0.09619140625, 0.1434478759765625, 0.190704345703125, 0.2379608154296875, 0.28521728515625, 0.3324737548828125, 0.379730224609375, 0.4269866943359375, 0.4742431640625, 0.5214996337890625, 0.568756103515625, 0.6160125732421875, 0.66326904296875, 0.7105255126953125, 0.757781982421875, 0.8050384521484375, 0.852294921875, 0.8995513916015625, 0.946807861328125, 0.9940643310546875, 1.04132080078125, 1.0885772705078125, 1.135833740234375, 1.1830902099609375, 1.2303466796875, 1.2776031494140625, 1.324859619140625, 1.3721160888671875, 1.41937255859375, 1.4666290283203125, 1.513885498046875, 1.5611419677734375, 1.6083984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 4.0, 6.0, 9.0, 5.0, 17.0, 23.0, 36.0, 72.0, 103.0, 110.0, 155.0, 134.0, 111.0, 76.0, 53.0, 29.0, 18.0, 15.0, 7.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.1483001708984375, -0.144256591796875, -0.1402130126953125, -0.13616943359375, -0.1321258544921875, -0.128082275390625, -0.1240386962890625, -0.1199951171875, -0.1159515380859375, -0.111907958984375, -0.1078643798828125, -0.10382080078125, -0.0997772216796875, -0.095733642578125, -0.0916900634765625, -0.087646484375, -0.0836029052734375, -0.079559326171875, -0.0755157470703125, -0.07147216796875, -0.0674285888671875, -0.063385009765625, -0.0593414306640625, -0.0552978515625, -0.0512542724609375, -0.047210693359375, -0.0431671142578125, -0.03912353515625, -0.0350799560546875, -0.031036376953125, -0.0269927978515625, -0.02294921875, -0.0189056396484375, -0.014862060546875, -0.0108184814453125, -0.00677490234375, -0.0027313232421875, 0.001312255859375, 0.0053558349609375, 0.0093994140625, 0.0134429931640625, 0.017486572265625, 0.0215301513671875, 0.02557373046875, 0.0296173095703125, 0.033660888671875, 0.0377044677734375, 0.041748046875, 0.0457916259765625, 0.049835205078125, 0.0538787841796875, 0.05792236328125, 0.0619659423828125, 0.066009521484375, 0.0700531005859375, 0.0740966796875, 0.0781402587890625, 0.082183837890625, 0.0862274169921875, 0.09027099609375, 0.0943145751953125, 0.098358154296875, 0.1024017333984375, 0.1064453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 13.0, 10.0, 24.0, 28.0, 30.0, 51.0, 68.0, 121.0, 162.0, 242.0, 435.0, 790.0, 1367.0, 2757.0, 6370.0, 19016.0, 89622.0, 625242.0, 246932.0, 36441.0, 10342.0, 4067.0, 1909.0, 995.0, 537.0, 310.0, 187.0, 135.0, 115.0, 67.0, 37.0, 41.0, 18.0, 17.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1181640625, -1.08056640625, -1.04296875, -1.00537109375, -0.9677734375, -0.93017578125, -0.892578125, -0.85498046875, -0.8173828125, -0.77978515625, -0.7421875, -0.70458984375, -0.6669921875, -0.62939453125, -0.591796875, -0.55419921875, -0.5166015625, -0.47900390625, -0.44140625, -0.40380859375, -0.3662109375, -0.32861328125, -0.291015625, -0.25341796875, -0.2158203125, -0.17822265625, -0.140625, -0.10302734375, -0.0654296875, -0.02783203125, 0.009765625, 0.04736328125, 0.0849609375, 0.12255859375, 0.16015625, 0.19775390625, 0.2353515625, 0.27294921875, 0.310546875, 0.34814453125, 0.3857421875, 0.42333984375, 0.4609375, 0.49853515625, 0.5361328125, 0.57373046875, 0.611328125, 0.64892578125, 0.6865234375, 0.72412109375, 0.76171875, 0.79931640625, 0.8369140625, 0.87451171875, 0.912109375, 0.94970703125, 0.9873046875, 1.02490234375, 1.0625, 1.10009765625, 1.1376953125, 1.17529296875, 1.212890625, 1.25048828125, 1.2880859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 9.0, 6.0, 17.0, 11.0, 21.0, 16.0, 21.0, 27.0, 36.0, 30.0, 29.0, 43.0, 47.0, 48.0, 56.0, 45.0, 53.0, 51.0, 55.0, 42.0, 28.0, 44.0, 43.0, 36.0, 24.0, 31.0, 16.0, 25.0, 16.0, 15.0, 17.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.6533203125, -0.6349334716796875, -0.616546630859375, -0.5981597900390625, -0.57977294921875, -0.5613861083984375, -0.542999267578125, -0.5246124267578125, -0.5062255859375, -0.4878387451171875, -0.469451904296875, -0.4510650634765625, -0.43267822265625, -0.4142913818359375, -0.395904541015625, -0.3775177001953125, -0.359130859375, -0.3407440185546875, -0.322357177734375, -0.3039703369140625, -0.28558349609375, -0.2671966552734375, -0.248809814453125, -0.2304229736328125, -0.2120361328125, -0.1936492919921875, -0.175262451171875, -0.1568756103515625, -0.13848876953125, -0.1201019287109375, -0.101715087890625, -0.0833282470703125, -0.06494140625, -0.0465545654296875, -0.028167724609375, -0.0097808837890625, 0.00860595703125, 0.0269927978515625, 0.045379638671875, 0.0637664794921875, 0.0821533203125, 0.1005401611328125, 0.118927001953125, 0.1373138427734375, 0.15570068359375, 0.1740875244140625, 0.192474365234375, 0.2108612060546875, 0.229248046875, 0.2476348876953125, 0.266021728515625, 0.2844085693359375, 0.30279541015625, 0.3211822509765625, 0.339569091796875, 0.3579559326171875, 0.3763427734375, 0.3947296142578125, 0.413116455078125, 0.4315032958984375, 0.44989013671875, 0.4682769775390625, 0.486663818359375, 0.5050506591796875, 0.5234375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 5.0, 15.0, 18.0, 29.0, 59.0, 66.0, 152.0, 318.0, 969.0, 5229.0, 950711.0, 86874.0, 2881.0, 648.0, 243.0, 130.0, 67.0, 47.0, 19.0, 18.0, 15.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.66558837890625, -7.4249267578125, -7.18426513671875, -6.943603515625, -6.70294189453125, -6.4622802734375, -6.22161865234375, -5.98095703125, -5.74029541015625, -5.4996337890625, -5.25897216796875, -5.018310546875, -4.77764892578125, -4.5369873046875, -4.29632568359375, -4.0556640625, -3.81500244140625, -3.5743408203125, -3.33367919921875, -3.093017578125, -2.85235595703125, -2.6116943359375, -2.37103271484375, -2.13037109375, -1.88970947265625, -1.6490478515625, -1.40838623046875, -1.167724609375, -0.92706298828125, -0.6864013671875, -0.44573974609375, -0.205078125, 0.03558349609375, 0.2762451171875, 0.51690673828125, 0.757568359375, 0.99822998046875, 1.2388916015625, 1.47955322265625, 1.72021484375, 1.96087646484375, 2.2015380859375, 2.44219970703125, 2.682861328125, 2.92352294921875, 3.1641845703125, 3.40484619140625, 3.6455078125, 3.88616943359375, 4.1268310546875, 4.36749267578125, 4.608154296875, 4.84881591796875, 5.0894775390625, 5.33013916015625, 5.57080078125, 5.81146240234375, 6.0521240234375, 6.29278564453125, 6.533447265625, 6.77410888671875, 7.0147705078125, 7.25543212890625, 7.49609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 9.0, 7.0, 8.0, 10.0, 18.0, 21.0, 43.0, 73.0, 86.0, 125.0, 169.0, 149.0, 114.0, 64.0, 47.0, 31.0, 17.0, 11.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023925304412841797, -0.00023365672677755356, -0.00022806040942668915, -0.00022246409207582474, -0.00021686777472496033, -0.00021127145737409592, -0.0002056751400232315, -0.0002000788226723671, -0.00019448250532150269, -0.00018888618797063828, -0.00018328987061977386, -0.00017769355326890945, -0.00017209723591804504, -0.00016650091856718063, -0.00016090460121631622, -0.0001553082838654518, -0.0001497119665145874, -0.000144115649163723, -0.00013851933181285858, -0.00013292301446199417, -0.00012732669711112976, -0.00012173037976026535, -0.00011613406240940094, -0.00011053774505853653, -0.00010494142770767212, -9.934511035680771e-05, -9.37487930059433e-05, -8.815247565507889e-05, -8.255615830421448e-05, -7.695984095335007e-05, -7.136352360248566e-05, -6.576720625162125e-05, -6.0170888900756836e-05, -5.4574571549892426e-05, -4.8978254199028015e-05, -4.3381936848163605e-05, -3.7785619497299194e-05, -3.2189302146434784e-05, -2.6592984795570374e-05, -2.0996667444705963e-05, -1.5400350093841553e-05, -9.804032742977142e-06, -4.207715392112732e-06, 1.3886019587516785e-06, 6.984919309616089e-06, 1.25812366604805e-05, 1.817755401134491e-05, 2.377387136220932e-05, 2.937018871307373e-05, 3.496650606393814e-05, 4.056282341480255e-05, 4.615914076566696e-05, 5.175545811653137e-05, 5.735177546739578e-05, 6.294809281826019e-05, 6.85444101691246e-05, 7.414072751998901e-05, 7.973704487085342e-05, 8.533336222171783e-05, 9.092967957258224e-05, 9.652599692344666e-05, 0.00010212231427431107, 0.00010771863162517548, 0.00011331494897603989, 0.0001189112663269043]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 5.0, 1.0, 7.0, 3.0, 14.0, 9.0, 17.0, 19.0, 36.0, 61.0, 90.0, 122.0, 184.0, 319.0, 613.0, 1388.0, 4038.0, 18102.0, 595399.0, 405461.0, 16147.0, 3714.0, 1396.0, 580.0, 302.0, 200.0, 106.0, 60.0, 56.0, 24.0, 16.0, 16.0, 16.0, 11.0, 9.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.17413330078125, -3.0748291015625, -2.97552490234375, -2.876220703125, -2.77691650390625, -2.6776123046875, -2.57830810546875, -2.47900390625, -2.37969970703125, -2.2803955078125, -2.18109130859375, -2.081787109375, -1.98248291015625, -1.8831787109375, -1.78387451171875, -1.6845703125, -1.58526611328125, -1.4859619140625, -1.38665771484375, -1.287353515625, -1.18804931640625, -1.0887451171875, -0.98944091796875, -0.89013671875, -0.79083251953125, -0.6915283203125, -0.59222412109375, -0.492919921875, -0.39361572265625, -0.2943115234375, -0.19500732421875, -0.095703125, 0.00360107421875, 0.1029052734375, 0.20220947265625, 0.301513671875, 0.40081787109375, 0.5001220703125, 0.59942626953125, 0.69873046875, 0.79803466796875, 0.8973388671875, 0.99664306640625, 1.095947265625, 1.19525146484375, 1.2945556640625, 1.39385986328125, 1.4931640625, 1.59246826171875, 1.6917724609375, 1.79107666015625, 1.890380859375, 1.98968505859375, 2.0889892578125, 2.18829345703125, 2.28759765625, 2.38690185546875, 2.4862060546875, 2.58551025390625, 2.684814453125, 2.78411865234375, 2.8834228515625, 2.98272705078125, 3.08203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 1.0, 6.0, 10.0, 26.0, 33.0, 100.0, 195.0, 260.0, 214.0, 85.0, 39.0, 11.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.77386474609375, -1.7039794921875, -1.63409423828125, -1.564208984375, -1.49432373046875, -1.4244384765625, -1.35455322265625, -1.28466796875, -1.21478271484375, -1.1448974609375, -1.07501220703125, -1.005126953125, -0.93524169921875, -0.8653564453125, -0.79547119140625, -0.7255859375, -0.65570068359375, -0.5858154296875, -0.51593017578125, -0.446044921875, -0.37615966796875, -0.3062744140625, -0.23638916015625, -0.16650390625, -0.09661865234375, -0.0267333984375, 0.04315185546875, 0.113037109375, 0.18292236328125, 0.2528076171875, 0.32269287109375, 0.392578125, 0.46246337890625, 0.5323486328125, 0.60223388671875, 0.672119140625, 0.74200439453125, 0.8118896484375, 0.88177490234375, 0.95166015625, 1.02154541015625, 1.0914306640625, 1.16131591796875, 1.231201171875, 1.30108642578125, 1.3709716796875, 1.44085693359375, 1.5107421875, 1.58062744140625, 1.6505126953125, 1.72039794921875, 1.790283203125, 1.86016845703125, 1.9300537109375, 1.99993896484375, 2.06982421875, 2.13970947265625, 2.2095947265625, 2.27947998046875, 2.349365234375, 2.41925048828125, 2.4891357421875, 2.55902099609375, 2.62890625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 16.0, 55.0, 156.0, 338.0, 245.0, 98.0, 39.0, 14.0, 9.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.008712768554688, -17.489585876464844, -16.970458984375, -16.451332092285156, -15.932205200195312, -15.413078308105469, -14.893951416015625, -14.374824523925781, -13.855697631835938, -13.336570739746094, -12.81744384765625, -12.298316955566406, -11.779190063476562, -11.260063171386719, -10.740936279296875, -10.221809387207031, -9.702681541442871, -9.183554649353027, -8.664427757263184, -8.14530086517334, -7.626173973083496, -7.107047080993652, -6.58791971206665, -6.068792819976807, -5.549665927886963, -5.030539035797119, -4.511412143707275, -3.9922850131988525, -3.473158121109009, -2.954031229019165, -2.434904098510742, -1.9157772064208984, -1.3966503143310547, -0.8775233626365662, -0.35839641094207764, 0.16073060035705566, 0.6798574924468994, 1.1989843845367432, 1.718111515045166, 2.2372384071350098, 2.7563652992248535, 3.2754921913146973, 3.794619083404541, 4.313746452331543, 4.832873344421387, 5.3520002365112305, 5.871127128601074, 6.390254020690918, 6.909380912780762, 7.4285078048706055, 7.947634696960449, 8.466761589050293, 8.985888481140137, 9.50501537322998, 10.02414321899414, 10.543270111083984, 11.062397003173828, 11.581523895263672, 12.100650787353516, 12.61977767944336, 13.138904571533203, 13.658031463623047, 14.17715835571289, 14.696285247802734, 15.215412139892578]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 11.0, 5.0, 5.0, 9.0, 16.0, 39.0, 54.0, 76.0, 159.0, 158.0, 158.0, 113.0, 80.0, 52.0, 27.0, 14.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.976655006408691, -13.551311492919922, -13.125967025756836, -12.700623512268066, -12.275279998779297, -11.849935531616211, -11.424592018127441, -10.999248504638672, -10.573904037475586, -10.148560523986816, -9.72321605682373, -9.297872543334961, -8.872528076171875, -8.447184562683105, -8.021841049194336, -7.596497058868408, -7.1711530685424805, -6.745809078216553, -6.320465087890625, -5.8951215744018555, -5.469777584075928, -5.04443359375, -4.6190900802612305, -4.193746089935303, -3.768402099609375, -3.3430581092834473, -2.9177143573760986, -2.49237060546875, -2.0670266151428223, -1.6416826248168945, -1.216338872909546, -0.7909951210021973, -0.36565208435058594, 0.059691786766052246, 0.48503565788269043, 0.9103795289993286, 1.3357234001159668, 1.7610673904418945, 2.186411142349243, 2.611754894256592, 3.0370988845825195, 3.4624428749084473, 3.887786626815796, 4.3131303787231445, 4.738474369049072, 5.163818359375, 5.5891618728637695, 6.014505863189697, 6.439849853515625, 6.865193843841553, 7.2905378341674805, 7.71588134765625, 8.141225814819336, 8.566569328308105, 8.991912841796875, 9.417257308959961, 9.84260082244873, 10.2679443359375, 10.693288803100586, 11.118632316589355, 11.543975830078125, 11.969320297241211, 12.39466381072998, 12.82000732421875, 13.245351791381836]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 26.0, 44.0, 171.0, 1411.0, 133270.0, 4055506.0, 3380.0, 294.0, 76.0, 31.0, 18.0, 8.0, 9.0, 3.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -7.83984375, -7.3828125, -6.92578125, -6.46875, -6.01171875, -5.5546875, -5.09765625, -4.640625, -4.18359375, -3.7265625, -3.26953125, -2.8125, -2.35546875, -1.8984375, -1.44140625, -0.984375, -0.52734375, -0.0703125, 0.38671875, 0.84375, 1.30078125, 1.7578125, 2.21484375, 2.671875, 3.12890625, 3.5859375, 4.04296875, 4.5, 4.95703125, 5.4140625, 5.87109375, 6.328125, 6.78515625, 7.2421875, 7.69921875, 8.15625, 8.61328125, 9.0703125, 9.52734375, 9.984375, 10.44140625, 10.8984375, 11.35546875, 11.8125, 12.26953125, 12.7265625, 13.18359375, 13.640625, 14.09765625, 14.5546875, 15.01171875, 15.46875, 15.92578125, 16.3828125, 16.83984375, 17.296875, 17.75390625, 18.2109375, 18.66796875, 19.125, 19.58203125, 20.0390625, 20.49609375, 20.953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 11.0, 2.0, 5.0, 3.0, 13.0, 19.0, 17.0, 32.0, 49.0, 50.0, 86.0, 99.0, 117.0, 99.0, 82.0, 85.0, 69.0, 51.0, 37.0, 26.0, 11.0, 9.0, 10.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12523555755615234, -0.12193107604980469, -0.11862659454345703, -0.11532211303710938, -0.11201763153076172, -0.10871315002441406, -0.1054086685180664, -0.10210418701171875, -0.0987997055053711, -0.09549522399902344, -0.09219074249267578, -0.08888626098632812, -0.08558177947998047, -0.08227729797363281, -0.07897281646728516, -0.0756683349609375, -0.07236385345458984, -0.06905937194824219, -0.06575489044189453, -0.062450408935546875, -0.05914592742919922, -0.05584144592285156, -0.052536964416503906, -0.04923248291015625, -0.045928001403808594, -0.04262351989746094, -0.03931903839111328, -0.036014556884765625, -0.03271007537841797, -0.029405593872070312, -0.026101112365722656, -0.022796630859375, -0.019492149353027344, -0.016187667846679688, -0.012883186340332031, -0.009578704833984375, -0.006274223327636719, -0.0029697418212890625, 0.00033473968505859375, 0.00363922119140625, 0.006943702697753906, 0.010248184204101562, 0.013552665710449219, 0.016857147216796875, 0.02016162872314453, 0.023466110229492188, 0.026770591735839844, 0.0300750732421875, 0.033379554748535156, 0.03668403625488281, 0.03998851776123047, 0.043292999267578125, 0.04659748077392578, 0.04990196228027344, 0.053206443786621094, 0.05651092529296875, 0.059815406799316406, 0.06311988830566406, 0.06642436981201172, 0.06972885131835938, 0.07303333282470703, 0.07633781433105469, 0.07964229583740234, 0.08294677734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 17.0, 22.0, 54.0, 90.0, 216.0, 508.0, 2311.0, 34531.0, 3841955.0, 304917.0, 8651.0, 795.0, 155.0, 30.0, 16.0, 9.0, 7.0, 2.0, 0.0, 2.0], "bins": [-11.3203125, -11.105804443359375, -10.89129638671875, -10.676788330078125, -10.4622802734375, -10.247772216796875, -10.03326416015625, -9.818756103515625, -9.604248046875, -9.389739990234375, -9.17523193359375, -8.960723876953125, -8.7462158203125, -8.531707763671875, -8.31719970703125, -8.102691650390625, -7.88818359375, -7.673675537109375, -7.45916748046875, -7.244659423828125, -7.0301513671875, -6.815643310546875, -6.60113525390625, -6.386627197265625, -6.172119140625, -5.957611083984375, -5.74310302734375, -5.528594970703125, -5.3140869140625, -5.099578857421875, -4.88507080078125, -4.670562744140625, -4.4560546875, -4.241546630859375, -4.02703857421875, -3.812530517578125, -3.5980224609375, -3.383514404296875, -3.16900634765625, -2.954498291015625, -2.739990234375, -2.525482177734375, -2.31097412109375, -2.096466064453125, -1.8819580078125, -1.667449951171875, -1.45294189453125, -1.238433837890625, -1.02392578125, -0.809417724609375, -0.59490966796875, -0.380401611328125, -0.1658935546875, 0.048614501953125, 0.26312255859375, 0.477630615234375, 0.692138671875, 0.906646728515625, 1.12115478515625, 1.335662841796875, 1.5501708984375, 1.764678955078125, 1.97918701171875, 2.193695068359375, 2.408203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 10.0, 8.0, 8.0, 10.0, 11.0, 9.0, 17.0, 29.0, 26.0, 29.0, 36.0, 61.0, 91.0, 111.0, 142.0, 259.0, 691.0, 1229.0, 411.0, 211.0, 163.0, 117.0, 86.0, 62.0, 56.0, 38.0, 30.0, 26.0, 16.0, 18.0, 14.0, 12.0, 9.0, 4.0, 4.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2376708984375, -0.23098182678222656, -0.22429275512695312, -0.2176036834716797, -0.21091461181640625, -0.2042255401611328, -0.19753646850585938, -0.19084739685058594, -0.1841583251953125, -0.17746925354003906, -0.17078018188476562, -0.1640911102294922, -0.15740203857421875, -0.1507129669189453, -0.14402389526367188, -0.13733482360839844, -0.130645751953125, -0.12395668029785156, -0.11726760864257812, -0.11057853698730469, -0.10388946533203125, -0.09720039367675781, -0.09051132202148438, -0.08382225036621094, -0.0771331787109375, -0.07044410705566406, -0.06375503540039062, -0.05706596374511719, -0.05037689208984375, -0.04368782043457031, -0.036998748779296875, -0.030309677124023438, -0.02362060546875, -0.016931533813476562, -0.010242462158203125, -0.0035533905029296875, 0.00313568115234375, 0.009824752807617188, 0.016513824462890625, 0.023202896118164062, 0.0298919677734375, 0.03658103942871094, 0.043270111083984375, 0.04995918273925781, 0.05664825439453125, 0.06333732604980469, 0.07002639770507812, 0.07671546936035156, 0.083404541015625, 0.09009361267089844, 0.09678268432617188, 0.10347175598144531, 0.11016082763671875, 0.11684989929199219, 0.12353897094726562, 0.13022804260253906, 0.1369171142578125, 0.14360618591308594, 0.15029525756835938, 0.1569843292236328, 0.16367340087890625, 0.1703624725341797, 0.17705154418945312, 0.18374061584472656, 0.1904296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 135.0, 804.0, 64.0, 1.0, 2.0, 1.0, 1.0], "bins": [-49.348167419433594, -48.50278854370117, -47.65740966796875, -46.81203079223633, -45.966651916503906, -45.12126922607422, -44.2758903503418, -43.430511474609375, -42.58513259887695, -41.73975372314453, -40.89437484741211, -40.04899597167969, -39.20361328125, -38.35823440551758, -37.512855529785156, -36.667476654052734, -35.82209777832031, -34.97671890258789, -34.13134002685547, -33.28596115112305, -32.440582275390625, -31.59520149230957, -30.749820709228516, -29.904441833496094, -29.059062957763672, -28.21368408203125, -27.368305206298828, -26.522924423217773, -25.67754554748535, -24.83216667175293, -23.986785888671875, -23.141407012939453, -22.29602813720703, -21.45064926147461, -20.605270385742188, -19.759889602661133, -18.91451072692871, -18.06913185119629, -17.223751068115234, -16.378372192382812, -15.532992362976074, -14.687612533569336, -13.842233657836914, -12.996854782104492, -12.151474952697754, -11.306095123291016, -10.460716247558594, -9.615337371826172, -8.769957542419434, -7.9245781898498535, -7.079198837280273, -6.233819484710693, -5.388440132141113, -4.543060779571533, -3.697681427001953, -2.852302074432373, -2.006922721862793, -1.161543369293213, -0.3161640167236328, 0.5292153358459473, 1.3745946884155273, 2.2199740409851074, 3.0653533935546875, 3.9107327461242676, 4.756112098693848]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 9.0, 9.0, 6.0, 7.0, 22.0, 31.0, 31.0, 57.0, 60.0, 71.0, 64.0, 94.0, 79.0, 70.0, 87.0, 66.0, 55.0, 47.0, 42.0, 26.0, 24.0, 17.0, 10.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.5356924533843994, -2.4734723567962646, -2.411252021789551, -2.349031925201416, -2.2868118286132812, -2.2245917320251465, -2.1623713970184326, -2.100151300430298, -2.037930965423584, -1.9757107496261597, -1.913490653038025, -1.8512704372406006, -1.7890503406524658, -1.7268301248550415, -1.6646099090576172, -1.6023898124694824, -1.5401697158813477, -1.4779495000839233, -1.4157294034957886, -1.3535091876983643, -1.2912890911102295, -1.2290688753128052, -1.1668486595153809, -1.104628562927246, -1.0424083471298218, -0.9801881909370422, -0.9179680347442627, -0.8557478189468384, -0.7935276627540588, -0.7313075065612793, -0.669087290763855, -0.6068671345710754, -0.5446470975875854, -0.4824269413948059, -0.420206755399704, -0.35798656940460205, -0.2957664132118225, -0.23354625701904297, -0.17132607102394104, -0.10910588502883911, -0.04688572883605957, 0.015334442257881165, 0.0775546133518219, 0.13977478444576263, 0.20199495553970337, 0.2642151117324829, 0.32643529772758484, 0.38865548372268677, 0.4508756399154663, 0.5130957961082458, 0.5753159523010254, 0.6375361680984497, 0.6997563242912292, 0.7619764804840088, 0.8241966962814331, 0.8864168524742126, 0.9486370086669922, 1.0108572244644165, 1.0730773210525513, 1.1352975368499756, 1.1975176334381104, 1.2597378492355347, 1.321958065032959, 1.3841781616210938, 1.446398377418518]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 13.0, 9.0, 15.0, 15.0, 29.0, 41.0, 39.0, 70.0, 97.0, 145.0, 232.0, 418.0, 589.0, 1076.0, 1951.0, 3748.0, 7787.0, 17549.0, 43447.0, 121715.0, 372033.0, 311783.0, 99785.0, 36574.0, 15138.0, 6667.0, 3375.0, 1697.0, 922.0, 542.0, 367.0, 218.0, 124.0, 104.0, 67.0, 42.0, 34.0, 24.0, 19.0, 18.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.066619873046875, -1.02972412109375, -0.992828369140625, -0.9559326171875, -0.919036865234375, -0.88214111328125, -0.845245361328125, -0.808349609375, -0.771453857421875, -0.73455810546875, -0.697662353515625, -0.6607666015625, -0.623870849609375, -0.58697509765625, -0.550079345703125, -0.51318359375, -0.476287841796875, -0.43939208984375, -0.402496337890625, -0.3656005859375, -0.328704833984375, -0.29180908203125, -0.254913330078125, -0.218017578125, -0.181121826171875, -0.14422607421875, -0.107330322265625, -0.0704345703125, -0.033538818359375, 0.00335693359375, 0.040252685546875, 0.0771484375, 0.114044189453125, 0.15093994140625, 0.187835693359375, 0.2247314453125, 0.261627197265625, 0.29852294921875, 0.335418701171875, 0.372314453125, 0.409210205078125, 0.44610595703125, 0.483001708984375, 0.5198974609375, 0.556793212890625, 0.59368896484375, 0.630584716796875, 0.66748046875, 0.704376220703125, 0.74127197265625, 0.778167724609375, 0.8150634765625, 0.851959228515625, 0.88885498046875, 0.925750732421875, 0.962646484375, 0.999542236328125, 1.03643798828125, 1.073333740234375, 1.1102294921875, 1.147125244140625, 1.18402099609375, 1.220916748046875, 1.2578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 11.0, 6.0, 8.0, 16.0, 17.0, 23.0, 29.0, 43.0, 44.0, 61.0, 58.0, 61.0, 88.0, 64.0, 78.0, 69.0, 60.0, 38.0, 47.0, 42.0, 37.0, 26.0, 22.0, 10.0, 7.0, 13.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08407211303710938, -0.08110809326171875, -0.07814407348632812, -0.0751800537109375, -0.07221603393554688, -0.06925201416015625, -0.06628799438476562, -0.063323974609375, -0.060359954833984375, -0.05739593505859375, -0.054431915283203125, -0.0514678955078125, -0.048503875732421875, -0.04553985595703125, -0.042575836181640625, -0.03961181640625, -0.036647796630859375, -0.03368377685546875, -0.030719757080078125, -0.0277557373046875, -0.024791717529296875, -0.02182769775390625, -0.018863677978515625, -0.015899658203125, -0.012935638427734375, -0.00997161865234375, -0.007007598876953125, -0.0040435791015625, -0.001079559326171875, 0.00188446044921875, 0.004848480224609375, 0.0078125, 0.010776519775390625, 0.01374053955078125, 0.016704559326171875, 0.0196685791015625, 0.022632598876953125, 0.02559661865234375, 0.028560638427734375, 0.031524658203125, 0.034488677978515625, 0.03745269775390625, 0.040416717529296875, 0.0433807373046875, 0.046344757080078125, 0.04930877685546875, 0.052272796630859375, 0.05523681640625, 0.058200836181640625, 0.06116485595703125, 0.06412887573242188, 0.0670928955078125, 0.07005691528320312, 0.07302093505859375, 0.07598495483398438, 0.078948974609375, 0.08191299438476562, 0.08487701416015625, 0.08784103393554688, 0.0908050537109375, 0.09376907348632812, 0.09673309326171875, 0.09969711303710938, 0.1026611328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 1.0, 9.0, 7.0, 6.0, 9.0, 11.0, 18.0, 19.0, 28.0, 31.0, 52.0, 94.0, 633.0, 12169.0, 993302.0, 40843.0, 987.0, 106.0, 53.0, 34.0, 37.0, 24.0, 11.0, 15.0, 10.0, 7.0, 10.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.85394287109375, -5.6688232421875, -5.48370361328125, -5.298583984375, -5.11346435546875, -4.9283447265625, -4.74322509765625, -4.55810546875, -4.37298583984375, -4.1878662109375, -4.00274658203125, -3.817626953125, -3.63250732421875, -3.4473876953125, -3.26226806640625, -3.0771484375, -2.89202880859375, -2.7069091796875, -2.52178955078125, -2.336669921875, -2.15155029296875, -1.9664306640625, -1.78131103515625, -1.59619140625, -1.41107177734375, -1.2259521484375, -1.04083251953125, -0.855712890625, -0.67059326171875, -0.4854736328125, -0.30035400390625, -0.115234375, 0.06988525390625, 0.2550048828125, 0.44012451171875, 0.625244140625, 0.81036376953125, 0.9954833984375, 1.18060302734375, 1.36572265625, 1.55084228515625, 1.7359619140625, 1.92108154296875, 2.106201171875, 2.29132080078125, 2.4764404296875, 2.66156005859375, 2.8466796875, 3.03179931640625, 3.2169189453125, 3.40203857421875, 3.587158203125, 3.77227783203125, 3.9573974609375, 4.14251708984375, 4.32763671875, 4.51275634765625, 4.6978759765625, 4.88299560546875, 5.068115234375, 5.25323486328125, 5.4383544921875, 5.62347412109375, 5.80859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 7.0, 9.0, 11.0, 17.0, 21.0, 24.0, 24.0, 26.0, 33.0, 42.0, 52.0, 36.0, 45.0, 49.0, 51.0, 53.0, 56.0, 44.0, 33.0, 46.0, 48.0, 43.0, 35.0, 25.0, 18.0, 26.0, 22.0, 26.0, 10.0, 13.0, 8.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3811302185058594, -0.36748504638671875, -0.3538398742675781, -0.3401947021484375, -0.3265495300292969, -0.31290435791015625, -0.2992591857910156, -0.285614013671875, -0.2719688415527344, -0.25832366943359375, -0.24467849731445312, -0.2310333251953125, -0.21738815307617188, -0.20374298095703125, -0.19009780883789062, -0.17645263671875, -0.16280746459960938, -0.14916229248046875, -0.13551712036132812, -0.1218719482421875, -0.10822677612304688, -0.09458160400390625, -0.08093643188476562, -0.067291259765625, -0.053646087646484375, -0.04000091552734375, -0.026355743408203125, -0.0127105712890625, 0.000934600830078125, 0.01457977294921875, 0.028224945068359375, 0.0418701171875, 0.055515289306640625, 0.06916046142578125, 0.08280563354492188, 0.0964508056640625, 0.11009597778320312, 0.12374114990234375, 0.13738632202148438, 0.151031494140625, 0.16467666625976562, 0.17832183837890625, 0.19196701049804688, 0.2056121826171875, 0.21925735473632812, 0.23290252685546875, 0.24654769897460938, 0.26019287109375, 0.2738380432128906, 0.28748321533203125, 0.3011283874511719, 0.3147735595703125, 0.3284187316894531, 0.34206390380859375, 0.3557090759277344, 0.369354248046875, 0.3829994201660156, 0.39664459228515625, 0.4102897644042969, 0.4239349365234375, 0.4375801086425781, 0.45122528076171875, 0.4648704528808594, 0.478515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 12.0, 10.0, 12.0, 25.0, 27.0, 70.0, 152.0, 1478.0, 966717.0, 79038.0, 709.0, 115.0, 65.0, 27.0, 28.0, 16.0, 7.0, 12.0, 7.0, 2.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.799560546875, -16.25537109375, -15.711181640625, -15.1669921875, -14.622802734375, -14.07861328125, -13.534423828125, -12.990234375, -12.446044921875, -11.90185546875, -11.357666015625, -10.8134765625, -10.269287109375, -9.72509765625, -9.180908203125, -8.63671875, -8.092529296875, -7.54833984375, -7.004150390625, -6.4599609375, -5.915771484375, -5.37158203125, -4.827392578125, -4.283203125, -3.739013671875, -3.19482421875, -2.650634765625, -2.1064453125, -1.562255859375, -1.01806640625, -0.473876953125, 0.0703125, 0.614501953125, 1.15869140625, 1.702880859375, 2.2470703125, 2.791259765625, 3.33544921875, 3.879638671875, 4.423828125, 4.968017578125, 5.51220703125, 6.056396484375, 6.6005859375, 7.144775390625, 7.68896484375, 8.233154296875, 8.77734375, 9.321533203125, 9.86572265625, 10.409912109375, 10.9541015625, 11.498291015625, 12.04248046875, 12.586669921875, 13.130859375, 13.675048828125, 14.21923828125, 14.763427734375, 15.3076171875, 15.851806640625, 16.39599609375, 16.940185546875, 17.484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 7.0, 6.0, 15.0, 19.0, 49.0, 101.0, 271.0, 280.0, 115.0, 46.0, 24.0, 20.0, 12.0, 8.0, 10.0, 5.0, 6.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005211830139160156, -0.0005038455128669739, -0.00048650801181793213, -0.0004691705107688904, -0.00045183300971984863, -0.0004344955086708069, -0.00041715800762176514, -0.0003998205065727234, -0.00038248300552368164, -0.0003651455044746399, -0.00034780800342559814, -0.0003304705023765564, -0.00031313300132751465, -0.0002957955002784729, -0.00027845799922943115, -0.0002611204981803894, -0.00024378299713134766, -0.0002264454960823059, -0.00020910799503326416, -0.0001917704939842224, -0.00017443299293518066, -0.00015709549188613892, -0.00013975799083709717, -0.00012242048978805542, -0.00010508298873901367, -8.774548768997192e-05, -7.040798664093018e-05, -5.307048559188843e-05, -3.573298454284668e-05, -1.839548349380493e-05, -1.0579824447631836e-06, 1.6279518604278564e-05, 3.361701965332031e-05, 5.095452070236206e-05, 6.829202175140381e-05, 8.562952280044556e-05, 0.0001029670238494873, 0.00012030452489852905, 0.0001376420259475708, 0.00015497952699661255, 0.0001723170280456543, 0.00018965452909469604, 0.0002069920301437378, 0.00022432953119277954, 0.0002416670322418213, 0.00025900453329086304, 0.0002763420343399048, 0.00029367953538894653, 0.0003110170364379883, 0.00032835453748703003, 0.0003456920385360718, 0.0003630295395851135, 0.0003803670406341553, 0.000397704541683197, 0.00041504204273223877, 0.0004323795437812805, 0.00044971704483032227, 0.000467054545879364, 0.00048439204692840576, 0.0005017295479774475, 0.0005190670490264893, 0.000536404550075531, 0.0005537420511245728, 0.0005710795521736145, 0.0005884170532226562]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 8.0, 13.0, 24.0, 37.0, 34.0, 63.0, 88.0, 136.0, 224.0, 322.0, 507.0, 859.0, 1583.0, 3035.0, 7240.0, 18806.0, 68627.0, 677885.0, 210570.0, 36169.0, 12133.0, 4898.0, 2345.0, 1163.0, 677.0, 394.0, 225.0, 161.0, 105.0, 80.0, 33.0, 24.0, 18.0, 20.0, 8.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.09765625, -3.96868896484375, -3.8397216796875, -3.71075439453125, -3.581787109375, -3.45281982421875, -3.3238525390625, -3.19488525390625, -3.06591796875, -2.93695068359375, -2.8079833984375, -2.67901611328125, -2.550048828125, -2.42108154296875, -2.2921142578125, -2.16314697265625, -2.0341796875, -1.90521240234375, -1.7762451171875, -1.64727783203125, -1.518310546875, -1.38934326171875, -1.2603759765625, -1.13140869140625, -1.00244140625, -0.87347412109375, -0.7445068359375, -0.61553955078125, -0.486572265625, -0.35760498046875, -0.2286376953125, -0.09967041015625, 0.029296875, 0.15826416015625, 0.2872314453125, 0.41619873046875, 0.545166015625, 0.67413330078125, 0.8031005859375, 0.93206787109375, 1.06103515625, 1.19000244140625, 1.3189697265625, 1.44793701171875, 1.576904296875, 1.70587158203125, 1.8348388671875, 1.96380615234375, 2.0927734375, 2.22174072265625, 2.3507080078125, 2.47967529296875, 2.608642578125, 2.73760986328125, 2.8665771484375, 2.99554443359375, 3.12451171875, 3.25347900390625, 3.3824462890625, 3.51141357421875, 3.640380859375, 3.76934814453125, 3.8983154296875, 4.02728271484375, 4.15625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 14.0, 15.0, 29.0, 55.0, 98.0, 185.0, 236.0, 140.0, 76.0, 31.0, 25.0, 23.0, 16.0, 11.0, 6.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.413116455078125, -2.33599853515625, -2.258880615234375, -2.1817626953125, -2.104644775390625, -2.02752685546875, -1.950408935546875, -1.873291015625, -1.796173095703125, -1.71905517578125, -1.641937255859375, -1.5648193359375, -1.487701416015625, -1.41058349609375, -1.333465576171875, -1.25634765625, -1.179229736328125, -1.10211181640625, -1.024993896484375, -0.9478759765625, -0.870758056640625, -0.79364013671875, -0.716522216796875, -0.639404296875, -0.562286376953125, -0.48516845703125, -0.408050537109375, -0.3309326171875, -0.253814697265625, -0.17669677734375, -0.099578857421875, -0.0224609375, 0.054656982421875, 0.13177490234375, 0.208892822265625, 0.2860107421875, 0.363128662109375, 0.44024658203125, 0.517364501953125, 0.594482421875, 0.671600341796875, 0.74871826171875, 0.825836181640625, 0.9029541015625, 0.980072021484375, 1.05718994140625, 1.134307861328125, 1.21142578125, 1.288543701171875, 1.36566162109375, 1.442779541015625, 1.5198974609375, 1.597015380859375, 1.67413330078125, 1.751251220703125, 1.828369140625, 1.905487060546875, 1.98260498046875, 2.059722900390625, 2.1368408203125, 2.213958740234375, 2.29107666015625, 2.368194580078125, 2.4453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 30.0, 78.0, 191.0, 295.0, 251.0, 102.0, 25.0, 18.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.916030883789062, -16.365196228027344, -15.814361572265625, -15.263526916503906, -14.712692260742188, -14.161857604980469, -13.61102294921875, -13.060188293457031, -12.509353637695312, -11.958518981933594, -11.407684326171875, -10.856849670410156, -10.306015014648438, -9.755180358886719, -9.204345703125, -8.653511047363281, -8.102676391601562, -7.551841735839844, -7.001007080078125, -6.450172424316406, -5.8993377685546875, -5.348503112792969, -4.79766845703125, -4.246833801269531, -3.6959991455078125, -3.1451644897460938, -2.594329833984375, -2.0434951782226562, -1.4926605224609375, -0.9418258666992188, -0.3909912109375, 0.15984344482421875, 0.7106781005859375, 1.2615127563476562, 1.812347412109375, 2.3631820678710938, 2.9140167236328125, 3.4648513793945312, 4.01568603515625, 4.566520690917969, 5.1173553466796875, 5.668190002441406, 6.219024658203125, 6.769859313964844, 7.3206939697265625, 7.871528625488281, 8.42236328125, 8.973197937011719, 9.524032592773438, 10.074867248535156, 10.625701904296875, 11.176536560058594, 11.727371215820312, 12.278205871582031, 12.82904052734375, 13.379875183105469, 13.930709838867188, 14.481544494628906, 15.032379150390625, 15.583213806152344, 16.134048461914062, 16.68488311767578, 17.2357177734375, 17.78655242919922, 18.337387084960938]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 10.0, 13.0, 14.0, 23.0, 31.0, 36.0, 49.0, 66.0, 94.0, 70.0, 81.0, 85.0, 68.0, 67.0, 68.0, 50.0, 36.0, 31.0, 26.0, 26.0, 11.0, 15.0, 5.0, 4.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.705593109130859, -5.540289878845215, -5.3749871253967285, -5.209684371948242, -5.044381141662598, -4.879077911376953, -4.713775157928467, -4.5484724044799805, -4.383169174194336, -4.217865943908691, -4.052563190460205, -3.8872601985931396, -3.721957206726074, -3.556654214859009, -3.3913512229919434, -3.226048231124878, -3.0607452392578125, -2.895442247390747, -2.7301392555236816, -2.564836263656616, -2.399533271789551, -2.2342302799224854, -2.06892728805542, -1.9036242961883545, -1.738321304321289, -1.5730183124542236, -1.4077153205871582, -1.2424123287200928, -1.0771093368530273, -0.9118063449859619, -0.7465033531188965, -0.581200361251831, -0.41589784622192383, -0.2505948543548584, -0.08529186248779297, 0.08001112937927246, 0.2453141212463379, 0.4106171131134033, 0.5759201049804688, 0.7412230968475342, 0.9065260887145996, 1.071829080581665, 1.2371320724487305, 1.402435064315796, 1.5677380561828613, 1.7330410480499268, 1.8983440399169922, 2.0636470317840576, 2.228950023651123, 2.3942530155181885, 2.559556007385254, 2.7248589992523193, 2.8901619911193848, 3.05546498298645, 3.2207679748535156, 3.386070966720581, 3.5513739585876465, 3.716676950454712, 3.8819799423217773, 4.047283172607422, 4.212585926055908, 4.3778886795043945, 4.543191909790039, 4.708495140075684, 4.87379789352417]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 6.0, 0.0, 10.0, 14.0, 6.0, 11.0, 15.0, 14.0, 34.0, 72.0, 178.0, 661.0, 3294.0, 33259.0, 3856183.0, 287459.0, 10807.0, 1370.0, 322.0, 146.0, 82.0, 41.0, 40.0, 43.0, 40.0, 29.0, 20.0, 19.0, 13.0, 6.0, 9.0, 15.0, 6.0, 10.0, 6.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0], "bins": [-7.90625, -7.68536376953125, -7.4644775390625, -7.24359130859375, -7.022705078125, -6.80181884765625, -6.5809326171875, -6.36004638671875, -6.13916015625, -5.91827392578125, -5.6973876953125, -5.47650146484375, -5.255615234375, -5.03472900390625, -4.8138427734375, -4.59295654296875, -4.3720703125, -4.15118408203125, -3.9302978515625, -3.70941162109375, -3.488525390625, -3.26763916015625, -3.0467529296875, -2.82586669921875, -2.60498046875, -2.38409423828125, -2.1632080078125, -1.94232177734375, -1.721435546875, -1.50054931640625, -1.2796630859375, -1.05877685546875, -0.837890625, -0.61700439453125, -0.3961181640625, -0.17523193359375, 0.045654296875, 0.26654052734375, 0.4874267578125, 0.70831298828125, 0.92919921875, 1.15008544921875, 1.3709716796875, 1.59185791015625, 1.812744140625, 2.03363037109375, 2.2545166015625, 2.47540283203125, 2.6962890625, 2.91717529296875, 3.1380615234375, 3.35894775390625, 3.579833984375, 3.80072021484375, 4.0216064453125, 4.24249267578125, 4.46337890625, 4.68426513671875, 4.9051513671875, 5.12603759765625, 5.346923828125, 5.56781005859375, 5.7886962890625, 6.00958251953125, 6.23046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 17.0, 21.0, 23.0, 39.0, 82.0, 85.0, 111.0, 110.0, 105.0, 113.0, 91.0, 67.0, 51.0, 31.0, 18.0, 16.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07589149475097656, -0.07085037231445312, -0.06580924987792969, -0.06076812744140625, -0.05572700500488281, -0.050685882568359375, -0.04564476013183594, -0.0406036376953125, -0.03556251525878906, -0.030521392822265625, -0.025480270385742188, -0.02043914794921875, -0.015398025512695312, -0.010356903076171875, -0.0053157806396484375, -0.000274658203125, 0.0047664642333984375, 0.009807586669921875, 0.014848709106445312, 0.01988983154296875, 0.024930953979492188, 0.029972076416015625, 0.03501319885253906, 0.0400543212890625, 0.04509544372558594, 0.050136566162109375, 0.05517768859863281, 0.06021881103515625, 0.06525993347167969, 0.07030105590820312, 0.07534217834472656, 0.08038330078125, 0.08542442321777344, 0.09046554565429688, 0.09550666809082031, 0.10054779052734375, 0.10558891296386719, 0.11063003540039062, 0.11567115783691406, 0.1207122802734375, 0.12575340270996094, 0.13079452514648438, 0.1358356475830078, 0.14087677001953125, 0.1459178924560547, 0.15095901489257812, 0.15600013732910156, 0.161041259765625, 0.16608238220214844, 0.17112350463867188, 0.1761646270751953, 0.18120574951171875, 0.1862468719482422, 0.19128799438476562, 0.19632911682128906, 0.2013702392578125, 0.20641136169433594, 0.21145248413085938, 0.2164936065673828, 0.22153472900390625, 0.2265758514404297, 0.23161697387695312, 0.23665809631347656, 0.24169921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 14.0, 44.0, 72.0, 180.0, 630.0, 50751.0, 4136869.0, 4962.0, 436.0, 149.0, 95.0, 34.0, 18.0, 10.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.75, -7.208251953125, -6.66650390625, -6.124755859375, -5.5830078125, -5.041259765625, -4.49951171875, -3.957763671875, -3.416015625, -2.874267578125, -2.33251953125, -1.790771484375, -1.2490234375, -0.707275390625, -0.16552734375, 0.376220703125, 0.91796875, 1.459716796875, 2.00146484375, 2.543212890625, 3.0849609375, 3.626708984375, 4.16845703125, 4.710205078125, 5.251953125, 5.793701171875, 6.33544921875, 6.877197265625, 7.4189453125, 7.960693359375, 8.50244140625, 9.044189453125, 9.5859375, 10.127685546875, 10.66943359375, 11.211181640625, 11.7529296875, 12.294677734375, 12.83642578125, 13.378173828125, 13.919921875, 14.461669921875, 15.00341796875, 15.545166015625, 16.0869140625, 16.628662109375, 17.17041015625, 17.712158203125, 18.25390625, 18.795654296875, 19.33740234375, 19.879150390625, 20.4208984375, 20.962646484375, 21.50439453125, 22.046142578125, 22.587890625, 23.129638671875, 23.67138671875, 24.213134765625, 24.7548828125, 25.296630859375, 25.83837890625, 26.380126953125, 26.921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 10.0, 28.0, 31.0, 44.0, 73.0, 133.0, 223.0, 437.0, 1593.0, 783.0, 297.0, 150.0, 111.0, 53.0, 42.0, 26.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.67626953125, -0.6611366271972656, -0.6460037231445312, -0.6308708190917969, -0.6157379150390625, -0.6006050109863281, -0.5854721069335938, -0.5703392028808594, -0.555206298828125, -0.5400733947753906, -0.5249404907226562, -0.5098075866699219, -0.4946746826171875, -0.4795417785644531, -0.46440887451171875, -0.4492759704589844, -0.43414306640625, -0.4190101623535156, -0.40387725830078125, -0.3887443542480469, -0.3736114501953125, -0.3584785461425781, -0.34334564208984375, -0.3282127380371094, -0.313079833984375, -0.2979469299316406, -0.28281402587890625, -0.2676811218261719, -0.2525482177734375, -0.23741531372070312, -0.22228240966796875, -0.20714950561523438, -0.1920166015625, -0.17688369750976562, -0.16175079345703125, -0.14661788940429688, -0.1314849853515625, -0.11635208129882812, -0.10121917724609375, -0.08608627319335938, -0.070953369140625, -0.055820465087890625, -0.04068756103515625, -0.025554656982421875, -0.0104217529296875, 0.004711151123046875, 0.01984405517578125, 0.034976959228515625, 0.05010986328125, 0.06524276733398438, 0.08037567138671875, 0.09550857543945312, 0.1106414794921875, 0.12577438354492188, 0.14090728759765625, 0.15604019165039062, 0.171173095703125, 0.18630599975585938, 0.20143890380859375, 0.21657180786132812, 0.2317047119140625, 0.24683761596679688, 0.26197052001953125, 0.2771034240722656, 0.292236328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [7.0, 264.0, 728.0, 21.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3375675678253174, -1.2624499797821045, -0.1873323917388916, 0.8877851963043213, 1.9629027843475342, 3.038020372390747, 4.113138198852539, 5.188255310058594, 6.263373374938965, 7.338490962982178, 8.41360855102539, 9.488725662231445, 10.563843727111816, 11.638961791992188, 12.714078903198242, 13.789196014404297, 14.864314079284668, 15.939432144165039, 17.014549255371094, 18.08966636657715, 19.164783477783203, 20.23990249633789, 21.315019607543945, 22.39013671875, 23.465253829956055, 24.54037094116211, 25.615489959716797, 26.69060707092285, 27.765724182128906, 28.84084129333496, 29.915958404541016, 30.991077423095703, 32.066192626953125, 33.14131164550781, 34.216426849365234, 35.29154586791992, 36.366661071777344, 37.44178009033203, 38.51689910888672, 39.59201431274414, 40.66713333129883, 41.742252349853516, 42.81736755371094, 43.892486572265625, 44.96760559082031, 46.042720794677734, 47.11783981323242, 48.192955017089844, 49.26807403564453, 50.34319305419922, 51.41830825805664, 52.49342727661133, 53.56854248046875, 54.64366149902344, 55.718780517578125, 56.79389572143555, 57.869014739990234, 58.94413375854492, 60.019248962402344, 61.09436798095703, 62.16948699951172, 63.24460220336914, 64.31971740722656, 65.39483642578125, 66.46995544433594]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 9.0, 17.0, 18.0, 24.0, 39.0, 44.0, 57.0, 49.0, 68.0, 84.0, 77.0, 73.0, 74.0, 77.0, 64.0, 62.0, 50.0, 33.0, 28.0, 21.0, 7.0, 10.0, 12.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7874598503112793, -2.7095694541931152, -2.631679058074951, -2.553788661956787, -2.475898265838623, -2.398008108139038, -2.320117712020874, -2.24222731590271, -2.164336919784546, -2.086446523666382, -2.0085561275482178, -1.9306658506393433, -1.8527754545211792, -1.7748850584030151, -1.6969947814941406, -1.6191043853759766, -1.5412139892578125, -1.4633235931396484, -1.3854331970214844, -1.3075429201126099, -1.2296525239944458, -1.1517621278762817, -1.0738718509674072, -0.9959814548492432, -0.9180910587310791, -0.840200662612915, -0.7623103260993958, -0.6844199895858765, -0.6065295934677124, -0.5286391973495483, -0.45074886083602905, -0.37285852432250977, -0.2949681282043457, -0.21707776188850403, -0.13918739557266235, -0.06129702925682068, 0.016593337059020996, 0.09448370337486267, 0.17237406969070435, 0.25026440620422363, 0.3281548023223877, 0.40604516863822937, 0.48393553495407104, 0.5618258714675903, 0.6397162675857544, 0.7176066637039185, 0.7954970002174377, 0.873387336730957, 0.9512777328491211, 1.0291681289672852, 1.1070585250854492, 1.1849488019943237, 1.2628391981124878, 1.3407295942306519, 1.4186198711395264, 1.4965102672576904, 1.5744006633758545, 1.6522910594940186, 1.7301814556121826, 1.8080717325210571, 1.8859621286392212, 1.9638525247573853, 2.0417428016662598, 2.119633197784424, 2.197523593902588]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 3.0, 10.0, 4.0, 10.0, 10.0, 15.0, 11.0, 20.0, 13.0, 28.0, 34.0, 23.0, 22.0, 41.0, 42.0, 84.0, 281.0, 1930.0, 20877.0, 287481.0, 658859.0, 71798.0, 5801.0, 645.0, 158.0, 62.0, 42.0, 26.0, 25.0, 29.0, 29.0, 15.0, 22.0, 22.0, 16.0, 10.0, 15.0, 10.0, 11.0, 4.0, 6.0, 5.0, 4.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.84765625, -2.74310302734375, -2.6385498046875, -2.53399658203125, -2.429443359375, -2.32489013671875, -2.2203369140625, -2.11578369140625, -2.01123046875, -1.90667724609375, -1.8021240234375, -1.69757080078125, -1.593017578125, -1.48846435546875, -1.3839111328125, -1.27935791015625, -1.1748046875, -1.07025146484375, -0.9656982421875, -0.86114501953125, -0.756591796875, -0.65203857421875, -0.5474853515625, -0.44293212890625, -0.33837890625, -0.23382568359375, -0.1292724609375, -0.02471923828125, 0.079833984375, 0.18438720703125, 0.2889404296875, 0.39349365234375, 0.498046875, 0.60260009765625, 0.7071533203125, 0.81170654296875, 0.916259765625, 1.02081298828125, 1.1253662109375, 1.22991943359375, 1.33447265625, 1.43902587890625, 1.5435791015625, 1.64813232421875, 1.752685546875, 1.85723876953125, 1.9617919921875, 2.06634521484375, 2.1708984375, 2.27545166015625, 2.3800048828125, 2.48455810546875, 2.589111328125, 2.69366455078125, 2.7982177734375, 2.90277099609375, 3.00732421875, 3.11187744140625, 3.2164306640625, 3.32098388671875, 3.425537109375, 3.53009033203125, 3.6346435546875, 3.73919677734375, 3.84375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 6.0, 8.0, 9.0, 14.0, 34.0, 27.0, 39.0, 50.0, 47.0, 49.0, 61.0, 65.0, 68.0, 68.0, 71.0, 61.0, 59.0, 51.0, 57.0, 41.0, 30.0, 25.0, 20.0, 10.0, 8.0, 7.0, 8.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11407470703125, -0.1097249984741211, -0.10537528991699219, -0.10102558135986328, -0.09667587280273438, -0.09232616424560547, -0.08797645568847656, -0.08362674713134766, -0.07927703857421875, -0.07492733001708984, -0.07057762145996094, -0.06622791290283203, -0.061878204345703125, -0.05752849578857422, -0.05317878723144531, -0.048829078674316406, -0.0444793701171875, -0.040129661560058594, -0.03577995300292969, -0.03143024444580078, -0.027080535888671875, -0.02273082733154297, -0.018381118774414062, -0.014031410217285156, -0.00968170166015625, -0.005331993103027344, -0.0009822845458984375, 0.0033674240112304688, 0.007717132568359375, 0.012066841125488281, 0.016416549682617188, 0.020766258239746094, 0.025115966796875, 0.029465675354003906, 0.03381538391113281, 0.03816509246826172, 0.042514801025390625, 0.04686450958251953, 0.05121421813964844, 0.055563926696777344, 0.05991363525390625, 0.06426334381103516, 0.06861305236816406, 0.07296276092529297, 0.07731246948242188, 0.08166217803955078, 0.08601188659667969, 0.0903615951538086, 0.0947113037109375, 0.0990610122680664, 0.10341072082519531, 0.10776042938232422, 0.11211013793945312, 0.11645984649658203, 0.12080955505371094, 0.12515926361083984, 0.12950897216796875, 0.13385868072509766, 0.13820838928222656, 0.14255809783935547, 0.14690780639648438, 0.15125751495361328, 0.1556072235107422, 0.1599569320678711, 0.164306640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 4.0, 12.0, 14.0, 19.0, 32.0, 42.0, 61.0, 123.0, 223.0, 449.0, 952.0, 2595.0, 8238.0, 31951.0, 154113.0, 490573.0, 278891.0, 59699.0, 13931.0, 3924.0, 1436.0, 582.0, 276.0, 152.0, 91.0, 53.0, 31.0, 22.0, 17.0, 17.0, 4.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.62890625, -2.56268310546875, -2.4964599609375, -2.43023681640625, -2.364013671875, -2.29779052734375, -2.2315673828125, -2.16534423828125, -2.09912109375, -2.03289794921875, -1.9666748046875, -1.90045166015625, -1.834228515625, -1.76800537109375, -1.7017822265625, -1.63555908203125, -1.5693359375, -1.50311279296875, -1.4368896484375, -1.37066650390625, -1.304443359375, -1.23822021484375, -1.1719970703125, -1.10577392578125, -1.03955078125, -0.97332763671875, -0.9071044921875, -0.84088134765625, -0.774658203125, -0.70843505859375, -0.6422119140625, -0.57598876953125, -0.509765625, -0.44354248046875, -0.3773193359375, -0.31109619140625, -0.244873046875, -0.17864990234375, -0.1124267578125, -0.04620361328125, 0.02001953125, 0.08624267578125, 0.1524658203125, 0.21868896484375, 0.284912109375, 0.35113525390625, 0.4173583984375, 0.48358154296875, 0.5498046875, 0.61602783203125, 0.6822509765625, 0.74847412109375, 0.814697265625, 0.88092041015625, 0.9471435546875, 1.01336669921875, 1.07958984375, 1.14581298828125, 1.2120361328125, 1.27825927734375, 1.344482421875, 1.41070556640625, 1.4769287109375, 1.54315185546875, 1.609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 2.0, 7.0, 6.0, 11.0, 17.0, 18.0, 18.0, 19.0, 21.0, 16.0, 22.0, 31.0, 28.0, 40.0, 35.0, 38.0, 46.0, 36.0, 45.0, 41.0, 34.0, 52.0, 35.0, 34.0, 35.0, 32.0, 37.0, 33.0, 17.0, 30.0, 25.0, 16.0, 13.0, 21.0, 13.0, 17.0, 7.0, 12.0, 6.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.57421875, -0.5565643310546875, -0.538909912109375, -0.5212554931640625, -0.50360107421875, -0.4859466552734375, -0.468292236328125, -0.4506378173828125, -0.4329833984375, -0.4153289794921875, -0.397674560546875, -0.3800201416015625, -0.36236572265625, -0.3447113037109375, -0.327056884765625, -0.3094024658203125, -0.291748046875, -0.2740936279296875, -0.256439208984375, -0.2387847900390625, -0.22113037109375, -0.2034759521484375, -0.185821533203125, -0.1681671142578125, -0.1505126953125, -0.1328582763671875, -0.115203857421875, -0.0975494384765625, -0.07989501953125, -0.0622406005859375, -0.044586181640625, -0.0269317626953125, -0.00927734375, 0.0083770751953125, 0.026031494140625, 0.0436859130859375, 0.06134033203125, 0.0789947509765625, 0.096649169921875, 0.1143035888671875, 0.1319580078125, 0.1496124267578125, 0.167266845703125, 0.1849212646484375, 0.20257568359375, 0.2202301025390625, 0.237884521484375, 0.2555389404296875, 0.273193359375, 0.2908477783203125, 0.308502197265625, 0.3261566162109375, 0.34381103515625, 0.3614654541015625, 0.379119873046875, 0.3967742919921875, 0.4144287109375, 0.4320831298828125, 0.449737548828125, 0.4673919677734375, 0.48504638671875, 0.5027008056640625, 0.520355224609375, 0.5380096435546875, 0.5556640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 15.0, 25.0, 32.0, 43.0, 70.0, 116.0, 188.0, 330.0, 686.0, 1804.0, 5425.0, 20949.0, 118015.0, 560332.0, 281354.0, 44659.0, 9591.0, 2811.0, 1021.0, 442.0, 239.0, 139.0, 71.0, 40.0, 37.0, 31.0, 22.0, 7.0, 12.0, 8.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.669921875, -2.59722900390625, -2.5245361328125, -2.45184326171875, -2.379150390625, -2.30645751953125, -2.2337646484375, -2.16107177734375, -2.08837890625, -2.01568603515625, -1.9429931640625, -1.87030029296875, -1.797607421875, -1.72491455078125, -1.6522216796875, -1.57952880859375, -1.5068359375, -1.43414306640625, -1.3614501953125, -1.28875732421875, -1.216064453125, -1.14337158203125, -1.0706787109375, -0.99798583984375, -0.92529296875, -0.85260009765625, -0.7799072265625, -0.70721435546875, -0.634521484375, -0.56182861328125, -0.4891357421875, -0.41644287109375, -0.34375, -0.27105712890625, -0.1983642578125, -0.12567138671875, -0.052978515625, 0.01971435546875, 0.0924072265625, 0.16510009765625, 0.23779296875, 0.31048583984375, 0.3831787109375, 0.45587158203125, 0.528564453125, 0.60125732421875, 0.6739501953125, 0.74664306640625, 0.8193359375, 0.89202880859375, 0.9647216796875, 1.03741455078125, 1.110107421875, 1.18280029296875, 1.2554931640625, 1.32818603515625, 1.40087890625, 1.47357177734375, 1.5462646484375, 1.61895751953125, 1.691650390625, 1.76434326171875, 1.8370361328125, 1.90972900390625, 1.982421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 8.0, 13.0, 12.0, 20.0, 24.0, 34.0, 53.0, 58.0, 95.0, 93.0, 110.0, 108.0, 97.0, 77.0, 52.0, 45.0, 19.0, 20.0, 14.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027680397033691406, -0.0002678297460079193, -0.00025885552167892456, -0.0002498812973499298, -0.00024090707302093506, -0.0002319328486919403, -0.00022295862436294556, -0.0002139844000339508, -0.00020501017570495605, -0.0001960359513759613, -0.00018706172704696655, -0.0001780875027179718, -0.00016911327838897705, -0.0001601390540599823, -0.00015116482973098755, -0.0001421906054019928, -0.00013321638107299805, -0.0001242421567440033, -0.00011526793241500854, -0.0001062937080860138, -9.731948375701904e-05, -8.834525942802429e-05, -7.937103509902954e-05, -7.039681077003479e-05, -6.142258644104004e-05, -5.244836211204529e-05, -4.347413778305054e-05, -3.4499913454055786e-05, -2.5525689125061035e-05, -1.6551464796066284e-05, -7.577240467071533e-06, 1.3969838619232178e-06, 1.0371208190917969e-05, 1.934543251991272e-05, 2.831965684890747e-05, 3.729388117790222e-05, 4.626810550689697e-05, 5.5242329835891724e-05, 6.421655416488647e-05, 7.319077849388123e-05, 8.216500282287598e-05, 9.113922715187073e-05, 0.00010011345148086548, 0.00010908767580986023, 0.00011806190013885498, 0.00012703612446784973, 0.00013601034879684448, 0.00014498457312583923, 0.00015395879745483398, 0.00016293302178382874, 0.00017190724611282349, 0.00018088147044181824, 0.000189855694770813, 0.00019882991909980774, 0.0002078041434288025, 0.00021677836775779724, 0.000225752592086792, 0.00023472681641578674, 0.0002437010407447815, 0.00025267526507377625, 0.000261649489402771, 0.00027062371373176575, 0.0002795979380607605, 0.00028857216238975525, 0.00029754638671875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 10.0, 5.0, 8.0, 4.0, 10.0, 9.0, 22.0, 10.0, 36.0, 52.0, 76.0, 111.0, 199.0, 356.0, 707.0, 1616.0, 5069.0, 20402.0, 144151.0, 652984.0, 188471.0, 25108.0, 5668.0, 1819.0, 739.0, 323.0, 208.0, 117.0, 82.0, 53.0, 37.0, 20.0, 19.0, 13.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.583984375, -2.506988525390625, -2.42999267578125, -2.352996826171875, -2.2760009765625, -2.199005126953125, -2.12200927734375, -2.045013427734375, -1.968017578125, -1.891021728515625, -1.81402587890625, -1.737030029296875, -1.6600341796875, -1.583038330078125, -1.50604248046875, -1.429046630859375, -1.35205078125, -1.275054931640625, -1.19805908203125, -1.121063232421875, -1.0440673828125, -0.967071533203125, -0.89007568359375, -0.813079833984375, -0.736083984375, -0.659088134765625, -0.58209228515625, -0.505096435546875, -0.4281005859375, -0.351104736328125, -0.27410888671875, -0.197113037109375, -0.1201171875, -0.043121337890625, 0.03387451171875, 0.110870361328125, 0.1878662109375, 0.264862060546875, 0.34185791015625, 0.418853759765625, 0.495849609375, 0.572845458984375, 0.64984130859375, 0.726837158203125, 0.8038330078125, 0.880828857421875, 0.95782470703125, 1.034820556640625, 1.11181640625, 1.188812255859375, 1.26580810546875, 1.342803955078125, 1.4197998046875, 1.496795654296875, 1.57379150390625, 1.650787353515625, 1.727783203125, 1.804779052734375, 1.88177490234375, 1.958770751953125, 2.0357666015625, 2.112762451171875, 2.18975830078125, 2.266754150390625, 2.34375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 17.0, 15.0, 19.0, 31.0, 58.0, 82.0, 101.0, 99.0, 111.0, 100.0, 93.0, 80.0, 60.0, 42.0, 28.0, 14.0, 14.0, 10.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.075897216796875, -1.03948974609375, -1.003082275390625, -0.9666748046875, -0.930267333984375, -0.89385986328125, -0.857452392578125, -0.821044921875, -0.784637451171875, -0.74822998046875, -0.711822509765625, -0.6754150390625, -0.639007568359375, -0.60260009765625, -0.566192626953125, -0.52978515625, -0.493377685546875, -0.45697021484375, -0.420562744140625, -0.3841552734375, -0.347747802734375, -0.31134033203125, -0.274932861328125, -0.238525390625, -0.202117919921875, -0.16571044921875, -0.129302978515625, -0.0928955078125, -0.056488037109375, -0.02008056640625, 0.016326904296875, 0.052734375, 0.089141845703125, 0.12554931640625, 0.161956787109375, 0.1983642578125, 0.234771728515625, 0.27117919921875, 0.307586669921875, 0.343994140625, 0.380401611328125, 0.41680908203125, 0.453216552734375, 0.4896240234375, 0.526031494140625, 0.56243896484375, 0.598846435546875, 0.63525390625, 0.671661376953125, 0.70806884765625, 0.744476318359375, 0.7808837890625, 0.817291259765625, 0.85369873046875, 0.890106201171875, 0.926513671875, 0.962921142578125, 0.99932861328125, 1.035736083984375, 1.0721435546875, 1.108551025390625, 1.14495849609375, 1.181365966796875, 1.2177734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 12.0, 68.0, 390.0, 436.0, 83.0, 18.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.533979415893555, -8.197861671447754, -6.861743927001953, -5.5256266593933105, -4.18950891494751, -2.853391170501709, -1.5172739028930664, -0.18115615844726562, 1.1549615859985352, 2.491079330444336, 3.8271968364715576, 5.163314342498779, 6.49943208694458, 7.835549831390381, 9.171667098999023, 10.507784843444824, 11.843902587890625, 13.180020332336426, 14.516138076782227, 15.852254867553711, 17.188373565673828, 18.524490356445312, 19.860607147216797, 21.196725845336914, 22.53284454345703, 23.868961334228516, 25.205080032348633, 26.541196823120117, 27.877315521240234, 29.21343231201172, 30.549549102783203, 31.88566780090332, 33.22178268432617, 34.557899475097656, 35.89401626586914, 37.23013687133789, 38.566253662109375, 39.90237045288086, 41.238487243652344, 42.574607849121094, 43.91072463989258, 45.24684143066406, 46.58295822143555, 47.9190788269043, 49.25519561767578, 50.591312408447266, 51.92742919921875, 53.2635498046875, 54.59966278076172, 55.9357795715332, 57.27189636230469, 58.60801696777344, 59.94413375854492, 61.280250549316406, 62.61636734008789, 63.952484130859375, 65.28860473632812, 66.62472534179688, 67.9608383178711, 69.29695892333984, 70.63307189941406, 71.96919250488281, 73.30531311035156, 74.64142608642578, 75.97754669189453]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 2.0, 8.0, 5.0, 6.0, 13.0, 14.0, 19.0, 31.0, 28.0, 41.0, 44.0, 59.0, 57.0, 68.0, 73.0, 57.0, 72.0, 64.0, 58.0, 56.0, 57.0, 38.0, 29.0, 21.0, 26.0, 14.0, 9.0, 13.0, 2.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.645059585571289, -4.440197944641113, -4.235335826873779, -4.030473709106445, -3.8256120681762695, -3.6207501888275146, -3.4158883094787598, -3.211026430130005, -3.00616455078125, -2.801302671432495, -2.5964407920837402, -2.3915789127349854, -2.1867170333862305, -1.9818551540374756, -1.7769932746887207, -1.5721313953399658, -1.367269515991211, -1.162407636642456, -0.9575457572937012, -0.7526838779449463, -0.5478219985961914, -0.3429601192474365, -0.13809823989868164, 0.06676363945007324, 0.2716255187988281, 0.476487398147583, 0.6813492774963379, 0.8862111568450928, 1.0910730361938477, 1.2959349155426025, 1.5007967948913574, 1.7056586742401123, 1.9105205535888672, 2.115382432937622, 2.320244312286377, 2.525106191635132, 2.7299680709838867, 2.9348299503326416, 3.1396918296813965, 3.3445537090301514, 3.5494155883789062, 3.754277467727661, 3.959139347076416, 4.16400146484375, 4.368863105773926, 4.573724746704102, 4.7785868644714355, 4.9834489822387695, 5.188310623168945, 5.393172264099121, 5.598034381866455, 5.802896499633789, 6.007758140563965, 6.212619781494141, 6.417481899261475, 6.622344017028809, 6.827205657958984, 7.03206729888916, 7.236929416656494, 7.441791534423828, 7.646653175354004, 7.85151481628418, 8.056377410888672, 8.261239051818848, 8.466100692749023]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 15.0, 24.0, 37.0, 90.0, 279.0, 1109.0, 14584.0, 4038357.0, 135510.0, 3389.0, 550.0, 185.0, 79.0, 46.0, 14.0, 10.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -3.7913818359375, -3.403076171875, -3.0147705078125, -2.62646484375, -2.2381591796875, -1.849853515625, -1.4615478515625, -1.0732421875, -0.6849365234375, -0.296630859375, 0.0916748046875, 0.47998046875, 0.8682861328125, 1.256591796875, 1.6448974609375, 2.033203125, 2.4215087890625, 2.809814453125, 3.1981201171875, 3.58642578125, 3.9747314453125, 4.363037109375, 4.7513427734375, 5.1396484375, 5.5279541015625, 5.916259765625, 6.3045654296875, 6.69287109375, 7.0811767578125, 7.469482421875, 7.8577880859375, 8.24609375, 8.6343994140625, 9.022705078125, 9.4110107421875, 9.79931640625, 10.1876220703125, 10.575927734375, 10.9642333984375, 11.3525390625, 11.7408447265625, 12.129150390625, 12.5174560546875, 12.90576171875, 13.2940673828125, 13.682373046875, 14.0706787109375, 14.458984375, 14.8472900390625, 15.235595703125, 15.6239013671875, 16.01220703125, 16.4005126953125, 16.788818359375, 17.1771240234375, 17.5654296875, 17.9537353515625, 18.342041015625, 18.7303466796875, 19.11865234375, 19.5069580078125, 19.895263671875, 20.2835693359375, 20.671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 5.0, 5.0, 14.0, 18.0, 20.0, 26.0, 42.0, 40.0, 50.0, 62.0, 62.0, 49.0, 64.0, 76.0, 71.0, 56.0, 65.0, 52.0, 40.0, 39.0, 36.0, 23.0, 20.0, 20.0, 11.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1353759765625, -0.13004112243652344, -0.12470626831054688, -0.11937141418457031, -0.11403656005859375, -0.10870170593261719, -0.10336685180664062, -0.09803199768066406, -0.0926971435546875, -0.08736228942871094, -0.08202743530273438, -0.07669258117675781, -0.07135772705078125, -0.06602287292480469, -0.060688018798828125, -0.05535316467285156, -0.050018310546875, -0.04468345642089844, -0.039348602294921875, -0.03401374816894531, -0.02867889404296875, -0.023344039916992188, -0.018009185791015625, -0.012674331665039062, -0.0073394775390625, -0.0020046234130859375, 0.003330230712890625, 0.008665084838867188, 0.01399993896484375, 0.019334793090820312, 0.024669647216796875, 0.030004501342773438, 0.03533935546875, 0.04067420959472656, 0.046009063720703125, 0.05134391784667969, 0.05667877197265625, 0.06201362609863281, 0.06734848022460938, 0.07268333435058594, 0.0780181884765625, 0.08335304260253906, 0.08868789672851562, 0.09402275085449219, 0.09935760498046875, 0.10469245910644531, 0.11002731323242188, 0.11536216735839844, 0.120697021484375, 0.12603187561035156, 0.13136672973632812, 0.1367015838623047, 0.14203643798828125, 0.1473712921142578, 0.15270614624023438, 0.15804100036621094, 0.1633758544921875, 0.16871070861816406, 0.17404556274414062, 0.1793804168701172, 0.18471527099609375, 0.1900501251220703, 0.19538497924804688, 0.20071983337402344, 0.2060546875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 11.0, 31.0, 54.0, 90.0, 127.0, 244.0, 486.0, 84251.0, 4107435.0, 885.0, 260.0, 187.0, 109.0, 68.0, 29.0, 16.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.625, -14.71435546875, -13.8037109375, -12.89306640625, -11.982421875, -11.07177734375, -10.1611328125, -9.25048828125, -8.33984375, -7.42919921875, -6.5185546875, -5.60791015625, -4.697265625, -3.78662109375, -2.8759765625, -1.96533203125, -1.0546875, -0.14404296875, 0.7666015625, 1.67724609375, 2.587890625, 3.49853515625, 4.4091796875, 5.31982421875, 6.23046875, 7.14111328125, 8.0517578125, 8.96240234375, 9.873046875, 10.78369140625, 11.6943359375, 12.60498046875, 13.515625, 14.42626953125, 15.3369140625, 16.24755859375, 17.158203125, 18.06884765625, 18.9794921875, 19.89013671875, 20.80078125, 21.71142578125, 22.6220703125, 23.53271484375, 24.443359375, 25.35400390625, 26.2646484375, 27.17529296875, 28.0859375, 28.99658203125, 29.9072265625, 30.81787109375, 31.728515625, 32.63916015625, 33.5498046875, 34.46044921875, 35.37109375, 36.28173828125, 37.1923828125, 38.10302734375, 39.013671875, 39.92431640625, 40.8349609375, 41.74560546875, 42.65625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 32.0, 69.0, 195.0, 643.0, 2448.0, 468.0, 137.0, 38.0, 23.0, 12.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.98333740234375, -0.9373779296875, -0.89141845703125, -0.845458984375, -0.79949951171875, -0.7535400390625, -0.70758056640625, -0.66162109375, -0.61566162109375, -0.5697021484375, -0.52374267578125, -0.477783203125, -0.43182373046875, -0.3858642578125, -0.33990478515625, -0.2939453125, -0.24798583984375, -0.2020263671875, -0.15606689453125, -0.110107421875, -0.06414794921875, -0.0181884765625, 0.02777099609375, 0.07373046875, 0.11968994140625, 0.1656494140625, 0.21160888671875, 0.257568359375, 0.30352783203125, 0.3494873046875, 0.39544677734375, 0.44140625, 0.48736572265625, 0.5333251953125, 0.57928466796875, 0.625244140625, 0.67120361328125, 0.7171630859375, 0.76312255859375, 0.80908203125, 0.85504150390625, 0.9010009765625, 0.94696044921875, 0.992919921875, 1.03887939453125, 1.0848388671875, 1.13079833984375, 1.1767578125, 1.22271728515625, 1.2686767578125, 1.31463623046875, 1.360595703125, 1.40655517578125, 1.4525146484375, 1.49847412109375, 1.54443359375, 1.59039306640625, 1.6363525390625, 1.68231201171875, 1.728271484375, 1.77423095703125, 1.8201904296875, 1.86614990234375, 1.912109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 88.0, 768.0, 124.0, 14.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.58824157714844, -42.15888595581055, -40.729530334472656, -39.3001708984375, -37.87081527709961, -36.44145965576172, -35.01210403442383, -33.58274841308594, -32.15338897705078, -30.72403335571289, -29.294675827026367, -27.865320205688477, -26.435962677001953, -25.006607055664062, -23.577251434326172, -22.14789390563965, -20.718538284301758, -19.289182662963867, -17.859825134277344, -16.430469512939453, -15.00111198425293, -13.571756362915039, -12.142399787902832, -10.713043212890625, -9.283686637878418, -7.854330062866211, -6.424973487854004, -4.995617389678955, -3.566260814666748, -2.136904239654541, -0.7075481414794922, 0.7218084335327148, 2.151165008544922, 3.580521583557129, 5.009878158569336, 6.439234256744385, 7.868590831756592, 9.29794692993164, 10.727303504943848, 12.156660079956055, 13.586016654968262, 15.015373229980469, 16.44472885131836, 17.874086380004883, 19.303442001342773, 20.732799530029297, 22.162155151367188, 23.591510772705078, 25.0208683013916, 26.450223922729492, 27.879581451416016, 29.308937072753906, 30.73829460144043, 32.16765213012695, 33.597007751464844, 35.026363372802734, 36.455718994140625, 37.885074615478516, 39.314430236816406, 40.74378967285156, 42.17314529418945, 43.602500915527344, 45.031856536865234, 46.461212158203125, 47.89057159423828]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 9.0, 16.0, 17.0, 30.0, 35.0, 45.0, 52.0, 66.0, 69.0, 87.0, 84.0, 93.0, 79.0, 61.0, 70.0, 53.0, 34.0, 36.0, 17.0, 17.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00689172744751, -3.8794171810150146, -3.7519426345825195, -3.6244678497314453, -3.49699330329895, -3.369518756866455, -3.242043972015381, -3.1145694255828857, -2.9870948791503906, -2.8596203327178955, -2.7321457862854004, -2.604671001434326, -2.477196455001831, -2.349721908569336, -2.2222471237182617, -2.0947725772857666, -1.9672980308532715, -1.8398234844207764, -1.7123488187789917, -1.584874153137207, -1.457399606704712, -1.3299250602722168, -1.2024503946304321, -1.0749757289886475, -0.9475011825561523, -0.8200265765190125, -0.6925519704818726, -0.5650773644447327, -0.4376027584075928, -0.3101281523704529, -0.182653546333313, -0.055178940296173096, 0.072296142578125, 0.1997707486152649, 0.3272453546524048, 0.4547199606895447, 0.5821945667266846, 0.7096691727638245, 0.8371437788009644, 0.9646183848381042, 1.0920929908752441, 1.2195675373077393, 1.347042202949524, 1.4745168685913086, 1.6019914150238037, 1.7294659614562988, 1.8569406270980835, 1.9844152927398682, 2.1118898391723633, 2.2393643856048584, 2.3668389320373535, 2.4943137168884277, 2.621788263320923, 2.749262809753418, 2.876737594604492, 3.0042121410369873, 3.1316866874694824, 3.2591612339019775, 3.3866357803344727, 3.514110565185547, 3.641585111618042, 3.769059658050537, 3.8965344429016113, 4.024008750915527, 4.151483535766602]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 7.0, 8.0, 10.0, 9.0, 20.0, 10.0, 16.0, 29.0, 26.0, 37.0, 48.0, 87.0, 130.0, 285.0, 504.0, 1084.0, 2649.0, 10690.0, 73798.0, 516290.0, 383521.0, 47618.0, 7587.0, 2143.0, 817.0, 445.0, 259.0, 117.0, 85.0, 47.0, 28.0, 26.0, 17.0, 15.0, 15.0, 23.0, 13.0, 12.0, 4.0, 9.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.841796875, -3.713287353515625, -3.58477783203125, -3.456268310546875, -3.3277587890625, -3.199249267578125, -3.07073974609375, -2.942230224609375, -2.813720703125, -2.685211181640625, -2.55670166015625, -2.428192138671875, -2.2996826171875, -2.171173095703125, -2.04266357421875, -1.914154052734375, -1.78564453125, -1.657135009765625, -1.52862548828125, -1.400115966796875, -1.2716064453125, -1.143096923828125, -1.01458740234375, -0.886077880859375, -0.757568359375, -0.629058837890625, -0.50054931640625, -0.372039794921875, -0.2435302734375, -0.115020751953125, 0.01348876953125, 0.141998291015625, 0.2705078125, 0.399017333984375, 0.52752685546875, 0.656036376953125, 0.7845458984375, 0.913055419921875, 1.04156494140625, 1.170074462890625, 1.298583984375, 1.427093505859375, 1.55560302734375, 1.684112548828125, 1.8126220703125, 1.941131591796875, 2.06964111328125, 2.198150634765625, 2.32666015625, 2.455169677734375, 2.58367919921875, 2.712188720703125, 2.8406982421875, 2.969207763671875, 3.09771728515625, 3.226226806640625, 3.354736328125, 3.483245849609375, 3.61175537109375, 3.740264892578125, 3.8687744140625, 3.997283935546875, 4.12579345703125, 4.254302978515625, 4.3828125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 17.0, 25.0, 34.0, 39.0, 47.0, 55.0, 64.0, 84.0, 97.0, 81.0, 83.0, 76.0, 63.0, 61.0, 53.0, 36.0, 26.0, 20.0, 11.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.258087158203125, -0.24932861328125, -0.240570068359375, -0.2318115234375, -0.223052978515625, -0.21429443359375, -0.205535888671875, -0.19677734375, -0.188018798828125, -0.17926025390625, -0.170501708984375, -0.1617431640625, -0.152984619140625, -0.14422607421875, -0.135467529296875, -0.126708984375, -0.117950439453125, -0.10919189453125, -0.100433349609375, -0.0916748046875, -0.082916259765625, -0.07415771484375, -0.065399169921875, -0.056640625, -0.047882080078125, -0.03912353515625, -0.030364990234375, -0.0216064453125, -0.012847900390625, -0.00408935546875, 0.004669189453125, 0.013427734375, 0.022186279296875, 0.03094482421875, 0.039703369140625, 0.0484619140625, 0.057220458984375, 0.06597900390625, 0.074737548828125, 0.08349609375, 0.092254638671875, 0.10101318359375, 0.109771728515625, 0.1185302734375, 0.127288818359375, 0.13604736328125, 0.144805908203125, 0.153564453125, 0.162322998046875, 0.17108154296875, 0.179840087890625, 0.1885986328125, 0.197357177734375, 0.20611572265625, 0.214874267578125, 0.2236328125, 0.232391357421875, 0.24114990234375, 0.249908447265625, 0.2586669921875, 0.267425537109375, 0.27618408203125, 0.284942626953125, 0.293701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 10.0, 15.0, 17.0, 26.0, 39.0, 52.0, 94.0, 203.0, 533.0, 1590.0, 5334.0, 24171.0, 164001.0, 604320.0, 208113.0, 30630.0, 6434.0, 1782.0, 614.0, 245.0, 104.0, 54.0, 24.0, 26.0, 18.0, 18.0, 15.0, 8.0, 8.0, 12.0, 3.0, 2.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.00762939453125, -2.9058837890625, -2.80413818359375, -2.702392578125, -2.60064697265625, -2.4989013671875, -2.39715576171875, -2.29541015625, -2.19366455078125, -2.0919189453125, -1.99017333984375, -1.888427734375, -1.78668212890625, -1.6849365234375, -1.58319091796875, -1.4814453125, -1.37969970703125, -1.2779541015625, -1.17620849609375, -1.074462890625, -0.97271728515625, -0.8709716796875, -0.76922607421875, -0.66748046875, -0.56573486328125, -0.4639892578125, -0.36224365234375, -0.260498046875, -0.15875244140625, -0.0570068359375, 0.04473876953125, 0.146484375, 0.24822998046875, 0.3499755859375, 0.45172119140625, 0.553466796875, 0.65521240234375, 0.7569580078125, 0.85870361328125, 0.96044921875, 1.06219482421875, 1.1639404296875, 1.26568603515625, 1.367431640625, 1.46917724609375, 1.5709228515625, 1.67266845703125, 1.7744140625, 1.87615966796875, 1.9779052734375, 2.07965087890625, 2.181396484375, 2.28314208984375, 2.3848876953125, 2.48663330078125, 2.58837890625, 2.69012451171875, 2.7918701171875, 2.89361572265625, 2.995361328125, 3.09710693359375, 3.1988525390625, 3.30059814453125, 3.40234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 8.0, 11.0, 11.0, 16.0, 16.0, 25.0, 27.0, 22.0, 21.0, 29.0, 29.0, 31.0, 42.0, 35.0, 47.0, 33.0, 45.0, 38.0, 47.0, 32.0, 40.0, 44.0, 41.0, 34.0, 31.0, 31.0, 35.0, 16.0, 24.0, 20.0, 20.0, 14.0, 12.0, 11.0, 10.0, 16.0, 10.0, 3.0, 8.0, 6.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.83642578125, -0.8103103637695312, -0.7841949462890625, -0.7580795288085938, -0.731964111328125, -0.7058486938476562, -0.6797332763671875, -0.6536178588867188, -0.62750244140625, -0.6013870239257812, -0.5752716064453125, -0.5491561889648438, -0.523040771484375, -0.49692535400390625, -0.4708099365234375, -0.44469451904296875, -0.4185791015625, -0.39246368408203125, -0.3663482666015625, -0.34023284912109375, -0.314117431640625, -0.28800201416015625, -0.2618865966796875, -0.23577117919921875, -0.20965576171875, -0.18354034423828125, -0.1574249267578125, -0.13130950927734375, -0.105194091796875, -0.07907867431640625, -0.0529632568359375, -0.02684783935546875, -0.000732421875, 0.02538299560546875, 0.0514984130859375, 0.07761383056640625, 0.103729248046875, 0.12984466552734375, 0.1559600830078125, 0.18207550048828125, 0.20819091796875, 0.23430633544921875, 0.2604217529296875, 0.28653717041015625, 0.312652587890625, 0.33876800537109375, 0.3648834228515625, 0.39099884033203125, 0.4171142578125, 0.44322967529296875, 0.4693450927734375, 0.49546051025390625, 0.521575927734375, 0.5476913452148438, 0.5738067626953125, 0.5999221801757812, 0.62603759765625, 0.6521530151367188, 0.6782684326171875, 0.7043838500976562, 0.730499267578125, 0.7566146850585938, 0.7827301025390625, 0.8088455200195312, 0.8349609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 17.0, 30.0, 48.0, 87.0, 135.0, 269.0, 553.0, 1254.0, 3308.0, 11445.0, 76354.0, 632188.0, 284546.0, 28573.0, 5986.0, 2079.0, 802.0, 356.0, 220.0, 107.0, 68.0, 46.0, 19.0, 12.0, 8.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435546875, -3.34210205078125, -3.2486572265625, -3.15521240234375, -3.061767578125, -2.96832275390625, -2.8748779296875, -2.78143310546875, -2.68798828125, -2.59454345703125, -2.5010986328125, -2.40765380859375, -2.314208984375, -2.22076416015625, -2.1273193359375, -2.03387451171875, -1.9404296875, -1.84698486328125, -1.7535400390625, -1.66009521484375, -1.566650390625, -1.47320556640625, -1.3797607421875, -1.28631591796875, -1.19287109375, -1.09942626953125, -1.0059814453125, -0.91253662109375, -0.819091796875, -0.72564697265625, -0.6322021484375, -0.53875732421875, -0.4453125, -0.35186767578125, -0.2584228515625, -0.16497802734375, -0.071533203125, 0.02191162109375, 0.1153564453125, 0.20880126953125, 0.30224609375, 0.39569091796875, 0.4891357421875, 0.58258056640625, 0.676025390625, 0.76947021484375, 0.8629150390625, 0.95635986328125, 1.0498046875, 1.14324951171875, 1.2366943359375, 1.33013916015625, 1.423583984375, 1.51702880859375, 1.6104736328125, 1.70391845703125, 1.79736328125, 1.89080810546875, 1.9842529296875, 2.07769775390625, 2.171142578125, 2.26458740234375, 2.3580322265625, 2.45147705078125, 2.544921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 24.0, 16.0, 31.0, 61.0, 74.0, 103.0, 137.0, 158.0, 119.0, 85.0, 59.0, 48.0, 22.0, 16.0, 14.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003528594970703125, -0.0003422647714614868, -0.00033167004585266113, -0.00032107532024383545, -0.00031048059463500977, -0.0002998858690261841, -0.0002892911434173584, -0.0002786964178085327, -0.00026810169219970703, -0.00025750696659088135, -0.00024691224098205566, -0.00023631751537322998, -0.0002257227897644043, -0.0002151280641555786, -0.00020453333854675293, -0.00019393861293792725, -0.00018334388732910156, -0.00017274916172027588, -0.0001621544361114502, -0.0001515597105026245, -0.00014096498489379883, -0.00013037025928497314, -0.00011977553367614746, -0.00010918080806732178, -9.85860824584961e-05, -8.799135684967041e-05, -7.739663124084473e-05, -6.680190563201904e-05, -5.620718002319336e-05, -4.5612454414367676e-05, -3.501772880554199e-05, -2.442300319671631e-05, -1.3828277587890625e-05, -3.2335519790649414e-06, 7.361173629760742e-06, 1.7955899238586426e-05, 2.855062484741211e-05, 3.914535045623779e-05, 4.9740076065063477e-05, 6.033480167388916e-05, 7.092952728271484e-05, 8.152425289154053e-05, 9.211897850036621e-05, 0.0001027137041091919, 0.00011330842971801758, 0.00012390315532684326, 0.00013449788093566895, 0.00014509260654449463, 0.0001556873321533203, 0.000166282057762146, 0.00017687678337097168, 0.00018747150897979736, 0.00019806623458862305, 0.00020866096019744873, 0.00021925568580627441, 0.0002298504114151001, 0.00024044513702392578, 0.00025103986263275146, 0.00026163458824157715, 0.00027222931385040283, 0.0002828240394592285, 0.0002934187650680542, 0.0003040134906768799, 0.00031460821628570557, 0.00032520294189453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 12.0, 17.0, 16.0, 34.0, 46.0, 77.0, 167.0, 344.0, 707.0, 2084.0, 8328.0, 69633.0, 644571.0, 292141.0, 24166.0, 4037.0, 1148.0, 476.0, 189.0, 132.0, 77.0, 51.0, 19.0, 22.0, 7.0, 10.0, 9.0, 9.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.2421875, -4.14300537109375, -4.0438232421875, -3.94464111328125, -3.845458984375, -3.74627685546875, -3.6470947265625, -3.54791259765625, -3.44873046875, -3.34954833984375, -3.2503662109375, -3.15118408203125, -3.052001953125, -2.95281982421875, -2.8536376953125, -2.75445556640625, -2.6552734375, -2.55609130859375, -2.4569091796875, -2.35772705078125, -2.258544921875, -2.15936279296875, -2.0601806640625, -1.96099853515625, -1.86181640625, -1.76263427734375, -1.6634521484375, -1.56427001953125, -1.465087890625, -1.36590576171875, -1.2667236328125, -1.16754150390625, -1.068359375, -0.96917724609375, -0.8699951171875, -0.77081298828125, -0.671630859375, -0.57244873046875, -0.4732666015625, -0.37408447265625, -0.27490234375, -0.17572021484375, -0.0765380859375, 0.02264404296875, 0.121826171875, 0.22100830078125, 0.3201904296875, 0.41937255859375, 0.5185546875, 0.61773681640625, 0.7169189453125, 0.81610107421875, 0.915283203125, 1.01446533203125, 1.1136474609375, 1.21282958984375, 1.31201171875, 1.41119384765625, 1.5103759765625, 1.60955810546875, 1.708740234375, 1.80792236328125, 1.9071044921875, 2.00628662109375, 2.10546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 4.0, 10.0, 15.0, 24.0, 26.0, 38.0, 44.0, 86.0, 73.0, 96.0, 94.0, 82.0, 77.0, 80.0, 61.0, 47.0, 35.0, 27.0, 17.0, 13.0, 6.0, 9.0, 4.0, 8.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.7080078125, -1.6679000854492188, -1.6277923583984375, -1.5876846313476562, -1.547576904296875, -1.5074691772460938, -1.4673614501953125, -1.4272537231445312, -1.38714599609375, -1.3470382690429688, -1.3069305419921875, -1.2668228149414062, -1.226715087890625, -1.1866073608398438, -1.1464996337890625, -1.1063919067382812, -1.0662841796875, -1.0261764526367188, -0.9860687255859375, -0.9459609985351562, -0.905853271484375, -0.8657455444335938, -0.8256378173828125, -0.7855300903320312, -0.74542236328125, -0.7053146362304688, -0.6652069091796875, -0.6250991821289062, -0.584991455078125, -0.5448837280273438, -0.5047760009765625, -0.46466827392578125, -0.424560546875, -0.38445281982421875, -0.3443450927734375, -0.30423736572265625, -0.264129638671875, -0.22402191162109375, -0.1839141845703125, -0.14380645751953125, -0.10369873046875, -0.06359100341796875, -0.0234832763671875, 0.01662445068359375, 0.056732177734375, 0.09683990478515625, 0.1369476318359375, 0.17705535888671875, 0.2171630859375, 0.25727081298828125, 0.2973785400390625, 0.33748626708984375, 0.377593994140625, 0.41770172119140625, 0.4578094482421875, 0.49791717529296875, 0.53802490234375, 0.5781326293945312, 0.6182403564453125, 0.6583480834960938, 0.698455810546875, 0.7385635375976562, 0.7786712646484375, 0.8187789916992188, 0.85888671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 34.0, 141.0, 436.0, 318.0, 57.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.23845672607422, -17.749343872070312, -16.260231018066406, -14.7711181640625, -13.282005310058594, -11.792892456054688, -10.303780555725098, -8.814667701721191, -7.325554847717285, -5.836441993713379, -4.347329139709473, -2.8582167625427246, -1.3691039085388184, 0.12000894546508789, 1.609121322631836, 3.098234176635742, 4.587347030639648, 6.076459884643555, 7.565572738647461, 9.054685592651367, 10.543798446655273, 12.03291130065918, 13.52202320098877, 15.011136054992676, 16.500247955322266, 17.989360809326172, 19.478473663330078, 20.967586517333984, 22.45669937133789, 23.945812225341797, 25.434925079345703, 26.92403793334961, 28.413150787353516, 29.902263641357422, 31.391376495361328, 32.880489349365234, 34.36960220336914, 35.85871505737305, 37.34782791137695, 38.83694076538086, 40.326053619384766, 41.81516647338867, 43.30427932739258, 44.793392181396484, 46.28250503540039, 47.7716178894043, 49.2607307434082, 50.74984359741211, 52.23895263671875, 53.728065490722656, 55.21717834472656, 56.70629119873047, 58.195404052734375, 59.68451690673828, 61.17362976074219, 62.662742614746094, 64.15185546875, 65.6409683227539, 67.13008117675781, 68.61919403076172, 70.10830688476562, 71.59741973876953, 73.08653259277344, 74.57564544677734, 76.06475830078125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 23.0, 10.0, 21.0, 20.0, 23.0, 33.0, 40.0, 34.0, 50.0, 48.0, 42.0, 62.0, 49.0, 41.0, 38.0, 54.0, 54.0, 34.0, 42.0, 35.0, 32.0, 33.0, 26.0, 23.0, 14.0, 15.0, 18.0, 7.0, 10.0, 8.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.494129180908203, -6.2764458656311035, -6.058763027191162, -5.8410797119140625, -5.623396396636963, -5.405713081359863, -5.188030242919922, -4.970346927642822, -4.752663612365723, -4.534980297088623, -4.317297458648682, -4.099614143371582, -3.8819308280944824, -3.664247751235962, -3.4465646743774414, -3.228881359100342, -3.0111982822418213, -2.793515205383301, -2.575831890106201, -2.3581488132476807, -2.140465497970581, -1.9227824211120605, -1.7050992250442505, -1.4874160289764404, -1.2697328329086304, -1.0520496368408203, -0.8343664407730103, -0.616683304309845, -0.3990001082420349, -0.18131697177886963, 0.03636622428894043, 0.2540494203567505, 0.47173261642456055, 0.6894158124923706, 0.9070990085601807, 1.1247820854187012, 1.3424654006958008, 1.5601484775543213, 1.7778316736221313, 1.9955148696899414, 2.213198184967041, 2.4308812618255615, 2.648564577102661, 2.8662476539611816, 3.0839309692382812, 3.3016140460968018, 3.5192971229553223, 3.736980438232422, 3.9546635150909424, 4.172346591949463, 4.3900299072265625, 4.607713222503662, 4.8253960609436035, 5.043079376220703, 5.260762691497803, 5.478446006774902, 5.696128845214844, 5.913812160491943, 6.131494998931885, 6.349178314208984, 6.566861629486084, 6.784544944763184, 7.002227783203125, 7.219911098480225, 7.437594413757324]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 13.0, 29.0, 73.0, 150.0, 392.0, 1635.0, 12219.0, 594274.0, 3559695.0, 22443.0, 2367.0, 547.0, 204.0, 89.0, 52.0, 25.0, 26.0, 14.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.199371337890625, -2.95538330078125, -2.711395263671875, -2.4674072265625, -2.223419189453125, -1.97943115234375, -1.735443115234375, -1.491455078125, -1.247467041015625, -1.00347900390625, -0.759490966796875, -0.5155029296875, -0.271514892578125, -0.02752685546875, 0.216461181640625, 0.46044921875, 0.704437255859375, 0.94842529296875, 1.192413330078125, 1.4364013671875, 1.680389404296875, 1.92437744140625, 2.168365478515625, 2.412353515625, 2.656341552734375, 2.90032958984375, 3.144317626953125, 3.3883056640625, 3.632293701171875, 3.87628173828125, 4.120269775390625, 4.3642578125, 4.608245849609375, 4.85223388671875, 5.096221923828125, 5.3402099609375, 5.584197998046875, 5.82818603515625, 6.072174072265625, 6.316162109375, 6.560150146484375, 6.80413818359375, 7.048126220703125, 7.2921142578125, 7.536102294921875, 7.78009033203125, 8.024078369140625, 8.26806640625, 8.512054443359375, 8.75604248046875, 9.000030517578125, 9.2440185546875, 9.488006591796875, 9.73199462890625, 9.975982666015625, 10.219970703125, 10.463958740234375, 10.70794677734375, 10.951934814453125, 11.1959228515625, 11.439910888671875, 11.68389892578125, 11.927886962890625, 12.171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 6.0, 9.0, 20.0, 19.0, 30.0, 36.0, 39.0, 63.0, 73.0, 64.0, 80.0, 68.0, 79.0, 86.0, 56.0, 56.0, 50.0, 45.0, 34.0, 34.0, 9.0, 12.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2349853515625, -0.2261943817138672, -0.21740341186523438, -0.20861244201660156, -0.19982147216796875, -0.19103050231933594, -0.18223953247070312, -0.1734485626220703, -0.1646575927734375, -0.1558666229248047, -0.14707565307617188, -0.13828468322753906, -0.12949371337890625, -0.12070274353027344, -0.11191177368164062, -0.10312080383300781, -0.094329833984375, -0.08553886413574219, -0.07674789428710938, -0.06795692443847656, -0.05916595458984375, -0.05037498474121094, -0.041584014892578125, -0.03279304504394531, -0.0240020751953125, -0.015211105346679688, -0.006420135498046875, 0.0023708343505859375, 0.01116180419921875, 0.019952774047851562, 0.028743743896484375, 0.03753471374511719, 0.04632568359375, 0.05511665344238281, 0.06390762329101562, 0.07269859313964844, 0.08148956298828125, 0.09028053283691406, 0.09907150268554688, 0.10786247253417969, 0.1166534423828125, 0.1254444122314453, 0.13423538208007812, 0.14302635192871094, 0.15181732177734375, 0.16060829162597656, 0.16939926147460938, 0.1781902313232422, 0.186981201171875, 0.1957721710205078, 0.20456314086914062, 0.21335411071777344, 0.22214508056640625, 0.23093605041503906, 0.23972702026367188, 0.2485179901123047, 0.2573089599609375, 0.2660999298095703, 0.2748908996582031, 0.28368186950683594, 0.29247283935546875, 0.30126380920410156, 0.3100547790527344, 0.3188457489013672, 0.32763671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 12.0, 15.0, 47.0, 79.0, 186.0, 579.0, 5342.0, 4168900.0, 17522.0, 1020.0, 317.0, 114.0, 71.0, 34.0, 25.0, 3.0, 10.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.6331787109375, -9.992919921875, -9.3526611328125, -8.71240234375, -8.0721435546875, -7.431884765625, -6.7916259765625, -6.1513671875, -5.5111083984375, -4.870849609375, -4.2305908203125, -3.59033203125, -2.9500732421875, -2.309814453125, -1.6695556640625, -1.029296875, -0.3890380859375, 0.251220703125, 0.8914794921875, 1.53173828125, 2.1719970703125, 2.812255859375, 3.4525146484375, 4.0927734375, 4.7330322265625, 5.373291015625, 6.0135498046875, 6.65380859375, 7.2940673828125, 7.934326171875, 8.5745849609375, 9.21484375, 9.8551025390625, 10.495361328125, 11.1356201171875, 11.77587890625, 12.4161376953125, 13.056396484375, 13.6966552734375, 14.3369140625, 14.9771728515625, 15.617431640625, 16.2576904296875, 16.89794921875, 17.5382080078125, 18.178466796875, 18.8187255859375, 19.458984375, 20.0992431640625, 20.739501953125, 21.3797607421875, 22.02001953125, 22.6602783203125, 23.300537109375, 23.9407958984375, 24.5810546875, 25.2213134765625, 25.861572265625, 26.5018310546875, 27.14208984375, 27.7823486328125, 28.422607421875, 29.0628662109375, 29.703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 19.0, 24.0, 45.0, 90.0, 208.0, 506.0, 1739.0, 856.0, 320.0, 126.0, 55.0, 41.0, 19.0, 7.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.49378204345703125, -0.4577789306640625, -0.42177581787109375, -0.385772705078125, -0.34976959228515625, -0.3137664794921875, -0.27776336669921875, -0.24176025390625, -0.20575714111328125, -0.1697540283203125, -0.13375091552734375, -0.097747802734375, -0.06174468994140625, -0.0257415771484375, 0.01026153564453125, 0.0462646484375, 0.08226776123046875, 0.1182708740234375, 0.15427398681640625, 0.190277099609375, 0.22628021240234375, 0.2622833251953125, 0.29828643798828125, 0.33428955078125, 0.37029266357421875, 0.4062957763671875, 0.44229888916015625, 0.478302001953125, 0.5143051147460938, 0.5503082275390625, 0.5863113403320312, 0.622314453125, 0.6583175659179688, 0.6943206787109375, 0.7303237915039062, 0.766326904296875, 0.8023300170898438, 0.8383331298828125, 0.8743362426757812, 0.91033935546875, 0.9463424682617188, 0.9823455810546875, 1.0183486938476562, 1.054351806640625, 1.0903549194335938, 1.1263580322265625, 1.1623611450195312, 1.1983642578125, 1.2343673706054688, 1.2703704833984375, 1.3063735961914062, 1.342376708984375, 1.3783798217773438, 1.4143829345703125, 1.4503860473632812, 1.48638916015625, 1.5223922729492188, 1.5583953857421875, 1.5943984985351562, 1.630401611328125, 1.6664047241210938, 1.7024078369140625, 1.7384109497070312, 1.7744140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 38.0, 511.0, 406.0, 36.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.10993194580078, -51.952728271484375, -50.795528411865234, -49.638328552246094, -48.48112487792969, -47.32392120361328, -46.16672134399414, -45.009521484375, -43.852317810058594, -42.69511413574219, -41.53791427612305, -40.380714416503906, -39.2235107421875, -38.066307067871094, -36.90910720825195, -35.75190734863281, -34.594703674316406, -33.4375, -32.28030014038086, -31.123098373413086, -29.965896606445312, -28.80869483947754, -27.651493072509766, -26.494291305541992, -25.33708953857422, -24.179887771606445, -23.022686004638672, -21.8654842376709, -20.708282470703125, -19.55108070373535, -18.393878936767578, -17.236677169799805, -16.079479217529297, -14.922277450561523, -13.76507568359375, -12.607873916625977, -11.450672149658203, -10.29347038269043, -9.136268615722656, -7.979066848754883, -6.821865081787109, -5.664663314819336, -4.5074615478515625, -3.350259780883789, -2.1930580139160156, -1.0358562469482422, 0.12134552001953125, 1.2785472869873047, 2.435749053955078, 3.5929508209228516, 4.750152587890625, 5.907354354858398, 7.064556121826172, 8.221757888793945, 9.378959655761719, 10.536161422729492, 11.693363189697266, 12.850564956665039, 14.007766723632812, 15.164968490600586, 16.32217025756836, 17.479372024536133, 18.636573791503906, 19.79377555847168, 20.950977325439453]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 13.0, 9.0, 8.0, 22.0, 24.0, 35.0, 33.0, 50.0, 66.0, 57.0, 73.0, 71.0, 69.0, 70.0, 65.0, 65.0, 69.0, 43.0, 32.0, 30.0, 26.0, 21.0, 10.0, 13.0, 7.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.728523254394531, -4.588433742523193, -4.4483442306518555, -4.308254718780518, -4.16816520690918, -4.028076171875, -3.887986660003662, -3.747897148132324, -3.6078076362609863, -3.4677181243896484, -3.3276286125183105, -3.1875393390655518, -3.047449827194214, -2.907360315322876, -2.767271041870117, -2.6271815299987793, -2.4870920181274414, -2.3470025062561035, -2.2069129943847656, -2.066823720932007, -1.926734209060669, -1.786644697189331, -1.6465553045272827, -1.5064659118652344, -1.3663763999938965, -1.2262868881225586, -1.0861974954605103, -0.9461080431938171, -0.806018590927124, -0.6659291386604309, -0.5258396863937378, -0.3857502341270447, -0.24566125869750977, -0.10557180643081665, 0.034517645835876465, 0.17460709810256958, 0.3146965503692627, 0.4547860026359558, 0.5948754549026489, 0.734964907169342, 0.8750543594360352, 1.015143871307373, 1.1552332639694214, 1.2953226566314697, 1.4354121685028076, 1.5755016803741455, 1.7155910730361938, 1.8556804656982422, 1.99576997756958, 2.135859489440918, 2.275949001312256, 2.4160382747650146, 2.5561277866363525, 2.6962172985076904, 2.836306571960449, 2.976396083831787, 3.116485595703125, 3.256575107574463, 3.396664619445801, 3.5367538928985596, 3.6768434047698975, 3.8169329166412354, 3.957022190093994, 4.097111701965332, 4.23720121383667]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 4.0, 8.0, 7.0, 15.0, 16.0, 19.0, 26.0, 41.0, 41.0, 55.0, 91.0, 104.0, 173.0, 253.0, 404.0, 721.0, 1509.0, 3935.0, 13462.0, 58796.0, 305040.0, 504920.0, 121870.0, 25635.0, 6619.0, 2269.0, 961.0, 515.0, 291.0, 218.0, 134.0, 101.0, 55.0, 67.0, 41.0, 27.0, 33.0, 19.0, 13.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.6875, -3.576507568359375, -3.46551513671875, -3.354522705078125, -3.2435302734375, -3.132537841796875, -3.02154541015625, -2.910552978515625, -2.799560546875, -2.688568115234375, -2.57757568359375, -2.466583251953125, -2.3555908203125, -2.244598388671875, -2.13360595703125, -2.022613525390625, -1.91162109375, -1.800628662109375, -1.68963623046875, -1.578643798828125, -1.4676513671875, -1.356658935546875, -1.24566650390625, -1.134674072265625, -1.023681640625, -0.912689208984375, -0.80169677734375, -0.690704345703125, -0.5797119140625, -0.468719482421875, -0.35772705078125, -0.246734619140625, -0.1357421875, -0.024749755859375, 0.08624267578125, 0.197235107421875, 0.3082275390625, 0.419219970703125, 0.53021240234375, 0.641204833984375, 0.752197265625, 0.863189697265625, 0.97418212890625, 1.085174560546875, 1.1961669921875, 1.307159423828125, 1.41815185546875, 1.529144287109375, 1.64013671875, 1.751129150390625, 1.86212158203125, 1.973114013671875, 2.0841064453125, 2.195098876953125, 2.30609130859375, 2.417083740234375, 2.528076171875, 2.639068603515625, 2.75006103515625, 2.861053466796875, 2.9720458984375, 3.083038330078125, 3.19403076171875, 3.305023193359375, 3.416015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 9.0, 8.0, 12.0, 19.0, 23.0, 27.0, 38.0, 37.0, 45.0, 46.0, 51.0, 74.0, 59.0, 63.0, 63.0, 69.0, 77.0, 54.0, 36.0, 31.0, 38.0, 41.0, 28.0, 15.0, 13.0, 8.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.33203125, -0.3219032287597656, -0.31177520751953125, -0.3016471862792969, -0.2915191650390625, -0.2813911437988281, -0.27126312255859375, -0.2611351013183594, -0.251007080078125, -0.24087905883789062, -0.23075103759765625, -0.22062301635742188, -0.2104949951171875, -0.20036697387695312, -0.19023895263671875, -0.18011093139648438, -0.16998291015625, -0.15985488891601562, -0.14972686767578125, -0.13959884643554688, -0.1294708251953125, -0.11934280395507812, -0.10921478271484375, -0.09908676147460938, -0.088958740234375, -0.07883071899414062, -0.06870269775390625, -0.058574676513671875, -0.0484466552734375, -0.038318634033203125, -0.02819061279296875, -0.018062591552734375, -0.0079345703125, 0.002193450927734375, 0.01232147216796875, 0.022449493408203125, 0.0325775146484375, 0.042705535888671875, 0.05283355712890625, 0.06296157836914062, 0.073089599609375, 0.08321762084960938, 0.09334564208984375, 0.10347366333007812, 0.1136016845703125, 0.12372970581054688, 0.13385772705078125, 0.14398574829101562, 0.15411376953125, 0.16424179077148438, 0.17436981201171875, 0.18449783325195312, 0.1946258544921875, 0.20475387573242188, 0.21488189697265625, 0.22500991821289062, 0.235137939453125, 0.24526596069335938, 0.25539398193359375, 0.2655220031738281, 0.2756500244140625, 0.2857780456542969, 0.29590606689453125, 0.3060340881347656, 0.316162109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 13.0, 12.0, 27.0, 24.0, 66.0, 79.0, 130.0, 255.0, 455.0, 899.0, 1938.0, 4481.0, 11624.0, 37228.0, 138482.0, 420735.0, 309941.0, 83977.0, 23938.0, 8064.0, 3188.0, 1374.0, 718.0, 367.0, 168.0, 135.0, 77.0, 49.0, 37.0, 18.0, 12.0, 10.0, 2.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.630859375, -2.557403564453125, -2.48394775390625, -2.410491943359375, -2.3370361328125, -2.263580322265625, -2.19012451171875, -2.116668701171875, -2.043212890625, -1.969757080078125, -1.89630126953125, -1.822845458984375, -1.7493896484375, -1.675933837890625, -1.60247802734375, -1.529022216796875, -1.45556640625, -1.382110595703125, -1.30865478515625, -1.235198974609375, -1.1617431640625, -1.088287353515625, -1.01483154296875, -0.941375732421875, -0.867919921875, -0.794464111328125, -0.72100830078125, -0.647552490234375, -0.5740966796875, -0.500640869140625, -0.42718505859375, -0.353729248046875, -0.2802734375, -0.206817626953125, -0.13336181640625, -0.059906005859375, 0.0135498046875, 0.087005615234375, 0.16046142578125, 0.233917236328125, 0.307373046875, 0.380828857421875, 0.45428466796875, 0.527740478515625, 0.6011962890625, 0.674652099609375, 0.74810791015625, 0.821563720703125, 0.89501953125, 0.968475341796875, 1.04193115234375, 1.115386962890625, 1.1888427734375, 1.262298583984375, 1.33575439453125, 1.409210205078125, 1.482666015625, 1.556121826171875, 1.62957763671875, 1.703033447265625, 1.7764892578125, 1.849945068359375, 1.92340087890625, 1.996856689453125, 2.0703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 6.0, 9.0, 11.0, 11.0, 10.0, 14.0, 20.0, 19.0, 25.0, 21.0, 29.0, 35.0, 36.0, 49.0, 35.0, 48.0, 40.0, 50.0, 37.0, 39.0, 36.0, 41.0, 29.0, 41.0, 26.0, 37.0, 35.0, 35.0, 32.0, 15.0, 30.0, 18.0, 14.0, 16.0, 12.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0], "bins": [-1.3037109375, -1.2694625854492188, -1.2352142333984375, -1.2009658813476562, -1.166717529296875, -1.1324691772460938, -1.0982208251953125, -1.0639724731445312, -1.02972412109375, -0.9954757690429688, -0.9612274169921875, -0.9269790649414062, -0.892730712890625, -0.8584823608398438, -0.8242340087890625, -0.7899856567382812, -0.7557373046875, -0.7214889526367188, -0.6872406005859375, -0.6529922485351562, -0.618743896484375, -0.5844955444335938, -0.5502471923828125, -0.5159988403320312, -0.48175048828125, -0.44750213623046875, -0.4132537841796875, -0.37900543212890625, -0.344757080078125, -0.31050872802734375, -0.2762603759765625, -0.24201202392578125, -0.207763671875, -0.17351531982421875, -0.1392669677734375, -0.10501861572265625, -0.070770263671875, -0.03652191162109375, -0.0022735595703125, 0.03197479248046875, 0.06622314453125, 0.10047149658203125, 0.1347198486328125, 0.16896820068359375, 0.203216552734375, 0.23746490478515625, 0.2717132568359375, 0.30596160888671875, 0.3402099609375, 0.37445831298828125, 0.4087066650390625, 0.44295501708984375, 0.477203369140625, 0.5114517211914062, 0.5457000732421875, 0.5799484252929688, 0.61419677734375, 0.6484451293945312, 0.6826934814453125, 0.7169418334960938, 0.751190185546875, 0.7854385375976562, 0.8196868896484375, 0.8539352416992188, 0.88818359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 10.0, 7.0, 14.0, 10.0, 18.0, 31.0, 46.0, 52.0, 97.0, 136.0, 175.0, 282.0, 436.0, 680.0, 1216.0, 2215.0, 4767.0, 11350.0, 33002.0, 119041.0, 385624.0, 343644.0, 98618.0, 27857.0, 9964.0, 4172.0, 2111.0, 1100.0, 668.0, 394.0, 253.0, 159.0, 141.0, 81.0, 48.0, 34.0, 20.0, 29.0, 21.0, 5.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2974700927734375, -1.254119873046875, -1.2107696533203125, -1.16741943359375, -1.1240692138671875, -1.080718994140625, -1.0373687744140625, -0.9940185546875, -0.9506683349609375, -0.907318115234375, -0.8639678955078125, -0.82061767578125, -0.7772674560546875, -0.733917236328125, -0.6905670166015625, -0.647216796875, -0.6038665771484375, -0.560516357421875, -0.5171661376953125, -0.47381591796875, -0.4304656982421875, -0.387115478515625, -0.3437652587890625, -0.3004150390625, -0.2570648193359375, -0.213714599609375, -0.1703643798828125, -0.12701416015625, -0.0836639404296875, -0.040313720703125, 0.0030364990234375, 0.04638671875, 0.0897369384765625, 0.133087158203125, 0.1764373779296875, 0.21978759765625, 0.2631378173828125, 0.306488037109375, 0.3498382568359375, 0.3931884765625, 0.4365386962890625, 0.479888916015625, 0.5232391357421875, 0.56658935546875, 0.6099395751953125, 0.653289794921875, 0.6966400146484375, 0.739990234375, 0.7833404541015625, 0.826690673828125, 0.8700408935546875, 0.91339111328125, 0.9567413330078125, 1.000091552734375, 1.0434417724609375, 1.0867919921875, 1.1301422119140625, 1.173492431640625, 1.2168426513671875, 1.26019287109375, 1.3035430908203125, 1.346893310546875, 1.3902435302734375, 1.43359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 7.0, 13.0, 11.0, 13.0, 15.0, 26.0, 29.0, 32.0, 44.0, 54.0, 58.0, 82.0, 100.0, 69.0, 66.0, 66.0, 54.0, 70.0, 42.0, 19.0, 24.0, 17.0, 21.0, 12.0, 10.0, 5.0, 10.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00017642974853515625, -0.0001715049147605896, -0.00016658008098602295, -0.0001616552472114563, -0.00015673041343688965, -0.000151805579662323, -0.00014688074588775635, -0.0001419559121131897, -0.00013703107833862305, -0.0001321062445640564, -0.00012718141078948975, -0.0001222565770149231, -0.00011733174324035645, -0.0001124069094657898, -0.00010748207569122314, -0.0001025572419166565, -9.763240814208984e-05, -9.27075743675232e-05, -8.778274059295654e-05, -8.285790681838989e-05, -7.793307304382324e-05, -7.300823926925659e-05, -6.808340549468994e-05, -6.315857172012329e-05, -5.823373794555664e-05, -5.330890417098999e-05, -4.838407039642334e-05, -4.345923662185669e-05, -3.853440284729004e-05, -3.360956907272339e-05, -2.8684735298156738e-05, -2.3759901523590088e-05, -1.8835067749023438e-05, -1.3910233974456787e-05, -8.985400199890137e-06, -4.060566425323486e-06, 8.642673492431641e-07, 5.7891011238098145e-06, 1.0713934898376465e-05, 1.5638768672943115e-05, 2.0563602447509766e-05, 2.5488436222076416e-05, 3.0413269996643066e-05, 3.533810377120972e-05, 4.026293754577637e-05, 4.518777132034302e-05, 5.011260509490967e-05, 5.503743886947632e-05, 5.996227264404297e-05, 6.488710641860962e-05, 6.981194019317627e-05, 7.473677396774292e-05, 7.966160774230957e-05, 8.458644151687622e-05, 8.951127529144287e-05, 9.443610906600952e-05, 9.936094284057617e-05, 0.00010428577661514282, 0.00010921061038970947, 0.00011413544416427612, 0.00011906027793884277, 0.00012398511171340942, 0.00012890994548797607, 0.00013383477926254272, 0.00013875961303710938]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 10.0, 7.0, 13.0, 16.0, 24.0, 48.0, 115.0, 226.0, 565.0, 1499.0, 4737.0, 20282.0, 144192.0, 650952.0, 192130.0, 25379.0, 5441.0, 1723.0, 615.0, 314.0, 121.0, 62.0, 30.0, 17.0, 14.0, 7.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.408203125, -2.336456298828125, -2.26470947265625, -2.192962646484375, -2.1212158203125, -2.049468994140625, -1.97772216796875, -1.905975341796875, -1.834228515625, -1.762481689453125, -1.69073486328125, -1.618988037109375, -1.5472412109375, -1.475494384765625, -1.40374755859375, -1.332000732421875, -1.26025390625, -1.188507080078125, -1.11676025390625, -1.045013427734375, -0.9732666015625, -0.901519775390625, -0.82977294921875, -0.758026123046875, -0.686279296875, -0.614532470703125, -0.54278564453125, -0.471038818359375, -0.3992919921875, -0.327545166015625, -0.25579833984375, -0.184051513671875, -0.1123046875, -0.040557861328125, 0.03118896484375, 0.102935791015625, 0.1746826171875, 0.246429443359375, 0.31817626953125, 0.389923095703125, 0.461669921875, 0.533416748046875, 0.60516357421875, 0.676910400390625, 0.7486572265625, 0.820404052734375, 0.89215087890625, 0.963897705078125, 1.03564453125, 1.107391357421875, 1.17913818359375, 1.250885009765625, 1.3226318359375, 1.394378662109375, 1.46612548828125, 1.537872314453125, 1.609619140625, 1.681365966796875, 1.75311279296875, 1.824859619140625, 1.8966064453125, 1.968353271484375, 2.04010009765625, 2.111846923828125, 2.18359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 20.0, 23.0, 33.0, 38.0, 49.0, 81.0, 86.0, 107.0, 97.0, 88.0, 85.0, 62.0, 50.0, 39.0, 27.0, 25.0, 24.0, 9.0, 10.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5302734375, -1.48486328125, -1.439453125, -1.39404296875, -1.3486328125, -1.30322265625, -1.2578125, -1.21240234375, -1.1669921875, -1.12158203125, -1.076171875, -1.03076171875, -0.9853515625, -0.93994140625, -0.89453125, -0.84912109375, -0.8037109375, -0.75830078125, -0.712890625, -0.66748046875, -0.6220703125, -0.57666015625, -0.53125, -0.48583984375, -0.4404296875, -0.39501953125, -0.349609375, -0.30419921875, -0.2587890625, -0.21337890625, -0.16796875, -0.12255859375, -0.0771484375, -0.03173828125, 0.013671875, 0.05908203125, 0.1044921875, 0.14990234375, 0.1953125, 0.24072265625, 0.2861328125, 0.33154296875, 0.376953125, 0.42236328125, 0.4677734375, 0.51318359375, 0.55859375, 0.60400390625, 0.6494140625, 0.69482421875, 0.740234375, 0.78564453125, 0.8310546875, 0.87646484375, 0.921875, 0.96728515625, 1.0126953125, 1.05810546875, 1.103515625, 1.14892578125, 1.1943359375, 1.23974609375, 1.28515625, 1.33056640625, 1.3759765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 11.0, 31.0, 94.0, 238.0, 339.0, 191.0, 63.0, 17.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.248069763183594, -48.1144905090332, -46.98091125488281, -45.84733200073242, -44.71375274658203, -43.58017349243164, -42.44659423828125, -41.313018798828125, -40.17943572998047, -39.04585647583008, -37.91227722167969, -36.7786979675293, -35.645118713378906, -34.511539459228516, -33.377960205078125, -32.244384765625, -31.11080551147461, -29.97722625732422, -28.843647003173828, -27.710067749023438, -26.576488494873047, -25.442909240722656, -24.3093318939209, -23.175752639770508, -22.042173385620117, -20.908594131469727, -19.775014877319336, -18.641435623168945, -17.507858276367188, -16.374279022216797, -15.240699768066406, -14.107120513916016, -12.97354507446289, -11.8399658203125, -10.70638656616211, -9.572808265686035, -8.439229011535645, -7.305649757385254, -6.1720709800720215, -5.038492202758789, -3.9049129486083984, -2.771333932876587, -1.6377549171447754, -0.5041759014129639, 0.6294031143188477, 1.7629823684692383, 2.8965611457824707, 4.030139923095703, 5.163719177246094, 6.297298431396484, 7.430877208709717, 8.56445598602295, 9.69803524017334, 10.83161449432373, 11.965192794799805, 13.098772048950195, 14.232351303100586, 15.365930557250977, 16.499509811401367, 17.633089065551758, 18.766666412353516, 19.900245666503906, 21.033824920654297, 22.167404174804688, 23.300983428955078]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 10.0, 11.0, 22.0, 14.0, 19.0, 36.0, 36.0, 38.0, 33.0, 43.0, 57.0, 41.0, 48.0, 47.0, 59.0, 52.0, 57.0, 44.0, 55.0, 40.0, 40.0, 33.0, 24.0, 20.0, 26.0, 20.0, 12.0, 11.0, 9.0, 2.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.185792922973633, -8.92286205291748, -8.659931182861328, -8.397000312805176, -8.134069442749023, -7.871138095855713, -7.608206748962402, -7.34527587890625, -7.082345008850098, -6.819414138793945, -6.556483268737793, -6.293551921844482, -6.03062105178833, -5.767690181732178, -5.504758834838867, -5.241827964782715, -4.9788970947265625, -4.71596622467041, -4.453035354614258, -4.190104007720947, -3.927173137664795, -3.6642422676086426, -3.401311159133911, -3.1383800506591797, -2.8754491806030273, -2.612518310546875, -2.3495872020721436, -2.086656093597412, -1.8237252235412598, -1.5607942342758179, -1.297863245010376, -1.034932255744934, -0.7720017433166504, -0.5090707540512085, -0.2461397647857666, 0.016791224479675293, 0.2797222137451172, 0.5426532030105591, 0.805584192276001, 1.0685151815414429, 1.3314461708068848, 1.5943771600723267, 1.8573081493377686, 2.1202392578125, 2.3831701278686523, 2.6461009979248047, 2.909032106399536, 3.1719632148742676, 3.43489408493042, 3.6978249549865723, 3.9607560634613037, 4.223687171936035, 4.4866180419921875, 4.74954891204834, 5.012479782104492, 5.275411128997803, 5.538341999053955, 5.801272869110107, 6.064204216003418, 6.32713508605957, 6.590065956115723, 6.852996826171875, 7.115927696228027, 7.378859043121338, 7.64178991317749]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 12.0, 16.0, 26.0, 52.0, 91.0, 159.0, 297.0, 688.0, 1755.0, 5959.0, 33002.0, 855233.0, 3233293.0, 51661.0, 7903.0, 2235.0, 875.0, 442.0, 205.0, 128.0, 79.0, 57.0, 30.0, 22.0, 10.0, 13.0, 8.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.037109375, -2.886016845703125, -2.73492431640625, -2.583831787109375, -2.4327392578125, -2.281646728515625, -2.13055419921875, -1.979461669921875, -1.828369140625, -1.677276611328125, -1.52618408203125, -1.375091552734375, -1.2239990234375, -1.072906494140625, -0.92181396484375, -0.770721435546875, -0.61962890625, -0.468536376953125, -0.31744384765625, -0.166351318359375, -0.0152587890625, 0.135833740234375, 0.28692626953125, 0.438018798828125, 0.589111328125, 0.740203857421875, 0.89129638671875, 1.042388916015625, 1.1934814453125, 1.344573974609375, 1.49566650390625, 1.646759033203125, 1.7978515625, 1.948944091796875, 2.10003662109375, 2.251129150390625, 2.4022216796875, 2.553314208984375, 2.70440673828125, 2.855499267578125, 3.006591796875, 3.157684326171875, 3.30877685546875, 3.459869384765625, 3.6109619140625, 3.762054443359375, 3.91314697265625, 4.064239501953125, 4.21533203125, 4.366424560546875, 4.51751708984375, 4.668609619140625, 4.8197021484375, 4.970794677734375, 5.12188720703125, 5.272979736328125, 5.424072265625, 5.575164794921875, 5.72625732421875, 5.877349853515625, 6.0284423828125, 6.179534912109375, 6.33062744140625, 6.481719970703125, 6.6328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 5.0, 11.0, 20.0, 23.0, 27.0, 37.0, 46.0, 48.0, 44.0, 53.0, 59.0, 56.0, 65.0, 59.0, 57.0, 49.0, 68.0, 50.0, 49.0, 31.0, 31.0, 25.0, 14.0, 15.0, 12.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.320068359375, -0.3100318908691406, -0.29999542236328125, -0.2899589538574219, -0.2799224853515625, -0.2698860168457031, -0.25984954833984375, -0.24981307983398438, -0.239776611328125, -0.22974014282226562, -0.21970367431640625, -0.20966720581054688, -0.1996307373046875, -0.18959426879882812, -0.17955780029296875, -0.16952133178710938, -0.15948486328125, -0.14944839477539062, -0.13941192626953125, -0.12937545776367188, -0.1193389892578125, -0.10930252075195312, -0.09926605224609375, -0.08922958374023438, -0.079193115234375, -0.06915664672851562, -0.05912017822265625, -0.049083709716796875, -0.0390472412109375, -0.029010772705078125, -0.01897430419921875, -0.008937835693359375, 0.0010986328125, 0.011135101318359375, 0.02117156982421875, 0.031208038330078125, 0.0412445068359375, 0.051280975341796875, 0.06131744384765625, 0.07135391235351562, 0.081390380859375, 0.09142684936523438, 0.10146331787109375, 0.11149978637695312, 0.1215362548828125, 0.13157272338867188, 0.14160919189453125, 0.15164566040039062, 0.16168212890625, 0.17171859741210938, 0.18175506591796875, 0.19179153442382812, 0.2018280029296875, 0.21186447143554688, 0.22190093994140625, 0.23193740844726562, 0.241973876953125, 0.2520103454589844, 0.26204681396484375, 0.2720832824707031, 0.2821197509765625, 0.2921562194824219, 0.30219268798828125, 0.3122291564941406, 0.322265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 15.0, 23.0, 27.0, 33.0, 51.0, 56.0, 90.0, 150.0, 689.0, 4163884.0, 28595.0, 313.0, 122.0, 75.0, 46.0, 34.0, 28.0, 18.0, 6.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.6875, -45.645751953125, -44.60400390625, -43.562255859375, -42.5205078125, -41.478759765625, -40.43701171875, -39.395263671875, -38.353515625, -37.311767578125, -36.27001953125, -35.228271484375, -34.1865234375, -33.144775390625, -32.10302734375, -31.061279296875, -30.01953125, -28.977783203125, -27.93603515625, -26.894287109375, -25.8525390625, -24.810791015625, -23.76904296875, -22.727294921875, -21.685546875, -20.643798828125, -19.60205078125, -18.560302734375, -17.5185546875, -16.476806640625, -15.43505859375, -14.393310546875, -13.3515625, -12.309814453125, -11.26806640625, -10.226318359375, -9.1845703125, -8.142822265625, -7.10107421875, -6.059326171875, -5.017578125, -3.975830078125, -2.93408203125, -1.892333984375, -0.8505859375, 0.191162109375, 1.23291015625, 2.274658203125, 3.31640625, 4.358154296875, 5.39990234375, 6.441650390625, 7.4833984375, 8.525146484375, 9.56689453125, 10.608642578125, 11.650390625, 12.692138671875, 13.73388671875, 14.775634765625, 15.8173828125, 16.859130859375, 17.90087890625, 18.942626953125, 19.984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 40.0, 333.0, 3221.0, 434.0, 41.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.99334716796875, -5.8616943359375, -5.73004150390625, -5.598388671875, -5.46673583984375, -5.3350830078125, -5.20343017578125, -5.07177734375, -4.94012451171875, -4.8084716796875, -4.67681884765625, -4.545166015625, -4.41351318359375, -4.2818603515625, -4.15020751953125, -4.0185546875, -3.88690185546875, -3.7552490234375, -3.62359619140625, -3.491943359375, -3.36029052734375, -3.2286376953125, -3.09698486328125, -2.96533203125, -2.83367919921875, -2.7020263671875, -2.57037353515625, -2.438720703125, -2.30706787109375, -2.1754150390625, -2.04376220703125, -1.912109375, -1.78045654296875, -1.6488037109375, -1.51715087890625, -1.385498046875, -1.25384521484375, -1.1221923828125, -0.99053955078125, -0.85888671875, -0.72723388671875, -0.5955810546875, -0.46392822265625, -0.332275390625, -0.20062255859375, -0.0689697265625, 0.06268310546875, 0.1943359375, 0.32598876953125, 0.4576416015625, 0.58929443359375, 0.720947265625, 0.85260009765625, 0.9842529296875, 1.11590576171875, 1.24755859375, 1.37921142578125, 1.5108642578125, 1.64251708984375, 1.774169921875, 1.90582275390625, 2.0374755859375, 2.16912841796875, 2.30078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 23.0, 777.0, 204.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78047561645508, -38.81562423706055, -36.85077667236328, -34.88592529296875, -32.92107391357422, -30.956226348876953, -28.991374969482422, -27.026525497436523, -25.061676025390625, -23.096826553344727, -21.131977081298828, -19.167125701904297, -17.2022762298584, -15.2374267578125, -13.272576332092285, -11.30772590637207, -9.342876434326172, -7.378026485443115, -5.413176536560059, -3.448326587677002, -1.4834766387939453, 0.4813728332519531, 2.446223258972168, 4.411073684692383, 6.375923156738281, 8.34077262878418, 10.305623054504395, 12.27047348022461, 14.235322952270508, 16.200172424316406, 18.165023803710938, 20.129873275756836, 22.09471893310547, 24.059568405151367, 26.024417877197266, 27.989269256591797, 29.954118728637695, 31.918968200683594, 33.883819580078125, 35.848670959472656, 37.81351852416992, 39.77836990356445, 41.74321746826172, 43.70806884765625, 45.67292022705078, 47.63776779174805, 49.60261917114258, 51.567466735839844, 53.532318115234375, 55.497169494628906, 57.46201705932617, 59.4268684387207, 61.39171600341797, 63.3565673828125, 65.32141876220703, 67.28627014160156, 69.25111389160156, 71.2159652709961, 73.18081665039062, 75.14566040039062, 77.11051177978516, 79.07536315917969, 81.04021453857422, 83.00506591796875, 84.96991729736328]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 6.0, 19.0, 26.0, 47.0, 76.0, 94.0, 108.0, 117.0, 109.0, 115.0, 111.0, 70.0, 38.0, 33.0, 17.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.464579105377197, -7.1965651512146, -6.928551197052002, -6.660537242889404, -6.392522811889648, -6.124508857727051, -5.856494903564453, -5.5884809494018555, -5.320466995239258, -5.05245304107666, -4.7844390869140625, -4.516425132751465, -4.248411178588867, -3.9803969860076904, -3.7123827934265137, -3.444368839263916, -3.1763548851013184, -2.9083409309387207, -2.640326976776123, -2.3723127841949463, -2.1042988300323486, -1.836284875869751, -1.5682708024978638, -1.3002567291259766, -1.032242774963379, -0.7642287611961365, -0.49621474742889404, -0.2282007336616516, 0.03981328010559082, 0.3078272342681885, 0.5758413076400757, 0.8438553810119629, 1.1118698120117188, 1.3798837661743164, 1.6478978395462036, 1.9159119129180908, 2.1839258670806885, 2.451939821243286, 2.719954013824463, 2.9879679679870605, 3.255981922149658, 3.523995876312256, 3.7920098304748535, 4.060023784637451, 4.328038215637207, 4.596052169799805, 4.864066123962402, 5.132080078125, 5.400094032287598, 5.668107986450195, 5.936121940612793, 6.204135894775391, 6.472149848937988, 6.740163803100586, 7.008178234100342, 7.2761921882629395, 7.544206142425537, 7.812220096588135, 8.08023452758789, 8.348248481750488, 8.616262435913086, 8.884276390075684, 9.152290344238281, 9.420304298400879, 9.688318252563477]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 4.0, 8.0, 17.0, 17.0, 23.0, 44.0, 60.0, 57.0, 104.0, 192.0, 280.0, 571.0, 1105.0, 2150.0, 5284.0, 14483.0, 46043.0, 156196.0, 391562.0, 292564.0, 93300.0, 28131.0, 9198.0, 3573.0, 1636.0, 814.0, 421.0, 233.0, 163.0, 80.0, 72.0, 38.0, 29.0, 24.0, 19.0, 22.0, 11.0, 3.0, 5.0, 1.0, 9.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.224609375, -2.1473388671875, -2.070068359375, -1.9927978515625, -1.91552734375, -1.8382568359375, -1.760986328125, -1.6837158203125, -1.6064453125, -1.5291748046875, -1.451904296875, -1.3746337890625, -1.29736328125, -1.2200927734375, -1.142822265625, -1.0655517578125, -0.98828125, -0.9110107421875, -0.833740234375, -0.7564697265625, -0.67919921875, -0.6019287109375, -0.524658203125, -0.4473876953125, -0.3701171875, -0.2928466796875, -0.215576171875, -0.1383056640625, -0.06103515625, 0.0162353515625, 0.093505859375, 0.1707763671875, 0.248046875, 0.3253173828125, 0.402587890625, 0.4798583984375, 0.55712890625, 0.6343994140625, 0.711669921875, 0.7889404296875, 0.8662109375, 0.9434814453125, 1.020751953125, 1.0980224609375, 1.17529296875, 1.2525634765625, 1.329833984375, 1.4071044921875, 1.484375, 1.5616455078125, 1.638916015625, 1.7161865234375, 1.79345703125, 1.8707275390625, 1.947998046875, 2.0252685546875, 2.1025390625, 2.1798095703125, 2.257080078125, 2.3343505859375, 2.41162109375, 2.4888916015625, 2.566162109375, 2.6434326171875, 2.720703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 10.0, 17.0, 17.0, 11.0, 22.0, 30.0, 25.0, 47.0, 34.0, 44.0, 44.0, 64.0, 63.0, 53.0, 51.0, 46.0, 56.0, 45.0, 50.0, 47.0, 40.0, 33.0, 33.0, 30.0, 23.0, 14.0, 14.0, 9.0, 6.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.323486328125, -0.3138389587402344, -0.30419158935546875, -0.2945442199707031, -0.2848968505859375, -0.2752494812011719, -0.26560211181640625, -0.2559547424316406, -0.246307373046875, -0.23666000366210938, -0.22701263427734375, -0.21736526489257812, -0.2077178955078125, -0.19807052612304688, -0.18842315673828125, -0.17877578735351562, -0.16912841796875, -0.15948104858398438, -0.14983367919921875, -0.14018630981445312, -0.1305389404296875, -0.12089157104492188, -0.11124420166015625, -0.10159683227539062, -0.091949462890625, -0.08230209350585938, -0.07265472412109375, -0.06300735473632812, -0.0533599853515625, -0.043712615966796875, -0.03406524658203125, -0.024417877197265625, -0.0147705078125, -0.005123138427734375, 0.00452423095703125, 0.014171600341796875, 0.0238189697265625, 0.033466339111328125, 0.04311370849609375, 0.052761077880859375, 0.062408447265625, 0.07205581665039062, 0.08170318603515625, 0.09135055541992188, 0.1009979248046875, 0.11064529418945312, 0.12029266357421875, 0.12994003295898438, 0.13958740234375, 0.14923477172851562, 0.15888214111328125, 0.16852951049804688, 0.1781768798828125, 0.18782424926757812, 0.19747161865234375, 0.20711898803710938, 0.216766357421875, 0.22641372680664062, 0.23606109619140625, 0.24570846557617188, 0.2553558349609375, 0.2650032043457031, 0.27465057373046875, 0.2842979431152344, 0.2939453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 8.0, 15.0, 23.0, 29.0, 46.0, 60.0, 79.0, 138.0, 181.0, 313.0, 505.0, 904.0, 1534.0, 2817.0, 5728.0, 12716.0, 32199.0, 92354.0, 250438.0, 357888.0, 184006.0, 63696.0, 23190.0, 9596.0, 4618.0, 2349.0, 1203.0, 674.0, 429.0, 253.0, 192.0, 120.0, 78.0, 48.0, 34.0, 22.0, 12.0, 13.0, 8.0, 10.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.087890625, -2.0287933349609375, -1.969696044921875, -1.9105987548828125, -1.85150146484375, -1.7924041748046875, -1.733306884765625, -1.6742095947265625, -1.6151123046875, -1.5560150146484375, -1.496917724609375, -1.4378204345703125, -1.37872314453125, -1.3196258544921875, -1.260528564453125, -1.2014312744140625, -1.142333984375, -1.0832366943359375, -1.024139404296875, -0.9650421142578125, -0.90594482421875, -0.8468475341796875, -0.787750244140625, -0.7286529541015625, -0.6695556640625, -0.6104583740234375, -0.551361083984375, -0.4922637939453125, -0.43316650390625, -0.3740692138671875, -0.314971923828125, -0.2558746337890625, -0.19677734375, -0.1376800537109375, -0.078582763671875, -0.0194854736328125, 0.03961181640625, 0.0987091064453125, 0.157806396484375, 0.2169036865234375, 0.2760009765625, 0.3350982666015625, 0.394195556640625, 0.4532928466796875, 0.51239013671875, 0.5714874267578125, 0.630584716796875, 0.6896820068359375, 0.748779296875, 0.8078765869140625, 0.866973876953125, 0.9260711669921875, 0.98516845703125, 1.0442657470703125, 1.103363037109375, 1.1624603271484375, 1.2215576171875, 1.2806549072265625, 1.339752197265625, 1.3988494873046875, 1.45794677734375, 1.5170440673828125, 1.576141357421875, 1.6352386474609375, 1.6943359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 10.0, 12.0, 15.0, 15.0, 17.0, 18.0, 29.0, 14.0, 25.0, 28.0, 27.0, 39.0, 42.0, 41.0, 40.0, 41.0, 44.0, 52.0, 48.0, 48.0, 40.0, 43.0, 28.0, 31.0, 30.0, 30.0, 27.0, 21.0, 29.0, 16.0, 16.0, 12.0, 4.0, 10.0, 6.0, 6.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0], "bins": [-1.443359375, -1.404510498046875, -1.36566162109375, -1.326812744140625, -1.2879638671875, -1.249114990234375, -1.21026611328125, -1.171417236328125, -1.132568359375, -1.093719482421875, -1.05487060546875, -1.016021728515625, -0.9771728515625, -0.938323974609375, -0.89947509765625, -0.860626220703125, -0.82177734375, -0.782928466796875, -0.74407958984375, -0.705230712890625, -0.6663818359375, -0.627532958984375, -0.58868408203125, -0.549835205078125, -0.510986328125, -0.472137451171875, -0.43328857421875, -0.394439697265625, -0.3555908203125, -0.316741943359375, -0.27789306640625, -0.239044189453125, -0.2001953125, -0.161346435546875, -0.12249755859375, -0.083648681640625, -0.0447998046875, -0.005950927734375, 0.03289794921875, 0.071746826171875, 0.110595703125, 0.149444580078125, 0.18829345703125, 0.227142333984375, 0.2659912109375, 0.304840087890625, 0.34368896484375, 0.382537841796875, 0.42138671875, 0.460235595703125, 0.49908447265625, 0.537933349609375, 0.5767822265625, 0.615631103515625, 0.65447998046875, 0.693328857421875, 0.732177734375, 0.771026611328125, 0.80987548828125, 0.848724365234375, 0.8875732421875, 0.926422119140625, 0.96527099609375, 1.004119873046875, 1.04296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 9.0, 17.0, 17.0, 26.0, 34.0, 66.0, 95.0, 142.0, 273.0, 438.0, 800.0, 1617.0, 3267.0, 8462.0, 27569.0, 127179.0, 512353.0, 286607.0, 55127.0, 14527.0, 5113.0, 2259.0, 1065.0, 592.0, 320.0, 193.0, 129.0, 77.0, 54.0, 43.0, 19.0, 13.0, 16.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.515167236328125, -1.46588134765625, -1.416595458984375, -1.3673095703125, -1.318023681640625, -1.26873779296875, -1.219451904296875, -1.170166015625, -1.120880126953125, -1.07159423828125, -1.022308349609375, -0.9730224609375, -0.923736572265625, -0.87445068359375, -0.825164794921875, -0.77587890625, -0.726593017578125, -0.67730712890625, -0.628021240234375, -0.5787353515625, -0.529449462890625, -0.48016357421875, -0.430877685546875, -0.381591796875, -0.332305908203125, -0.28302001953125, -0.233734130859375, -0.1844482421875, -0.135162353515625, -0.08587646484375, -0.036590576171875, 0.0126953125, 0.061981201171875, 0.11126708984375, 0.160552978515625, 0.2098388671875, 0.259124755859375, 0.30841064453125, 0.357696533203125, 0.406982421875, 0.456268310546875, 0.50555419921875, 0.554840087890625, 0.6041259765625, 0.653411865234375, 0.70269775390625, 0.751983642578125, 0.80126953125, 0.850555419921875, 0.89984130859375, 0.949127197265625, 0.9984130859375, 1.047698974609375, 1.09698486328125, 1.146270751953125, 1.195556640625, 1.244842529296875, 1.29412841796875, 1.343414306640625, 1.3927001953125, 1.441986083984375, 1.49127197265625, 1.540557861328125, 1.58984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 9.0, 3.0, 19.0, 16.0, 20.0, 15.0, 26.0, 42.0, 35.0, 46.0, 54.0, 60.0, 57.0, 63.0, 64.0, 61.0, 68.0, 51.0, 51.0, 48.0, 27.0, 24.0, 22.0, 21.0, 24.0, 9.0, 19.0, 5.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013589859008789062, -0.00013170763850212097, -0.00012751668691635132, -0.00012332573533058167, -0.00011913478374481201, -0.00011494383215904236, -0.0001107528805732727, -0.00010656192898750305, -0.0001023709774017334, -9.818002581596375e-05, -9.398907423019409e-05, -8.979812264442444e-05, -8.560717105865479e-05, -8.141621947288513e-05, -7.722526788711548e-05, -7.303431630134583e-05, -6.884336471557617e-05, -6.465241312980652e-05, -6.0461461544036865e-05, -5.627050995826721e-05, -5.207955837249756e-05, -4.7888606786727905e-05, -4.369765520095825e-05, -3.95067036151886e-05, -3.5315752029418945e-05, -3.112480044364929e-05, -2.693384885787964e-05, -2.2742897272109985e-05, -1.8551945686340332e-05, -1.4360994100570679e-05, -1.0170042514801025e-05, -5.979090929031372e-06, -1.7881393432617188e-06, 2.4028122425079346e-06, 6.593763828277588e-06, 1.0784715414047241e-05, 1.4975666999816895e-05, 1.9166618585586548e-05, 2.33575701713562e-05, 2.7548521757125854e-05, 3.173947334289551e-05, 3.593042492866516e-05, 4.0121376514434814e-05, 4.431232810020447e-05, 4.850327968597412e-05, 5.2694231271743774e-05, 5.688518285751343e-05, 6.107613444328308e-05, 6.526708602905273e-05, 6.945803761482239e-05, 7.364898920059204e-05, 7.78399407863617e-05, 8.203089237213135e-05, 8.6221843957901e-05, 9.041279554367065e-05, 9.460374712944031e-05, 9.879469871520996e-05, 0.00010298565030097961, 0.00010717660188674927, 0.00011136755347251892, 0.00011555850505828857, 0.00011974945664405823, 0.00012394040822982788, 0.00012813135981559753, 0.0001323223114013672]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 9.0, 20.0, 24.0, 42.0, 58.0, 123.0, 193.0, 356.0, 606.0, 1277.0, 3165.0, 8865.0, 33537.0, 185904.0, 567272.0, 196334.0, 35535.0, 9183.0, 3235.0, 1382.0, 654.0, 343.0, 173.0, 85.0, 64.0, 44.0, 22.0, 16.0, 9.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4619140625, -1.412384033203125, -1.36285400390625, -1.313323974609375, -1.2637939453125, -1.214263916015625, -1.16473388671875, -1.115203857421875, -1.065673828125, -1.016143798828125, -0.96661376953125, -0.917083740234375, -0.8675537109375, -0.818023681640625, -0.76849365234375, -0.718963623046875, -0.66943359375, -0.619903564453125, -0.57037353515625, -0.520843505859375, -0.4713134765625, -0.421783447265625, -0.37225341796875, -0.322723388671875, -0.273193359375, -0.223663330078125, -0.17413330078125, -0.124603271484375, -0.0750732421875, -0.025543212890625, 0.02398681640625, 0.073516845703125, 0.123046875, 0.172576904296875, 0.22210693359375, 0.271636962890625, 0.3211669921875, 0.370697021484375, 0.42022705078125, 0.469757080078125, 0.519287109375, 0.568817138671875, 0.61834716796875, 0.667877197265625, 0.7174072265625, 0.766937255859375, 0.81646728515625, 0.865997314453125, 0.91552734375, 0.965057373046875, 1.01458740234375, 1.064117431640625, 1.1136474609375, 1.163177490234375, 1.21270751953125, 1.262237548828125, 1.311767578125, 1.361297607421875, 1.41082763671875, 1.460357666015625, 1.5098876953125, 1.559417724609375, 1.60894775390625, 1.658477783203125, 1.7080078125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 10.0, 14.0, 10.0, 19.0, 22.0, 31.0, 46.0, 65.0, 77.0, 83.0, 102.0, 84.0, 87.0, 79.0, 71.0, 49.0, 35.0, 30.0, 21.0, 11.0, 7.0, 7.0, 11.0, 1.0, 10.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16796875, -1.130401611328125, -1.09283447265625, -1.055267333984375, -1.0177001953125, -0.980133056640625, -0.94256591796875, -0.904998779296875, -0.867431640625, -0.829864501953125, -0.79229736328125, -0.754730224609375, -0.7171630859375, -0.679595947265625, -0.64202880859375, -0.604461669921875, -0.56689453125, -0.529327392578125, -0.49176025390625, -0.454193115234375, -0.4166259765625, -0.379058837890625, -0.34149169921875, -0.303924560546875, -0.266357421875, -0.228790283203125, -0.19122314453125, -0.153656005859375, -0.1160888671875, -0.078521728515625, -0.04095458984375, -0.003387451171875, 0.0341796875, 0.071746826171875, 0.10931396484375, 0.146881103515625, 0.1844482421875, 0.222015380859375, 0.25958251953125, 0.297149658203125, 0.334716796875, 0.372283935546875, 0.40985107421875, 0.447418212890625, 0.4849853515625, 0.522552490234375, 0.56011962890625, 0.597686767578125, 0.63525390625, 0.672821044921875, 0.71038818359375, 0.747955322265625, 0.7855224609375, 0.823089599609375, 0.86065673828125, 0.898223876953125, 0.935791015625, 0.973358154296875, 1.01092529296875, 1.048492431640625, 1.0860595703125, 1.123626708984375, 1.16119384765625, 1.198760986328125, 1.236328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 10.0, 7.0, 18.0, 22.0, 23.0, 59.0, 105.0, 160.0, 180.0, 166.0, 106.0, 63.0, 41.0, 19.0, 11.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.532722473144531, -9.853334426879883, -9.173946380615234, -8.49455738067627, -7.815169334411621, -7.135781288146973, -6.456392765045166, -5.777004241943359, -5.097616195678711, -4.4182281494140625, -3.738839626312256, -3.0594513416290283, -2.380063056945801, -1.7006747722625732, -1.0212864875793457, -0.34189796447753906, 0.3374900817871094, 1.016878366470337, 1.6962666511535645, 2.375654935836792, 3.0550432205200195, 3.734431505203247, 4.413819789886475, 5.093208312988281, 5.77259635925293, 6.451984405517578, 7.131372928619385, 7.810761451721191, 8.49014949798584, 9.169537544250488, 9.848926544189453, 10.528314590454102, 11.20770263671875, 11.887090682983398, 12.566478729248047, 13.245867729187012, 13.92525577545166, 14.604643821716309, 15.284032821655273, 15.963420867919922, 16.64280891418457, 17.32219696044922, 18.001585006713867, 18.680973052978516, 19.360363006591797, 20.039751052856445, 20.719139099121094, 21.398527145385742, 22.07791519165039, 22.75730323791504, 23.436691284179688, 24.116079330444336, 24.795467376708984, 25.474857330322266, 26.154245376586914, 26.833633422851562, 27.51302146911621, 28.19240951538086, 28.871797561645508, 29.551185607910156, 30.230575561523438, 30.909963607788086, 31.589351654052734, 32.26873779296875, 32.94812774658203]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 10.0, 11.0, 13.0, 18.0, 14.0, 17.0, 22.0, 38.0, 38.0, 50.0, 52.0, 60.0, 65.0, 62.0, 57.0, 71.0, 56.0, 61.0, 44.0, 47.0, 51.0, 26.0, 36.0, 19.0, 14.0, 11.0, 11.0, 6.0, 4.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.445122718811035, -13.076869010925293, -12.70861530303955, -12.340361595153809, -11.972107887268066, -11.603854179382324, -11.235601425170898, -10.867347717285156, -10.499094009399414, -10.130840301513672, -9.76258659362793, -9.394332885742188, -9.026079177856445, -8.657825469970703, -8.289571762084961, -7.921318531036377, -7.553064346313477, -7.184810638427734, -6.816556930541992, -6.44830322265625, -6.080049514770508, -5.711795806884766, -5.343542575836182, -4.9752888679504395, -4.607035160064697, -4.238781452178955, -3.870527744293213, -3.50227427482605, -3.1340205669403076, -2.7657668590545654, -2.3975133895874023, -2.02925968170166, -1.6610050201416016, -1.2927513122558594, -0.9244977235794067, -0.5562441349029541, -0.18799042701721191, 0.18026328086853027, 0.5485167503356934, 0.9167704582214355, 1.2850241661071777, 1.65327787399292, 2.021531581878662, 2.389785051345825, 2.7580387592315674, 3.1262924671173096, 3.4945459365844727, 3.862799644470215, 4.231053352355957, 4.599307060241699, 4.967560768127441, 5.335814476013184, 5.704068183898926, 6.072321891784668, 6.440575122833252, 6.808828830718994, 7.177082538604736, 7.5453362464904785, 7.913589954376221, 8.281843185424805, 8.650096893310547, 9.018350601196289, 9.386604309082031, 9.754858016967773, 10.123111724853516]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 24.0, 26.0, 52.0, 84.0, 127.0, 202.0, 356.0, 764.0, 1467.0, 3427.0, 8914.0, 30042.0, 142838.0, 2256700.0, 1581739.0, 124418.0, 27712.0, 8718.0, 3439.0, 1537.0, 679.0, 411.0, 197.0, 143.0, 78.0, 46.0, 24.0, 22.0, 15.0, 10.0, 7.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.36163330078125, -2.2740478515625, -2.18646240234375, -2.098876953125, -2.01129150390625, -1.9237060546875, -1.83612060546875, -1.74853515625, -1.66094970703125, -1.5733642578125, -1.48577880859375, -1.398193359375, -1.31060791015625, -1.2230224609375, -1.13543701171875, -1.0478515625, -0.96026611328125, -0.8726806640625, -0.78509521484375, -0.697509765625, -0.60992431640625, -0.5223388671875, -0.43475341796875, -0.34716796875, -0.25958251953125, -0.1719970703125, -0.08441162109375, 0.003173828125, 0.09075927734375, 0.1783447265625, 0.26593017578125, 0.353515625, 0.44110107421875, 0.5286865234375, 0.61627197265625, 0.703857421875, 0.79144287109375, 0.8790283203125, 0.96661376953125, 1.05419921875, 1.14178466796875, 1.2293701171875, 1.31695556640625, 1.404541015625, 1.49212646484375, 1.5797119140625, 1.66729736328125, 1.7548828125, 1.84246826171875, 1.9300537109375, 2.01763916015625, 2.105224609375, 2.19281005859375, 2.2803955078125, 2.36798095703125, 2.45556640625, 2.54315185546875, 2.6307373046875, 2.71832275390625, 2.805908203125, 2.89349365234375, 2.9810791015625, 3.06866455078125, 3.15625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 11.0, 20.0, 30.0, 39.0, 40.0, 43.0, 55.0, 81.0, 57.0, 73.0, 84.0, 63.0, 69.0, 61.0, 58.0, 49.0, 45.0, 37.0, 26.0, 16.0, 17.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3203010559082031, -0.30735015869140625, -0.2943992614746094, -0.2814483642578125, -0.2684974670410156, -0.25554656982421875, -0.24259567260742188, -0.229644775390625, -0.21669387817382812, -0.20374298095703125, -0.19079208374023438, -0.1778411865234375, -0.16489028930664062, -0.15193939208984375, -0.13898849487304688, -0.12603759765625, -0.11308670043945312, -0.10013580322265625, -0.08718490600585938, -0.0742340087890625, -0.061283111572265625, -0.04833221435546875, -0.035381317138671875, -0.022430419921875, -0.009479522705078125, 0.00347137451171875, 0.016422271728515625, 0.0293731689453125, 0.042324066162109375, 0.05527496337890625, 0.06822586059570312, 0.0811767578125, 0.09412765502929688, 0.10707855224609375, 0.12002944946289062, 0.1329803466796875, 0.14593124389648438, 0.15888214111328125, 0.17183303833007812, 0.184783935546875, 0.19773483276367188, 0.21068572998046875, 0.22363662719726562, 0.2365875244140625, 0.24953842163085938, 0.26248931884765625, 0.2754402160644531, 0.28839111328125, 0.3013420104980469, 0.31429290771484375, 0.3272438049316406, 0.3401947021484375, 0.3531455993652344, 0.36609649658203125, 0.3790473937988281, 0.391998291015625, 0.4049491882324219, 0.41790008544921875, 0.4308509826660156, 0.4438018798828125, 0.4567527770996094, 0.46970367431640625, 0.4826545715332031, 0.49560546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 7.0, 13.0, 27.0, 37.0, 65.0, 83.0, 148.0, 232.0, 485.0, 1014.0, 2737.0, 12114.0, 173691.0, 3822331.0, 166236.0, 11097.0, 2371.0, 807.0, 339.0, 171.0, 88.0, 65.0, 39.0, 39.0, 11.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.60546875, -6.41937255859375, -6.2332763671875, -6.04718017578125, -5.861083984375, -5.67498779296875, -5.4888916015625, -5.30279541015625, -5.11669921875, -4.93060302734375, -4.7445068359375, -4.55841064453125, -4.372314453125, -4.18621826171875, -4.0001220703125, -3.81402587890625, -3.6279296875, -3.44183349609375, -3.2557373046875, -3.06964111328125, -2.883544921875, -2.69744873046875, -2.5113525390625, -2.32525634765625, -2.13916015625, -1.95306396484375, -1.7669677734375, -1.58087158203125, -1.394775390625, -1.20867919921875, -1.0225830078125, -0.83648681640625, -0.650390625, -0.46429443359375, -0.2781982421875, -0.09210205078125, 0.093994140625, 0.28009033203125, 0.4661865234375, 0.65228271484375, 0.83837890625, 1.02447509765625, 1.2105712890625, 1.39666748046875, 1.582763671875, 1.76885986328125, 1.9549560546875, 2.14105224609375, 2.3271484375, 2.51324462890625, 2.6993408203125, 2.88543701171875, 3.071533203125, 3.25762939453125, 3.4437255859375, 3.62982177734375, 3.81591796875, 4.00201416015625, 4.1881103515625, 4.37420654296875, 4.560302734375, 4.74639892578125, 4.9324951171875, 5.11859130859375, 5.3046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 29.0, 41.0, 104.0, 154.0, 336.0, 752.0, 1324.0, 704.0, 297.0, 145.0, 65.0, 38.0, 22.0, 4.0, 10.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.0489349365234375, -1.998260498046875, -1.9475860595703125, -1.89691162109375, -1.8462371826171875, -1.795562744140625, -1.7448883056640625, -1.6942138671875, -1.6435394287109375, -1.592864990234375, -1.5421905517578125, -1.49151611328125, -1.4408416748046875, -1.390167236328125, -1.3394927978515625, -1.288818359375, -1.2381439208984375, -1.187469482421875, -1.1367950439453125, -1.08612060546875, -1.0354461669921875, -0.984771728515625, -0.9340972900390625, -0.8834228515625, -0.8327484130859375, -0.782073974609375, -0.7313995361328125, -0.68072509765625, -0.6300506591796875, -0.579376220703125, -0.5287017822265625, -0.47802734375, -0.4273529052734375, -0.376678466796875, -0.3260040283203125, -0.27532958984375, -0.2246551513671875, -0.173980712890625, -0.1233062744140625, -0.0726318359375, -0.0219573974609375, 0.028717041015625, 0.0793914794921875, 0.13006591796875, 0.1807403564453125, 0.231414794921875, 0.2820892333984375, 0.332763671875, 0.3834381103515625, 0.434112548828125, 0.4847869873046875, 0.53546142578125, 0.5861358642578125, 0.636810302734375, 0.6874847412109375, 0.7381591796875, 0.7888336181640625, 0.839508056640625, 0.8901824951171875, 0.94085693359375, 0.9915313720703125, 1.042205810546875, 1.0928802490234375, 1.1435546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 11.0, 13.0, 16.0, 33.0, 60.0, 89.0, 136.0, 141.0, 145.0, 124.0, 83.0, 56.0, 39.0, 14.0, 17.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.631415367126465, -15.313575744628906, -14.995736122131348, -14.677896499633789, -14.36005687713623, -14.042217254638672, -13.724377632141113, -13.406538009643555, -13.08869743347168, -12.770857810974121, -12.453018188476562, -12.135178565979004, -11.817338943481445, -11.499499320983887, -11.181659698486328, -10.863819122314453, -10.545980453491211, -10.228140830993652, -9.910301208496094, -9.592461585998535, -9.274621963500977, -8.956782341003418, -8.63894271850586, -8.321102142333984, -8.003263473510742, -7.685423851013184, -7.367584228515625, -7.049744606018066, -6.731904983520508, -6.414065361022949, -6.096225261688232, -5.778385639190674, -5.460546493530273, -5.142706871032715, -4.824867248535156, -4.507027626037598, -4.189188003540039, -3.8713481426239014, -3.5535082817077637, -3.235668659210205, -2.9178290367126465, -2.599989414215088, -2.2821497917175293, -1.9643099308013916, -1.646470308303833, -1.3286306858062744, -1.0107909440994263, -0.6929512023925781, -0.37511157989501953, -0.05727189779281616, 0.2605677843093872, 0.5784074664115906, 0.896247148513794, 1.2140867710113525, 1.5319265127182007, 1.8497662544250488, 2.1676058769226074, 2.485445499420166, 2.8032851219177246, 3.1211249828338623, 3.438964605331421, 3.7568042278289795, 4.074644088745117, 4.392483711242676, 4.710323333740234]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 6.0, 6.0, 7.0, 13.0, 14.0, 20.0, 28.0, 34.0, 44.0, 54.0, 62.0, 86.0, 91.0, 77.0, 78.0, 58.0, 61.0, 69.0, 54.0, 41.0, 24.0, 30.0, 14.0, 14.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.696931838989258, -9.44190502166748, -9.186878204345703, -8.931851387023926, -8.676824569702148, -8.421797752380371, -8.166770935058594, -7.911744117736816, -7.656717300415039, -7.401690483093262, -7.146663665771484, -6.891636848449707, -6.63661003112793, -6.381583213806152, -6.126556396484375, -5.871529579162598, -5.61650276184082, -5.361475944519043, -5.106449127197266, -4.851422309875488, -4.596395492553711, -4.341368675231934, -4.086341857910156, -3.831315040588379, -3.5762882232666016, -3.321261405944824, -3.066234588623047, -2.8112077713012695, -2.556180953979492, -2.301154136657715, -2.0461273193359375, -1.7911005020141602, -1.536074161529541, -1.2810473442077637, -1.0260205268859863, -0.770993709564209, -0.5159668922424316, -0.2609400749206543, -0.005913257598876953, 0.2491135597229004, 0.5041403770446777, 0.7591671943664551, 1.0141940116882324, 1.2692208290100098, 1.524247646331787, 1.7792744636535645, 2.034301280975342, 2.289328098297119, 2.5443549156188965, 2.799381732940674, 3.054408550262451, 3.3094353675842285, 3.564462184906006, 3.819489002227783, 4.0745158195495605, 4.329542636871338, 4.584569454193115, 4.839596271514893, 5.09462308883667, 5.349649906158447, 5.604676723480225, 5.859703540802002, 6.114730358123779, 6.369757175445557, 6.624783992767334]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 9.0, 11.0, 15.0, 16.0, 20.0, 35.0, 64.0, 73.0, 114.0, 147.0, 248.0, 427.0, 669.0, 1242.0, 2491.0, 5493.0, 13280.0, 37827.0, 113530.0, 296981.0, 346574.0, 149074.0, 49645.0, 17109.0, 6837.0, 2980.0, 1524.0, 819.0, 460.0, 260.0, 184.0, 136.0, 68.0, 44.0, 32.0, 16.0, 28.0, 19.0, 12.0, 15.0, 6.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0390625, -1.96905517578125, -1.8990478515625, -1.82904052734375, -1.759033203125, -1.68902587890625, -1.6190185546875, -1.54901123046875, -1.47900390625, -1.40899658203125, -1.3389892578125, -1.26898193359375, -1.198974609375, -1.12896728515625, -1.0589599609375, -0.98895263671875, -0.9189453125, -0.84893798828125, -0.7789306640625, -0.70892333984375, -0.638916015625, -0.56890869140625, -0.4989013671875, -0.42889404296875, -0.35888671875, -0.28887939453125, -0.2188720703125, -0.14886474609375, -0.078857421875, -0.00885009765625, 0.0611572265625, 0.13116455078125, 0.201171875, 0.27117919921875, 0.3411865234375, 0.41119384765625, 0.481201171875, 0.55120849609375, 0.6212158203125, 0.69122314453125, 0.76123046875, 0.83123779296875, 0.9012451171875, 0.97125244140625, 1.041259765625, 1.11126708984375, 1.1812744140625, 1.25128173828125, 1.3212890625, 1.39129638671875, 1.4613037109375, 1.53131103515625, 1.601318359375, 1.67132568359375, 1.7413330078125, 1.81134033203125, 1.88134765625, 1.95135498046875, 2.0213623046875, 2.09136962890625, 2.161376953125, 2.23138427734375, 2.3013916015625, 2.37139892578125, 2.44140625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 13.0, 15.0, 32.0, 25.0, 44.0, 67.0, 59.0, 85.0, 88.0, 82.0, 80.0, 73.0, 82.0, 65.0, 55.0, 39.0, 29.0, 23.0, 17.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5037345886230469, -0.48793792724609375, -0.4721412658691406, -0.4563446044921875, -0.4405479431152344, -0.42475128173828125, -0.4089546203613281, -0.393157958984375, -0.3773612976074219, -0.36156463623046875, -0.3457679748535156, -0.3299713134765625, -0.3141746520996094, -0.29837799072265625, -0.2825813293457031, -0.26678466796875, -0.2509880065917969, -0.23519134521484375, -0.21939468383789062, -0.2035980224609375, -0.18780136108398438, -0.17200469970703125, -0.15620803833007812, -0.140411376953125, -0.12461471557617188, -0.10881805419921875, -0.09302139282226562, -0.0772247314453125, -0.061428070068359375, -0.04563140869140625, -0.029834747314453125, -0.0140380859375, 0.001758575439453125, 0.01755523681640625, 0.033351898193359375, 0.0491485595703125, 0.06494522094726562, 0.08074188232421875, 0.09653854370117188, 0.112335205078125, 0.12813186645507812, 0.14392852783203125, 0.15972518920898438, 0.1755218505859375, 0.19131851196289062, 0.20711517333984375, 0.22291183471679688, 0.23870849609375, 0.2545051574707031, 0.27030181884765625, 0.2860984802246094, 0.3018951416015625, 0.3176918029785156, 0.33348846435546875, 0.3492851257324219, 0.365081787109375, 0.3808784484863281, 0.39667510986328125, 0.4124717712402344, 0.4282684326171875, 0.4440650939941406, 0.45986175537109375, 0.4756584167480469, 0.491455078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 8.0, 15.0, 23.0, 27.0, 44.0, 48.0, 81.0, 118.0, 200.0, 268.0, 431.0, 657.0, 1040.0, 1738.0, 2787.0, 4897.0, 9023.0, 16691.0, 32682.0, 63450.0, 118172.0, 192613.0, 228218.0, 167949.0, 97679.0, 51768.0, 26565.0, 13593.0, 7217.0, 4097.0, 2376.0, 1441.0, 895.0, 570.0, 384.0, 244.0, 175.0, 104.0, 76.0, 59.0, 33.0, 27.0, 24.0, 13.0, 9.0, 8.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.1142578125, -1.079803466796875, -1.04534912109375, -1.010894775390625, -0.9764404296875, -0.941986083984375, -0.90753173828125, -0.873077392578125, -0.838623046875, -0.804168701171875, -0.76971435546875, -0.735260009765625, -0.7008056640625, -0.666351318359375, -0.63189697265625, -0.597442626953125, -0.56298828125, -0.528533935546875, -0.49407958984375, -0.459625244140625, -0.4251708984375, -0.390716552734375, -0.35626220703125, -0.321807861328125, -0.287353515625, -0.252899169921875, -0.21844482421875, -0.183990478515625, -0.1495361328125, -0.115081787109375, -0.08062744140625, -0.046173095703125, -0.01171875, 0.022735595703125, 0.05718994140625, 0.091644287109375, 0.1260986328125, 0.160552978515625, 0.19500732421875, 0.229461669921875, 0.263916015625, 0.298370361328125, 0.33282470703125, 0.367279052734375, 0.4017333984375, 0.436187744140625, 0.47064208984375, 0.505096435546875, 0.53955078125, 0.574005126953125, 0.60845947265625, 0.642913818359375, 0.6773681640625, 0.711822509765625, 0.74627685546875, 0.780731201171875, 0.815185546875, 0.849639892578125, 0.88409423828125, 0.918548583984375, 0.9530029296875, 0.987457275390625, 1.02191162109375, 1.056365966796875, 1.0908203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 8.0, 6.0, 4.0, 8.0, 7.0, 11.0, 8.0, 10.0, 17.0, 17.0, 24.0, 33.0, 21.0, 36.0, 30.0, 28.0, 38.0, 42.0, 41.0, 43.0, 45.0, 31.0, 42.0, 47.0, 42.0, 46.0, 26.0, 46.0, 22.0, 28.0, 29.0, 22.0, 29.0, 18.0, 14.0, 11.0, 18.0, 12.0, 7.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.3076171875, -1.270782470703125, -1.23394775390625, -1.197113037109375, -1.1602783203125, -1.123443603515625, -1.08660888671875, -1.049774169921875, -1.012939453125, -0.976104736328125, -0.93927001953125, -0.902435302734375, -0.8656005859375, -0.828765869140625, -0.79193115234375, -0.755096435546875, -0.71826171875, -0.681427001953125, -0.64459228515625, -0.607757568359375, -0.5709228515625, -0.534088134765625, -0.49725341796875, -0.460418701171875, -0.423583984375, -0.386749267578125, -0.34991455078125, -0.313079833984375, -0.2762451171875, -0.239410400390625, -0.20257568359375, -0.165740966796875, -0.12890625, -0.092071533203125, -0.05523681640625, -0.018402099609375, 0.0184326171875, 0.055267333984375, 0.09210205078125, 0.128936767578125, 0.165771484375, 0.202606201171875, 0.23944091796875, 0.276275634765625, 0.3131103515625, 0.349945068359375, 0.38677978515625, 0.423614501953125, 0.46044921875, 0.497283935546875, 0.53411865234375, 0.570953369140625, 0.6077880859375, 0.644622802734375, 0.68145751953125, 0.718292236328125, 0.755126953125, 0.791961669921875, 0.82879638671875, 0.865631103515625, 0.9024658203125, 0.939300537109375, 0.97613525390625, 1.012969970703125, 1.0498046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 18.0, 8.0, 10.0, 23.0, 29.0, 49.0, 103.0, 114.0, 223.0, 402.0, 785.0, 1653.0, 3413.0, 8342.0, 22631.0, 75497.0, 324114.0, 443153.0, 116761.0, 31539.0, 11081.0, 4455.0, 2021.0, 958.0, 470.0, 287.0, 158.0, 91.0, 65.0, 31.0, 19.0, 18.0, 14.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.5634765625, -1.521392822265625, -1.47930908203125, -1.437225341796875, -1.3951416015625, -1.353057861328125, -1.31097412109375, -1.268890380859375, -1.226806640625, -1.184722900390625, -1.14263916015625, -1.100555419921875, -1.0584716796875, -1.016387939453125, -0.97430419921875, -0.932220458984375, -0.89013671875, -0.848052978515625, -0.80596923828125, -0.763885498046875, -0.7218017578125, -0.679718017578125, -0.63763427734375, -0.595550537109375, -0.553466796875, -0.511383056640625, -0.46929931640625, -0.427215576171875, -0.3851318359375, -0.343048095703125, -0.30096435546875, -0.258880615234375, -0.216796875, -0.174713134765625, -0.13262939453125, -0.090545654296875, -0.0484619140625, -0.006378173828125, 0.03570556640625, 0.077789306640625, 0.119873046875, 0.161956787109375, 0.20404052734375, 0.246124267578125, 0.2882080078125, 0.330291748046875, 0.37237548828125, 0.414459228515625, 0.45654296875, 0.498626708984375, 0.54071044921875, 0.582794189453125, 0.6248779296875, 0.666961669921875, 0.70904541015625, 0.751129150390625, 0.793212890625, 0.835296630859375, 0.87738037109375, 0.919464111328125, 0.9615478515625, 1.003631591796875, 1.04571533203125, 1.087799072265625, 1.1298828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 10.0, 14.0, 18.0, 23.0, 25.0, 28.0, 49.0, 61.0, 69.0, 82.0, 101.0, 113.0, 81.0, 69.0, 59.0, 43.0, 35.0, 22.0, 18.0, 16.0, 10.0, 10.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019884109497070312, -0.0001934543251991272, -0.00018806755542755127, -0.00018268078565597534, -0.00017729401588439941, -0.00017190724611282349, -0.00016652047634124756, -0.00016113370656967163, -0.0001557469367980957, -0.00015036016702651978, -0.00014497339725494385, -0.00013958662748336792, -0.000134199857711792, -0.00012881308794021606, -0.00012342631816864014, -0.00011803954839706421, -0.00011265277862548828, -0.00010726600885391235, -0.00010187923908233643, -9.64924693107605e-05, -9.110569953918457e-05, -8.571892976760864e-05, -8.033215999603271e-05, -7.494539022445679e-05, -6.955862045288086e-05, -6.417185068130493e-05, -5.8785080909729004e-05, -5.3398311138153076e-05, -4.801154136657715e-05, -4.262477159500122e-05, -3.723800182342529e-05, -3.1851232051849365e-05, -2.6464462280273438e-05, -2.107769250869751e-05, -1.5690922737121582e-05, -1.0304152965545654e-05, -4.9173831939697266e-06, 4.6938657760620117e-07, 5.856156349182129e-06, 1.1242926120758057e-05, 1.6629695892333984e-05, 2.2016465663909912e-05, 2.740323543548584e-05, 3.279000520706177e-05, 3.8176774978637695e-05, 4.356354475021362e-05, 4.895031452178955e-05, 5.433708429336548e-05, 5.9723854064941406e-05, 6.511062383651733e-05, 7.049739360809326e-05, 7.588416337966919e-05, 8.127093315124512e-05, 8.665770292282104e-05, 9.204447269439697e-05, 9.74312424659729e-05, 0.00010281801223754883, 0.00010820478200912476, 0.00011359155178070068, 0.00011897832155227661, 0.00012436509132385254, 0.00012975186109542847, 0.0001351386308670044, 0.00014052540063858032, 0.00014591217041015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 7.0, 11.0, 9.0, 11.0, 31.0, 45.0, 73.0, 142.0, 210.0, 450.0, 983.0, 2365.0, 6885.0, 25708.0, 168935.0, 674096.0, 136034.0, 22393.0, 6204.0, 2106.0, 893.0, 430.0, 222.0, 136.0, 74.0, 53.0, 20.0, 13.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7726593017578125, -1.710357666015625, -1.6480560302734375, -1.58575439453125, -1.5234527587890625, -1.461151123046875, -1.3988494873046875, -1.3365478515625, -1.2742462158203125, -1.211944580078125, -1.1496429443359375, -1.08734130859375, -1.0250396728515625, -0.962738037109375, -0.9004364013671875, -0.838134765625, -0.7758331298828125, -0.713531494140625, -0.6512298583984375, -0.58892822265625, -0.5266265869140625, -0.464324951171875, -0.4020233154296875, -0.3397216796875, -0.2774200439453125, -0.215118408203125, -0.1528167724609375, -0.09051513671875, -0.0282135009765625, 0.034088134765625, 0.0963897705078125, 0.15869140625, 0.2209930419921875, 0.283294677734375, 0.3455963134765625, 0.40789794921875, 0.4701995849609375, 0.532501220703125, 0.5948028564453125, 0.6571044921875, 0.7194061279296875, 0.781707763671875, 0.8440093994140625, 0.90631103515625, 0.9686126708984375, 1.030914306640625, 1.0932159423828125, 1.155517578125, 1.2178192138671875, 1.280120849609375, 1.3424224853515625, 1.40472412109375, 1.4670257568359375, 1.529327392578125, 1.5916290283203125, 1.6539306640625, 1.7162322998046875, 1.778533935546875, 1.8408355712890625, 1.90313720703125, 1.9654388427734375, 2.027740478515625, 2.0900421142578125, 2.15234375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 8.0, 4.0, 4.0, 15.0, 13.0, 15.0, 39.0, 46.0, 36.0, 53.0, 73.0, 93.0, 93.0, 90.0, 98.0, 75.0, 52.0, 45.0, 27.0, 25.0, 22.0, 18.0, 8.0, 9.0, 6.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.932525634765625, -0.90020751953125, -0.867889404296875, -0.8355712890625, -0.803253173828125, -0.77093505859375, -0.738616943359375, -0.706298828125, -0.673980712890625, -0.64166259765625, -0.609344482421875, -0.5770263671875, -0.544708251953125, -0.51239013671875, -0.480072021484375, -0.44775390625, -0.415435791015625, -0.38311767578125, -0.350799560546875, -0.3184814453125, -0.286163330078125, -0.25384521484375, -0.221527099609375, -0.189208984375, -0.156890869140625, -0.12457275390625, -0.092254638671875, -0.0599365234375, -0.027618408203125, 0.00469970703125, 0.037017822265625, 0.0693359375, 0.101654052734375, 0.13397216796875, 0.166290283203125, 0.1986083984375, 0.230926513671875, 0.26324462890625, 0.295562744140625, 0.327880859375, 0.360198974609375, 0.39251708984375, 0.424835205078125, 0.4571533203125, 0.489471435546875, 0.52178955078125, 0.554107666015625, 0.58642578125, 0.618743896484375, 0.65106201171875, 0.683380126953125, 0.7156982421875, 0.748016357421875, 0.78033447265625, 0.812652587890625, 0.844970703125, 0.877288818359375, 0.90960693359375, 0.941925048828125, 0.9742431640625, 1.006561279296875, 1.03887939453125, 1.071197509765625, 1.103515625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 16.0, 17.0, 50.0, 81.0, 99.0, 153.0, 135.0, 134.0, 111.0, 79.0, 40.0, 32.0, 18.0, 12.0, 6.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.92098045349121, -18.316871643066406, -17.7127628326416, -17.108654022216797, -16.50454330444336, -15.900434494018555, -15.29632568359375, -14.692216873168945, -14.08810806274414, -13.483999252319336, -12.879889488220215, -12.27578067779541, -11.671671867370605, -11.067562103271484, -10.46345329284668, -9.859344482421875, -9.255234718322754, -8.65112590789795, -8.047016143798828, -7.442907333374023, -6.838798522949219, -6.234689235687256, -5.630579948425293, -5.026471138000488, -4.422361850738525, -3.8182528018951416, -3.214143753051758, -2.610034465789795, -2.005925416946411, -1.4018163681030273, -0.7977070808410645, -0.19359827041625977, 0.4105110168457031, 1.014620065689087, 1.6187292337417603, 2.2228384017944336, 2.8269474506378174, 3.431056499481201, 4.035165786743164, 4.639274597167969, 5.243383884429932, 5.8474931716918945, 6.451601982116699, 7.055711269378662, 7.659820556640625, 8.26392936706543, 8.868038177490234, 9.472146987915039, 10.07625675201416, 10.680365562438965, 11.284475326538086, 11.88858413696289, 12.492692947387695, 13.0968017578125, 13.700911521911621, 14.305020332336426, 14.909130096435547, 15.513238906860352, 16.117347717285156, 16.721458435058594, 17.3255672454834, 17.929676055908203, 18.533784866333008, 19.137893676757812, 19.742002487182617]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 10.0, 6.0, 9.0, 15.0, 18.0, 19.0, 27.0, 35.0, 38.0, 49.0, 56.0, 50.0, 66.0, 61.0, 60.0, 55.0, 47.0, 62.0, 50.0, 47.0, 44.0, 43.0, 22.0, 27.0, 15.0, 20.0, 11.0, 12.0, 4.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.667394638061523, -12.328136444091797, -11.988879203796387, -11.64962100982666, -11.31036376953125, -10.971105575561523, -10.631847381591797, -10.29258918762207, -9.95333194732666, -9.614073753356934, -9.274816513061523, -8.935558319091797, -8.59630012512207, -8.25704288482666, -7.917784690856934, -7.578526973724365, -7.239269256591797, -6.9000115394592285, -6.56075382232666, -6.221495628356934, -5.882237911224365, -5.542980194091797, -5.20372200012207, -4.864464282989502, -4.525206565856934, -4.185948848724365, -3.8466908931732178, -3.5074329376220703, -3.168175220489502, -2.8289175033569336, -2.489659547805786, -2.1504015922546387, -1.8111438751220703, -1.4718860387802124, -1.1326282024383545, -0.7933703660964966, -0.45411252975463867, -0.11485469341278076, 0.22440314292907715, 0.5636610984802246, 0.902918815612793, 1.2421766519546509, 1.5814344882965088, 1.9206923246383667, 2.2599501609802246, 2.599207878112793, 2.9384658336639404, 3.277723789215088, 3.6169815063476562, 3.9562392234802246, 4.295496940612793, 4.6347551345825195, 4.974012851715088, 5.313270568847656, 5.652528762817383, 5.991786479949951, 6.3310441970825195, 6.670301914215088, 7.009559631347656, 7.348817825317383, 7.688075542449951, 8.02733325958252, 8.366591453552246, 8.705848693847656, 9.045106887817383]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 2.0, 8.0, 9.0, 18.0, 24.0, 26.0, 39.0, 52.0, 63.0, 86.0, 136.0, 230.0, 404.0, 672.0, 1393.0, 3037.0, 7505.0, 23949.0, 117181.0, 3215739.0, 732902.0, 64265.0, 16228.0, 5575.0, 2246.0, 1118.0, 520.0, 318.0, 213.0, 106.0, 79.0, 52.0, 25.0, 20.0, 10.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.375, -3.285797119140625, -3.19659423828125, -3.107391357421875, -3.0181884765625, -2.928985595703125, -2.83978271484375, -2.750579833984375, -2.661376953125, -2.572174072265625, -2.48297119140625, -2.393768310546875, -2.3045654296875, -2.215362548828125, -2.12615966796875, -2.036956787109375, -1.94775390625, -1.858551025390625, -1.76934814453125, -1.680145263671875, -1.5909423828125, -1.501739501953125, -1.41253662109375, -1.323333740234375, -1.234130859375, -1.144927978515625, -1.05572509765625, -0.966522216796875, -0.8773193359375, -0.788116455078125, -0.69891357421875, -0.609710693359375, -0.5205078125, -0.431304931640625, -0.34210205078125, -0.252899169921875, -0.1636962890625, -0.074493408203125, 0.01470947265625, 0.103912353515625, 0.193115234375, 0.282318115234375, 0.37152099609375, 0.460723876953125, 0.5499267578125, 0.639129638671875, 0.72833251953125, 0.817535400390625, 0.90673828125, 0.995941162109375, 1.08514404296875, 1.174346923828125, 1.2635498046875, 1.352752685546875, 1.44195556640625, 1.531158447265625, 1.620361328125, 1.709564208984375, 1.79876708984375, 1.887969970703125, 1.9771728515625, 2.066375732421875, 2.15557861328125, 2.244781494140625, 2.333984375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 6.0, 21.0, 34.0, 38.0, 38.0, 52.0, 64.0, 67.0, 70.0, 70.0, 85.0, 78.0, 78.0, 54.0, 52.0, 47.0, 37.0, 33.0, 18.0, 14.0, 9.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.490234375, -0.47586822509765625, -0.4615020751953125, -0.44713592529296875, -0.432769775390625, -0.41840362548828125, -0.4040374755859375, -0.38967132568359375, -0.37530517578125, -0.36093902587890625, -0.3465728759765625, -0.33220672607421875, -0.317840576171875, -0.30347442626953125, -0.2891082763671875, -0.27474212646484375, -0.2603759765625, -0.24600982666015625, -0.2316436767578125, -0.21727752685546875, -0.202911376953125, -0.18854522705078125, -0.1741790771484375, -0.15981292724609375, -0.14544677734375, -0.13108062744140625, -0.1167144775390625, -0.10234832763671875, -0.087982177734375, -0.07361602783203125, -0.0592498779296875, -0.04488372802734375, -0.030517578125, -0.01615142822265625, -0.0017852783203125, 0.01258087158203125, 0.026947021484375, 0.04131317138671875, 0.0556793212890625, 0.07004547119140625, 0.08441162109375, 0.09877777099609375, 0.1131439208984375, 0.12751007080078125, 0.141876220703125, 0.15624237060546875, 0.1706085205078125, 0.18497467041015625, 0.1993408203125, 0.21370697021484375, 0.2280731201171875, 0.24243927001953125, 0.256805419921875, 0.27117156982421875, 0.2855377197265625, 0.29990386962890625, 0.31427001953125, 0.32863616943359375, 0.3430023193359375, 0.35736846923828125, 0.371734619140625, 0.38610076904296875, 0.4004669189453125, 0.41483306884765625, 0.42919921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 7.0, 23.0, 17.0, 21.0, 26.0, 54.0, 80.0, 114.0, 206.0, 300.0, 557.0, 1050.0, 2172.0, 5095.0, 13876.0, 45858.0, 222062.0, 2680775.0, 1048272.0, 125629.0, 30697.0, 9817.0, 3752.0, 1719.0, 844.0, 449.0, 273.0, 140.0, 127.0, 72.0, 49.0, 37.0, 26.0, 19.0, 14.0, 13.0, 7.0, 6.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.4609375, -2.39227294921875, -2.3236083984375, -2.25494384765625, -2.186279296875, -2.11761474609375, -2.0489501953125, -1.98028564453125, -1.91162109375, -1.84295654296875, -1.7742919921875, -1.70562744140625, -1.636962890625, -1.56829833984375, -1.4996337890625, -1.43096923828125, -1.3623046875, -1.29364013671875, -1.2249755859375, -1.15631103515625, -1.087646484375, -1.01898193359375, -0.9503173828125, -0.88165283203125, -0.81298828125, -0.74432373046875, -0.6756591796875, -0.60699462890625, -0.538330078125, -0.46966552734375, -0.4010009765625, -0.33233642578125, -0.263671875, -0.19500732421875, -0.1263427734375, -0.05767822265625, 0.010986328125, 0.07965087890625, 0.1483154296875, 0.21697998046875, 0.28564453125, 0.35430908203125, 0.4229736328125, 0.49163818359375, 0.560302734375, 0.62896728515625, 0.6976318359375, 0.76629638671875, 0.8349609375, 0.90362548828125, 0.9722900390625, 1.04095458984375, 1.109619140625, 1.17828369140625, 1.2469482421875, 1.31561279296875, 1.38427734375, 1.45294189453125, 1.5216064453125, 1.59027099609375, 1.658935546875, 1.72760009765625, 1.7962646484375, 1.86492919921875, 1.93359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 13.0, 9.0, 18.0, 26.0, 48.0, 44.0, 79.0, 127.0, 199.0, 360.0, 591.0, 1129.0, 583.0, 275.0, 177.0, 129.0, 79.0, 51.0, 29.0, 21.0, 18.0, 13.0, 14.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5568389892578125, -0.533111572265625, -0.5093841552734375, -0.48565673828125, -0.4619293212890625, -0.438201904296875, -0.4144744873046875, -0.3907470703125, -0.3670196533203125, -0.343292236328125, -0.3195648193359375, -0.29583740234375, -0.2721099853515625, -0.248382568359375, -0.2246551513671875, -0.200927734375, -0.1772003173828125, -0.153472900390625, -0.1297454833984375, -0.10601806640625, -0.0822906494140625, -0.058563232421875, -0.0348358154296875, -0.0111083984375, 0.0126190185546875, 0.036346435546875, 0.0600738525390625, 0.08380126953125, 0.1075286865234375, 0.131256103515625, 0.1549835205078125, 0.1787109375, 0.2024383544921875, 0.226165771484375, 0.2498931884765625, 0.27362060546875, 0.2973480224609375, 0.321075439453125, 0.3448028564453125, 0.3685302734375, 0.3922576904296875, 0.415985107421875, 0.4397125244140625, 0.46343994140625, 0.4871673583984375, 0.510894775390625, 0.5346221923828125, 0.558349609375, 0.5820770263671875, 0.605804443359375, 0.6295318603515625, 0.65325927734375, 0.6769866943359375, 0.700714111328125, 0.7244415283203125, 0.7481689453125, 0.7718963623046875, 0.795623779296875, 0.8193511962890625, 0.84307861328125, 0.8668060302734375, 0.890533447265625, 0.9142608642578125, 0.93798828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 18.0, 45.0, 116.0, 210.0, 274.0, 196.0, 94.0, 32.0, 16.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.535314559936523, -21.100561141967773, -20.665809631347656, -20.231056213378906, -19.79630470275879, -19.36155128479004, -18.926799774169922, -18.492046356201172, -18.057292938232422, -17.622539520263672, -17.187788009643555, -16.753034591674805, -16.318283081054688, -15.883529663085938, -15.448777198791504, -15.01402473449707, -14.579273223876953, -14.14452075958252, -13.709768295288086, -13.275014877319336, -12.840262413024902, -12.405509948730469, -11.970757484436035, -11.536005020141602, -11.101251602172852, -10.666499137878418, -10.231746673583984, -9.796993255615234, -9.3622407913208, -8.927488327026367, -8.492735862731934, -8.0579833984375, -7.623230934143066, -7.188478469848633, -6.753725528717041, -6.318973064422607, -5.884220600128174, -5.449467658996582, -5.014715194702148, -4.579962730407715, -4.145210266113281, -3.7104575634002686, -3.275705099105835, -2.8409523963928223, -2.4061999320983887, -1.971447229385376, -1.5366945266723633, -1.1019420623779297, -0.6671891212463379, -0.23243650794029236, 0.20231610536575317, 0.6370687484741211, 1.0718213319778442, 1.5065739154815674, 1.94132661819458, 2.3760790824890137, 2.8108317852020264, 3.245584487915039, 3.6803369522094727, 4.115089416503906, 4.549842357635498, 4.984594821929932, 5.419347763061523, 5.854100227355957, 6.288852691650391]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 8.0, 10.0, 16.0, 13.0, 17.0, 25.0, 27.0, 30.0, 26.0, 42.0, 39.0, 43.0, 40.0, 49.0, 43.0, 53.0, 50.0, 39.0, 55.0, 44.0, 45.0, 39.0, 27.0, 28.0, 32.0, 18.0, 23.0, 19.0, 19.0, 11.0, 12.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1007704734802246, -3.01249098777771, -2.9242117404937744, -2.8359322547912598, -2.747653007507324, -2.6593735218048096, -2.571094036102295, -2.4828147888183594, -2.394535541534424, -2.306256055831909, -2.2179768085479736, -2.129697322845459, -2.0414180755615234, -1.9531385898590088, -1.8648592233657837, -1.7765798568725586, -1.688300371170044, -1.6000210046768188, -1.5117416381835938, -1.423462152481079, -1.3351829051971436, -1.246903419494629, -1.1586240530014038, -1.0703446865081787, -0.9820653200149536, -0.8937859535217285, -0.8055065870285034, -0.7172271609306335, -0.6289477944374084, -0.5406684279441833, -0.4523890018463135, -0.3641096353530884, -0.2758302688598633, -0.187550887465477, -0.0992715060710907, -0.010992109775543213, 0.07728725671768188, 0.16556662321090698, 0.25384604930877686, 0.34212541580200195, 0.43040478229522705, 0.5186841487884521, 0.6069635152816772, 0.6952429413795471, 0.7835223078727722, 0.8718016743659973, 0.9600811004638672, 1.0483604669570923, 1.1366398334503174, 1.2249191999435425, 1.3131985664367676, 1.4014780521392822, 1.4897572994232178, 1.5780367851257324, 1.6663161516189575, 1.7545955181121826, 1.8428748846054077, 1.9311542510986328, 2.0194337368011475, 2.107712984085083, 2.1959924697875977, 2.284271717071533, 2.372551202774048, 2.4608306884765625, 2.549109935760498]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 6.0, 12.0, 21.0, 30.0, 30.0, 45.0, 72.0, 84.0, 156.0, 217.0, 343.0, 636.0, 991.0, 1786.0, 3444.0, 6692.0, 14665.0, 33751.0, 82159.0, 187305.0, 302116.0, 227786.0, 106095.0, 43556.0, 18653.0, 8358.0, 4220.0, 2169.0, 1231.0, 678.0, 407.0, 253.0, 158.0, 128.0, 80.0, 54.0, 42.0, 28.0, 23.0, 20.0, 10.0, 11.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.01953125, -1.957672119140625, -1.89581298828125, -1.833953857421875, -1.7720947265625, -1.710235595703125, -1.64837646484375, -1.586517333984375, -1.524658203125, -1.462799072265625, -1.40093994140625, -1.339080810546875, -1.2772216796875, -1.215362548828125, -1.15350341796875, -1.091644287109375, -1.02978515625, -0.967926025390625, -0.90606689453125, -0.844207763671875, -0.7823486328125, -0.720489501953125, -0.65863037109375, -0.596771240234375, -0.534912109375, -0.473052978515625, -0.41119384765625, -0.349334716796875, -0.2874755859375, -0.225616455078125, -0.16375732421875, -0.101898193359375, -0.0400390625, 0.021820068359375, 0.08367919921875, 0.145538330078125, 0.2073974609375, 0.269256591796875, 0.33111572265625, 0.392974853515625, 0.454833984375, 0.516693115234375, 0.57855224609375, 0.640411376953125, 0.7022705078125, 0.764129638671875, 0.82598876953125, 0.887847900390625, 0.94970703125, 1.011566162109375, 1.07342529296875, 1.135284423828125, 1.1971435546875, 1.259002685546875, 1.32086181640625, 1.382720947265625, 1.444580078125, 1.506439208984375, 1.56829833984375, 1.630157470703125, 1.6920166015625, 1.753875732421875, 1.81573486328125, 1.877593994140625, 1.939453125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 11.0, 16.0, 22.0, 34.0, 38.0, 43.0, 51.0, 69.0, 60.0, 71.0, 71.0, 72.0, 80.0, 60.0, 61.0, 47.0, 49.0, 33.0, 31.0, 30.0, 9.0, 4.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4423942565917969, -0.42848968505859375, -0.4145851135253906, -0.4006805419921875, -0.3867759704589844, -0.37287139892578125, -0.3589668273925781, -0.345062255859375, -0.3311576843261719, -0.31725311279296875, -0.3033485412597656, -0.2894439697265625, -0.2755393981933594, -0.26163482666015625, -0.24773025512695312, -0.23382568359375, -0.21992111206054688, -0.20601654052734375, -0.19211196899414062, -0.1782073974609375, -0.16430282592773438, -0.15039825439453125, -0.13649368286132812, -0.122589111328125, -0.10868453979492188, -0.09477996826171875, -0.08087539672851562, -0.0669708251953125, -0.053066253662109375, -0.03916168212890625, -0.025257110595703125, -0.0113525390625, 0.002552032470703125, 0.01645660400390625, 0.030361175537109375, 0.0442657470703125, 0.058170318603515625, 0.07207489013671875, 0.08597946166992188, 0.099884033203125, 0.11378860473632812, 0.12769317626953125, 0.14159774780273438, 0.1555023193359375, 0.16940689086914062, 0.18331146240234375, 0.19721603393554688, 0.21112060546875, 0.22502517700195312, 0.23892974853515625, 0.2528343200683594, 0.2667388916015625, 0.2806434631347656, 0.29454803466796875, 0.3084526062011719, 0.322357177734375, 0.3362617492675781, 0.35016632080078125, 0.3640708923339844, 0.3779754638671875, 0.3918800354003906, 0.40578460693359375, 0.4196891784667969, 0.43359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 6.0, 8.0, 11.0, 21.0, 41.0, 53.0, 67.0, 88.0, 134.0, 203.0, 308.0, 524.0, 902.0, 1406.0, 2471.0, 4534.0, 8628.0, 16862.0, 33800.0, 68506.0, 127343.0, 205084.0, 231005.0, 161833.0, 90576.0, 46028.0, 22808.0, 11513.0, 5987.0, 3101.0, 1829.0, 1043.0, 655.0, 391.0, 233.0, 172.0, 138.0, 72.0, 50.0, 34.0, 29.0, 13.0, 15.0, 7.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.154296875, -1.11846923828125, -1.0826416015625, -1.04681396484375, -1.010986328125, -0.97515869140625, -0.9393310546875, -0.90350341796875, -0.86767578125, -0.83184814453125, -0.7960205078125, -0.76019287109375, -0.724365234375, -0.68853759765625, -0.6527099609375, -0.61688232421875, -0.5810546875, -0.54522705078125, -0.5093994140625, -0.47357177734375, -0.437744140625, -0.40191650390625, -0.3660888671875, -0.33026123046875, -0.29443359375, -0.25860595703125, -0.2227783203125, -0.18695068359375, -0.151123046875, -0.11529541015625, -0.0794677734375, -0.04364013671875, -0.0078125, 0.02801513671875, 0.0638427734375, 0.09967041015625, 0.135498046875, 0.17132568359375, 0.2071533203125, 0.24298095703125, 0.27880859375, 0.31463623046875, 0.3504638671875, 0.38629150390625, 0.422119140625, 0.45794677734375, 0.4937744140625, 0.52960205078125, 0.5654296875, 0.60125732421875, 0.6370849609375, 0.67291259765625, 0.708740234375, 0.74456787109375, 0.7803955078125, 0.81622314453125, 0.85205078125, 0.88787841796875, 0.9237060546875, 0.95953369140625, 0.995361328125, 1.03118896484375, 1.0670166015625, 1.10284423828125, 1.138671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 11.0, 13.0, 9.0, 6.0, 14.0, 14.0, 16.0, 15.0, 26.0, 30.0, 34.0, 32.0, 33.0, 34.0, 26.0, 49.0, 43.0, 39.0, 38.0, 46.0, 38.0, 41.0, 37.0, 39.0, 30.0, 39.0, 22.0, 29.0, 21.0, 23.0, 18.0, 36.0, 13.0, 16.0, 6.0, 6.0, 9.0, 10.0, 2.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0], "bins": [-1.1728515625, -1.1381683349609375, -1.103485107421875, -1.0688018798828125, -1.03411865234375, -0.9994354248046875, -0.964752197265625, -0.9300689697265625, -0.8953857421875, -0.8607025146484375, -0.826019287109375, -0.7913360595703125, -0.75665283203125, -0.7219696044921875, -0.687286376953125, -0.6526031494140625, -0.617919921875, -0.5832366943359375, -0.548553466796875, -0.5138702392578125, -0.47918701171875, -0.4445037841796875, -0.409820556640625, -0.3751373291015625, -0.3404541015625, -0.3057708740234375, -0.271087646484375, -0.2364044189453125, -0.20172119140625, -0.1670379638671875, -0.132354736328125, -0.0976715087890625, -0.06298828125, -0.0283050537109375, 0.006378173828125, 0.0410614013671875, 0.07574462890625, 0.1104278564453125, 0.145111083984375, 0.1797943115234375, 0.2144775390625, 0.2491607666015625, 0.283843994140625, 0.3185272216796875, 0.35321044921875, 0.3878936767578125, 0.422576904296875, 0.4572601318359375, 0.491943359375, 0.5266265869140625, 0.561309814453125, 0.5959930419921875, 0.63067626953125, 0.6653594970703125, 0.700042724609375, 0.7347259521484375, 0.7694091796875, 0.8040924072265625, 0.838775634765625, 0.8734588623046875, 0.90814208984375, 0.9428253173828125, 0.977508544921875, 1.0121917724609375, 1.046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 6.0, 17.0, 30.0, 63.0, 108.0, 233.0, 470.0, 1008.0, 2745.0, 8236.0, 30890.0, 187458.0, 640891.0, 140018.0, 25278.0, 6907.0, 2405.0, 951.0, 392.0, 199.0, 103.0, 54.0, 37.0, 15.0, 14.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.1144866943359375, -2.049285888671875, -1.9840850830078125, -1.91888427734375, -1.8536834716796875, -1.788482666015625, -1.7232818603515625, -1.6580810546875, -1.5928802490234375, -1.527679443359375, -1.4624786376953125, -1.39727783203125, -1.3320770263671875, -1.266876220703125, -1.2016754150390625, -1.136474609375, -1.0712738037109375, -1.006072998046875, -0.9408721923828125, -0.87567138671875, -0.8104705810546875, -0.745269775390625, -0.6800689697265625, -0.6148681640625, -0.5496673583984375, -0.484466552734375, -0.4192657470703125, -0.35406494140625, -0.2888641357421875, -0.223663330078125, -0.1584625244140625, -0.09326171875, -0.0280609130859375, 0.037139892578125, 0.1023406982421875, 0.16754150390625, 0.2327423095703125, 0.297943115234375, 0.3631439208984375, 0.4283447265625, 0.4935455322265625, 0.558746337890625, 0.6239471435546875, 0.68914794921875, 0.7543487548828125, 0.819549560546875, 0.8847503662109375, 0.949951171875, 1.0151519775390625, 1.080352783203125, 1.1455535888671875, 1.21075439453125, 1.2759552001953125, 1.341156005859375, 1.4063568115234375, 1.4715576171875, 1.5367584228515625, 1.601959228515625, 1.6671600341796875, 1.73236083984375, 1.7975616455078125, 1.862762451171875, 1.9279632568359375, 1.9931640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 5.0, 12.0, 8.0, 7.0, 9.0, 14.0, 30.0, 30.0, 47.0, 51.0, 55.0, 86.0, 101.0, 104.0, 88.0, 75.0, 71.0, 50.0, 31.0, 24.0, 19.0, 15.0, 13.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00019347667694091797, -0.00018615461885929108, -0.00017883256077766418, -0.0001715105026960373, -0.0001641884446144104, -0.0001568663865327835, -0.00014954432845115662, -0.00014222227036952972, -0.00013490021228790283, -0.00012757815420627594, -0.00012025609612464905, -0.00011293403804302216, -0.00010561197996139526, -9.828992187976837e-05, -9.096786379814148e-05, -8.364580571651459e-05, -7.63237476348877e-05, -6.90016895532608e-05, -6.167963147163391e-05, -5.435757339000702e-05, -4.703551530838013e-05, -3.9713457226753235e-05, -3.239139914512634e-05, -2.506934106349945e-05, -1.774728298187256e-05, -1.0425224900245667e-05, -3.1031668186187744e-06, 4.218891263008118e-06, 1.154094934463501e-05, 1.8863007426261902e-05, 2.6185065507888794e-05, 3.3507123589515686e-05, 4.082918167114258e-05, 4.815123975276947e-05, 5.547329783439636e-05, 6.279535591602325e-05, 7.011741399765015e-05, 7.743947207927704e-05, 8.476153016090393e-05, 9.208358824253082e-05, 9.940564632415771e-05, 0.00010672770440578461, 0.0001140497624874115, 0.00012137182056903839, 0.00012869387865066528, 0.00013601593673229218, 0.00014333799481391907, 0.00015066005289554596, 0.00015798211097717285, 0.00016530416905879974, 0.00017262622714042664, 0.00017994828522205353, 0.00018727034330368042, 0.0001945924013853073, 0.0002019144594669342, 0.0002092365175485611, 0.000216558575630188, 0.00022388063371181488, 0.00023120269179344177, 0.00023852474987506866, 0.00024584680795669556, 0.00025316886603832245, 0.00026049092411994934, 0.00026781298220157623, 0.0002751350402832031]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 8.0, 17.0, 11.0, 31.0, 44.0, 56.0, 89.0, 116.0, 202.0, 335.0, 645.0, 1219.0, 2611.0, 5583.0, 14043.0, 39785.0, 145121.0, 479978.0, 258531.0, 64058.0, 20863.0, 8030.0, 3520.0, 1586.0, 878.0, 447.0, 268.0, 159.0, 106.0, 72.0, 33.0, 22.0, 25.0, 14.0, 9.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.259765625, -1.21734619140625, -1.1749267578125, -1.13250732421875, -1.090087890625, -1.04766845703125, -1.0052490234375, -0.96282958984375, -0.92041015625, -0.87799072265625, -0.8355712890625, -0.79315185546875, -0.750732421875, -0.70831298828125, -0.6658935546875, -0.62347412109375, -0.5810546875, -0.53863525390625, -0.4962158203125, -0.45379638671875, -0.411376953125, -0.36895751953125, -0.3265380859375, -0.28411865234375, -0.24169921875, -0.19927978515625, -0.1568603515625, -0.11444091796875, -0.072021484375, -0.02960205078125, 0.0128173828125, 0.05523681640625, 0.09765625, 0.14007568359375, 0.1824951171875, 0.22491455078125, 0.267333984375, 0.30975341796875, 0.3521728515625, 0.39459228515625, 0.43701171875, 0.47943115234375, 0.5218505859375, 0.56427001953125, 0.606689453125, 0.64910888671875, 0.6915283203125, 0.73394775390625, 0.7763671875, 0.81878662109375, 0.8612060546875, 0.90362548828125, 0.946044921875, 0.98846435546875, 1.0308837890625, 1.07330322265625, 1.11572265625, 1.15814208984375, 1.2005615234375, 1.24298095703125, 1.285400390625, 1.32781982421875, 1.3702392578125, 1.41265869140625, 1.455078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 6.0, 2.0, 7.0, 5.0, 5.0, 14.0, 18.0, 20.0, 22.0, 29.0, 40.0, 56.0, 66.0, 101.0, 102.0, 108.0, 88.0, 80.0, 64.0, 45.0, 31.0, 18.0, 17.0, 11.0, 10.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.185546875, -1.1433258056640625, -1.101104736328125, -1.0588836669921875, -1.01666259765625, -0.9744415283203125, -0.932220458984375, -0.8899993896484375, -0.8477783203125, -0.8055572509765625, -0.763336181640625, -0.7211151123046875, -0.67889404296875, -0.6366729736328125, -0.594451904296875, -0.5522308349609375, -0.510009765625, -0.4677886962890625, -0.425567626953125, -0.3833465576171875, -0.34112548828125, -0.2989044189453125, -0.256683349609375, -0.2144622802734375, -0.1722412109375, -0.1300201416015625, -0.087799072265625, -0.0455780029296875, -0.00335693359375, 0.0388641357421875, 0.081085205078125, 0.1233062744140625, 0.16552734375, 0.2077484130859375, 0.249969482421875, 0.2921905517578125, 0.33441162109375, 0.3766326904296875, 0.418853759765625, 0.4610748291015625, 0.5032958984375, 0.5455169677734375, 0.587738037109375, 0.6299591064453125, 0.67218017578125, 0.7144012451171875, 0.756622314453125, 0.7988433837890625, 0.841064453125, 0.8832855224609375, 0.925506591796875, 0.9677276611328125, 1.00994873046875, 1.0521697998046875, 1.094390869140625, 1.1366119384765625, 1.1788330078125, 1.2210540771484375, 1.263275146484375, 1.3054962158203125, 1.34771728515625, 1.3899383544921875, 1.432159423828125, 1.4743804931640625, 1.5166015625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 19.0, 50.0, 113.0, 198.0, 216.0, 191.0, 109.0, 48.0, 19.0, 15.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15909194946289, -18.298742294311523, -17.438390731811523, -16.578041076660156, -15.717690467834473, -14.857339859008789, -13.996990203857422, -13.136639595031738, -12.276288986206055, -11.415938377380371, -10.555588722229004, -9.69523811340332, -8.834887504577637, -7.974537372589111, -7.114187240600586, -6.253836631774902, -5.393486976623535, -4.53313684463501, -3.672786235809326, -2.812436103820801, -1.9520857334136963, -1.0917353630065918, -0.2313852310180664, 0.6289653778076172, 1.4893155097961426, 2.349665880203247, 3.2100162506103516, 4.070366382598877, 4.930716514587402, 5.791067123413086, 6.651417255401611, 7.511767864227295, 8.37211799621582, 9.232468605041504, 10.092818260192871, 10.953168869018555, 11.813519477844238, 12.673870086669922, 13.534219741821289, 14.394570350646973, 15.254920959472656, 16.115270614624023, 16.975622177124023, 17.83597183227539, 18.696321487426758, 19.556673049926758, 20.417022705078125, 21.277374267578125, 22.13772201538086, 22.998071670532227, 23.858423233032227, 24.718772888183594, 25.57912254333496, 26.43947410583496, 27.299823760986328, 28.160175323486328, 29.020524978637695, 29.880874633789062, 30.741226196289062, 31.60157585144043, 32.4619255065918, 33.3222770690918, 34.18262481689453, 35.04297637939453, 35.90332794189453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 7.0, 6.0, 11.0, 9.0, 15.0, 13.0, 21.0, 28.0, 25.0, 20.0, 27.0, 41.0, 42.0, 43.0, 52.0, 44.0, 54.0, 43.0, 46.0, 42.0, 44.0, 40.0, 42.0, 34.0, 29.0, 29.0, 26.0, 24.0, 25.0, 28.0, 23.0, 9.0, 15.0, 8.0, 7.0, 2.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.809619903564453, -7.565699100494385, -7.321778297424316, -7.077857494354248, -6.83393669128418, -6.590015888214111, -6.346095085144043, -6.102173805236816, -5.858253479003906, -5.614332675933838, -5.3704118728637695, -5.126491069793701, -4.882570266723633, -4.6386494636535645, -4.394728660583496, -4.1508073806762695, -3.906886577606201, -3.662965774536133, -3.4190449714660645, -3.175124168395996, -2.9312033653259277, -2.6872825622558594, -2.443361520767212, -2.1994407176971436, -1.9555199146270752, -1.7115991115570068, -1.4676783084869385, -1.2237573862075806, -0.9798365831375122, -0.7359157800674438, -0.49199485778808594, -0.24807405471801758, -0.004152774810791016, 0.23976805806159973, 0.4836888909339905, 0.7276097536087036, 0.971530556678772, 1.2154513597488403, 1.4593722820281982, 1.7032930850982666, 1.947213888168335, 2.1911346912384033, 2.4350554943084717, 2.678976535797119, 2.9228973388671875, 3.166818141937256, 3.410738945007324, 3.6546597480773926, 3.898580551147461, 4.142501354217529, 4.386422157287598, 4.630342960357666, 4.874263763427734, 5.118184566497803, 5.362105369567871, 5.606026649475098, 5.849946975708008, 6.093867778778076, 6.3377885818481445, 6.581709384918213, 6.825630187988281, 7.06955099105835, 7.313471794128418, 7.5573930740356445, 7.801313877105713]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 11.0, 5.0, 6.0, 9.0, 23.0, 19.0, 22.0, 39.0, 73.0, 82.0, 111.0, 165.0, 244.0, 425.0, 710.0, 1232.0, 2357.0, 4910.0, 11667.0, 35918.0, 168183.0, 2980113.0, 854387.0, 93992.0, 23971.0, 8313.0, 3447.0, 1730.0, 878.0, 486.0, 263.0, 155.0, 110.0, 65.0, 39.0, 35.0, 25.0, 14.0, 15.0, 14.0, 5.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.873046875, -2.788116455078125, -2.70318603515625, -2.618255615234375, -2.5333251953125, -2.448394775390625, -2.36346435546875, -2.278533935546875, -2.193603515625, -2.108673095703125, -2.02374267578125, -1.938812255859375, -1.8538818359375, -1.768951416015625, -1.68402099609375, -1.599090576171875, -1.51416015625, -1.429229736328125, -1.34429931640625, -1.259368896484375, -1.1744384765625, -1.089508056640625, -1.00457763671875, -0.919647216796875, -0.834716796875, -0.749786376953125, -0.66485595703125, -0.579925537109375, -0.4949951171875, -0.410064697265625, -0.32513427734375, -0.240203857421875, -0.1552734375, -0.070343017578125, 0.01458740234375, 0.099517822265625, 0.1844482421875, 0.269378662109375, 0.35430908203125, 0.439239501953125, 0.524169921875, 0.609100341796875, 0.69403076171875, 0.778961181640625, 0.8638916015625, 0.948822021484375, 1.03375244140625, 1.118682861328125, 1.20361328125, 1.288543701171875, 1.37347412109375, 1.458404541015625, 1.5433349609375, 1.628265380859375, 1.71319580078125, 1.798126220703125, 1.883056640625, 1.967987060546875, 2.05291748046875, 2.137847900390625, 2.2227783203125, 2.307708740234375, 2.39263916015625, 2.477569580078125, 2.5625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 11.0, 10.0, 12.0, 13.0, 16.0, 20.0, 33.0, 42.0, 52.0, 58.0, 61.0, 72.0, 84.0, 71.0, 72.0, 58.0, 61.0, 52.0, 35.0, 39.0, 40.0, 22.0, 23.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.4260101318359375, -0.412322998046875, -0.3986358642578125, -0.38494873046875, -0.3712615966796875, -0.357574462890625, -0.3438873291015625, -0.3302001953125, -0.3165130615234375, -0.302825927734375, -0.2891387939453125, -0.27545166015625, -0.2617645263671875, -0.248077392578125, -0.2343902587890625, -0.220703125, -0.2070159912109375, -0.193328857421875, -0.1796417236328125, -0.16595458984375, -0.1522674560546875, -0.138580322265625, -0.1248931884765625, -0.1112060546875, -0.0975189208984375, -0.083831787109375, -0.0701446533203125, -0.05645751953125, -0.0427703857421875, -0.029083251953125, -0.0153961181640625, -0.001708984375, 0.0119781494140625, 0.025665283203125, 0.0393524169921875, 0.05303955078125, 0.0667266845703125, 0.080413818359375, 0.0941009521484375, 0.1077880859375, 0.1214752197265625, 0.135162353515625, 0.1488494873046875, 0.16253662109375, 0.1762237548828125, 0.189910888671875, 0.2035980224609375, 0.21728515625, 0.2309722900390625, 0.244659423828125, 0.2583465576171875, 0.27203369140625, 0.2857208251953125, 0.299407958984375, 0.3130950927734375, 0.3267822265625, 0.3404693603515625, 0.354156494140625, 0.3678436279296875, 0.38153076171875, 0.3952178955078125, 0.408905029296875, 0.4225921630859375, 0.436279296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 9.0, 8.0, 14.0, 16.0, 27.0, 35.0, 57.0, 98.0, 153.0, 273.0, 531.0, 1042.0, 2374.0, 5871.0, 16451.0, 52858.0, 222127.0, 1991800.0, 1625616.0, 200845.0, 48931.0, 15146.0, 5596.0, 2220.0, 1012.0, 521.0, 244.0, 149.0, 86.0, 59.0, 38.0, 17.0, 15.0, 13.0, 18.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.72509765625, -1.6611328125, -1.59716796875, -1.533203125, -1.46923828125, -1.4052734375, -1.34130859375, -1.27734375, -1.21337890625, -1.1494140625, -1.08544921875, -1.021484375, -0.95751953125, -0.8935546875, -0.82958984375, -0.765625, -0.70166015625, -0.6376953125, -0.57373046875, -0.509765625, -0.44580078125, -0.3818359375, -0.31787109375, -0.25390625, -0.18994140625, -0.1259765625, -0.06201171875, 0.001953125, 0.06591796875, 0.1298828125, 0.19384765625, 0.2578125, 0.32177734375, 0.3857421875, 0.44970703125, 0.513671875, 0.57763671875, 0.6416015625, 0.70556640625, 0.76953125, 0.83349609375, 0.8974609375, 0.96142578125, 1.025390625, 1.08935546875, 1.1533203125, 1.21728515625, 1.28125, 1.34521484375, 1.4091796875, 1.47314453125, 1.537109375, 1.60107421875, 1.6650390625, 1.72900390625, 1.79296875, 1.85693359375, 1.9208984375, 1.98486328125, 2.048828125, 2.11279296875, 2.1767578125, 2.24072265625, 2.3046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 1.0, 0.0, 4.0, 7.0, 5.0, 10.0, 20.0, 26.0, 40.0, 39.0, 72.0, 114.0, 151.0, 279.0, 462.0, 841.0, 829.0, 439.0, 251.0, 155.0, 108.0, 67.0, 50.0, 34.0, 24.0, 12.0, 11.0, 10.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.0687332153320312, -1.0398101806640625, -1.0108871459960938, -0.981964111328125, -0.9530410766601562, -0.9241180419921875, -0.8951950073242188, -0.86627197265625, -0.8373489379882812, -0.8084259033203125, -0.7795028686523438, -0.750579833984375, -0.7216567993164062, -0.6927337646484375, -0.6638107299804688, -0.6348876953125, -0.6059646606445312, -0.5770416259765625, -0.5481185913085938, -0.519195556640625, -0.49027252197265625, -0.4613494873046875, -0.43242645263671875, -0.40350341796875, -0.37458038330078125, -0.3456573486328125, -0.31673431396484375, -0.287811279296875, -0.25888824462890625, -0.2299652099609375, -0.20104217529296875, -0.172119140625, -0.14319610595703125, -0.1142730712890625, -0.08535003662109375, -0.056427001953125, -0.02750396728515625, 0.0014190673828125, 0.03034210205078125, 0.05926513671875, 0.08818817138671875, 0.1171112060546875, 0.14603424072265625, 0.174957275390625, 0.20388031005859375, 0.2328033447265625, 0.26172637939453125, 0.2906494140625, 0.31957244873046875, 0.3484954833984375, 0.37741851806640625, 0.406341552734375, 0.43526458740234375, 0.4641876220703125, 0.49311065673828125, 0.52203369140625, 0.5509567260742188, 0.5798797607421875, 0.6088027954101562, 0.637725830078125, 0.6666488647460938, 0.6955718994140625, 0.7244949340820312, 0.75341796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 8.0, 24.0, 28.0, 57.0, 115.0, 147.0, 191.0, 150.0, 122.0, 63.0, 43.0, 20.0, 16.0, 6.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.450633525848389, -4.122186660766602, -3.7937397956848145, -3.4652931690216064, -3.1368463039398193, -2.8083994388580322, -2.479952812194824, -2.151505947113037, -1.82305908203125, -1.494612216949463, -1.1661654710769653, -0.837718665599823, -0.5092718601226807, -0.18082499504089355, 0.147621750831604, 0.47606849670410156, 0.8045153617858887, 1.1329622268676758, 1.4614089727401733, 1.789855718612671, 2.118302583694458, 2.446749448776245, 2.775196075439453, 3.1036429405212402, 3.4320898056030273, 3.7605366706848145, 4.088983535766602, 4.417430400848389, 4.745877265930176, 5.074323654174805, 5.402770519256592, 5.731217384338379, 6.059663772583008, 6.388110637664795, 6.716557502746582, 7.045004367828369, 7.373451232910156, 7.701897621154785, 8.03034496307373, 8.35879135131836, 8.687238693237305, 9.015685081481934, 9.344132423400879, 9.672578811645508, 10.001026153564453, 10.329472541809082, 10.657919883728027, 10.986366271972656, 11.314812660217285, 11.643259048461914, 11.97170639038086, 12.300152778625488, 12.628600120544434, 12.957046508789062, 13.285493850708008, 13.613940238952637, 13.942386627197266, 14.270833015441895, 14.59928035736084, 14.927726745605469, 15.256174087524414, 15.584620475769043, 15.913067817687988, 16.241514205932617, 16.569961547851562]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 7.0, 13.0, 10.0, 18.0, 15.0, 18.0, 23.0, 27.0, 29.0, 27.0, 32.0, 44.0, 39.0, 41.0, 52.0, 53.0, 63.0, 53.0, 45.0, 50.0, 40.0, 37.0, 34.0, 42.0, 25.0, 35.0, 21.0, 17.0, 14.0, 21.0, 12.0, 8.0, 8.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7309255599975586, -2.617586851119995, -2.5042481422424316, -2.390909433364868, -2.2775707244873047, -2.164232015609741, -2.0508933067321777, -1.9375545978546143, -1.8242158889770508, -1.7108771800994873, -1.5975384712219238, -1.4841997623443604, -1.3708610534667969, -1.2575223445892334, -1.14418363571167, -1.0308449268341064, -0.917506217956543, -0.8041675090789795, -0.690828800201416, -0.5774900913238525, -0.46415138244628906, -0.3508126735687256, -0.2374739646911621, -0.12413525581359863, -0.010796546936035156, 0.10254216194152832, 0.2158808708190918, 0.3292195796966553, 0.44255828857421875, 0.5558969974517822, 0.6692357063293457, 0.7825744152069092, 0.8959131240844727, 1.0092518329620361, 1.1225905418395996, 1.235929250717163, 1.3492679595947266, 1.46260666847229, 1.5759453773498535, 1.689284086227417, 1.8026227951049805, 1.915961503982544, 2.0293002128601074, 2.142638921737671, 2.2559776306152344, 2.369316339492798, 2.4826550483703613, 2.595993757247925, 2.7093324661254883, 2.8226711750030518, 2.9360098838806152, 3.0493485927581787, 3.162687301635742, 3.2760260105133057, 3.389364719390869, 3.5027034282684326, 3.616042137145996, 3.7293808460235596, 3.842719554901123, 3.9560582637786865, 4.06939697265625, 4.182735443115234, 4.296074390411377, 4.4094133377075195, 4.522751808166504]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 9.0, 8.0, 16.0, 14.0, 21.0, 37.0, 37.0, 49.0, 88.0, 126.0, 190.0, 313.0, 456.0, 744.0, 1337.0, 2624.0, 5546.0, 12234.0, 29000.0, 73541.0, 207259.0, 403534.0, 192265.0, 69257.0, 27172.0, 11572.0, 5246.0, 2528.0, 1328.0, 765.0, 429.0, 268.0, 144.0, 129.0, 65.0, 55.0, 39.0, 30.0, 21.0, 17.0, 10.0, 9.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.30078125, -2.2376861572265625, -2.174591064453125, -2.1114959716796875, -2.04840087890625, -1.9853057861328125, -1.922210693359375, -1.8591156005859375, -1.7960205078125, -1.7329254150390625, -1.669830322265625, -1.6067352294921875, -1.54364013671875, -1.4805450439453125, -1.417449951171875, -1.3543548583984375, -1.291259765625, -1.2281646728515625, -1.165069580078125, -1.1019744873046875, -1.03887939453125, -0.9757843017578125, -0.912689208984375, -0.8495941162109375, -0.7864990234375, -0.7234039306640625, -0.660308837890625, -0.5972137451171875, -0.53411865234375, -0.4710235595703125, -0.407928466796875, -0.3448333740234375, -0.28173828125, -0.2186431884765625, -0.155548095703125, -0.0924530029296875, -0.02935791015625, 0.0337371826171875, 0.096832275390625, 0.1599273681640625, 0.2230224609375, 0.2861175537109375, 0.349212646484375, 0.4123077392578125, 0.47540283203125, 0.5384979248046875, 0.601593017578125, 0.6646881103515625, 0.727783203125, 0.7908782958984375, 0.853973388671875, 0.9170684814453125, 0.98016357421875, 1.0432586669921875, 1.106353759765625, 1.1694488525390625, 1.2325439453125, 1.2956390380859375, 1.358734130859375, 1.4218292236328125, 1.48492431640625, 1.5480194091796875, 1.611114501953125, 1.6742095947265625, 1.7373046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 13.0, 8.0, 3.0, 11.0, 8.0, 19.0, 30.0, 30.0, 36.0, 48.0, 52.0, 67.0, 70.0, 71.0, 88.0, 56.0, 58.0, 67.0, 73.0, 51.0, 39.0, 24.0, 20.0, 24.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4912109375, -0.4764671325683594, -0.46172332763671875, -0.4469795227050781, -0.4322357177734375, -0.4174919128417969, -0.40274810791015625, -0.3880043029785156, -0.373260498046875, -0.3585166931152344, -0.34377288818359375, -0.3290290832519531, -0.3142852783203125, -0.2995414733886719, -0.28479766845703125, -0.2700538635253906, -0.25531005859375, -0.24056625366210938, -0.22582244873046875, -0.21107864379882812, -0.1963348388671875, -0.18159103393554688, -0.16684722900390625, -0.15210342407226562, -0.137359619140625, -0.12261581420898438, -0.10787200927734375, -0.09312820434570312, -0.0783843994140625, -0.06364059448242188, -0.04889678955078125, -0.034152984619140625, -0.0194091796875, -0.004665374755859375, 0.01007843017578125, 0.024822235107421875, 0.0395660400390625, 0.054309844970703125, 0.06905364990234375, 0.08379745483398438, 0.098541259765625, 0.11328506469726562, 0.12802886962890625, 0.14277267456054688, 0.1575164794921875, 0.17226028442382812, 0.18700408935546875, 0.20174789428710938, 0.21649169921875, 0.23123550415039062, 0.24597930908203125, 0.2607231140136719, 0.2754669189453125, 0.2902107238769531, 0.30495452880859375, 0.3196983337402344, 0.334442138671875, 0.3491859436035156, 0.36392974853515625, 0.3786735534667969, 0.3934173583984375, 0.4081611633300781, 0.42290496826171875, 0.4376487731933594, 0.452392578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 9.0, 11.0, 14.0, 20.0, 25.0, 31.0, 42.0, 64.0, 98.0, 131.0, 204.0, 303.0, 495.0, 816.0, 1371.0, 2524.0, 4912.0, 10110.0, 21264.0, 46294.0, 102770.0, 225322.0, 310893.0, 174170.0, 77723.0, 35481.0, 16516.0, 7833.0, 3944.0, 2058.0, 1145.0, 680.0, 402.0, 267.0, 192.0, 100.0, 76.0, 64.0, 49.0, 41.0, 19.0, 19.0, 8.0, 13.0, 6.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.25, -1.2087860107421875, -1.167572021484375, -1.1263580322265625, -1.08514404296875, -1.0439300537109375, -1.002716064453125, -0.9615020751953125, -0.9202880859375, -0.8790740966796875, -0.837860107421875, -0.7966461181640625, -0.75543212890625, -0.7142181396484375, -0.673004150390625, -0.6317901611328125, -0.590576171875, -0.5493621826171875, -0.508148193359375, -0.4669342041015625, -0.42572021484375, -0.3845062255859375, -0.343292236328125, -0.3020782470703125, -0.2608642578125, -0.2196502685546875, -0.178436279296875, -0.1372222900390625, -0.09600830078125, -0.0547943115234375, -0.013580322265625, 0.0276336669921875, 0.06884765625, 0.1100616455078125, 0.151275634765625, 0.1924896240234375, 0.23370361328125, 0.2749176025390625, 0.316131591796875, 0.3573455810546875, 0.3985595703125, 0.4397735595703125, 0.480987548828125, 0.5222015380859375, 0.56341552734375, 0.6046295166015625, 0.645843505859375, 0.6870574951171875, 0.728271484375, 0.7694854736328125, 0.810699462890625, 0.8519134521484375, 0.89312744140625, 0.9343414306640625, 0.975555419921875, 1.0167694091796875, 1.0579833984375, 1.0991973876953125, 1.140411376953125, 1.1816253662109375, 1.22283935546875, 1.2640533447265625, 1.305267333984375, 1.3464813232421875, 1.3876953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 13.0, 10.0, 7.0, 17.0, 23.0, 14.0, 28.0, 22.0, 25.0, 37.0, 35.0, 29.0, 40.0, 41.0, 41.0, 43.0, 48.0, 45.0, 53.0, 40.0, 35.0, 45.0, 43.0, 33.0, 33.0, 32.0, 23.0, 21.0, 14.0, 21.0, 12.0, 17.0, 14.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.5, -1.459075927734375, -1.41815185546875, -1.377227783203125, -1.3363037109375, -1.295379638671875, -1.25445556640625, -1.213531494140625, -1.172607421875, -1.131683349609375, -1.09075927734375, -1.049835205078125, -1.0089111328125, -0.967987060546875, -0.92706298828125, -0.886138916015625, -0.84521484375, -0.804290771484375, -0.76336669921875, -0.722442626953125, -0.6815185546875, -0.640594482421875, -0.59967041015625, -0.558746337890625, -0.517822265625, -0.476898193359375, -0.43597412109375, -0.395050048828125, -0.3541259765625, -0.313201904296875, -0.27227783203125, -0.231353759765625, -0.1904296875, -0.149505615234375, -0.10858154296875, -0.067657470703125, -0.0267333984375, 0.014190673828125, 0.05511474609375, 0.096038818359375, 0.136962890625, 0.177886962890625, 0.21881103515625, 0.259735107421875, 0.3006591796875, 0.341583251953125, 0.38250732421875, 0.423431396484375, 0.46435546875, 0.505279541015625, 0.54620361328125, 0.587127685546875, 0.6280517578125, 0.668975830078125, 0.70989990234375, 0.750823974609375, 0.791748046875, 0.832672119140625, 0.87359619140625, 0.914520263671875, 0.9554443359375, 0.996368408203125, 1.03729248046875, 1.078216552734375, 1.119140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 16.0, 22.0, 17.0, 43.0, 62.0, 89.0, 133.0, 295.0, 609.0, 1436.0, 4383.0, 15176.0, 67284.0, 487993.0, 397428.0, 54190.0, 12928.0, 3895.0, 1354.0, 508.0, 266.0, 130.0, 76.0, 51.0, 37.0, 41.0, 14.0, 16.0, 10.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.7008819580078125, -1.645904541015625, -1.5909271240234375, -1.53594970703125, -1.4809722900390625, -1.425994873046875, -1.3710174560546875, -1.3160400390625, -1.2610626220703125, -1.206085205078125, -1.1511077880859375, -1.09613037109375, -1.0411529541015625, -0.986175537109375, -0.9311981201171875, -0.876220703125, -0.8212432861328125, -0.766265869140625, -0.7112884521484375, -0.65631103515625, -0.6013336181640625, -0.546356201171875, -0.4913787841796875, -0.4364013671875, -0.3814239501953125, -0.326446533203125, -0.2714691162109375, -0.21649169921875, -0.1615142822265625, -0.106536865234375, -0.0515594482421875, 0.00341796875, 0.0583953857421875, 0.113372802734375, 0.1683502197265625, 0.22332763671875, 0.2783050537109375, 0.333282470703125, 0.3882598876953125, 0.4432373046875, 0.4982147216796875, 0.553192138671875, 0.6081695556640625, 0.66314697265625, 0.7181243896484375, 0.773101806640625, 0.8280792236328125, 0.883056640625, 0.9380340576171875, 0.993011474609375, 1.0479888916015625, 1.10296630859375, 1.1579437255859375, 1.212921142578125, 1.2678985595703125, 1.3228759765625, 1.3778533935546875, 1.432830810546875, 1.4878082275390625, 1.54278564453125, 1.5977630615234375, 1.652740478515625, 1.7077178955078125, 1.7626953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 8.0, 9.0, 14.0, 34.0, 22.0, 26.0, 42.0, 117.0, 178.0, 207.0, 138.0, 61.0, 36.0, 35.0, 11.0, 17.0, 9.0, 2.0, 7.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004563331604003906, -0.000445537269115448, -0.00043474137783050537, -0.00042394548654556274, -0.0004131495952606201, -0.0004023537039756775, -0.00039155781269073486, -0.00038076192140579224, -0.0003699660301208496, -0.000359170138835907, -0.00034837424755096436, -0.00033757835626602173, -0.0003267824649810791, -0.0003159865736961365, -0.00030519068241119385, -0.0002943947911262512, -0.0002835988998413086, -0.00027280300855636597, -0.00026200711727142334, -0.0002512112259864807, -0.00024041533470153809, -0.00022961944341659546, -0.00021882355213165283, -0.0002080276608467102, -0.00019723176956176758, -0.00018643587827682495, -0.00017563998699188232, -0.0001648440957069397, -0.00015404820442199707, -0.00014325231313705444, -0.00013245642185211182, -0.00012166053056716919, -0.00011086463928222656, -0.00010006874799728394, -8.927285671234131e-05, -7.847696542739868e-05, -6.768107414245605e-05, -5.688518285751343e-05, -4.60892915725708e-05, -3.5293400287628174e-05, -2.4497509002685547e-05, -1.370161771774292e-05, -2.905726432800293e-06, 7.890164852142334e-06, 1.868605613708496e-05, 2.9481947422027588e-05, 4.0277838706970215e-05, 5.107372999191284e-05, 6.186962127685547e-05, 7.26655125617981e-05, 8.346140384674072e-05, 9.425729513168335e-05, 0.00010505318641662598, 0.0001158490777015686, 0.00012664496898651123, 0.00013744086027145386, 0.00014823675155639648, 0.0001590326428413391, 0.00016982853412628174, 0.00018062442541122437, 0.000191420316696167, 0.00020221620798110962, 0.00021301209926605225, 0.00022380799055099487, 0.0002346038818359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 24.0, 21.0, 41.0, 92.0, 129.0, 268.0, 461.0, 1329.0, 6136.0, 42884.0, 696117.0, 274231.0, 21603.0, 3475.0, 912.0, 364.0, 168.0, 94.0, 65.0, 33.0, 25.0, 21.0, 12.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.578125, -2.499603271484375, -2.42108154296875, -2.342559814453125, -2.2640380859375, -2.185516357421875, -2.10699462890625, -2.028472900390625, -1.949951171875, -1.871429443359375, -1.79290771484375, -1.714385986328125, -1.6358642578125, -1.557342529296875, -1.47882080078125, -1.400299072265625, -1.32177734375, -1.243255615234375, -1.16473388671875, -1.086212158203125, -1.0076904296875, -0.929168701171875, -0.85064697265625, -0.772125244140625, -0.693603515625, -0.615081787109375, -0.53656005859375, -0.458038330078125, -0.3795166015625, -0.300994873046875, -0.22247314453125, -0.143951416015625, -0.0654296875, 0.013092041015625, 0.09161376953125, 0.170135498046875, 0.2486572265625, 0.327178955078125, 0.40570068359375, 0.484222412109375, 0.562744140625, 0.641265869140625, 0.71978759765625, 0.798309326171875, 0.8768310546875, 0.955352783203125, 1.03387451171875, 1.112396240234375, 1.19091796875, 1.269439697265625, 1.34796142578125, 1.426483154296875, 1.5050048828125, 1.583526611328125, 1.66204833984375, 1.740570068359375, 1.819091796875, 1.897613525390625, 1.97613525390625, 2.054656982421875, 2.1331787109375, 2.211700439453125, 2.29022216796875, 2.368743896484375, 2.447265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 10.0, 20.0, 18.0, 29.0, 33.0, 64.0, 87.0, 115.0, 122.0, 151.0, 103.0, 79.0, 44.0, 34.0, 15.0, 18.0, 5.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.8994140625, -1.854949951171875, -1.81048583984375, -1.766021728515625, -1.7215576171875, -1.677093505859375, -1.63262939453125, -1.588165283203125, -1.543701171875, -1.499237060546875, -1.45477294921875, -1.410308837890625, -1.3658447265625, -1.321380615234375, -1.27691650390625, -1.232452392578125, -1.18798828125, -1.143524169921875, -1.09906005859375, -1.054595947265625, -1.0101318359375, -0.965667724609375, -0.92120361328125, -0.876739501953125, -0.832275390625, -0.787811279296875, -0.74334716796875, -0.698883056640625, -0.6544189453125, -0.609954833984375, -0.56549072265625, -0.521026611328125, -0.4765625, -0.432098388671875, -0.38763427734375, -0.343170166015625, -0.2987060546875, -0.254241943359375, -0.20977783203125, -0.165313720703125, -0.120849609375, -0.076385498046875, -0.03192138671875, 0.012542724609375, 0.0570068359375, 0.101470947265625, 0.14593505859375, 0.190399169921875, 0.23486328125, 0.279327392578125, 0.32379150390625, 0.368255615234375, 0.4127197265625, 0.457183837890625, 0.50164794921875, 0.546112060546875, 0.590576171875, 0.635040283203125, 0.67950439453125, 0.723968505859375, 0.7684326171875, 0.812896728515625, 0.85736083984375, 0.901824951171875, 0.9462890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 15.0, 25.0, 47.0, 71.0, 117.0, 143.0, 169.0, 142.0, 105.0, 70.0, 44.0, 24.0, 20.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.369895935058594, -26.734100341796875, -26.098304748535156, -25.462509155273438, -24.82671356201172, -24.19091796875, -23.55512237548828, -22.919326782226562, -22.283531188964844, -21.647735595703125, -21.011940002441406, -20.376144409179688, -19.74034881591797, -19.10455322265625, -18.46875762939453, -17.832962036132812, -17.19716453552246, -16.561368942260742, -15.925573348999023, -15.289777755737305, -14.653982162475586, -14.018186569213867, -13.382390022277832, -12.746594429016113, -12.110798835754395, -11.475003242492676, -10.839207649230957, -10.203412055969238, -9.567615509033203, -8.931819915771484, -8.296024322509766, -7.660228729248047, -7.0244340896606445, -6.388638496398926, -5.752842903137207, -5.11704683303833, -4.481251239776611, -3.8454556465148926, -3.2096598148345947, -2.573863983154297, -1.9380683898925781, -1.3022726774215698, -0.6664769649505615, -0.030681252479553223, 0.6051144599914551, 1.2409100532531738, 1.8767058849334717, 2.5125017166137695, 3.1482973098754883, 3.784092903137207, 4.419888496398926, 5.055684566497803, 5.6914801597595215, 6.32727575302124, 6.963071823120117, 7.598867416381836, 8.234663009643555, 8.870458602905273, 9.506254196166992, 10.142049789428711, 10.77784538269043, 11.413640975952148, 12.049437522888184, 12.685233116149902, 13.321028709411621]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 3.0, 5.0, 19.0, 9.0, 13.0, 9.0, 15.0, 22.0, 10.0, 18.0, 14.0, 22.0, 31.0, 26.0, 35.0, 33.0, 30.0, 47.0, 44.0, 40.0, 34.0, 45.0, 39.0, 41.0, 32.0, 36.0, 24.0, 38.0, 26.0, 31.0, 26.0, 19.0, 19.0, 22.0, 17.0, 18.0, 16.0, 17.0, 6.0, 6.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.17392635345459, -5.970163345336914, -5.7664008140563965, -5.562637805938721, -5.358874797821045, -5.155112266540527, -4.951349258422852, -4.747586250305176, -4.5438232421875, -4.340060234069824, -4.136297702789307, -3.932534694671631, -3.728771686553955, -3.5250089168548584, -3.3212461471557617, -3.117483139038086, -2.9137206077575684, -2.7099578380584717, -2.506194829940796, -2.302432060241699, -2.0986690521240234, -1.8949062824249268, -1.69114351272583, -1.4873806238174438, -1.2836177349090576, -1.0798548460006714, -0.8760920166969299, -0.6723291873931885, -0.46856629848480225, -0.264803409576416, -0.061040639877319336, 0.1427222490310669, 0.3464846611022949, 0.5502475500106812, 0.7540103793144226, 0.9577732086181641, 1.1615360975265503, 1.3652989864349365, 1.5690617561340332, 1.7728246450424194, 1.9765875339508057, 2.1803503036499023, 2.384113311767578, 2.587876081466675, 2.7916388511657715, 2.9954018592834473, 3.199164628982544, 3.4029273986816406, 3.6066904067993164, 3.810453176498413, 4.01421594619751, 4.2179789543151855, 4.421741962432861, 4.625504493713379, 4.829267501831055, 5.0330305099487305, 5.236793518066406, 5.440556526184082, 5.6443190574646, 5.848082065582275, 6.051845073699951, 6.255607604980469, 6.4593706130981445, 6.66313362121582, 6.866896152496338]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 5.0, 6.0, 7.0, 8.0, 13.0, 14.0, 25.0, 39.0, 66.0, 80.0, 141.0, 243.0, 383.0, 741.0, 1548.0, 3406.0, 9453.0, 34924.0, 258512.0, 3643064.0, 196889.0, 30180.0, 8583.0, 3078.0, 1322.0, 640.0, 363.0, 210.0, 104.0, 76.0, 48.0, 32.0, 24.0, 19.0, 7.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.20703125, -4.088348388671875, -3.96966552734375, -3.850982666015625, -3.7322998046875, -3.613616943359375, -3.49493408203125, -3.376251220703125, -3.257568359375, -3.138885498046875, -3.02020263671875, -2.901519775390625, -2.7828369140625, -2.664154052734375, -2.54547119140625, -2.426788330078125, -2.30810546875, -2.189422607421875, -2.07073974609375, -1.952056884765625, -1.8333740234375, -1.714691162109375, -1.59600830078125, -1.477325439453125, -1.358642578125, -1.239959716796875, -1.12127685546875, -1.002593994140625, -0.8839111328125, -0.765228271484375, -0.64654541015625, -0.527862548828125, -0.4091796875, -0.290496826171875, -0.17181396484375, -0.053131103515625, 0.0655517578125, 0.184234619140625, 0.30291748046875, 0.421600341796875, 0.540283203125, 0.658966064453125, 0.77764892578125, 0.896331787109375, 1.0150146484375, 1.133697509765625, 1.25238037109375, 1.371063232421875, 1.48974609375, 1.608428955078125, 1.72711181640625, 1.845794677734375, 1.9644775390625, 2.083160400390625, 2.20184326171875, 2.320526123046875, 2.439208984375, 2.557891845703125, 2.67657470703125, 2.795257568359375, 2.9139404296875, 3.032623291015625, 3.15130615234375, 3.269989013671875, 3.388671875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 6.0, 8.0, 11.0, 33.0, 38.0, 30.0, 35.0, 57.0, 68.0, 72.0, 61.0, 74.0, 80.0, 59.0, 61.0, 77.0, 54.0, 35.0, 27.0, 26.0, 23.0, 13.0, 16.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53076171875, -0.51544189453125, -0.5001220703125, -0.48480224609375, -0.469482421875, -0.45416259765625, -0.4388427734375, -0.42352294921875, -0.408203125, -0.39288330078125, -0.3775634765625, -0.36224365234375, -0.346923828125, -0.33160400390625, -0.3162841796875, -0.30096435546875, -0.28564453125, -0.27032470703125, -0.2550048828125, -0.23968505859375, -0.224365234375, -0.20904541015625, -0.1937255859375, -0.17840576171875, -0.1630859375, -0.14776611328125, -0.1324462890625, -0.11712646484375, -0.101806640625, -0.08648681640625, -0.0711669921875, -0.05584716796875, -0.04052734375, -0.02520751953125, -0.0098876953125, 0.00543212890625, 0.020751953125, 0.03607177734375, 0.0513916015625, 0.06671142578125, 0.08203125, 0.09735107421875, 0.1126708984375, 0.12799072265625, 0.143310546875, 0.15863037109375, 0.1739501953125, 0.18927001953125, 0.20458984375, 0.21990966796875, 0.2352294921875, 0.25054931640625, 0.265869140625, 0.28118896484375, 0.2965087890625, 0.31182861328125, 0.3271484375, 0.34246826171875, 0.3577880859375, 0.37310791015625, 0.388427734375, 0.40374755859375, 0.4190673828125, 0.43438720703125, 0.44970703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 6.0, 9.0, 6.0, 11.0, 13.0, 15.0, 20.0, 29.0, 28.0, 26.0, 28.0, 45.0, 53.0, 86.0, 231.0, 727.0, 4510.0, 45975.0, 3290573.0, 822809.0, 25267.0, 2822.0, 468.0, 154.0, 75.0, 38.0, 32.0, 32.0, 22.0, 20.0, 24.0, 16.0, 20.0, 14.0, 10.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.92578125, -5.75592041015625, -5.5860595703125, -5.41619873046875, -5.246337890625, -5.07647705078125, -4.9066162109375, -4.73675537109375, -4.56689453125, -4.39703369140625, -4.2271728515625, -4.05731201171875, -3.887451171875, -3.71759033203125, -3.5477294921875, -3.37786865234375, -3.2080078125, -3.03814697265625, -2.8682861328125, -2.69842529296875, -2.528564453125, -2.35870361328125, -2.1888427734375, -2.01898193359375, -1.84912109375, -1.67926025390625, -1.5093994140625, -1.33953857421875, -1.169677734375, -0.99981689453125, -0.8299560546875, -0.66009521484375, -0.490234375, -0.32037353515625, -0.1505126953125, 0.01934814453125, 0.189208984375, 0.35906982421875, 0.5289306640625, 0.69879150390625, 0.86865234375, 1.03851318359375, 1.2083740234375, 1.37823486328125, 1.548095703125, 1.71795654296875, 1.8878173828125, 2.05767822265625, 2.2275390625, 2.39739990234375, 2.5672607421875, 2.73712158203125, 2.906982421875, 3.07684326171875, 3.2467041015625, 3.41656494140625, 3.58642578125, 3.75628662109375, 3.9261474609375, 4.09600830078125, 4.265869140625, 4.43572998046875, 4.6055908203125, 4.77545166015625, 4.9453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 14.0, 32.0, 33.0, 66.0, 117.0, 262.0, 727.0, 1822.0, 538.0, 238.0, 105.0, 46.0, 27.0, 18.0, 8.0, 10.0, 8.0, 1.0, 0.0, 2.0], "bins": [-2.46484375, -2.4168853759765625, -2.368927001953125, -2.3209686279296875, -2.27301025390625, -2.2250518798828125, -2.177093505859375, -2.1291351318359375, -2.0811767578125, -2.0332183837890625, -1.985260009765625, -1.9373016357421875, -1.88934326171875, -1.8413848876953125, -1.793426513671875, -1.7454681396484375, -1.697509765625, -1.6495513916015625, -1.601593017578125, -1.5536346435546875, -1.50567626953125, -1.4577178955078125, -1.409759521484375, -1.3618011474609375, -1.3138427734375, -1.2658843994140625, -1.217926025390625, -1.1699676513671875, -1.12200927734375, -1.0740509033203125, -1.026092529296875, -0.9781341552734375, -0.93017578125, -0.8822174072265625, -0.834259033203125, -0.7863006591796875, -0.73834228515625, -0.6903839111328125, -0.642425537109375, -0.5944671630859375, -0.5465087890625, -0.4985504150390625, -0.450592041015625, -0.4026336669921875, -0.35467529296875, -0.3067169189453125, -0.258758544921875, -0.2108001708984375, -0.162841796875, -0.1148834228515625, -0.066925048828125, -0.0189666748046875, 0.02899169921875, 0.0769500732421875, 0.124908447265625, 0.1728668212890625, 0.2208251953125, 0.2687835693359375, 0.316741943359375, 0.3647003173828125, 0.41265869140625, 0.4606170654296875, 0.508575439453125, 0.5565338134765625, 0.6044921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 15.0, 7.0, 31.0, 48.0, 73.0, 121.0, 161.0, 163.0, 141.0, 113.0, 58.0, 30.0, 21.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.662063598632812, -12.372052192687988, -12.08204174041748, -11.792030334472656, -11.502018928527832, -11.212007522583008, -10.9219970703125, -10.631985664367676, -10.341974258422852, -10.051962852478027, -9.76195240020752, -9.471940994262695, -9.181929588317871, -8.891918182373047, -8.601907730102539, -8.311896324157715, -8.021885871887207, -7.731874942779541, -7.441863536834717, -7.151852607727051, -6.861841201782227, -6.5718302726745605, -6.2818193435668945, -5.99180793762207, -5.701797008514404, -5.411786079406738, -5.121774673461914, -4.831763744354248, -4.541752815246582, -4.251741409301758, -3.961730480194092, -3.6717193126678467, -3.3817081451416016, -3.0916969776153564, -2.8016858100891113, -2.5116748809814453, -2.2216637134552, -1.931652545928955, -1.6416414976119995, -1.351630449295044, -1.0616192817687988, -0.7716081738471985, -0.48159706592559814, -0.1915859580039978, 0.09842514991760254, 0.38843631744384766, 0.6784473657608032, 0.9684584140777588, 1.258469581604004, 1.548480749130249, 1.8384917974472046, 2.12850284576416, 2.4185140132904053, 2.7085251808166504, 2.9985361099243164, 3.2885472774505615, 3.5785584449768066, 3.8685696125030518, 4.158580780029297, 4.448591709136963, 4.738602638244629, 5.028614044189453, 5.318624973297119, 5.608635902404785, 5.898647308349609]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 9.0, 11.0, 8.0, 12.0, 17.0, 21.0, 24.0, 32.0, 30.0, 26.0, 34.0, 33.0, 34.0, 33.0, 35.0, 54.0, 45.0, 50.0, 35.0, 47.0, 57.0, 43.0, 41.0, 33.0, 28.0, 28.0, 33.0, 33.0, 22.0, 15.0, 13.0, 14.0, 12.0, 14.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-3.935969829559326, -3.825162410736084, -3.714354991912842, -3.6035475730895996, -3.4927401542663574, -3.3819327354431152, -3.271125078201294, -3.1603176593780518, -3.0495102405548096, -2.9387028217315674, -2.827895402908325, -2.717087984085083, -2.6062803268432617, -2.4954729080200195, -2.3846654891967773, -2.273858070373535, -2.163050651550293, -2.052243232727051, -1.9414358139038086, -1.8306282758712769, -1.7198208570480347, -1.6090134382247925, -1.4982059001922607, -1.3873984813690186, -1.2765910625457764, -1.1657836437225342, -1.054976224899292, -0.9441686868667603, -0.8333612680435181, -0.7225538492202759, -0.6117463707923889, -0.500938892364502, -0.39013147354125977, -0.2793240249156952, -0.16851657629013062, -0.05770912766456604, 0.053098320960998535, 0.16390573978424072, 0.2747132182121277, 0.38552069664001465, 0.49632811546325684, 0.607135534286499, 0.717943012714386, 0.828750491142273, 0.9395579099655151, 1.0503653287887573, 1.161172866821289, 1.2719802856445312, 1.3827877044677734, 1.4935951232910156, 1.6044025421142578, 1.7152100801467896, 1.8260174989700317, 1.936824917793274, 2.0476324558258057, 2.158439874649048, 2.26924729347229, 2.3800547122955322, 2.4908621311187744, 2.6016695499420166, 2.712477207183838, 2.82328462600708, 2.9340920448303223, 3.0448994636535645, 3.1557068824768066]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 4.0, 7.0, 11.0, 21.0, 17.0, 26.0, 36.0, 43.0, 76.0, 118.0, 178.0, 321.0, 540.0, 941.0, 2047.0, 4734.0, 12182.0, 34836.0, 107722.0, 388895.0, 349741.0, 94927.0, 31430.0, 11225.0, 4371.0, 1867.0, 863.0, 553.0, 283.0, 192.0, 109.0, 67.0, 49.0, 26.0, 23.0, 26.0, 9.0, 12.0, 4.0, 2.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.505859375, -2.4298095703125, -2.353759765625, -2.2777099609375, -2.20166015625, -2.1256103515625, -2.049560546875, -1.9735107421875, -1.8974609375, -1.8214111328125, -1.745361328125, -1.6693115234375, -1.59326171875, -1.5172119140625, -1.441162109375, -1.3651123046875, -1.2890625, -1.2130126953125, -1.136962890625, -1.0609130859375, -0.98486328125, -0.9088134765625, -0.832763671875, -0.7567138671875, -0.6806640625, -0.6046142578125, -0.528564453125, -0.4525146484375, -0.37646484375, -0.3004150390625, -0.224365234375, -0.1483154296875, -0.072265625, 0.0037841796875, 0.079833984375, 0.1558837890625, 0.23193359375, 0.3079833984375, 0.384033203125, 0.4600830078125, 0.5361328125, 0.6121826171875, 0.688232421875, 0.7642822265625, 0.84033203125, 0.9163818359375, 0.992431640625, 1.0684814453125, 1.14453125, 1.2205810546875, 1.296630859375, 1.3726806640625, 1.44873046875, 1.5247802734375, 1.600830078125, 1.6768798828125, 1.7529296875, 1.8289794921875, 1.905029296875, 1.9810791015625, 2.05712890625, 2.1331787109375, 2.209228515625, 2.2852783203125, 2.361328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 12.0, 28.0, 36.0, 36.0, 70.0, 54.0, 81.0, 72.0, 63.0, 86.0, 60.0, 67.0, 61.0, 54.0, 34.0, 34.0, 25.0, 24.0, 8.0, 9.0, 9.0, 6.0, 3.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5823287963867188, -0.5660247802734375, -0.5497207641601562, -0.533416748046875, -0.5171127319335938, -0.5008087158203125, -0.48450469970703125, -0.46820068359375, -0.45189666748046875, -0.4355926513671875, -0.41928863525390625, -0.402984619140625, -0.38668060302734375, -0.3703765869140625, -0.35407257080078125, -0.3377685546875, -0.32146453857421875, -0.3051605224609375, -0.28885650634765625, -0.272552490234375, -0.25624847412109375, -0.2399444580078125, -0.22364044189453125, -0.20733642578125, -0.19103240966796875, -0.1747283935546875, -0.15842437744140625, -0.142120361328125, -0.12581634521484375, -0.1095123291015625, -0.09320831298828125, -0.076904296875, -0.06060028076171875, -0.0442962646484375, -0.02799224853515625, -0.011688232421875, 0.00461578369140625, 0.0209197998046875, 0.03722381591796875, 0.05352783203125, 0.06983184814453125, 0.0861358642578125, 0.10243988037109375, 0.118743896484375, 0.13504791259765625, 0.1513519287109375, 0.16765594482421875, 0.1839599609375, 0.20026397705078125, 0.2165679931640625, 0.23287200927734375, 0.249176025390625, 0.26548004150390625, 0.2817840576171875, 0.29808807373046875, 0.31439208984375, 0.33069610595703125, 0.3470001220703125, 0.36330413818359375, 0.379608154296875, 0.39591217041015625, 0.4122161865234375, 0.42852020263671875, 0.44482421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 10.0, 14.0, 26.0, 31.0, 46.0, 92.0, 124.0, 202.0, 324.0, 603.0, 1144.0, 2413.0, 5610.0, 13783.0, 35362.0, 95742.0, 289261.0, 382076.0, 139466.0, 49143.0, 18930.0, 7713.0, 3242.0, 1451.0, 727.0, 366.0, 226.0, 148.0, 64.0, 58.0, 45.0, 28.0, 29.0, 19.0, 12.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.4693603515625, -1.415283203125, -1.3612060546875, -1.30712890625, -1.2530517578125, -1.198974609375, -1.1448974609375, -1.0908203125, -1.0367431640625, -0.982666015625, -0.9285888671875, -0.87451171875, -0.8204345703125, -0.766357421875, -0.7122802734375, -0.658203125, -0.6041259765625, -0.550048828125, -0.4959716796875, -0.44189453125, -0.3878173828125, -0.333740234375, -0.2796630859375, -0.2255859375, -0.1715087890625, -0.117431640625, -0.0633544921875, -0.00927734375, 0.0447998046875, 0.098876953125, 0.1529541015625, 0.20703125, 0.2611083984375, 0.315185546875, 0.3692626953125, 0.42333984375, 0.4774169921875, 0.531494140625, 0.5855712890625, 0.6396484375, 0.6937255859375, 0.747802734375, 0.8018798828125, 0.85595703125, 0.9100341796875, 0.964111328125, 1.0181884765625, 1.072265625, 1.1263427734375, 1.180419921875, 1.2344970703125, 1.28857421875, 1.3426513671875, 1.396728515625, 1.4508056640625, 1.5048828125, 1.5589599609375, 1.613037109375, 1.6671142578125, 1.72119140625, 1.7752685546875, 1.829345703125, 1.8834228515625, 1.9375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 21.0, 9.0, 17.0, 28.0, 20.0, 18.0, 23.0, 34.0, 43.0, 43.0, 43.0, 48.0, 52.0, 52.0, 38.0, 40.0, 42.0, 51.0, 38.0, 44.0, 43.0, 33.0, 29.0, 25.0, 23.0, 19.0, 17.0, 20.0, 12.0, 11.0, 10.0, 12.0, 6.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.505859375, -1.4579315185546875, -1.410003662109375, -1.3620758056640625, -1.31414794921875, -1.2662200927734375, -1.218292236328125, -1.1703643798828125, -1.1224365234375, -1.0745086669921875, -1.026580810546875, -0.9786529541015625, -0.93072509765625, -0.8827972412109375, -0.834869384765625, -0.7869415283203125, -0.739013671875, -0.6910858154296875, -0.643157958984375, -0.5952301025390625, -0.54730224609375, -0.4993743896484375, -0.451446533203125, -0.4035186767578125, -0.3555908203125, -0.3076629638671875, -0.259735107421875, -0.2118072509765625, -0.16387939453125, -0.1159515380859375, -0.068023681640625, -0.0200958251953125, 0.02783203125, 0.0757598876953125, 0.123687744140625, 0.1716156005859375, 0.21954345703125, 0.2674713134765625, 0.315399169921875, 0.3633270263671875, 0.4112548828125, 0.4591827392578125, 0.507110595703125, 0.5550384521484375, 0.60296630859375, 0.6508941650390625, 0.698822021484375, 0.7467498779296875, 0.794677734375, 0.8426055908203125, 0.890533447265625, 0.9384613037109375, 0.98638916015625, 1.0343170166015625, 1.082244873046875, 1.1301727294921875, 1.1781005859375, 1.2260284423828125, 1.273956298828125, 1.3218841552734375, 1.36981201171875, 1.4177398681640625, 1.465667724609375, 1.5135955810546875, 1.5615234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 9.0, 11.0, 22.0, 28.0, 56.0, 88.0, 140.0, 243.0, 441.0, 929.0, 2020.0, 4903.0, 14086.0, 45783.0, 173559.0, 496786.0, 224076.0, 57417.0, 17354.0, 5918.0, 2374.0, 1037.0, 559.0, 314.0, 156.0, 76.0, 53.0, 29.0, 27.0, 15.0, 12.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7277297973632812, -0.6981353759765625, -0.6685409545898438, -0.638946533203125, -0.6093521118164062, -0.5797576904296875, -0.5501632690429688, -0.52056884765625, -0.49097442626953125, -0.4613800048828125, -0.43178558349609375, -0.402191162109375, -0.37259674072265625, -0.3430023193359375, -0.31340789794921875, -0.2838134765625, -0.25421905517578125, -0.2246246337890625, -0.19503021240234375, -0.165435791015625, -0.13584136962890625, -0.1062469482421875, -0.07665252685546875, -0.04705810546875, -0.01746368408203125, 0.0121307373046875, 0.04172515869140625, 0.071319580078125, 0.10091400146484375, 0.1305084228515625, 0.16010284423828125, 0.189697265625, 0.21929168701171875, 0.2488861083984375, 0.27848052978515625, 0.308074951171875, 0.33766937255859375, 0.3672637939453125, 0.39685821533203125, 0.42645263671875, 0.45604705810546875, 0.4856414794921875, 0.5152359008789062, 0.544830322265625, 0.5744247436523438, 0.6040191650390625, 0.6336135864257812, 0.6632080078125, 0.6928024291992188, 0.7223968505859375, 0.7519912719726562, 0.781585693359375, 0.8111801147460938, 0.8407745361328125, 0.8703689575195312, 0.89996337890625, 0.9295578002929688, 0.9591522216796875, 0.9887466430664062, 1.018341064453125, 1.0479354858398438, 1.0775299072265625, 1.1071243286132812, 1.13671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 16.0, 20.0, 27.0, 34.0, 45.0, 83.0, 113.0, 163.0, 138.0, 94.0, 69.0, 42.0, 31.0, 28.0, 16.0, 9.0, 11.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022649765014648438, -0.00022001191973686218, -0.00021352618932724, -0.0002070404589176178, -0.0002005547285079956, -0.0001940689980983734, -0.00018758326768875122, -0.00018109753727912903, -0.00017461180686950684, -0.00016812607645988464, -0.00016164034605026245, -0.00015515461564064026, -0.00014866888523101807, -0.00014218315482139587, -0.00013569742441177368, -0.0001292116940021515, -0.0001227259635925293, -0.0001162402331829071, -0.00010975450277328491, -0.00010326877236366272, -9.678304195404053e-05, -9.029731154441833e-05, -8.381158113479614e-05, -7.732585072517395e-05, -7.084012031555176e-05, -6.435438990592957e-05, -5.786865949630737e-05, -5.138292908668518e-05, -4.489719867706299e-05, -3.8411468267440796e-05, -3.1925737857818604e-05, -2.544000744819641e-05, -1.895427703857422e-05, -1.2468546628952026e-05, -5.982816219329834e-06, 5.029141902923584e-07, 6.988644599914551e-06, 1.3474375009536743e-05, 1.9960105419158936e-05, 2.6445835828781128e-05, 3.293156623840332e-05, 3.941729664802551e-05, 4.5903027057647705e-05, 5.23887574672699e-05, 5.887448787689209e-05, 6.536021828651428e-05, 7.184594869613647e-05, 7.833167910575867e-05, 8.481740951538086e-05, 9.130313992500305e-05, 9.778887033462524e-05, 0.00010427460074424744, 0.00011076033115386963, 0.00011724606156349182, 0.00012373179197311401, 0.0001302175223827362, 0.0001367032527923584, 0.0001431889832019806, 0.00014967471361160278, 0.00015616044402122498, 0.00016264617443084717, 0.00016913190484046936, 0.00017561763525009155, 0.00018210336565971375, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 6.0, 17.0, 29.0, 40.0, 81.0, 108.0, 162.0, 305.0, 701.0, 1574.0, 3824.0, 10978.0, 34643.0, 141150.0, 570746.0, 214763.0, 46778.0, 14119.0, 4871.0, 1891.0, 813.0, 402.0, 231.0, 118.0, 82.0, 39.0, 18.0, 22.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99462890625, -0.9631729125976562, -0.9317169189453125, -0.9002609252929688, -0.868804931640625, -0.8373489379882812, -0.8058929443359375, -0.7744369506835938, -0.74298095703125, -0.7115249633789062, -0.6800689697265625, -0.6486129760742188, -0.617156982421875, -0.5857009887695312, -0.5542449951171875, -0.5227890014648438, -0.4913330078125, -0.45987701416015625, -0.4284210205078125, -0.39696502685546875, -0.365509033203125, -0.33405303955078125, -0.3025970458984375, -0.27114105224609375, -0.23968505859375, -0.20822906494140625, -0.1767730712890625, -0.14531707763671875, -0.113861083984375, -0.08240509033203125, -0.0509490966796875, -0.01949310302734375, 0.011962890625, 0.04341888427734375, 0.0748748779296875, 0.10633087158203125, 0.137786865234375, 0.16924285888671875, 0.2006988525390625, 0.23215484619140625, 0.26361083984375, 0.29506683349609375, 0.3265228271484375, 0.35797882080078125, 0.389434814453125, 0.42089080810546875, 0.4523468017578125, 0.48380279541015625, 0.5152587890625, 0.5467147827148438, 0.5781707763671875, 0.6096267700195312, 0.641082763671875, 0.6725387573242188, 0.7039947509765625, 0.7354507446289062, 0.76690673828125, 0.7983627319335938, 0.8298187255859375, 0.8612747192382812, 0.892730712890625, 0.9241867065429688, 0.9556427001953125, 0.9870986938476562, 1.0185546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 2.0, 4.0, 3.0, 8.0, 5.0, 10.0, 8.0, 9.0, 9.0, 13.0, 20.0, 26.0, 23.0, 45.0, 41.0, 63.0, 70.0, 80.0, 80.0, 82.0, 70.0, 68.0, 45.0, 44.0, 26.0, 32.0, 22.0, 17.0, 21.0, 16.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.666015625, -0.6442184448242188, -0.6224212646484375, -0.6006240844726562, -0.578826904296875, -0.5570297241210938, -0.5352325439453125, -0.5134353637695312, -0.49163818359375, -0.46984100341796875, -0.4480438232421875, -0.42624664306640625, -0.404449462890625, -0.38265228271484375, -0.3608551025390625, -0.33905792236328125, -0.3172607421875, -0.29546356201171875, -0.2736663818359375, -0.25186920166015625, -0.230072021484375, -0.20827484130859375, -0.1864776611328125, -0.16468048095703125, -0.14288330078125, -0.12108612060546875, -0.0992889404296875, -0.07749176025390625, -0.055694580078125, -0.03389739990234375, -0.0121002197265625, 0.00969696044921875, 0.031494140625, 0.05329132080078125, 0.0750885009765625, 0.09688568115234375, 0.118682861328125, 0.14048004150390625, 0.1622772216796875, 0.18407440185546875, 0.20587158203125, 0.22766876220703125, 0.2494659423828125, 0.27126312255859375, 0.293060302734375, 0.31485748291015625, 0.3366546630859375, 0.35845184326171875, 0.3802490234375, 0.40204620361328125, 0.4238433837890625, 0.44564056396484375, 0.467437744140625, 0.48923492431640625, 0.5110321044921875, 0.5328292846679688, 0.55462646484375, 0.5764236450195312, 0.5982208251953125, 0.6200180053710938, 0.641815185546875, 0.6636123657226562, 0.6854095458984375, 0.7072067260742188, 0.72900390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 15.0, 34.0, 99.0, 149.0, 205.0, 183.0, 165.0, 76.0, 41.0, 22.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-40.049278259277344, -39.290897369384766, -38.53251647949219, -37.77413558959961, -37.01575469970703, -36.25736999511719, -35.498992919921875, -34.74060821533203, -33.98222732543945, -33.223846435546875, -32.4654655456543, -31.70708465576172, -30.948701858520508, -30.19032096862793, -29.43194007873535, -28.673559188842773, -27.915178298950195, -27.156797409057617, -26.39841651916504, -25.640033721923828, -24.88165283203125, -24.123271942138672, -23.364891052246094, -22.606510162353516, -21.848129272460938, -21.08974838256836, -20.33136749267578, -19.572986602783203, -18.814603805541992, -18.056222915649414, -17.297842025756836, -16.539461135864258, -15.781079292297363, -15.022698402404785, -14.26431655883789, -13.505935668945312, -12.747554779052734, -11.98917293548584, -11.230792045593262, -10.472410202026367, -9.714029312133789, -8.955648422241211, -8.197266578674316, -7.438885688781738, -6.680504322052002, -5.922122955322266, -5.1637420654296875, -4.405360698699951, -3.646979331970215, -2.8885979652404785, -2.1302168369293213, -1.371835708618164, -0.6134543418884277, 0.1449270248413086, 0.9033079147338867, 1.661689281463623, 2.4200706481933594, 3.1784520149230957, 3.936833143234253, 4.69521427154541, 5.4535956382751465, 6.211977005004883, 6.970357894897461, 7.728739261627197, 8.487120628356934]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 5.0, 9.0, 13.0, 16.0, 15.0, 20.0, 18.0, 18.0, 34.0, 48.0, 41.0, 31.0, 39.0, 40.0, 50.0, 58.0, 45.0, 23.0, 50.0, 44.0, 33.0, 45.0, 33.0, 41.0, 41.0, 38.0, 24.0, 19.0, 21.0, 14.0, 14.0, 9.0, 10.0, 11.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.520538330078125, -7.292177200317383, -7.063816070556641, -6.83545446395874, -6.607093334197998, -6.378732204437256, -6.1503705978393555, -5.922009468078613, -5.693648338317871, -5.465287208557129, -5.236926078796387, -5.008564472198486, -4.780203342437744, -4.551842212677002, -4.323480606079102, -4.095119476318359, -3.866758346557617, -3.638397216796875, -3.4100358486175537, -3.1816744804382324, -2.9533133506774902, -2.724952220916748, -2.4965908527374268, -2.2682294845581055, -2.0398683547973633, -1.8115071058273315, -1.5831458568572998, -1.354784607887268, -1.1264233589172363, -0.8980621099472046, -0.6697008609771729, -0.4413396120071411, -0.21297836303710938, 0.015382885932922363, 0.2437441349029541, 0.47210538387298584, 0.7004666328430176, 0.9288278818130493, 1.157189130783081, 1.3855503797531128, 1.6139116287231445, 1.8422728776931763, 2.070634126663208, 2.2989954948425293, 2.5273566246032715, 2.7557177543640137, 2.984079122543335, 3.2124404907226562, 3.4408016204833984, 3.6691627502441406, 3.897524118423462, 4.125885486602783, 4.354246616363525, 4.582607746124268, 4.810969352722168, 5.03933048248291, 5.267691612243652, 5.4960527420043945, 5.724413871765137, 5.952775478363037, 6.181136608123779, 6.4094977378845215, 6.637859344482422, 6.866220474243164, 7.094581604003906]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 11.0, 6.0, 10.0, 24.0, 52.0, 76.0, 172.0, 366.0, 858.0, 2900.0, 12156.0, 99685.0, 3930266.0, 129171.0, 13966.0, 3004.0, 888.0, 320.0, 148.0, 88.0, 48.0, 26.0, 20.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.098876953125, -5.87744140625, -5.656005859375, -5.4345703125, -5.213134765625, -4.99169921875, -4.770263671875, -4.548828125, -4.327392578125, -4.10595703125, -3.884521484375, -3.6630859375, -3.441650390625, -3.22021484375, -2.998779296875, -2.77734375, -2.555908203125, -2.33447265625, -2.113037109375, -1.8916015625, -1.670166015625, -1.44873046875, -1.227294921875, -1.005859375, -0.784423828125, -0.56298828125, -0.341552734375, -0.1201171875, 0.101318359375, 0.32275390625, 0.544189453125, 0.765625, 0.987060546875, 1.20849609375, 1.429931640625, 1.6513671875, 1.872802734375, 2.09423828125, 2.315673828125, 2.537109375, 2.758544921875, 2.97998046875, 3.201416015625, 3.4228515625, 3.644287109375, 3.86572265625, 4.087158203125, 4.30859375, 4.530029296875, 4.75146484375, 4.972900390625, 5.1943359375, 5.415771484375, 5.63720703125, 5.858642578125, 6.080078125, 6.301513671875, 6.52294921875, 6.744384765625, 6.9658203125, 7.187255859375, 7.40869140625, 7.630126953125, 7.8515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 4.0, 8.0, 19.0, 16.0, 17.0, 26.0, 41.0, 45.0, 56.0, 56.0, 61.0, 78.0, 72.0, 78.0, 60.0, 63.0, 61.0, 55.0, 50.0, 34.0, 17.0, 26.0, 11.0, 9.0, 4.0, 12.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.60791015625, -0.5913581848144531, -0.5748062133789062, -0.5582542419433594, -0.5417022705078125, -0.5251502990722656, -0.5085983276367188, -0.4920463562011719, -0.475494384765625, -0.4589424133300781, -0.44239044189453125, -0.4258384704589844, -0.4092864990234375, -0.3927345275878906, -0.37618255615234375, -0.3596305847167969, -0.34307861328125, -0.3265266418457031, -0.30997467041015625, -0.2934226989746094, -0.2768707275390625, -0.2603187561035156, -0.24376678466796875, -0.22721481323242188, -0.210662841796875, -0.19411087036132812, -0.17755889892578125, -0.16100692749023438, -0.1444549560546875, -0.12790298461914062, -0.11135101318359375, -0.09479904174804688, -0.0782470703125, -0.061695098876953125, -0.04514312744140625, -0.028591156005859375, -0.0120391845703125, 0.004512786865234375, 0.02106475830078125, 0.037616729736328125, 0.054168701171875, 0.07072067260742188, 0.08727264404296875, 0.10382461547851562, 0.1203765869140625, 0.13692855834960938, 0.15348052978515625, 0.17003250122070312, 0.18658447265625, 0.20313644409179688, 0.21968841552734375, 0.23624038696289062, 0.2527923583984375, 0.2693443298339844, 0.28589630126953125, 0.3024482727050781, 0.319000244140625, 0.3355522155761719, 0.35210418701171875, 0.3686561584472656, 0.3852081298828125, 0.4017601013183594, 0.41831207275390625, 0.4348640441894531, 0.451416015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 9.0, 9.0, 16.0, 23.0, 55.0, 76.0, 100.0, 188.0, 290.0, 495.0, 780.0, 1518.0, 3254.0, 7749.0, 19926.0, 61692.0, 301845.0, 3375942.0, 321164.0, 63879.0, 20497.0, 7840.0, 3347.0, 1637.0, 770.0, 429.0, 260.0, 181.0, 111.0, 79.0, 44.0, 23.0, 16.0, 14.0, 9.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.686248779296875, -2.60101318359375, -2.515777587890625, -2.4305419921875, -2.345306396484375, -2.26007080078125, -2.174835205078125, -2.089599609375, -2.004364013671875, -1.91912841796875, -1.833892822265625, -1.7486572265625, -1.663421630859375, -1.57818603515625, -1.492950439453125, -1.40771484375, -1.322479248046875, -1.23724365234375, -1.152008056640625, -1.0667724609375, -0.981536865234375, -0.89630126953125, -0.811065673828125, -0.725830078125, -0.640594482421875, -0.55535888671875, -0.470123291015625, -0.3848876953125, -0.299652099609375, -0.21441650390625, -0.129180908203125, -0.0439453125, 0.041290283203125, 0.12652587890625, 0.211761474609375, 0.2969970703125, 0.382232666015625, 0.46746826171875, 0.552703857421875, 0.637939453125, 0.723175048828125, 0.80841064453125, 0.893646240234375, 0.9788818359375, 1.064117431640625, 1.14935302734375, 1.234588623046875, 1.31982421875, 1.405059814453125, 1.49029541015625, 1.575531005859375, 1.6607666015625, 1.746002197265625, 1.83123779296875, 1.916473388671875, 2.001708984375, 2.086944580078125, 2.17218017578125, 2.257415771484375, 2.3426513671875, 2.427886962890625, 2.51312255859375, 2.598358154296875, 2.68359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 9.0, 10.0, 17.0, 22.0, 32.0, 52.0, 79.0, 148.0, 314.0, 1108.0, 1650.0, 295.0, 120.0, 91.0, 45.0, 22.0, 18.0, 10.0, 17.0, 7.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.126861572265625, -1.08184814453125, -1.036834716796875, -0.9918212890625, -0.946807861328125, -0.90179443359375, -0.856781005859375, -0.811767578125, -0.766754150390625, -0.72174072265625, -0.676727294921875, -0.6317138671875, -0.586700439453125, -0.54168701171875, -0.496673583984375, -0.45166015625, -0.406646728515625, -0.36163330078125, -0.316619873046875, -0.2716064453125, -0.226593017578125, -0.18157958984375, -0.136566162109375, -0.091552734375, -0.046539306640625, -0.00152587890625, 0.043487548828125, 0.0885009765625, 0.133514404296875, 0.17852783203125, 0.223541259765625, 0.2685546875, 0.313568115234375, 0.35858154296875, 0.403594970703125, 0.4486083984375, 0.493621826171875, 0.53863525390625, 0.583648681640625, 0.628662109375, 0.673675537109375, 0.71868896484375, 0.763702392578125, 0.8087158203125, 0.853729248046875, 0.89874267578125, 0.943756103515625, 0.98876953125, 1.033782958984375, 1.07879638671875, 1.123809814453125, 1.1688232421875, 1.213836669921875, 1.25885009765625, 1.303863525390625, 1.348876953125, 1.393890380859375, 1.43890380859375, 1.483917236328125, 1.5289306640625, 1.573944091796875, 1.61895751953125, 1.663970947265625, 1.708984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 13.0, 23.0, 51.0, 120.0, 174.0, 226.0, 196.0, 91.0, 53.0, 20.0, 12.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.02601146697998, -9.665599822998047, -9.30518913269043, -8.944777488708496, -8.584366798400879, -8.223955154418945, -7.86354398727417, -7.5031328201293945, -7.142721652984619, -6.782310485839844, -6.421899318695068, -6.061488151550293, -5.701076507568359, -5.340665817260742, -4.980254173278809, -4.619843006134033, -4.259431838989258, -3.8990206718444824, -3.538609504699707, -3.1781980991363525, -2.817786931991577, -2.4573757648468018, -2.0969643592834473, -1.7365531921386719, -1.3761420249938965, -1.015730857849121, -0.6553195714950562, -0.2949082851409912, 0.06550288200378418, 0.42591404914855957, 0.7863254547119141, 1.1467366218566895, 1.5071487426757812, 1.8675599098205566, 2.227971076965332, 2.5883824825286865, 2.948793649673462, 3.3092048168182373, 3.669616222381592, 4.030027389526367, 4.390438556671143, 4.750849723815918, 5.111260890960693, 5.471672058105469, 5.832083702087402, 6.1924943923950195, 6.552906036376953, 6.9133172035217285, 7.273728370666504, 7.634139537811279, 7.994550704956055, 8.354962348937988, 8.715373039245605, 9.075784683227539, 9.436195373535156, 9.79660701751709, 10.157018661499023, 10.517430305480957, 10.877840995788574, 11.238252639770508, 11.598663330078125, 11.959074974060059, 12.319486618041992, 12.67989730834961, 13.040307998657227]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 8.0, 7.0, 8.0, 7.0, 15.0, 11.0, 15.0, 18.0, 22.0, 25.0, 28.0, 29.0, 39.0, 31.0, 48.0, 36.0, 35.0, 41.0, 47.0, 46.0, 42.0, 47.0, 42.0, 43.0, 43.0, 24.0, 25.0, 17.0, 29.0, 22.0, 27.0, 23.0, 17.0, 13.0, 6.0, 12.0, 9.0, 14.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.227794885635376, -3.1318273544311523, -3.0358598232269287, -2.939892292022705, -2.8439247608184814, -2.747957229614258, -2.651989459991455, -2.5560219287872314, -2.460054397583008, -2.364086866378784, -2.2681193351745605, -2.172151803970337, -2.0761842727661133, -1.9802166223526, -1.8842490911483765, -1.7882814407348633, -1.6923140287399292, -1.5963464975357056, -1.500378966331482, -1.4044113159179688, -1.3084437847137451, -1.2124762535095215, -1.1165087223052979, -1.0205411911010742, -0.9245736002922058, -0.8286060690879822, -0.7326384782791138, -0.6366709470748901, -0.5407034158706665, -0.4447358250617981, -0.34876829385757446, -0.25280070304870605, -0.15683317184448242, -0.060865618288517, 0.035101935267448425, 0.13106948137283325, 0.22703704237937927, 0.3230046033859253, 0.4189721345901489, 0.5149397253990173, 0.610907256603241, 0.7068747878074646, 0.802842378616333, 0.8988099098205566, 0.9947774410247803, 1.090744972229004, 1.1867125034332275, 1.2826801538467407, 1.3786476850509644, 1.474615216255188, 1.5705827474594116, 1.6665503978729248, 1.7625179290771484, 1.858485460281372, 1.9544529914855957, 2.0504205226898193, 2.146388053894043, 2.2423555850982666, 2.3383231163024902, 2.434290647506714, 2.5302581787109375, 2.6262259483337402, 2.7221932411193848, 2.8181610107421875, 2.914128541946411]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 3.0, 2.0, 9.0, 8.0, 13.0, 13.0, 20.0, 22.0, 30.0, 47.0, 43.0, 89.0, 109.0, 146.0, 215.0, 292.0, 476.0, 726.0, 1090.0, 1920.0, 3274.0, 5830.0, 11290.0, 22226.0, 45082.0, 92241.0, 188168.0, 300845.0, 188161.0, 92546.0, 45677.0, 22348.0, 11227.0, 5831.0, 3271.0, 1832.0, 1141.0, 698.0, 482.0, 333.0, 209.0, 176.0, 110.0, 82.0, 54.0, 47.0, 30.0, 18.0, 19.0, 10.0, 12.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.82421875, -1.7663116455078125, -1.708404541015625, -1.6504974365234375, -1.59259033203125, -1.5346832275390625, -1.476776123046875, -1.4188690185546875, -1.3609619140625, -1.3030548095703125, -1.245147705078125, -1.1872406005859375, -1.12933349609375, -1.0714263916015625, -1.013519287109375, -0.9556121826171875, -0.897705078125, -0.8397979736328125, -0.781890869140625, -0.7239837646484375, -0.66607666015625, -0.6081695556640625, -0.550262451171875, -0.4923553466796875, -0.4344482421875, -0.3765411376953125, -0.318634033203125, -0.2607269287109375, -0.20281982421875, -0.1449127197265625, -0.087005615234375, -0.0290985107421875, 0.02880859375, 0.0867156982421875, 0.144622802734375, 0.2025299072265625, 0.26043701171875, 0.3183441162109375, 0.376251220703125, 0.4341583251953125, 0.4920654296875, 0.5499725341796875, 0.607879638671875, 0.6657867431640625, 0.72369384765625, 0.7816009521484375, 0.839508056640625, 0.8974151611328125, 0.955322265625, 1.0132293701171875, 1.071136474609375, 1.1290435791015625, 1.18695068359375, 1.2448577880859375, 1.302764892578125, 1.3606719970703125, 1.4185791015625, 1.4764862060546875, 1.534393310546875, 1.5923004150390625, 1.65020751953125, 1.7081146240234375, 1.766021728515625, 1.8239288330078125, 1.8818359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 11.0, 2.0, 9.0, 13.0, 21.0, 22.0, 24.0, 31.0, 47.0, 46.0, 59.0, 62.0, 68.0, 59.0, 54.0, 66.0, 70.0, 58.0, 61.0, 46.0, 31.0, 34.0, 22.0, 25.0, 20.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.63427734375, -0.6172523498535156, -0.6002273559570312, -0.5832023620605469, -0.5661773681640625, -0.5491523742675781, -0.5321273803710938, -0.5151023864746094, -0.498077392578125, -0.4810523986816406, -0.46402740478515625, -0.4470024108886719, -0.4299774169921875, -0.4129524230957031, -0.39592742919921875, -0.3789024353027344, -0.36187744140625, -0.3448524475097656, -0.32782745361328125, -0.3108024597167969, -0.2937774658203125, -0.2767524719238281, -0.25972747802734375, -0.24270248413085938, -0.225677490234375, -0.20865249633789062, -0.19162750244140625, -0.17460250854492188, -0.1575775146484375, -0.14055252075195312, -0.12352752685546875, -0.10650253295898438, -0.0894775390625, -0.07245254516601562, -0.05542755126953125, -0.038402557373046875, -0.0213775634765625, -0.004352569580078125, 0.01267242431640625, 0.029697418212890625, 0.046722412109375, 0.06374740600585938, 0.08077239990234375, 0.09779739379882812, 0.1148223876953125, 0.13184738159179688, 0.14887237548828125, 0.16589736938476562, 0.18292236328125, 0.19994735717773438, 0.21697235107421875, 0.23399734497070312, 0.2510223388671875, 0.2680473327636719, 0.28507232666015625, 0.3020973205566406, 0.319122314453125, 0.3361473083496094, 0.35317230224609375, 0.3701972961425781, 0.3872222900390625, 0.4042472839355469, 0.42127227783203125, 0.4382972717285156, 0.455322265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 11.0, 11.0, 11.0, 20.0, 19.0, 42.0, 42.0, 75.0, 108.0, 150.0, 247.0, 403.0, 606.0, 1106.0, 2001.0, 4078.0, 9055.0, 21076.0, 51187.0, 124818.0, 293059.0, 310063.0, 133358.0, 55032.0, 22878.0, 9643.0, 4334.0, 2139.0, 1084.0, 642.0, 450.0, 253.0, 170.0, 111.0, 79.0, 62.0, 38.0, 34.0, 14.0, 14.0, 11.0, 13.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.74249267578125, -1.6881103515625, -1.63372802734375, -1.579345703125, -1.52496337890625, -1.4705810546875, -1.41619873046875, -1.36181640625, -1.30743408203125, -1.2530517578125, -1.19866943359375, -1.144287109375, -1.08990478515625, -1.0355224609375, -0.98114013671875, -0.9267578125, -0.87237548828125, -0.8179931640625, -0.76361083984375, -0.709228515625, -0.65484619140625, -0.6004638671875, -0.54608154296875, -0.49169921875, -0.43731689453125, -0.3829345703125, -0.32855224609375, -0.274169921875, -0.21978759765625, -0.1654052734375, -0.11102294921875, -0.056640625, -0.00225830078125, 0.0521240234375, 0.10650634765625, 0.160888671875, 0.21527099609375, 0.2696533203125, 0.32403564453125, 0.37841796875, 0.43280029296875, 0.4871826171875, 0.54156494140625, 0.595947265625, 0.65032958984375, 0.7047119140625, 0.75909423828125, 0.8134765625, 0.86785888671875, 0.9222412109375, 0.97662353515625, 1.031005859375, 1.08538818359375, 1.1397705078125, 1.19415283203125, 1.24853515625, 1.30291748046875, 1.3572998046875, 1.41168212890625, 1.466064453125, 1.52044677734375, 1.5748291015625, 1.62921142578125, 1.68359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 13.0, 8.0, 14.0, 14.0, 18.0, 12.0, 34.0, 36.0, 33.0, 31.0, 36.0, 47.0, 44.0, 43.0, 53.0, 50.0, 62.0, 42.0, 42.0, 37.0, 50.0, 43.0, 27.0, 31.0, 31.0, 27.0, 11.0, 23.0, 15.0, 16.0, 17.0, 9.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7741241455078125, -1.713287353515625, -1.6524505615234375, -1.59161376953125, -1.5307769775390625, -1.469940185546875, -1.4091033935546875, -1.3482666015625, -1.2874298095703125, -1.226593017578125, -1.1657562255859375, -1.10491943359375, -1.0440826416015625, -0.983245849609375, -0.9224090576171875, -0.861572265625, -0.8007354736328125, -0.739898681640625, -0.6790618896484375, -0.61822509765625, -0.5573883056640625, -0.496551513671875, -0.4357147216796875, -0.3748779296875, -0.3140411376953125, -0.253204345703125, -0.1923675537109375, -0.13153076171875, -0.0706939697265625, -0.009857177734375, 0.0509796142578125, 0.11181640625, 0.1726531982421875, 0.233489990234375, 0.2943267822265625, 0.35516357421875, 0.4160003662109375, 0.476837158203125, 0.5376739501953125, 0.5985107421875, 0.6593475341796875, 0.720184326171875, 0.7810211181640625, 0.84185791015625, 0.9026947021484375, 0.963531494140625, 1.0243682861328125, 1.085205078125, 1.1460418701171875, 1.206878662109375, 1.2677154541015625, 1.32855224609375, 1.3893890380859375, 1.450225830078125, 1.5110626220703125, 1.5718994140625, 1.6327362060546875, 1.693572998046875, 1.7544097900390625, 1.81524658203125, 1.8760833740234375, 1.936920166015625, 1.9977569580078125, 2.05859375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 3.0, 8.0, 15.0, 24.0, 24.0, 44.0, 99.0, 136.0, 242.0, 451.0, 891.0, 2075.0, 4965.0, 14126.0, 52277.0, 307486.0, 555447.0, 79226.0, 19711.0, 6461.0, 2480.0, 1106.0, 522.0, 284.0, 165.0, 103.0, 60.0, 36.0, 23.0, 22.0, 9.0, 4.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.756134033203125, -1.69586181640625, -1.635589599609375, -1.5753173828125, -1.515045166015625, -1.45477294921875, -1.394500732421875, -1.334228515625, -1.273956298828125, -1.21368408203125, -1.153411865234375, -1.0931396484375, -1.032867431640625, -0.97259521484375, -0.912322998046875, -0.85205078125, -0.791778564453125, -0.73150634765625, -0.671234130859375, -0.6109619140625, -0.550689697265625, -0.49041748046875, -0.430145263671875, -0.369873046875, -0.309600830078125, -0.24932861328125, -0.189056396484375, -0.1287841796875, -0.068511962890625, -0.00823974609375, 0.052032470703125, 0.1123046875, 0.172576904296875, 0.23284912109375, 0.293121337890625, 0.3533935546875, 0.413665771484375, 0.47393798828125, 0.534210205078125, 0.594482421875, 0.654754638671875, 0.71502685546875, 0.775299072265625, 0.8355712890625, 0.895843505859375, 0.95611572265625, 1.016387939453125, 1.07666015625, 1.136932373046875, 1.19720458984375, 1.257476806640625, 1.3177490234375, 1.378021240234375, 1.43829345703125, 1.498565673828125, 1.558837890625, 1.619110107421875, 1.67938232421875, 1.739654541015625, 1.7999267578125, 1.860198974609375, 1.92047119140625, 1.980743408203125, 2.041015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 8.0, 6.0, 14.0, 13.0, 29.0, 34.0, 38.0, 40.0, 72.0, 114.0, 170.0, 153.0, 98.0, 64.0, 48.0, 36.0, 24.0, 19.0, 17.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030159950256347656, -0.0002921484410762787, -0.0002826973795890808, -0.00027324631810188293, -0.00026379525661468506, -0.0002543441951274872, -0.0002448931336402893, -0.00023544207215309143, -0.00022599101066589355, -0.00021653994917869568, -0.0002070888876914978, -0.00019763782620429993, -0.00018818676471710205, -0.00017873570322990417, -0.0001692846417427063, -0.00015983358025550842, -0.00015038251876831055, -0.00014093145728111267, -0.0001314803957939148, -0.00012202933430671692, -0.00011257827281951904, -0.00010312721133232117, -9.367614984512329e-05, -8.422508835792542e-05, -7.477402687072754e-05, -6.532296538352966e-05, -5.587190389633179e-05, -4.642084240913391e-05, -3.6969780921936035e-05, -2.751871943473816e-05, -1.8067657947540283e-05, -8.616596460342407e-06, 8.344650268554688e-07, 1.0285526514053345e-05, 1.973658800125122e-05, 2.9187649488449097e-05, 3.863871097564697e-05, 4.808977246284485e-05, 5.7540833950042725e-05, 6.69918954372406e-05, 7.644295692443848e-05, 8.589401841163635e-05, 9.534507989883423e-05, 0.0001047961413860321, 0.00011424720287322998, 0.00012369826436042786, 0.00013314932584762573, 0.0001426003873348236, 0.00015205144882202148, 0.00016150251030921936, 0.00017095357179641724, 0.0001804046332836151, 0.000189855694770813, 0.00019930675625801086, 0.00020875781774520874, 0.00021820887923240662, 0.0002276599407196045, 0.00023711100220680237, 0.00024656206369400024, 0.0002560131251811981, 0.000265464186668396, 0.00027491524815559387, 0.00028436630964279175, 0.0002938173711299896, 0.0003032684326171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 13.0, 26.0, 43.0, 67.0, 122.0, 233.0, 460.0, 1047.0, 3189.0, 12579.0, 77701.0, 737772.0, 183402.0, 23905.0, 5156.0, 1576.0, 626.0, 261.0, 121.0, 96.0, 51.0, 23.0, 17.0, 17.0, 9.0, 4.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.97265625, -2.886962890625, -2.80126953125, -2.715576171875, -2.6298828125, -2.544189453125, -2.45849609375, -2.372802734375, -2.287109375, -2.201416015625, -2.11572265625, -2.030029296875, -1.9443359375, -1.858642578125, -1.77294921875, -1.687255859375, -1.6015625, -1.515869140625, -1.43017578125, -1.344482421875, -1.2587890625, -1.173095703125, -1.08740234375, -1.001708984375, -0.916015625, -0.830322265625, -0.74462890625, -0.658935546875, -0.5732421875, -0.487548828125, -0.40185546875, -0.316162109375, -0.23046875, -0.144775390625, -0.05908203125, 0.026611328125, 0.1123046875, 0.197998046875, 0.28369140625, 0.369384765625, 0.455078125, 0.540771484375, 0.62646484375, 0.712158203125, 0.7978515625, 0.883544921875, 0.96923828125, 1.054931640625, 1.140625, 1.226318359375, 1.31201171875, 1.397705078125, 1.4833984375, 1.569091796875, 1.65478515625, 1.740478515625, 1.826171875, 1.911865234375, 1.99755859375, 2.083251953125, 2.1689453125, 2.254638671875, 2.34033203125, 2.426025390625, 2.51171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 18.0, 12.0, 18.0, 18.0, 32.0, 65.0, 97.0, 156.0, 229.0, 102.0, 82.0, 44.0, 41.0, 18.0, 17.0, 9.0, 9.0, 6.0, 10.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3359375, -2.261383056640625, -2.18682861328125, -2.112274169921875, -2.0377197265625, -1.963165283203125, -1.88861083984375, -1.814056396484375, -1.739501953125, -1.664947509765625, -1.59039306640625, -1.515838623046875, -1.4412841796875, -1.366729736328125, -1.29217529296875, -1.217620849609375, -1.14306640625, -1.068511962890625, -0.99395751953125, -0.919403076171875, -0.8448486328125, -0.770294189453125, -0.69573974609375, -0.621185302734375, -0.546630859375, -0.472076416015625, -0.39752197265625, -0.322967529296875, -0.2484130859375, -0.173858642578125, -0.09930419921875, -0.024749755859375, 0.0498046875, 0.124359130859375, 0.19891357421875, 0.273468017578125, 0.3480224609375, 0.422576904296875, 0.49713134765625, 0.571685791015625, 0.646240234375, 0.720794677734375, 0.79534912109375, 0.869903564453125, 0.9444580078125, 1.019012451171875, 1.09356689453125, 1.168121337890625, 1.24267578125, 1.317230224609375, 1.39178466796875, 1.466339111328125, 1.5408935546875, 1.615447998046875, 1.69000244140625, 1.764556884765625, 1.839111328125, 1.913665771484375, 1.98822021484375, 2.062774658203125, 2.1373291015625, 2.211883544921875, 2.28643798828125, 2.360992431640625, 2.435546875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 13.0, 6.0, 24.0, 20.0, 47.0, 62.0, 74.0, 103.0, 109.0, 112.0, 87.0, 97.0, 67.0, 55.0, 46.0, 26.0, 16.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.143619537353516, -25.552173614501953, -24.96072769165039, -24.369281768798828, -23.777835845947266, -23.186389923095703, -22.59494400024414, -22.003498077392578, -21.412052154541016, -20.820606231689453, -20.22916030883789, -19.637714385986328, -19.046268463134766, -18.454822540283203, -17.86337661743164, -17.271930694580078, -16.680484771728516, -16.089038848876953, -15.49759292602539, -14.906147003173828, -14.314701080322266, -13.723255157470703, -13.13180923461914, -12.540363311767578, -11.948917388916016, -11.357471466064453, -10.76602554321289, -10.174579620361328, -9.583133697509766, -8.991687774658203, -8.40024185180664, -7.808795928955078, -7.217350006103516, -6.625904083251953, -6.034458160400391, -5.443012237548828, -4.851566314697266, -4.260120391845703, -3.6686744689941406, -3.077228546142578, -2.4857826232910156, -1.8943367004394531, -1.3028907775878906, -0.7114448547363281, -0.11999893188476562, 0.4714469909667969, 1.0628929138183594, 1.6543388366699219, 2.2457847595214844, 2.837230682373047, 3.4286766052246094, 4.020122528076172, 4.611568450927734, 5.203014373779297, 5.794460296630859, 6.385906219482422, 6.977352142333984, 7.568798065185547, 8.16024398803711, 8.751689910888672, 9.343135833740234, 9.934581756591797, 10.52602767944336, 11.117473602294922, 11.708919525146484]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 9.0, 13.0, 12.0, 15.0, 19.0, 24.0, 25.0, 26.0, 28.0, 30.0, 27.0, 34.0, 33.0, 38.0, 42.0, 63.0, 44.0, 48.0, 42.0, 35.0, 35.0, 37.0, 35.0, 36.0, 33.0, 40.0, 34.0, 21.0, 23.0, 15.0, 16.0, 13.0, 11.0, 3.0, 6.0, 12.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.034894943237305, -10.70212173461914, -10.369349479675293, -10.036576271057129, -9.703804016113281, -9.371030807495117, -9.038257598876953, -8.705484390258789, -8.372712135314941, -8.039938926696777, -7.70716667175293, -7.374393463134766, -7.04162073135376, -6.708847999572754, -6.37607479095459, -6.043302059173584, -5.710529327392578, -5.377756595611572, -5.044983863830566, -4.712210655212402, -4.3794379234313965, -4.046665191650391, -3.7138922214508057, -3.3811192512512207, -3.048346519470215, -2.715573787689209, -2.382800817489624, -2.050027847290039, -1.7172551155090332, -1.3844822645187378, -1.0517094135284424, -0.7189364433288574, -0.38616275787353516, -0.053389906883239746, 0.27938294410705566, 0.6121557950973511, 0.9449286460876465, 1.277701497077942, 1.6104743480682373, 1.9432473182678223, 2.276020050048828, 2.608792781829834, 2.941565752029419, 3.274338722229004, 3.6071114540100098, 3.9398841857910156, 4.27265739440918, 4.6054301261901855, 4.938202857971191, 5.270975589752197, 5.603748321533203, 5.936521530151367, 6.269294261932373, 6.602066993713379, 6.934840202331543, 7.267612934112549, 7.600385665893555, 7.9331583976745605, 8.265931129455566, 8.59870433807373, 8.931476593017578, 9.264249801635742, 9.597023010253906, 9.92979621887207, 10.262568473815918]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 10.0, 14.0, 9.0, 25.0, 29.0, 43.0, 66.0, 104.0, 147.0, 246.0, 461.0, 738.0, 1326.0, 2726.0, 5492.0, 12816.0, 35309.0, 146460.0, 3331152.0, 545262.0, 73342.0, 21973.0, 8444.0, 3854.0, 1873.0, 974.0, 529.0, 307.0, 178.0, 111.0, 74.0, 54.0, 30.0, 20.0, 13.0, 11.0, 14.0, 7.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.683013916015625, -2.58282470703125, -2.482635498046875, -2.3824462890625, -2.282257080078125, -2.18206787109375, -2.081878662109375, -1.981689453125, -1.881500244140625, -1.78131103515625, -1.681121826171875, -1.5809326171875, -1.480743408203125, -1.38055419921875, -1.280364990234375, -1.18017578125, -1.079986572265625, -0.97979736328125, -0.879608154296875, -0.7794189453125, -0.679229736328125, -0.57904052734375, -0.478851318359375, -0.378662109375, -0.278472900390625, -0.17828369140625, -0.078094482421875, 0.0220947265625, 0.122283935546875, 0.22247314453125, 0.322662353515625, 0.4228515625, 0.523040771484375, 0.62322998046875, 0.723419189453125, 0.8236083984375, 0.923797607421875, 1.02398681640625, 1.124176025390625, 1.224365234375, 1.324554443359375, 1.42474365234375, 1.524932861328125, 1.6251220703125, 1.725311279296875, 1.82550048828125, 1.925689697265625, 2.02587890625, 2.126068115234375, 2.22625732421875, 2.326446533203125, 2.4266357421875, 2.526824951171875, 2.62701416015625, 2.727203369140625, 2.827392578125, 2.927581787109375, 3.02777099609375, 3.127960205078125, 3.2281494140625, 3.328338623046875, 3.42852783203125, 3.528717041015625, 3.62890625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 5.0, 13.0, 19.0, 14.0, 25.0, 31.0, 23.0, 35.0, 38.0, 47.0, 44.0, 69.0, 51.0, 59.0, 56.0, 81.0, 56.0, 57.0, 49.0, 45.0, 37.0, 28.0, 27.0, 32.0, 14.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6422653198242188, -0.6248626708984375, -0.6074600219726562, -0.590057373046875, -0.5726547241210938, -0.5552520751953125, -0.5378494262695312, -0.52044677734375, -0.5030441284179688, -0.4856414794921875, -0.46823883056640625, -0.450836181640625, -0.43343353271484375, -0.4160308837890625, -0.39862823486328125, -0.3812255859375, -0.36382293701171875, -0.3464202880859375, -0.32901763916015625, -0.311614990234375, -0.29421234130859375, -0.2768096923828125, -0.25940704345703125, -0.24200439453125, -0.22460174560546875, -0.2071990966796875, -0.18979644775390625, -0.172393798828125, -0.15499114990234375, -0.1375885009765625, -0.12018585205078125, -0.102783203125, -0.08538055419921875, -0.0679779052734375, -0.05057525634765625, -0.033172607421875, -0.01576995849609375, 0.0016326904296875, 0.01903533935546875, 0.03643798828125, 0.05384063720703125, 0.0712432861328125, 0.08864593505859375, 0.106048583984375, 0.12345123291015625, 0.1408538818359375, 0.15825653076171875, 0.1756591796875, 0.19306182861328125, 0.2104644775390625, 0.22786712646484375, 0.245269775390625, 0.26267242431640625, 0.2800750732421875, 0.29747772216796875, 0.31488037109375, 0.33228302001953125, 0.3496856689453125, 0.36708831787109375, 0.384490966796875, 0.40189361572265625, 0.4192962646484375, 0.43669891357421875, 0.4541015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 6.0, 14.0, 17.0, 26.0, 46.0, 65.0, 115.0, 147.0, 249.0, 422.0, 699.0, 1320.0, 2384.0, 4364.0, 9138.0, 20351.0, 50988.0, 160383.0, 1266590.0, 2383202.0, 192581.0, 57768.0, 22712.0, 10082.0, 4766.0, 2497.0, 1379.0, 759.0, 462.0, 250.0, 178.0, 101.0, 72.0, 38.0, 33.0, 19.0, 8.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.341796875, -2.2750091552734375, -2.208221435546875, -2.1414337158203125, -2.07464599609375, -2.0078582763671875, -1.941070556640625, -1.8742828369140625, -1.8074951171875, -1.7407073974609375, -1.673919677734375, -1.6071319580078125, -1.54034423828125, -1.4735565185546875, -1.406768798828125, -1.3399810791015625, -1.273193359375, -1.2064056396484375, -1.139617919921875, -1.0728302001953125, -1.00604248046875, -0.9392547607421875, -0.872467041015625, -0.8056793212890625, -0.7388916015625, -0.6721038818359375, -0.605316162109375, -0.5385284423828125, -0.47174072265625, -0.4049530029296875, -0.338165283203125, -0.2713775634765625, -0.20458984375, -0.1378021240234375, -0.071014404296875, -0.0042266845703125, 0.06256103515625, 0.1293487548828125, 0.196136474609375, 0.2629241943359375, 0.3297119140625, 0.3964996337890625, 0.463287353515625, 0.5300750732421875, 0.59686279296875, 0.6636505126953125, 0.730438232421875, 0.7972259521484375, 0.864013671875, 0.9308013916015625, 0.997589111328125, 1.0643768310546875, 1.13116455078125, 1.1979522705078125, 1.264739990234375, 1.3315277099609375, 1.3983154296875, 1.4651031494140625, 1.531890869140625, 1.5986785888671875, 1.66546630859375, 1.7322540283203125, 1.799041748046875, 1.8658294677734375, 1.9326171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 9.0, 10.0, 17.0, 17.0, 19.0, 31.0, 63.0, 69.0, 139.0, 230.0, 595.0, 1724.0, 524.0, 239.0, 133.0, 80.0, 54.0, 32.0, 28.0, 18.0, 8.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3056640625, -1.258087158203125, -1.21051025390625, -1.162933349609375, -1.1153564453125, -1.067779541015625, -1.02020263671875, -0.972625732421875, -0.925048828125, -0.877471923828125, -0.82989501953125, -0.782318115234375, -0.7347412109375, -0.687164306640625, -0.63958740234375, -0.592010498046875, -0.54443359375, -0.496856689453125, -0.44927978515625, -0.401702880859375, -0.3541259765625, -0.306549072265625, -0.25897216796875, -0.211395263671875, -0.163818359375, -0.116241455078125, -0.06866455078125, -0.021087646484375, 0.0264892578125, 0.074066162109375, 0.12164306640625, 0.169219970703125, 0.216796875, 0.264373779296875, 0.31195068359375, 0.359527587890625, 0.4071044921875, 0.454681396484375, 0.50225830078125, 0.549835205078125, 0.597412109375, 0.644989013671875, 0.69256591796875, 0.740142822265625, 0.7877197265625, 0.835296630859375, 0.88287353515625, 0.930450439453125, 0.97802734375, 1.025604248046875, 1.07318115234375, 1.120758056640625, 1.1683349609375, 1.215911865234375, 1.26348876953125, 1.311065673828125, 1.358642578125, 1.406219482421875, 1.45379638671875, 1.501373291015625, 1.5489501953125, 1.596527099609375, 1.64410400390625, 1.691680908203125, 1.7392578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 23.0, 72.0, 246.0, 323.0, 223.0, 79.0, 24.0, 10.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.864779472351074, -5.06349515914917, -4.262210369110107, -3.460926055908203, -2.6596415042877197, -1.8583569526672363, -1.057072639465332, -0.25578784942626953, 0.5454964637756348, 1.3467810153961182, 2.1480655670166016, 2.949349880218506, 3.7506344318389893, 4.551918983459473, 5.353203296661377, 6.1544880867004395, 6.955772399902344, 7.757056713104248, 8.558341026306152, 9.359625816345215, 10.160910606384277, 10.962194442749023, 11.763479232788086, 12.564764022827148, 13.366048812866211, 14.167333602905273, 14.96861743927002, 15.769902229309082, 16.571186065673828, 17.37247085571289, 18.173755645751953, 18.975040435791016, 19.776323318481445, 20.577608108520508, 21.37889289855957, 22.18017578125, 22.981460571289062, 23.782745361328125, 24.584030151367188, 25.38531494140625, 26.186599731445312, 26.987884521484375, 27.789169311523438, 28.5904541015625, 29.39173698425293, 30.193021774291992, 30.994306564331055, 31.795591354370117, 32.59687423706055, 33.39815902709961, 34.19944381713867, 35.000728607177734, 35.8020133972168, 36.60329818725586, 37.404579162597656, 38.20586395263672, 39.00715255737305, 39.80843734741211, 40.60972213745117, 41.411006927490234, 42.2122917175293, 43.01357650756836, 43.814857482910156, 44.61614227294922, 45.41742706298828]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 12.0, 17.0, 12.0, 11.0, 14.0, 18.0, 18.0, 19.0, 27.0, 31.0, 28.0, 33.0, 27.0, 30.0, 34.0, 28.0, 41.0, 49.0, 49.0, 22.0, 39.0, 46.0, 25.0, 31.0, 27.0, 23.0, 33.0, 29.0, 27.0, 19.0, 15.0, 19.0, 10.0, 14.0, 15.0, 15.0, 13.0, 10.0, 9.0, 5.0, 8.0, 8.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.676394462585449, -3.5574376583099365, -3.4384806156158447, -3.319523811340332, -3.2005670070648193, -3.0816102027893066, -2.962653160095215, -2.843696355819702, -2.7247395515441895, -2.6057827472686768, -2.486825704574585, -2.3678689002990723, -2.2489120960235596, -2.129955291748047, -2.010998249053955, -1.8920414447784424, -1.7730844020843506, -1.6541274785995483, -1.5351706743240356, -1.4162137508392334, -1.2972569465637207, -1.1783000230789185, -1.0593430995941162, -0.9403862357139587, -0.8214293718338013, -0.7024725079536438, -0.5835156440734863, -0.4645587205886841, -0.3456018567085266, -0.22664499282836914, -0.1076880693435669, 0.011268794536590576, 0.13022565841674805, 0.2491825371980667, 0.3681394159793854, 0.48709630966186523, 0.6060531735420227, 0.7250100374221802, 0.8439669609069824, 0.9629238247871399, 1.0818806886672974, 1.2008376121520996, 1.3197944164276123, 1.4387513399124146, 1.5577082633972168, 1.6766650676727295, 1.7956219911575317, 1.914578914642334, 2.0335357189178467, 2.1524925231933594, 2.271449565887451, 2.390406370162964, 2.5093631744384766, 2.6283202171325684, 2.747277021408081, 2.8662338256835938, 2.9851908683776855, 3.1041476726531982, 3.22310471534729, 3.3420615196228027, 3.4610183238983154, 3.579975128173828, 3.69893217086792, 3.8178889751434326, 3.9368457794189453]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 8.0, 18.0, 17.0, 28.0, 37.0, 87.0, 118.0, 170.0, 300.0, 484.0, 830.0, 1477.0, 2739.0, 5395.0, 11117.0, 24479.0, 55576.0, 121637.0, 224591.0, 263886.0, 176835.0, 86428.0, 38324.0, 17140.0, 8023.0, 4028.0, 1994.0, 1092.0, 622.0, 360.0, 252.0, 139.0, 94.0, 63.0, 48.0, 23.0, 25.0, 14.0, 10.0, 6.0, 8.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8896484375, -1.8311004638671875, -1.772552490234375, -1.7140045166015625, -1.65545654296875, -1.5969085693359375, -1.538360595703125, -1.4798126220703125, -1.4212646484375, -1.3627166748046875, -1.304168701171875, -1.2456207275390625, -1.18707275390625, -1.1285247802734375, -1.069976806640625, -1.0114288330078125, -0.952880859375, -0.8943328857421875, -0.835784912109375, -0.7772369384765625, -0.71868896484375, -0.6601409912109375, -0.601593017578125, -0.5430450439453125, -0.4844970703125, -0.4259490966796875, -0.367401123046875, -0.3088531494140625, -0.25030517578125, -0.1917572021484375, -0.133209228515625, -0.0746612548828125, -0.01611328125, 0.0424346923828125, 0.100982666015625, 0.1595306396484375, 0.21807861328125, 0.2766265869140625, 0.335174560546875, 0.3937225341796875, 0.4522705078125, 0.5108184814453125, 0.569366455078125, 0.6279144287109375, 0.68646240234375, 0.7450103759765625, 0.803558349609375, 0.8621063232421875, 0.920654296875, 0.9792022705078125, 1.037750244140625, 1.0962982177734375, 1.15484619140625, 1.2133941650390625, 1.271942138671875, 1.3304901123046875, 1.3890380859375, 1.4475860595703125, 1.506134033203125, 1.5646820068359375, 1.62322998046875, 1.6817779541015625, 1.740325927734375, 1.7988739013671875, 1.857421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 7.0, 12.0, 18.0, 10.0, 25.0, 21.0, 32.0, 38.0, 48.0, 42.0, 54.0, 40.0, 55.0, 66.0, 66.0, 67.0, 59.0, 43.0, 46.0, 46.0, 54.0, 29.0, 30.0, 26.0, 14.0, 15.0, 6.0, 12.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6980705261230469, -0.6793441772460938, -0.6606178283691406, -0.6418914794921875, -0.6231651306152344, -0.6044387817382812, -0.5857124328613281, -0.566986083984375, -0.5482597351074219, -0.5295333862304688, -0.5108070373535156, -0.4920806884765625, -0.4733543395996094, -0.45462799072265625, -0.4359016418457031, -0.41717529296875, -0.3984489440917969, -0.37972259521484375, -0.3609962463378906, -0.3422698974609375, -0.3235435485839844, -0.30481719970703125, -0.2860908508300781, -0.267364501953125, -0.24863815307617188, -0.22991180419921875, -0.21118545532226562, -0.1924591064453125, -0.17373275756835938, -0.15500640869140625, -0.13628005981445312, -0.1175537109375, -0.09882736206054688, -0.08010101318359375, -0.061374664306640625, -0.0426483154296875, -0.023921966552734375, -0.00519561767578125, 0.013530731201171875, 0.032257080078125, 0.050983428955078125, 0.06970977783203125, 0.08843612670898438, 0.1071624755859375, 0.12588882446289062, 0.14461517333984375, 0.16334152221679688, 0.18206787109375, 0.20079421997070312, 0.21952056884765625, 0.23824691772460938, 0.2569732666015625, 0.2756996154785156, 0.29442596435546875, 0.3131523132324219, 0.331878662109375, 0.3506050109863281, 0.36933135986328125, 0.3880577087402344, 0.4067840576171875, 0.4255104064941406, 0.44423675537109375, 0.4629631042480469, 0.481689453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 10.0, 8.0, 14.0, 21.0, 26.0, 33.0, 51.0, 85.0, 108.0, 165.0, 248.0, 382.0, 671.0, 1208.0, 2385.0, 4634.0, 10688.0, 25039.0, 61169.0, 141743.0, 263465.0, 272060.0, 149739.0, 65706.0, 26865.0, 11480.0, 4992.0, 2395.0, 1258.0, 687.0, 407.0, 244.0, 190.0, 118.0, 78.0, 51.0, 36.0, 30.0, 21.0, 22.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.80078125, -1.7478790283203125, -1.694976806640625, -1.6420745849609375, -1.58917236328125, -1.5362701416015625, -1.483367919921875, -1.4304656982421875, -1.3775634765625, -1.3246612548828125, -1.271759033203125, -1.2188568115234375, -1.16595458984375, -1.1130523681640625, -1.060150146484375, -1.0072479248046875, -0.954345703125, -0.9014434814453125, -0.848541259765625, -0.7956390380859375, -0.74273681640625, -0.6898345947265625, -0.636932373046875, -0.5840301513671875, -0.5311279296875, -0.4782257080078125, -0.425323486328125, -0.3724212646484375, -0.31951904296875, -0.2666168212890625, -0.213714599609375, -0.1608123779296875, -0.10791015625, -0.0550079345703125, -0.002105712890625, 0.0507965087890625, 0.10369873046875, 0.1566009521484375, 0.209503173828125, 0.2624053955078125, 0.3153076171875, 0.3682098388671875, 0.421112060546875, 0.4740142822265625, 0.52691650390625, 0.5798187255859375, 0.632720947265625, 0.6856231689453125, 0.738525390625, 0.7914276123046875, 0.844329833984375, 0.8972320556640625, 0.95013427734375, 1.0030364990234375, 1.055938720703125, 1.1088409423828125, 1.1617431640625, 1.2146453857421875, 1.267547607421875, 1.3204498291015625, 1.37335205078125, 1.4262542724609375, 1.479156494140625, 1.5320587158203125, 1.5849609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 7.0, 3.0, 3.0, 9.0, 9.0, 8.0, 23.0, 23.0, 15.0, 30.0, 29.0, 36.0, 41.0, 47.0, 45.0, 42.0, 40.0, 45.0, 50.0, 64.0, 40.0, 48.0, 44.0, 33.0, 36.0, 42.0, 25.0, 25.0, 27.0, 31.0, 12.0, 8.0, 9.0, 8.0, 12.0, 10.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.732421875, -2.65924072265625, -2.5860595703125, -2.51287841796875, -2.439697265625, -2.36651611328125, -2.2933349609375, -2.22015380859375, -2.14697265625, -2.07379150390625, -2.0006103515625, -1.92742919921875, -1.854248046875, -1.78106689453125, -1.7078857421875, -1.63470458984375, -1.5615234375, -1.48834228515625, -1.4151611328125, -1.34197998046875, -1.268798828125, -1.19561767578125, -1.1224365234375, -1.04925537109375, -0.97607421875, -0.90289306640625, -0.8297119140625, -0.75653076171875, -0.683349609375, -0.61016845703125, -0.5369873046875, -0.46380615234375, -0.390625, -0.31744384765625, -0.2442626953125, -0.17108154296875, -0.097900390625, -0.02471923828125, 0.0484619140625, 0.12164306640625, 0.19482421875, 0.26800537109375, 0.3411865234375, 0.41436767578125, 0.487548828125, 0.56072998046875, 0.6339111328125, 0.70709228515625, 0.7802734375, 0.85345458984375, 0.9266357421875, 0.99981689453125, 1.072998046875, 1.14617919921875, 1.2193603515625, 1.29254150390625, 1.36572265625, 1.43890380859375, 1.5120849609375, 1.58526611328125, 1.658447265625, 1.73162841796875, 1.8048095703125, 1.87799072265625, 1.951171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 4.0, 3.0, 11.0, 19.0, 24.0, 34.0, 28.0, 56.0, 96.0, 146.0, 231.0, 402.0, 788.0, 1383.0, 3050.0, 6800.0, 17478.0, 52700.0, 166783.0, 393050.0, 267486.0, 90144.0, 28926.0, 10290.0, 4237.0, 2032.0, 1038.0, 528.0, 291.0, 163.0, 105.0, 86.0, 44.0, 18.0, 32.0, 19.0, 9.0, 5.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.780487060546875, -0.74456787109375, -0.708648681640625, -0.6727294921875, -0.636810302734375, -0.60089111328125, -0.564971923828125, -0.529052734375, -0.493133544921875, -0.45721435546875, -0.421295166015625, -0.3853759765625, -0.349456787109375, -0.31353759765625, -0.277618408203125, -0.24169921875, -0.205780029296875, -0.16986083984375, -0.133941650390625, -0.0980224609375, -0.062103271484375, -0.02618408203125, 0.009735107421875, 0.045654296875, 0.081573486328125, 0.11749267578125, 0.153411865234375, 0.1893310546875, 0.225250244140625, 0.26116943359375, 0.297088623046875, 0.3330078125, 0.368927001953125, 0.40484619140625, 0.440765380859375, 0.4766845703125, 0.512603759765625, 0.54852294921875, 0.584442138671875, 0.620361328125, 0.656280517578125, 0.69219970703125, 0.728118896484375, 0.7640380859375, 0.799957275390625, 0.83587646484375, 0.871795654296875, 0.90771484375, 0.943634033203125, 0.97955322265625, 1.015472412109375, 1.0513916015625, 1.087310791015625, 1.12322998046875, 1.159149169921875, 1.195068359375, 1.230987548828125, 1.26690673828125, 1.302825927734375, 1.3387451171875, 1.374664306640625, 1.41058349609375, 1.446502685546875, 1.482421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 4.0, 4.0, 6.0, 4.0, 11.0, 3.0, 16.0, 18.0, 23.0, 24.0, 35.0, 43.0, 61.0, 64.0, 72.0, 72.0, 76.0, 65.0, 67.0, 67.0, 56.0, 39.0, 34.0, 32.0, 27.0, 16.0, 19.0, 9.0, 11.0, 4.0, 4.0, 0.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018477439880371094, -0.00017854012548923492, -0.0001723058521747589, -0.0001660715788602829, -0.00015983730554580688, -0.00015360303223133087, -0.00014736875891685486, -0.00014113448560237885, -0.00013490021228790283, -0.00012866593897342682, -0.0001224316656589508, -0.00011619739234447479, -0.00010996311902999878, -0.00010372884571552277, -9.749457240104675e-05, -9.126029908657074e-05, -8.502602577209473e-05, -7.879175245761871e-05, -7.25574791431427e-05, -6.632320582866669e-05, -6.0088932514190674e-05, -5.385465919971466e-05, -4.762038588523865e-05, -4.1386112570762634e-05, -3.515183925628662e-05, -2.8917565941810608e-05, -2.2683292627334595e-05, -1.644901931285858e-05, -1.0214745998382568e-05, -3.980472683906555e-06, 2.253800630569458e-06, 8.488073945045471e-06, 1.4722347259521484e-05, 2.0956620573997498e-05, 2.719089388847351e-05, 3.3425167202949524e-05, 3.965944051742554e-05, 4.589371383190155e-05, 5.2127987146377563e-05, 5.836226046085358e-05, 6.459653377532959e-05, 7.08308070898056e-05, 7.706508040428162e-05, 8.329935371875763e-05, 8.953362703323364e-05, 9.576790034770966e-05, 0.00010200217366218567, 0.00010823644697666168, 0.0001144707202911377, 0.00012070499360561371, 0.00012693926692008972, 0.00013317354023456573, 0.00013940781354904175, 0.00014564208686351776, 0.00015187636017799377, 0.0001581106334924698, 0.0001643449068069458, 0.00017057918012142181, 0.00017681345343589783, 0.00018304772675037384, 0.00018928200006484985, 0.00019551627337932587, 0.00020175054669380188, 0.0002079848200082779, 0.0002142190933227539]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 6.0, 14.0, 18.0, 26.0, 45.0, 111.0, 205.0, 473.0, 1256.0, 4063.0, 19787.0, 144421.0, 619526.0, 220953.0, 29298.0, 5567.0, 1662.0, 585.0, 279.0, 125.0, 48.0, 25.0, 17.0, 23.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.4373931884765625, -1.373809814453125, -1.3102264404296875, -1.24664306640625, -1.1830596923828125, -1.119476318359375, -1.0558929443359375, -0.9923095703125, -0.9287261962890625, -0.865142822265625, -0.8015594482421875, -0.73797607421875, -0.6743927001953125, -0.610809326171875, -0.5472259521484375, -0.483642578125, -0.4200592041015625, -0.356475830078125, -0.2928924560546875, -0.22930908203125, -0.1657257080078125, -0.102142333984375, -0.0385589599609375, 0.0250244140625, 0.0886077880859375, 0.152191162109375, 0.2157745361328125, 0.27935791015625, 0.3429412841796875, 0.406524658203125, 0.4701080322265625, 0.53369140625, 0.5972747802734375, 0.660858154296875, 0.7244415283203125, 0.78802490234375, 0.8516082763671875, 0.915191650390625, 0.9787750244140625, 1.0423583984375, 1.1059417724609375, 1.169525146484375, 1.2331085205078125, 1.29669189453125, 1.3602752685546875, 1.423858642578125, 1.4874420166015625, 1.551025390625, 1.6146087646484375, 1.678192138671875, 1.7417755126953125, 1.80535888671875, 1.8689422607421875, 1.932525634765625, 1.9961090087890625, 2.0596923828125, 2.1232757568359375, 2.186859130859375, 2.2504425048828125, 2.31402587890625, 2.3776092529296875, 2.441192626953125, 2.5047760009765625, 2.568359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 25.0, 29.0, 41.0, 54.0, 61.0, 83.0, 100.0, 112.0, 102.0, 81.0, 68.0, 62.0, 30.0, 33.0, 30.0, 18.0, 13.0, 6.0, 3.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6334686279296875, -1.576507568359375, -1.5195465087890625, -1.46258544921875, -1.4056243896484375, -1.348663330078125, -1.2917022705078125, -1.2347412109375, -1.1777801513671875, -1.120819091796875, -1.0638580322265625, -1.00689697265625, -0.9499359130859375, -0.892974853515625, -0.8360137939453125, -0.779052734375, -0.7220916748046875, -0.665130615234375, -0.6081695556640625, -0.55120849609375, -0.4942474365234375, -0.437286376953125, -0.3803253173828125, -0.3233642578125, -0.2664031982421875, -0.209442138671875, -0.1524810791015625, -0.09552001953125, -0.0385589599609375, 0.018402099609375, 0.0753631591796875, 0.13232421875, 0.1892852783203125, 0.246246337890625, 0.3032073974609375, 0.36016845703125, 0.4171295166015625, 0.474090576171875, 0.5310516357421875, 0.5880126953125, 0.6449737548828125, 0.701934814453125, 0.7588958740234375, 0.81585693359375, 0.8728179931640625, 0.929779052734375, 0.9867401123046875, 1.043701171875, 1.1006622314453125, 1.157623291015625, 1.2145843505859375, 1.27154541015625, 1.3285064697265625, 1.385467529296875, 1.4424285888671875, 1.4993896484375, 1.5563507080078125, 1.613311767578125, 1.6702728271484375, 1.72723388671875, 1.7841949462890625, 1.841156005859375, 1.8981170654296875, 1.955078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 26.0, 52.0, 131.0, 221.0, 241.0, 186.0, 82.0, 37.0, 19.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.51769256591797, -63.180030822753906, -61.842369079589844, -60.50471115112305, -59.167049407958984, -57.82938766479492, -56.491729736328125, -55.15406799316406, -53.81640625, -52.47874450683594, -51.141082763671875, -49.80342483520508, -48.465763092041016, -47.12810134887695, -45.790443420410156, -44.452781677246094, -43.11511993408203, -41.77745819091797, -40.439796447753906, -39.10213851928711, -37.76447677612305, -36.426815032958984, -35.08915710449219, -33.751495361328125, -32.41383361816406, -31.076171875, -29.73851203918457, -28.40085220336914, -27.063190460205078, -25.725528717041016, -24.387868881225586, -23.050209045410156, -21.712547302246094, -20.37488555908203, -19.0372257232666, -17.699565887451172, -16.36190414428711, -15.024243354797363, -13.686582565307617, -12.348921775817871, -11.011260986328125, -9.673600196838379, -8.335939407348633, -6.998278617858887, -5.660617828369141, -4.3229570388793945, -2.9852962493896484, -1.6476354598999023, -0.30997467041015625, 1.0276861190795898, 2.365346908569336, 3.703007698059082, 5.040668487548828, 6.378329277038574, 7.71599006652832, 9.053650856018066, 10.391311645507812, 11.728972434997559, 13.066633224487305, 14.40429401397705, 15.741954803466797, 17.07961654663086, 18.41727638244629, 19.75493621826172, 21.09259796142578]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 4.0, 9.0, 14.0, 18.0, 7.0, 19.0, 14.0, 29.0, 27.0, 30.0, 29.0, 30.0, 48.0, 42.0, 43.0, 50.0, 40.0, 59.0, 48.0, 34.0, 48.0, 56.0, 33.0, 47.0, 25.0, 39.0, 25.0, 16.0, 21.0, 26.0, 9.0, 11.0, 8.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.099786758422852, -11.729218482971191, -11.358649253845215, -10.988080978393555, -10.617511749267578, -10.246943473815918, -9.876375198364258, -9.505805969238281, -9.135237693786621, -8.764669418334961, -8.394100189208984, -8.023531913757324, -7.652963161468506, -7.2823944091796875, -6.911826133728027, -6.541257381439209, -6.170688629150391, -5.800119876861572, -5.429551124572754, -5.058982849121094, -4.688414096832275, -4.317845344543457, -3.9472768306732178, -3.5767083168029785, -3.20613956451416, -2.835570812225342, -2.4650022983551025, -2.0944337844848633, -1.723865032196045, -1.3532963991165161, -0.9827277660369873, -0.612159252166748, -0.24158954620361328, 0.12897908687591553, 0.49954771995544434, 0.8701163530349731, 1.240684986114502, 1.6112536191940308, 1.9818222522735596, 2.352390766143799, 2.722959518432617, 3.0935282707214355, 3.464096784591675, 3.834665298461914, 4.205234050750732, 4.575802803039551, 4.946371078491211, 5.316939830780029, 5.687508583068848, 6.058077335357666, 6.428646087646484, 6.7992143630981445, 7.169783115386963, 7.540351867675781, 7.910920143127441, 8.281488418579102, 8.652057647705078, 9.022625923156738, 9.393195152282715, 9.763763427734375, 10.134332656860352, 10.504900932312012, 10.875469207763672, 11.246038436889648, 11.616606712341309]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 11.0, 7.0, 17.0, 21.0, 29.0, 46.0, 64.0, 87.0, 165.0, 272.0, 539.0, 992.0, 2293.0, 6382.0, 28523.0, 4006648.0, 126739.0, 14105.0, 4050.0, 1549.0, 745.0, 362.0, 221.0, 127.0, 94.0, 44.0, 39.0, 28.0, 17.0, 13.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 7.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.52374267578125, -5.3443603515625, -5.16497802734375, -4.985595703125, -4.80621337890625, -4.6268310546875, -4.44744873046875, -4.26806640625, -4.08868408203125, -3.9093017578125, -3.72991943359375, -3.550537109375, -3.37115478515625, -3.1917724609375, -3.01239013671875, -2.8330078125, -2.65362548828125, -2.4742431640625, -2.29486083984375, -2.115478515625, -1.93609619140625, -1.7567138671875, -1.57733154296875, -1.39794921875, -1.21856689453125, -1.0391845703125, -0.85980224609375, -0.680419921875, -0.50103759765625, -0.3216552734375, -0.14227294921875, 0.037109375, 0.21649169921875, 0.3958740234375, 0.57525634765625, 0.754638671875, 0.93402099609375, 1.1134033203125, 1.29278564453125, 1.47216796875, 1.65155029296875, 1.8309326171875, 2.01031494140625, 2.189697265625, 2.36907958984375, 2.5484619140625, 2.72784423828125, 2.9072265625, 3.08660888671875, 3.2659912109375, 3.44537353515625, 3.624755859375, 3.80413818359375, 3.9835205078125, 4.16290283203125, 4.34228515625, 4.52166748046875, 4.7010498046875, 4.88043212890625, 5.059814453125, 5.23919677734375, 5.4185791015625, 5.59796142578125, 5.77734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 10.0, 16.0, 13.0, 15.0, 27.0, 31.0, 23.0, 33.0, 33.0, 51.0, 63.0, 38.0, 40.0, 42.0, 54.0, 45.0, 51.0, 54.0, 53.0, 29.0, 35.0, 36.0, 33.0, 29.0, 25.0, 14.0, 20.0, 10.0, 16.0, 8.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.61279296875, -0.5956153869628906, -0.5784378051757812, -0.5612602233886719, -0.5440826416015625, -0.5269050598144531, -0.5097274780273438, -0.4925498962402344, -0.475372314453125, -0.4581947326660156, -0.44101715087890625, -0.4238395690917969, -0.4066619873046875, -0.3894844055175781, -0.37230682373046875, -0.3551292419433594, -0.33795166015625, -0.3207740783691406, -0.30359649658203125, -0.2864189147949219, -0.2692413330078125, -0.2520637512207031, -0.23488616943359375, -0.21770858764648438, -0.200531005859375, -0.18335342407226562, -0.16617584228515625, -0.14899826049804688, -0.1318206787109375, -0.11464309692382812, -0.09746551513671875, -0.08028793334960938, -0.0631103515625, -0.045932769775390625, -0.02875518798828125, -0.011577606201171875, 0.0055999755859375, 0.022777557373046875, 0.03995513916015625, 0.057132720947265625, 0.074310302734375, 0.09148788452148438, 0.10866546630859375, 0.12584304809570312, 0.1430206298828125, 0.16019821166992188, 0.17737579345703125, 0.19455337524414062, 0.21173095703125, 0.22890853881835938, 0.24608612060546875, 0.2632637023925781, 0.2804412841796875, 0.2976188659667969, 0.31479644775390625, 0.3319740295410156, 0.349151611328125, 0.3663291931152344, 0.38350677490234375, 0.4006843566894531, 0.4178619384765625, 0.4350395202636719, 0.45221710205078125, 0.4693946838378906, 0.486572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 17.0, 28.0, 49.0, 90.0, 154.0, 244.0, 443.0, 906.0, 2038.0, 5004.0, 14438.0, 61843.0, 3882280.0, 186196.0, 26989.0, 8038.0, 2861.0, 1333.0, 566.0, 329.0, 182.0, 109.0, 60.0, 37.0, 26.0, 12.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30859375, -3.204345703125, -3.10009765625, -2.995849609375, -2.8916015625, -2.787353515625, -2.68310546875, -2.578857421875, -2.474609375, -2.370361328125, -2.26611328125, -2.161865234375, -2.0576171875, -1.953369140625, -1.84912109375, -1.744873046875, -1.640625, -1.536376953125, -1.43212890625, -1.327880859375, -1.2236328125, -1.119384765625, -1.01513671875, -0.910888671875, -0.806640625, -0.702392578125, -0.59814453125, -0.493896484375, -0.3896484375, -0.285400390625, -0.18115234375, -0.076904296875, 0.02734375, 0.131591796875, 0.23583984375, 0.340087890625, 0.4443359375, 0.548583984375, 0.65283203125, 0.757080078125, 0.861328125, 0.965576171875, 1.06982421875, 1.174072265625, 1.2783203125, 1.382568359375, 1.48681640625, 1.591064453125, 1.6953125, 1.799560546875, 1.90380859375, 2.008056640625, 2.1123046875, 2.216552734375, 2.32080078125, 2.425048828125, 2.529296875, 2.633544921875, 2.73779296875, 2.842041015625, 2.9462890625, 3.050537109375, 3.15478515625, 3.259033203125, 3.36328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 10.0, 9.0, 15.0, 27.0, 45.0, 57.0, 80.0, 239.0, 3115.0, 179.0, 82.0, 51.0, 36.0, 25.0, 19.0, 11.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3857421875, -0.3711090087890625, -0.356475830078125, -0.3418426513671875, -0.32720947265625, -0.3125762939453125, -0.297943115234375, -0.2833099365234375, -0.2686767578125, -0.2540435791015625, -0.239410400390625, -0.2247772216796875, -0.21014404296875, -0.1955108642578125, -0.180877685546875, -0.1662445068359375, -0.151611328125, -0.1369781494140625, -0.122344970703125, -0.1077117919921875, -0.09307861328125, -0.0784454345703125, -0.063812255859375, -0.0491790771484375, -0.0345458984375, -0.0199127197265625, -0.005279541015625, 0.0093536376953125, 0.02398681640625, 0.0386199951171875, 0.053253173828125, 0.0678863525390625, 0.08251953125, 0.0971527099609375, 0.111785888671875, 0.1264190673828125, 0.14105224609375, 0.1556854248046875, 0.170318603515625, 0.1849517822265625, 0.1995849609375, 0.2142181396484375, 0.228851318359375, 0.2434844970703125, 0.25811767578125, 0.2727508544921875, 0.287384033203125, 0.3020172119140625, 0.316650390625, 0.3312835693359375, 0.345916748046875, 0.3605499267578125, 0.37518310546875, 0.3898162841796875, 0.404449462890625, 0.4190826416015625, 0.4337158203125, 0.4483489990234375, 0.462982177734375, 0.4776153564453125, 0.49224853515625, 0.5068817138671875, 0.521514892578125, 0.5361480712890625, 0.55078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 15.0, 33.0, 34.0, 59.0, 94.0, 114.0, 134.0, 132.0, 126.0, 79.0, 69.0, 47.0, 26.0, 18.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.540987968444824, -2.4557275772094727, -2.370467185974121, -2.2852065563201904, -2.199946165084839, -2.1146857738494873, -2.0294251441955566, -1.944164752960205, -1.8589043617248535, -1.773643970489502, -1.6883834600448608, -1.6031229496002197, -1.5178625583648682, -1.4326021671295166, -1.3473416566848755, -1.2620811462402344, -1.1768207550048828, -1.0915603637695312, -1.0062998533248901, -0.9210394024848938, -0.8357789516448975, -0.7505185008049011, -0.6652580499649048, -0.5799975991249084, -0.4947371482849121, -0.40947669744491577, -0.32421624660491943, -0.2389557957649231, -0.15369534492492676, -0.06843489408493042, 0.016825556755065918, 0.10208600759506226, 0.1873464584350586, 0.27260690927505493, 0.35786736011505127, 0.4431278109550476, 0.528388261795044, 0.6136487126350403, 0.6989091634750366, 0.784169614315033, 0.8694300651550293, 0.9546905159950256, 1.039950966835022, 1.125211477279663, 1.2104718685150146, 1.2957322597503662, 1.3809927701950073, 1.4662532806396484, 1.551513671875, 1.6367740631103516, 1.7220345735549927, 1.8072950839996338, 1.8925554752349854, 1.977815866470337, 2.0630764961242676, 2.148336887359619, 2.2335972785949707, 2.3188576698303223, 2.404118061065674, 2.4893786907196045, 2.574639081954956, 2.6598994731903076, 2.7451601028442383, 2.83042049407959, 2.9156808853149414]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 10.0, 8.0, 6.0, 12.0, 22.0, 25.0, 29.0, 34.0, 27.0, 33.0, 40.0, 42.0, 41.0, 42.0, 43.0, 46.0, 40.0, 46.0, 49.0, 37.0, 41.0, 41.0, 35.0, 46.0, 28.0, 21.0, 28.0, 23.0, 18.0, 16.0, 17.0, 13.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4903054237365723, -1.4488273859024048, -1.4073494672775269, -1.3658714294433594, -1.3243935108184814, -1.282915472984314, -1.241437554359436, -1.1999595165252686, -1.1584815979003906, -1.1170035600662231, -1.0755256414413452, -1.0340476036071777, -0.9925696849822998, -0.9510917067527771, -0.9096137285232544, -0.8681356906890869, -0.8266577124595642, -0.7851797342300415, -0.7437017560005188, -0.7022237777709961, -0.6607457995414734, -0.6192678213119507, -0.5777897834777832, -0.5363118648529053, -0.4948338568210602, -0.4533558785915375, -0.41187790036201477, -0.3703998923301697, -0.328921914100647, -0.28744393587112427, -0.24596595764160156, -0.20448797941207886, -0.16301000118255615, -0.12153202295303345, -0.08005403727293015, -0.03857605159282684, 0.002901926636695862, 0.04437990486621857, 0.08585789799690247, 0.12733587622642517, 0.16881385445594788, 0.21029183268547058, 0.2517698109149933, 0.2932478189468384, 0.3347257971763611, 0.3762037754058838, 0.4176817536354065, 0.4591597318649292, 0.5006377100944519, 0.5421156883239746, 0.5835936665534973, 0.62507164478302, 0.6665496230125427, 0.7080276012420654, 0.7495056390762329, 0.7909835577011108, 0.8324615955352783, 0.873939573764801, 0.9154175519943237, 0.9568955302238464, 0.9983735084533691, 1.0398515462875366, 1.0813294649124146, 1.122807502746582, 1.16428542137146]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 13.0, 9.0, 10.0, 18.0, 27.0, 39.0, 47.0, 89.0, 146.0, 229.0, 408.0, 724.0, 1327.0, 2547.0, 5141.0, 10535.0, 22116.0, 45527.0, 90616.0, 167172.0, 237988.0, 210620.0, 125781.0, 64931.0, 32028.0, 15341.0, 7469.0, 3599.0, 1742.0, 992.0, 493.0, 304.0, 201.0, 114.0, 70.0, 51.0, 26.0, 13.0, 17.0, 12.0, 5.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.5693359375, -1.5228424072265625, -1.476348876953125, -1.4298553466796875, -1.38336181640625, -1.3368682861328125, -1.290374755859375, -1.2438812255859375, -1.1973876953125, -1.1508941650390625, -1.104400634765625, -1.0579071044921875, -1.01141357421875, -0.9649200439453125, -0.918426513671875, -0.8719329833984375, -0.825439453125, -0.7789459228515625, -0.732452392578125, -0.6859588623046875, -0.63946533203125, -0.5929718017578125, -0.546478271484375, -0.4999847412109375, -0.4534912109375, -0.4069976806640625, -0.360504150390625, -0.3140106201171875, -0.26751708984375, -0.2210235595703125, -0.174530029296875, -0.1280364990234375, -0.08154296875, -0.0350494384765625, 0.011444091796875, 0.0579376220703125, 0.10443115234375, 0.1509246826171875, 0.197418212890625, 0.2439117431640625, 0.2904052734375, 0.3368988037109375, 0.383392333984375, 0.4298858642578125, 0.47637939453125, 0.5228729248046875, 0.569366455078125, 0.6158599853515625, 0.662353515625, 0.7088470458984375, 0.755340576171875, 0.8018341064453125, 0.84832763671875, 0.8948211669921875, 0.941314697265625, 0.9878082275390625, 1.0343017578125, 1.0807952880859375, 1.127288818359375, 1.1737823486328125, 1.22027587890625, 1.2667694091796875, 1.313262939453125, 1.3597564697265625, 1.40625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 12.0, 10.0, 13.0, 15.0, 25.0, 27.0, 29.0, 32.0, 39.0, 30.0, 42.0, 56.0, 38.0, 66.0, 49.0, 57.0, 56.0, 40.0, 54.0, 53.0, 36.0, 36.0, 29.0, 23.0, 26.0, 24.0, 13.0, 20.0, 7.0, 15.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6720809936523438, -0.6522674560546875, -0.6324539184570312, -0.612640380859375, -0.5928268432617188, -0.5730133056640625, -0.5531997680664062, -0.53338623046875, -0.5135726928710938, -0.4937591552734375, -0.47394561767578125, -0.454132080078125, -0.43431854248046875, -0.4145050048828125, -0.39469146728515625, -0.3748779296875, -0.35506439208984375, -0.3352508544921875, -0.31543731689453125, -0.295623779296875, -0.27581024169921875, -0.2559967041015625, -0.23618316650390625, -0.21636962890625, -0.19655609130859375, -0.1767425537109375, -0.15692901611328125, -0.137115478515625, -0.11730194091796875, -0.0974884033203125, -0.07767486572265625, -0.057861328125, -0.03804779052734375, -0.0182342529296875, 0.00157928466796875, 0.021392822265625, 0.04120635986328125, 0.0610198974609375, 0.08083343505859375, 0.10064697265625, 0.12046051025390625, 0.1402740478515625, 0.16008758544921875, 0.179901123046875, 0.19971466064453125, 0.2195281982421875, 0.23934173583984375, 0.2591552734375, 0.27896881103515625, 0.2987823486328125, 0.31859588623046875, 0.338409423828125, 0.35822296142578125, 0.3780364990234375, 0.39785003662109375, 0.41766357421875, 0.43747711181640625, 0.4572906494140625, 0.47710418701171875, 0.496917724609375, 0.5167312622070312, 0.5365447998046875, 0.5563583374023438, 0.576171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 13.0, 17.0, 26.0, 35.0, 50.0, 72.0, 86.0, 129.0, 192.0, 252.0, 416.0, 647.0, 1169.0, 2246.0, 4939.0, 12002.0, 30297.0, 79565.0, 199751.0, 357159.0, 215740.0, 86419.0, 33144.0, 12983.0, 5462.0, 2421.0, 1269.0, 698.0, 405.0, 276.0, 192.0, 137.0, 95.0, 59.0, 40.0, 42.0, 30.0, 14.0, 11.0, 12.0, 12.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.486968994140625, -1.43487548828125, -1.382781982421875, -1.3306884765625, -1.278594970703125, -1.22650146484375, -1.174407958984375, -1.122314453125, -1.070220947265625, -1.01812744140625, -0.966033935546875, -0.9139404296875, -0.861846923828125, -0.80975341796875, -0.757659912109375, -0.70556640625, -0.653472900390625, -0.60137939453125, -0.549285888671875, -0.4971923828125, -0.445098876953125, -0.39300537109375, -0.340911865234375, -0.288818359375, -0.236724853515625, -0.18463134765625, -0.132537841796875, -0.0804443359375, -0.028350830078125, 0.02374267578125, 0.075836181640625, 0.1279296875, 0.180023193359375, 0.23211669921875, 0.284210205078125, 0.3363037109375, 0.388397216796875, 0.44049072265625, 0.492584228515625, 0.544677734375, 0.596771240234375, 0.64886474609375, 0.700958251953125, 0.7530517578125, 0.805145263671875, 0.85723876953125, 0.909332275390625, 0.96142578125, 1.013519287109375, 1.06561279296875, 1.117706298828125, 1.1697998046875, 1.221893310546875, 1.27398681640625, 1.326080322265625, 1.378173828125, 1.430267333984375, 1.48236083984375, 1.534454345703125, 1.5865478515625, 1.638641357421875, 1.69073486328125, 1.742828369140625, 1.794921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 3.0, 5.0, 8.0, 7.0, 15.0, 12.0, 19.0, 16.0, 17.0, 24.0, 18.0, 26.0, 31.0, 39.0, 45.0, 34.0, 32.0, 36.0, 41.0, 38.0, 48.0, 39.0, 52.0, 44.0, 39.0, 48.0, 39.0, 33.0, 33.0, 23.0, 19.0, 18.0, 15.0, 14.0, 9.0, 7.0, 7.0, 10.0, 5.0, 10.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.5078125, -2.432098388671875, -2.35638427734375, -2.280670166015625, -2.2049560546875, -2.129241943359375, -2.05352783203125, -1.977813720703125, -1.902099609375, -1.826385498046875, -1.75067138671875, -1.674957275390625, -1.5992431640625, -1.523529052734375, -1.44781494140625, -1.372100830078125, -1.29638671875, -1.220672607421875, -1.14495849609375, -1.069244384765625, -0.9935302734375, -0.917816162109375, -0.84210205078125, -0.766387939453125, -0.690673828125, -0.614959716796875, -0.53924560546875, -0.463531494140625, -0.3878173828125, -0.312103271484375, -0.23638916015625, -0.160675048828125, -0.0849609375, -0.009246826171875, 0.06646728515625, 0.142181396484375, 0.2178955078125, 0.293609619140625, 0.36932373046875, 0.445037841796875, 0.520751953125, 0.596466064453125, 0.67218017578125, 0.747894287109375, 0.8236083984375, 0.899322509765625, 0.97503662109375, 1.050750732421875, 1.12646484375, 1.202178955078125, 1.27789306640625, 1.353607177734375, 1.4293212890625, 1.505035400390625, 1.58074951171875, 1.656463623046875, 1.732177734375, 1.807891845703125, 1.88360595703125, 1.959320068359375, 2.0350341796875, 2.110748291015625, 2.18646240234375, 2.262176513671875, 2.337890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 12.0, 20.0, 36.0, 48.0, 71.0, 135.0, 244.0, 451.0, 906.0, 1873.0, 4507.0, 13006.0, 45117.0, 181906.0, 495198.0, 224754.0, 55257.0, 15506.0, 5218.0, 2122.0, 1001.0, 467.0, 286.0, 162.0, 89.0, 57.0, 30.0, 26.0, 13.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05859375, -1.0239715576171875, -0.989349365234375, -0.9547271728515625, -0.92010498046875, -0.8854827880859375, -0.850860595703125, -0.8162384033203125, -0.7816162109375, -0.7469940185546875, -0.712371826171875, -0.6777496337890625, -0.64312744140625, -0.6085052490234375, -0.573883056640625, -0.5392608642578125, -0.504638671875, -0.4700164794921875, -0.435394287109375, -0.4007720947265625, -0.36614990234375, -0.3315277099609375, -0.296905517578125, -0.2622833251953125, -0.2276611328125, -0.1930389404296875, -0.158416748046875, -0.1237945556640625, -0.08917236328125, -0.0545501708984375, -0.019927978515625, 0.0146942138671875, 0.04931640625, 0.0839385986328125, 0.118560791015625, 0.1531829833984375, 0.18780517578125, 0.2224273681640625, 0.257049560546875, 0.2916717529296875, 0.3262939453125, 0.3609161376953125, 0.395538330078125, 0.4301605224609375, 0.46478271484375, 0.4994049072265625, 0.534027099609375, 0.5686492919921875, 0.603271484375, 0.6378936767578125, 0.672515869140625, 0.7071380615234375, 0.74176025390625, 0.7763824462890625, 0.811004638671875, 0.8456268310546875, 0.8802490234375, 0.9148712158203125, 0.949493408203125, 0.9841156005859375, 1.01873779296875, 1.0533599853515625, 1.087982177734375, 1.1226043701171875, 1.1572265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 4.0, 8.0, 16.0, 23.0, 16.0, 28.0, 30.0, 31.0, 30.0, 42.0, 44.0, 44.0, 54.0, 58.0, 54.0, 66.0, 73.0, 55.0, 53.0, 40.0, 46.0, 32.0, 24.0, 18.0, 16.0, 10.0, 19.0, 11.0, 5.0, 7.0, 5.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00014901161193847656, -0.0001446940004825592, -0.00014037638902664185, -0.0001360587775707245, -0.00013174116611480713, -0.00012742355465888977, -0.0001231059432029724, -0.00011878833174705505, -0.0001144707202911377, -0.00011015310883522034, -0.00010583549737930298, -0.00010151788592338562, -9.720027446746826e-05, -9.28826630115509e-05, -8.856505155563354e-05, -8.424744009971619e-05, -7.992982864379883e-05, -7.561221718788147e-05, -7.129460573196411e-05, -6.697699427604675e-05, -6.26593828201294e-05, -5.8341771364212036e-05, -5.402415990829468e-05, -4.970654845237732e-05, -4.538893699645996e-05, -4.10713255405426e-05, -3.6753714084625244e-05, -3.2436102628707886e-05, -2.8118491172790527e-05, -2.380087971687317e-05, -1.948326826095581e-05, -1.5165656805038452e-05, -1.0848045349121094e-05, -6.530433893203735e-06, -2.212822437286377e-06, 2.1047890186309814e-06, 6.42240047454834e-06, 1.0740011930465698e-05, 1.5057623386383057e-05, 1.9375234842300415e-05, 2.3692846298217773e-05, 2.8010457754135132e-05, 3.232806921005249e-05, 3.664568066596985e-05, 4.096329212188721e-05, 4.5280903577804565e-05, 4.9598515033721924e-05, 5.391612648963928e-05, 5.823373794555664e-05, 6.2551349401474e-05, 6.686896085739136e-05, 7.118657231330872e-05, 7.550418376922607e-05, 7.982179522514343e-05, 8.413940668106079e-05, 8.845701813697815e-05, 9.277462959289551e-05, 9.709224104881287e-05, 0.00010140985250473022, 0.00010572746396064758, 0.00011004507541656494, 0.0001143626868724823, 0.00011868029832839966, 0.00012299790978431702, 0.00012731552124023438]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 9.0, 15.0, 30.0, 53.0, 72.0, 167.0, 247.0, 465.0, 909.0, 2019.0, 5143.0, 18872.0, 102770.0, 529731.0, 318931.0, 51602.0, 10936.0, 3529.0, 1445.0, 712.0, 366.0, 204.0, 118.0, 64.0, 45.0, 28.0, 21.0, 14.0, 8.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3017578125, -1.2565765380859375, -1.211395263671875, -1.1662139892578125, -1.12103271484375, -1.0758514404296875, -1.030670166015625, -0.9854888916015625, -0.9403076171875, -0.8951263427734375, -0.849945068359375, -0.8047637939453125, -0.75958251953125, -0.7144012451171875, -0.669219970703125, -0.6240386962890625, -0.578857421875, -0.5336761474609375, -0.488494873046875, -0.4433135986328125, -0.39813232421875, -0.3529510498046875, -0.307769775390625, -0.2625885009765625, -0.2174072265625, -0.1722259521484375, -0.127044677734375, -0.0818634033203125, -0.03668212890625, 0.0084991455078125, 0.053680419921875, 0.0988616943359375, 0.14404296875, 0.1892242431640625, 0.234405517578125, 0.2795867919921875, 0.32476806640625, 0.3699493408203125, 0.415130615234375, 0.4603118896484375, 0.5054931640625, 0.5506744384765625, 0.595855712890625, 0.6410369873046875, 0.68621826171875, 0.7313995361328125, 0.776580810546875, 0.8217620849609375, 0.866943359375, 0.9121246337890625, 0.957305908203125, 1.0024871826171875, 1.04766845703125, 1.0928497314453125, 1.138031005859375, 1.1832122802734375, 1.2283935546875, 1.2735748291015625, 1.318756103515625, 1.3639373779296875, 1.40911865234375, 1.4542999267578125, 1.499481201171875, 1.5446624755859375, 1.58984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 21.0, 36.0, 42.0, 57.0, 93.0, 101.0, 113.0, 123.0, 93.0, 78.0, 51.0, 49.0, 36.0, 21.0, 11.0, 15.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5703125, -2.5142364501953125, -2.458160400390625, -2.4020843505859375, -2.34600830078125, -2.2899322509765625, -2.233856201171875, -2.1777801513671875, -2.1217041015625, -2.0656280517578125, -2.009552001953125, -1.9534759521484375, -1.89739990234375, -1.8413238525390625, -1.785247802734375, -1.7291717529296875, -1.673095703125, -1.6170196533203125, -1.560943603515625, -1.5048675537109375, -1.44879150390625, -1.3927154541015625, -1.336639404296875, -1.2805633544921875, -1.2244873046875, -1.1684112548828125, -1.112335205078125, -1.0562591552734375, -1.00018310546875, -0.9441070556640625, -0.888031005859375, -0.8319549560546875, -0.77587890625, -0.7198028564453125, -0.663726806640625, -0.6076507568359375, -0.55157470703125, -0.4954986572265625, -0.439422607421875, -0.3833465576171875, -0.3272705078125, -0.2711944580078125, -0.215118408203125, -0.1590423583984375, -0.10296630859375, -0.0468902587890625, 0.009185791015625, 0.0652618408203125, 0.121337890625, 0.1774139404296875, 0.233489990234375, 0.2895660400390625, 0.34564208984375, 0.4017181396484375, 0.457794189453125, 0.5138702392578125, 0.5699462890625, 0.6260223388671875, 0.682098388671875, 0.7381744384765625, 0.79425048828125, 0.8503265380859375, 0.906402587890625, 0.9624786376953125, 1.0185546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 9.0, 31.0, 77.0, 171.0, 282.0, 222.0, 113.0, 61.0, 22.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.69205093383789, -27.388267517089844, -26.084484100341797, -24.78070068359375, -23.476917266845703, -22.173133850097656, -20.86935043334961, -19.565567016601562, -18.261783599853516, -16.95800018310547, -15.654216766357422, -14.350433349609375, -13.046649932861328, -11.742866516113281, -10.439083099365234, -9.135299682617188, -7.831516265869141, -6.527732849121094, -5.223949432373047, -3.920166015625, -2.616382598876953, -1.3125991821289062, -0.008815765380859375, 1.2949676513671875, 2.5987510681152344, 3.9025344848632812, 5.206317901611328, 6.510101318359375, 7.813884735107422, 9.117668151855469, 10.421451568603516, 11.725234985351562, 13.02901840209961, 14.332801818847656, 15.636585235595703, 16.94036865234375, 18.244152069091797, 19.547935485839844, 20.85171890258789, 22.155502319335938, 23.459285736083984, 24.76306915283203, 26.066852569580078, 27.370635986328125, 28.674419403076172, 29.97820281982422, 31.281986236572266, 32.58576965332031, 33.88955307006836, 35.193336486816406, 36.49711990356445, 37.8009033203125, 39.10468673706055, 40.408470153808594, 41.71225357055664, 43.01603698730469, 44.319820404052734, 45.62360382080078, 46.92738723754883, 48.231170654296875, 49.53495407104492, 50.83873748779297, 52.142520904541016, 53.44630432128906, 54.75008773803711]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 6.0, 1.0, 5.0, 4.0, 8.0, 3.0, 11.0, 13.0, 12.0, 28.0, 21.0, 25.0, 28.0, 40.0, 39.0, 40.0, 47.0, 47.0, 60.0, 47.0, 61.0, 64.0, 48.0, 53.0, 38.0, 45.0, 51.0, 28.0, 24.0, 31.0, 15.0, 18.0, 7.0, 13.0, 3.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.377784729003906, -15.882405281066895, -15.387025833129883, -14.891645431518555, -14.396265983581543, -13.900886535644531, -13.40550708770752, -12.910127639770508, -12.41474723815918, -11.919367790222168, -11.423988342285156, -10.928607940673828, -10.433228492736816, -9.937849044799805, -9.442469596862793, -8.947090148925781, -8.45171070098877, -7.956331253051758, -7.460951328277588, -6.965571880340576, -6.470191955566406, -5.9748125076293945, -5.479433059692383, -4.984053611755371, -4.488673686981201, -3.9932940006256104, -3.4979143142700195, -3.002534866333008, -2.507155179977417, -2.011775493621826, -1.5163960456848145, -1.0210163593292236, -0.5256366729736328, -0.030257046222686768, 0.4651225805282593, 0.9605021476745605, 1.4558818340301514, 1.9512615203857422, 2.446640968322754, 2.9420206546783447, 3.4374003410339355, 3.9327800273895264, 4.428159713745117, 4.923539161682129, 5.418918609619141, 5.9142985343933105, 6.409677982330322, 6.905057907104492, 7.400437355041504, 7.895816802978516, 8.391196250915527, 8.886575698852539, 9.381956100463867, 9.877335548400879, 10.37271499633789, 10.868094444274902, 11.363473892211914, 11.858853340148926, 12.354232788085938, 12.849613189697266, 13.344992637634277, 13.840372085571289, 14.3357515335083, 14.831130981445312, 15.32651138305664]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 8.0, 13.0, 20.0, 22.0, 23.0, 57.0, 85.0, 120.0, 179.0, 302.0, 517.0, 907.0, 1833.0, 4536.0, 14778.0, 93687.0, 4015426.0, 45460.0, 9596.0, 3306.0, 1521.0, 736.0, 413.0, 246.0, 162.0, 117.0, 67.0, 28.0, 36.0, 19.0, 8.0, 7.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9921875, -2.88275146484375, -2.7733154296875, -2.66387939453125, -2.554443359375, -2.44500732421875, -2.3355712890625, -2.22613525390625, -2.11669921875, -2.00726318359375, -1.8978271484375, -1.78839111328125, -1.678955078125, -1.56951904296875, -1.4600830078125, -1.35064697265625, -1.2412109375, -1.13177490234375, -1.0223388671875, -0.91290283203125, -0.803466796875, -0.69403076171875, -0.5845947265625, -0.47515869140625, -0.36572265625, -0.25628662109375, -0.1468505859375, -0.03741455078125, 0.072021484375, 0.18145751953125, 0.2908935546875, 0.40032958984375, 0.509765625, 0.61920166015625, 0.7286376953125, 0.83807373046875, 0.947509765625, 1.05694580078125, 1.1663818359375, 1.27581787109375, 1.38525390625, 1.49468994140625, 1.6041259765625, 1.71356201171875, 1.822998046875, 1.93243408203125, 2.0418701171875, 2.15130615234375, 2.2607421875, 2.37017822265625, 2.4796142578125, 2.58905029296875, 2.698486328125, 2.80792236328125, 2.9173583984375, 3.02679443359375, 3.13623046875, 3.24566650390625, 3.3551025390625, 3.46453857421875, 3.573974609375, 3.68341064453125, 3.7928466796875, 3.90228271484375, 4.01171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 12.0, 19.0, 23.0, 32.0, 28.0, 25.0, 41.0, 46.0, 49.0, 55.0, 64.0, 46.0, 64.0, 47.0, 54.0, 55.0, 42.0, 33.0, 34.0, 43.0, 28.0, 26.0, 23.0, 15.0, 14.0, 5.0, 13.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.76513671875, -0.7455863952636719, -0.7260360717773438, -0.7064857482910156, -0.6869354248046875, -0.6673851013183594, -0.6478347778320312, -0.6282844543457031, -0.608734130859375, -0.5891838073730469, -0.5696334838867188, -0.5500831604003906, -0.5305328369140625, -0.5109825134277344, -0.49143218994140625, -0.4718818664550781, -0.45233154296875, -0.4327812194824219, -0.41323089599609375, -0.3936805725097656, -0.3741302490234375, -0.3545799255371094, -0.33502960205078125, -0.3154792785644531, -0.295928955078125, -0.2763786315917969, -0.25682830810546875, -0.23727798461914062, -0.2177276611328125, -0.19817733764648438, -0.17862701416015625, -0.15907669067382812, -0.1395263671875, -0.11997604370117188, -0.10042572021484375, -0.08087539672851562, -0.0613250732421875, -0.041774749755859375, -0.02222442626953125, -0.002674102783203125, 0.016876220703125, 0.036426544189453125, 0.05597686767578125, 0.07552719116210938, 0.0950775146484375, 0.11462783813476562, 0.13417816162109375, 0.15372848510742188, 0.17327880859375, 0.19282913208007812, 0.21237945556640625, 0.23192977905273438, 0.2514801025390625, 0.2710304260253906, 0.29058074951171875, 0.3101310729980469, 0.329681396484375, 0.3492317199707031, 0.36878204345703125, 0.3883323669433594, 0.4078826904296875, 0.4274330139160156, 0.44698333740234375, 0.4665336608886719, 0.486083984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 11.0, 7.0, 17.0, 18.0, 35.0, 34.0, 48.0, 80.0, 105.0, 174.0, 299.0, 450.0, 756.0, 1373.0, 2686.0, 5724.0, 13922.0, 42034.0, 223618.0, 3779433.0, 83179.0, 23263.0, 8784.0, 3755.0, 1812.0, 1011.0, 596.0, 370.0, 238.0, 162.0, 89.0, 54.0, 45.0, 25.0, 24.0, 12.0, 15.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1796875, -2.1178436279296875, -2.055999755859375, -1.9941558837890625, -1.93231201171875, -1.8704681396484375, -1.808624267578125, -1.7467803955078125, -1.6849365234375, -1.6230926513671875, -1.561248779296875, -1.4994049072265625, -1.43756103515625, -1.3757171630859375, -1.313873291015625, -1.2520294189453125, -1.190185546875, -1.1283416748046875, -1.066497802734375, -1.0046539306640625, -0.94281005859375, -0.8809661865234375, -0.819122314453125, -0.7572784423828125, -0.6954345703125, -0.6335906982421875, -0.571746826171875, -0.5099029541015625, -0.44805908203125, -0.3862152099609375, -0.324371337890625, -0.2625274658203125, -0.20068359375, -0.1388397216796875, -0.076995849609375, -0.0151519775390625, 0.04669189453125, 0.1085357666015625, 0.170379638671875, 0.2322235107421875, 0.2940673828125, 0.3559112548828125, 0.417755126953125, 0.4795989990234375, 0.54144287109375, 0.6032867431640625, 0.665130615234375, 0.7269744873046875, 0.788818359375, 0.8506622314453125, 0.912506103515625, 0.9743499755859375, 1.03619384765625, 1.0980377197265625, 1.159881591796875, 1.2217254638671875, 1.2835693359375, 1.3454132080078125, 1.407257080078125, 1.4691009521484375, 1.53094482421875, 1.5927886962890625, 1.654632568359375, 1.7164764404296875, 1.7783203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 10.0, 22.0, 19.0, 54.0, 87.0, 235.0, 3332.0, 151.0, 66.0, 31.0, 26.0, 12.0, 7.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9256362915039062, -0.8986358642578125, -0.8716354370117188, -0.844635009765625, -0.8176345825195312, -0.7906341552734375, -0.7636337280273438, -0.73663330078125, -0.7096328735351562, -0.6826324462890625, -0.6556320190429688, -0.628631591796875, -0.6016311645507812, -0.5746307373046875, -0.5476303100585938, -0.5206298828125, -0.49362945556640625, -0.4666290283203125, -0.43962860107421875, -0.412628173828125, -0.38562774658203125, -0.3586273193359375, -0.33162689208984375, -0.30462646484375, -0.27762603759765625, -0.2506256103515625, -0.22362518310546875, -0.196624755859375, -0.16962432861328125, -0.1426239013671875, -0.11562347412109375, -0.088623046875, -0.06162261962890625, -0.0346221923828125, -0.00762176513671875, 0.019378662109375, 0.04637908935546875, 0.0733795166015625, 0.10037994384765625, 0.12738037109375, 0.15438079833984375, 0.1813812255859375, 0.20838165283203125, 0.235382080078125, 0.26238250732421875, 0.2893829345703125, 0.31638336181640625, 0.3433837890625, 0.37038421630859375, 0.3973846435546875, 0.42438507080078125, 0.451385498046875, 0.47838592529296875, 0.5053863525390625, 0.5323867797851562, 0.55938720703125, 0.5863876342773438, 0.6133880615234375, 0.6403884887695312, 0.667388916015625, 0.6943893432617188, 0.7213897705078125, 0.7483901977539062, 0.775390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 8.0, 25.0, 28.0, 45.0, 94.0, 129.0, 173.0, 153.0, 145.0, 81.0, 63.0, 28.0, 15.0, 4.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7443273067474365, -2.642873525619507, -2.541419744491577, -2.4399657249450684, -2.3385119438171387, -2.237058162689209, -2.1356043815612793, -2.0341506004333496, -1.9326967000961304, -1.8312429189682007, -1.7297890186309814, -1.6283352375030518, -1.526881456375122, -1.4254275560379028, -1.3239737749099731, -1.222519874572754, -1.1210660934448242, -1.0196123123168945, -0.9181584119796753, -0.8167046308517456, -0.7152507901191711, -0.6137969493865967, -0.512343168258667, -0.41088932752609253, -0.30943548679351807, -0.2079816609621048, -0.10652783513069153, -0.005074024200439453, 0.09637981653213501, 0.19783365726470947, 0.29928743839263916, 0.4007412791252136, 0.5021953582763672, 0.6036491990089417, 0.7051030397415161, 0.8065568208694458, 0.9080106616020203, 1.0094645023345947, 1.1109182834625244, 1.212372064590454, 1.3138259649276733, 1.415279746055603, 1.5167336463928223, 1.618187427520752, 1.7196412086486816, 1.8210951089859009, 1.9225488901138306, 2.02400279045105, 2.1254565715789795, 2.226910352706909, 2.328364133834839, 2.4298181533813477, 2.5312719345092773, 2.632725715637207, 2.7341794967651367, 2.8356332778930664, 2.937087059020996, 3.038540840148926, 3.1399946212768555, 3.241448402404785, 3.342902421951294, 3.4443562030792236, 3.5458099842071533, 3.647263765335083, 3.748717784881592]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 8.0, 5.0, 13.0, 10.0, 12.0, 19.0, 17.0, 16.0, 27.0, 28.0, 17.0, 41.0, 35.0, 43.0, 39.0, 57.0, 46.0, 59.0, 57.0, 43.0, 42.0, 47.0, 37.0, 38.0, 37.0, 28.0, 30.0, 30.0, 17.0, 13.0, 17.0, 12.0, 11.0, 5.0, 6.0, 3.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1311805248260498, -1.0932921171188354, -1.055403709411621, -1.0175151824951172, -0.9796267747879028, -0.9417383670806885, -0.9038499593734741, -0.865961492061615, -0.8280730247497559, -0.7901846170425415, -0.7522961497306824, -0.714407742023468, -0.6765192747116089, -0.6386308670043945, -0.6007424592971802, -0.562853991985321, -0.5249655842781067, -0.48707714676856995, -0.4491887092590332, -0.41130030155181885, -0.3734118342399597, -0.33552342653274536, -0.2976349890232086, -0.2597465515136719, -0.22185811400413513, -0.1839696764945984, -0.14608123898506165, -0.1081928163766861, -0.07030437886714935, -0.03241594135761261, 0.0054724812507629395, 0.04336091876029968, 0.08124935626983643, 0.11913779377937317, 0.1570262312889099, 0.19491465389728546, 0.2328030914068222, 0.27069151401519775, 0.3085799515247345, 0.34646838903427124, 0.384356826543808, 0.4222452640533447, 0.46013370156288147, 0.4980221390724182, 0.5359105467796326, 0.5737990140914917, 0.611687421798706, 0.6495758295059204, 0.6874642968177795, 0.7253527045249939, 0.763241171836853, 0.8011295795440674, 0.8390180468559265, 0.8769064545631409, 0.914794921875, 0.9526833295822144, 0.9905717372894287, 1.028460144996643, 1.0663485527038574, 1.1042370796203613, 1.1421254873275757, 1.18001389503479, 1.2179023027420044, 1.2557907104492188, 1.2936792373657227]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 8.0, 2.0, 13.0, 9.0, 19.0, 33.0, 58.0, 55.0, 122.0, 204.0, 324.0, 654.0, 1328.0, 2836.0, 6337.0, 14975.0, 36284.0, 89451.0, 196438.0, 293281.0, 223604.0, 106461.0, 44176.0, 17950.0, 7487.0, 3266.0, 1443.0, 748.0, 392.0, 223.0, 132.0, 89.0, 55.0, 36.0, 20.0, 14.0, 11.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.9697265625, -1.918701171875, -1.86767578125, -1.816650390625, -1.765625, -1.714599609375, -1.66357421875, -1.612548828125, -1.5615234375, -1.510498046875, -1.45947265625, -1.408447265625, -1.357421875, -1.306396484375, -1.25537109375, -1.204345703125, -1.1533203125, -1.102294921875, -1.05126953125, -1.000244140625, -0.94921875, -0.898193359375, -0.84716796875, -0.796142578125, -0.7451171875, -0.694091796875, -0.64306640625, -0.592041015625, -0.541015625, -0.489990234375, -0.43896484375, -0.387939453125, -0.3369140625, -0.285888671875, -0.23486328125, -0.183837890625, -0.1328125, -0.081787109375, -0.03076171875, 0.020263671875, 0.0712890625, 0.122314453125, 0.17333984375, 0.224365234375, 0.275390625, 0.326416015625, 0.37744140625, 0.428466796875, 0.4794921875, 0.530517578125, 0.58154296875, 0.632568359375, 0.68359375, 0.734619140625, 0.78564453125, 0.836669921875, 0.8876953125, 0.938720703125, 0.98974609375, 1.040771484375, 1.091796875, 1.142822265625, 1.19384765625, 1.244873046875, 1.2958984375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 17.0, 18.0, 16.0, 15.0, 34.0, 24.0, 28.0, 38.0, 43.0, 55.0, 53.0, 50.0, 60.0, 45.0, 45.0, 47.0, 52.0, 48.0, 43.0, 39.0, 33.0, 34.0, 24.0, 18.0, 17.0, 18.0, 14.0, 12.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72021484375, -0.7009048461914062, -0.6815948486328125, -0.6622848510742188, -0.642974853515625, -0.6236648559570312, -0.6043548583984375, -0.5850448608398438, -0.56573486328125, -0.5464248657226562, -0.5271148681640625, -0.5078048706054688, -0.488494873046875, -0.46918487548828125, -0.4498748779296875, -0.43056488037109375, -0.4112548828125, -0.39194488525390625, -0.3726348876953125, -0.35332489013671875, -0.334014892578125, -0.31470489501953125, -0.2953948974609375, -0.27608489990234375, -0.25677490234375, -0.23746490478515625, -0.2181549072265625, -0.19884490966796875, -0.179534912109375, -0.16022491455078125, -0.1409149169921875, -0.12160491943359375, -0.102294921875, -0.08298492431640625, -0.0636749267578125, -0.04436492919921875, -0.025054931640625, -0.00574493408203125, 0.0135650634765625, 0.03287506103515625, 0.05218505859375, 0.07149505615234375, 0.0908050537109375, 0.11011505126953125, 0.129425048828125, 0.14873504638671875, 0.1680450439453125, 0.18735504150390625, 0.2066650390625, 0.22597503662109375, 0.2452850341796875, 0.26459503173828125, 0.283905029296875, 0.30321502685546875, 0.3225250244140625, 0.34183502197265625, 0.36114501953125, 0.38045501708984375, 0.3997650146484375, 0.41907501220703125, 0.438385009765625, 0.45769500732421875, 0.4770050048828125, 0.49631500244140625, 0.515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 17.0, 16.0, 43.0, 45.0, 110.0, 222.0, 447.0, 1038.0, 2920.0, 12028.0, 87388.0, 622433.0, 282201.0, 31018.0, 5652.0, 1669.0, 657.0, 296.0, 140.0, 85.0, 47.0, 32.0, 24.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.539581298828125, -2.43267822265625, -2.325775146484375, -2.2188720703125, -2.111968994140625, -2.00506591796875, -1.898162841796875, -1.791259765625, -1.684356689453125, -1.57745361328125, -1.470550537109375, -1.3636474609375, -1.256744384765625, -1.14984130859375, -1.042938232421875, -0.93603515625, -0.829132080078125, -0.72222900390625, -0.615325927734375, -0.5084228515625, -0.401519775390625, -0.29461669921875, -0.187713623046875, -0.080810546875, 0.026092529296875, 0.13299560546875, 0.239898681640625, 0.3468017578125, 0.453704833984375, 0.56060791015625, 0.667510986328125, 0.7744140625, 0.881317138671875, 0.98822021484375, 1.095123291015625, 1.2020263671875, 1.308929443359375, 1.41583251953125, 1.522735595703125, 1.629638671875, 1.736541748046875, 1.84344482421875, 1.950347900390625, 2.0572509765625, 2.164154052734375, 2.27105712890625, 2.377960205078125, 2.48486328125, 2.591766357421875, 2.69866943359375, 2.805572509765625, 2.9124755859375, 3.019378662109375, 3.12628173828125, 3.233184814453125, 3.340087890625, 3.446990966796875, 3.55389404296875, 3.660797119140625, 3.7677001953125, 3.874603271484375, 3.98150634765625, 4.088409423828125, 4.1953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 5.0, 9.0, 11.0, 11.0, 15.0, 14.0, 11.0, 24.0, 20.0, 16.0, 22.0, 26.0, 25.0, 33.0, 27.0, 36.0, 30.0, 23.0, 37.0, 37.0, 33.0, 33.0, 41.0, 41.0, 31.0, 32.0, 35.0, 32.0, 36.0, 30.0, 23.0, 23.0, 30.0, 27.0, 18.0, 7.0, 13.0, 10.0, 16.0, 9.0, 7.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.22265625, -2.1578369140625, -2.093017578125, -2.0281982421875, -1.96337890625, -1.8985595703125, -1.833740234375, -1.7689208984375, -1.7041015625, -1.6392822265625, -1.574462890625, -1.5096435546875, -1.44482421875, -1.3800048828125, -1.315185546875, -1.2503662109375, -1.185546875, -1.1207275390625, -1.055908203125, -0.9910888671875, -0.92626953125, -0.8614501953125, -0.796630859375, -0.7318115234375, -0.6669921875, -0.6021728515625, -0.537353515625, -0.4725341796875, -0.40771484375, -0.3428955078125, -0.278076171875, -0.2132568359375, -0.1484375, -0.0836181640625, -0.018798828125, 0.0460205078125, 0.11083984375, 0.1756591796875, 0.240478515625, 0.3052978515625, 0.3701171875, 0.4349365234375, 0.499755859375, 0.5645751953125, 0.62939453125, 0.6942138671875, 0.759033203125, 0.8238525390625, 0.888671875, 0.9534912109375, 1.018310546875, 1.0831298828125, 1.14794921875, 1.2127685546875, 1.277587890625, 1.3424072265625, 1.4072265625, 1.4720458984375, 1.536865234375, 1.6016845703125, 1.66650390625, 1.7313232421875, 1.796142578125, 1.8609619140625, 1.92578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 13.0, 28.0, 40.0, 66.0, 110.0, 301.0, 708.0, 2649.0, 19660.0, 433037.0, 563109.0, 24426.0, 3024.0, 781.0, 300.0, 132.0, 71.0, 32.0, 26.0, 14.0, 6.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.03515625, -2.9629669189453125, -2.890777587890625, -2.8185882568359375, -2.74639892578125, -2.6742095947265625, -2.602020263671875, -2.5298309326171875, -2.4576416015625, -2.3854522705078125, -2.313262939453125, -2.2410736083984375, -2.16888427734375, -2.0966949462890625, -2.024505615234375, -1.9523162841796875, -1.880126953125, -1.8079376220703125, -1.735748291015625, -1.6635589599609375, -1.59136962890625, -1.5191802978515625, -1.446990966796875, -1.3748016357421875, -1.3026123046875, -1.2304229736328125, -1.158233642578125, -1.0860443115234375, -1.01385498046875, -0.9416656494140625, -0.869476318359375, -0.7972869873046875, -0.72509765625, -0.6529083251953125, -0.580718994140625, -0.5085296630859375, -0.43634033203125, -0.3641510009765625, -0.291961669921875, -0.2197723388671875, -0.1475830078125, -0.0753936767578125, -0.003204345703125, 0.0689849853515625, 0.14117431640625, 0.2133636474609375, 0.285552978515625, 0.3577423095703125, 0.429931640625, 0.5021209716796875, 0.574310302734375, 0.6464996337890625, 0.71868896484375, 0.7908782958984375, 0.863067626953125, 0.9352569580078125, 1.0074462890625, 1.0796356201171875, 1.151824951171875, 1.2240142822265625, 1.29620361328125, 1.3683929443359375, 1.440582275390625, 1.5127716064453125, 1.5849609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 23.0, 25.0, 41.0, 49.0, 67.0, 93.0, 125.0, 116.0, 111.0, 108.0, 68.0, 46.0, 27.0, 20.0, 24.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021719932556152344, -0.0002092607319355011, -0.00020132213830947876, -0.00019338354468345642, -0.00018544495105743408, -0.00017750635743141174, -0.0001695677638053894, -0.00016162917017936707, -0.00015369057655334473, -0.0001457519829273224, -0.00013781338930130005, -0.0001298747956752777, -0.00012193620204925537, -0.00011399760842323303, -0.0001060590147972107, -9.812042117118835e-05, -9.018182754516602e-05, -8.224323391914368e-05, -7.430464029312134e-05, -6.6366046667099e-05, -5.842745304107666e-05, -5.048885941505432e-05, -4.255026578903198e-05, -3.4611672163009644e-05, -2.6673078536987305e-05, -1.8734484910964966e-05, -1.0795891284942627e-05, -2.857297658920288e-06, 5.081295967102051e-06, 1.301988959312439e-05, 2.095848321914673e-05, 2.8897076845169067e-05, 3.6835670471191406e-05, 4.4774264097213745e-05, 5.2712857723236084e-05, 6.065145134925842e-05, 6.859004497528076e-05, 7.65286386013031e-05, 8.446723222732544e-05, 9.240582585334778e-05, 0.00010034441947937012, 0.00010828301310539246, 0.0001162216067314148, 0.00012416020035743713, 0.00013209879398345947, 0.0001400373876094818, 0.00014797598123550415, 0.0001559145748615265, 0.00016385316848754883, 0.00017179176211357117, 0.0001797303557395935, 0.00018766894936561584, 0.00019560754299163818, 0.00020354613661766052, 0.00021148473024368286, 0.0002194233238697052, 0.00022736191749572754, 0.00023530051112174988, 0.00024323910474777222, 0.00025117769837379456, 0.0002591162919998169, 0.00026705488562583923, 0.00027499347925186157, 0.0002829320728778839, 0.00029087066650390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 13.0, 7.0, 7.0, 12.0, 26.0, 41.0, 78.0, 132.0, 311.0, 665.0, 1994.0, 8965.0, 100852.0, 802014.0, 119700.0, 10106.0, 2189.0, 782.0, 299.0, 135.0, 78.0, 49.0, 37.0, 14.0, 13.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1953125, -2.1298370361328125, -2.064361572265625, -1.9988861083984375, -1.93341064453125, -1.8679351806640625, -1.802459716796875, -1.7369842529296875, -1.6715087890625, -1.6060333251953125, -1.540557861328125, -1.4750823974609375, -1.40960693359375, -1.3441314697265625, -1.278656005859375, -1.2131805419921875, -1.147705078125, -1.0822296142578125, -1.016754150390625, -0.9512786865234375, -0.88580322265625, -0.8203277587890625, -0.754852294921875, -0.6893768310546875, -0.6239013671875, -0.5584259033203125, -0.492950439453125, -0.4274749755859375, -0.36199951171875, -0.2965240478515625, -0.231048583984375, -0.1655731201171875, -0.10009765625, -0.0346221923828125, 0.030853271484375, 0.0963287353515625, 0.16180419921875, 0.2272796630859375, 0.292755126953125, 0.3582305908203125, 0.4237060546875, 0.4891815185546875, 0.554656982421875, 0.6201324462890625, 0.68560791015625, 0.7510833740234375, 0.816558837890625, 0.8820343017578125, 0.947509765625, 1.0129852294921875, 1.078460693359375, 1.1439361572265625, 1.20941162109375, 1.2748870849609375, 1.340362548828125, 1.4058380126953125, 1.4713134765625, 1.5367889404296875, 1.602264404296875, 1.6677398681640625, 1.73321533203125, 1.7986907958984375, 1.864166259765625, 1.9296417236328125, 1.9951171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 8.0, 10.0, 18.0, 28.0, 47.0, 61.0, 106.0, 119.0, 141.0, 151.0, 89.0, 76.0, 57.0, 37.0, 13.0, 13.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.029296875, -2.9669570922851562, -2.9046173095703125, -2.8422775268554688, -2.779937744140625, -2.7175979614257812, -2.6552581787109375, -2.5929183959960938, -2.53057861328125, -2.4682388305664062, -2.4058990478515625, -2.3435592651367188, -2.281219482421875, -2.2188796997070312, -2.1565399169921875, -2.0942001342773438, -2.0318603515625, -1.9695205688476562, -1.9071807861328125, -1.8448410034179688, -1.782501220703125, -1.7201614379882812, -1.6578216552734375, -1.5954818725585938, -1.53314208984375, -1.4708023071289062, -1.4084625244140625, -1.3461227416992188, -1.283782958984375, -1.2214431762695312, -1.1591033935546875, -1.0967636108398438, -1.034423828125, -0.9720840454101562, -0.9097442626953125, -0.8474044799804688, -0.785064697265625, -0.7227249145507812, -0.6603851318359375, -0.5980453491210938, -0.53570556640625, -0.47336578369140625, -0.4110260009765625, -0.34868621826171875, -0.286346435546875, -0.22400665283203125, -0.1616668701171875, -0.09932708740234375, -0.0369873046875, 0.02535247802734375, 0.0876922607421875, 0.15003204345703125, 0.212371826171875, 0.27471160888671875, 0.3370513916015625, 0.39939117431640625, 0.46173095703125, 0.5240707397460938, 0.5864105224609375, 0.6487503051757812, 0.711090087890625, 0.7734298706054688, 0.8357696533203125, 0.8981094360351562, 0.96044921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 15.0, 34.0, 87.0, 140.0, 190.0, 218.0, 144.0, 91.0, 43.0, 18.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.71631622314453, -28.68522834777832, -27.65414047241211, -26.6230525970459, -25.591964721679688, -24.56087875366211, -23.5297908782959, -22.498703002929688, -21.467615127563477, -20.436527252197266, -19.405439376831055, -18.374351501464844, -17.343265533447266, -16.312175750732422, -15.281089782714844, -14.250001907348633, -13.218914031982422, -12.187826156616211, -11.15673828125, -10.125651359558105, -9.094563484191895, -8.063475608825684, -7.032388210296631, -6.001300811767578, -4.970212936401367, -3.9391252994537354, -2.9080376625061035, -1.8769500255584717, -0.8458623886108398, 0.1852254867553711, 1.2163128852844238, 2.2474002838134766, 3.2784881591796875, 4.309576034545898, 5.340663433074951, 6.371750831604004, 7.402838706970215, 8.433926582336426, 9.46501350402832, 10.496101379394531, 11.527189254760742, 12.558277130126953, 13.589365005493164, 14.620451927185059, 15.65153980255127, 16.682628631591797, 17.713714599609375, 18.744802474975586, 19.775890350341797, 20.806978225708008, 21.83806610107422, 22.86915397644043, 23.90024185180664, 24.93132781982422, 25.96241569519043, 26.99350357055664, 28.02459144592285, 29.055679321289062, 30.086767196655273, 31.117855072021484, 32.14894104003906, 33.180030822753906, 34.211116790771484, 35.24220275878906, 36.273292541503906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 8.0, 10.0, 15.0, 16.0, 18.0, 32.0, 22.0, 27.0, 23.0, 39.0, 34.0, 35.0, 37.0, 30.0, 44.0, 40.0, 59.0, 47.0, 53.0, 38.0, 50.0, 39.0, 33.0, 30.0, 41.0, 26.0, 23.0, 22.0, 10.0, 17.0, 7.0, 11.0, 16.0, 8.0, 3.0, 4.0, 7.0, 0.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.212970733642578, -11.826147079467773, -11.439323425292969, -11.052499771118164, -10.665675163269043, -10.278851509094238, -9.892027854919434, -9.505204200744629, -9.118379592895508, -8.731555938720703, -8.344732284545898, -7.9579081535339355, -7.571084022521973, -7.184260368347168, -6.797436714172363, -6.410613059997559, -6.023789405822754, -5.636965751647949, -5.250141620635986, -4.863317966461182, -4.476493835449219, -4.089670181274414, -3.7028465270996094, -3.3160226345062256, -2.929198741912842, -2.542374849319458, -2.155550956726074, -1.7687273025512695, -1.3819034099578857, -0.995079517364502, -0.6082558631896973, -0.22143197059631348, 0.1653909683227539, 0.5522148013114929, 0.9390386343002319, 1.3258624076843262, 1.71268630027771, 2.0995101928710938, 2.4863338470458984, 2.8731577396392822, 3.259981632232666, 3.64680552482605, 4.033629417419434, 4.420453071594238, 4.807276725769043, 5.194100856781006, 5.5809245109558105, 5.967748641967773, 6.354572296142578, 6.741395950317383, 7.128220081329346, 7.51504373550415, 7.901867866516113, 8.288691520690918, 8.675515174865723, 9.062338829040527, 9.449163436889648, 9.835987091064453, 10.222810745239258, 10.609634399414062, 10.996459007263184, 11.383282661437988, 11.770106315612793, 12.156929969787598, 12.543753623962402]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 8.0, 11.0, 14.0, 24.0, 21.0, 40.0, 45.0, 79.0, 99.0, 184.0, 266.0, 470.0, 748.0, 1323.0, 2562.0, 5082.0, 11871.0, 38376.0, 4010575.0, 88000.0, 19337.0, 7319.0, 3486.0, 1828.0, 963.0, 550.0, 363.0, 203.0, 126.0, 91.0, 55.0, 54.0, 23.0, 15.0, 13.0, 12.0, 12.0, 4.0, 9.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.466796875, -2.383819580078125, -2.30084228515625, -2.217864990234375, -2.1348876953125, -2.051910400390625, -1.96893310546875, -1.885955810546875, -1.802978515625, -1.720001220703125, -1.63702392578125, -1.554046630859375, -1.4710693359375, -1.388092041015625, -1.30511474609375, -1.222137451171875, -1.13916015625, -1.056182861328125, -0.97320556640625, -0.890228271484375, -0.8072509765625, -0.724273681640625, -0.64129638671875, -0.558319091796875, -0.475341796875, -0.392364501953125, -0.30938720703125, -0.226409912109375, -0.1434326171875, -0.060455322265625, 0.02252197265625, 0.105499267578125, 0.1884765625, 0.271453857421875, 0.35443115234375, 0.437408447265625, 0.5203857421875, 0.603363037109375, 0.68634033203125, 0.769317626953125, 0.852294921875, 0.935272216796875, 1.01824951171875, 1.101226806640625, 1.1842041015625, 1.267181396484375, 1.35015869140625, 1.433135986328125, 1.51611328125, 1.599090576171875, 1.68206787109375, 1.765045166015625, 1.8480224609375, 1.930999755859375, 2.01397705078125, 2.096954345703125, 2.179931640625, 2.262908935546875, 2.34588623046875, 2.428863525390625, 2.5118408203125, 2.594818115234375, 2.67779541015625, 2.760772705078125, 2.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 18.0, 15.0, 13.0, 19.0, 23.0, 25.0, 35.0, 41.0, 52.0, 59.0, 55.0, 46.0, 53.0, 59.0, 69.0, 51.0, 58.0, 42.0, 45.0, 42.0, 32.0, 26.0, 24.0, 23.0, 12.0, 15.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.8935546875, -0.8707275390625, -0.847900390625, -0.8250732421875, -0.80224609375, -0.7794189453125, -0.756591796875, -0.7337646484375, -0.7109375, -0.6881103515625, -0.665283203125, -0.6424560546875, -0.61962890625, -0.5968017578125, -0.573974609375, -0.5511474609375, -0.5283203125, -0.5054931640625, -0.482666015625, -0.4598388671875, -0.43701171875, -0.4141845703125, -0.391357421875, -0.3685302734375, -0.345703125, -0.3228759765625, -0.300048828125, -0.2772216796875, -0.25439453125, -0.2315673828125, -0.208740234375, -0.1859130859375, -0.1630859375, -0.1402587890625, -0.117431640625, -0.0946044921875, -0.07177734375, -0.0489501953125, -0.026123046875, -0.0032958984375, 0.01953125, 0.0423583984375, 0.065185546875, 0.0880126953125, 0.11083984375, 0.1336669921875, 0.156494140625, 0.1793212890625, 0.2021484375, 0.2249755859375, 0.247802734375, 0.2706298828125, 0.29345703125, 0.3162841796875, 0.339111328125, 0.3619384765625, 0.384765625, 0.4075927734375, 0.430419921875, 0.4532470703125, 0.47607421875, 0.4989013671875, 0.521728515625, 0.5445556640625, 0.5673828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 3.0, 3.0, 16.0, 24.0, 24.0, 25.0, 47.0, 37.0, 62.0, 89.0, 154.0, 255.0, 407.0, 828.0, 1852.0, 4677.0, 15771.0, 80506.0, 4007072.0, 61840.0, 12861.0, 4151.0, 1646.0, 788.0, 415.0, 227.0, 139.0, 74.0, 65.0, 56.0, 30.0, 23.0, 17.0, 13.0, 16.0, 7.0, 14.0, 10.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.305633544921875, -2.22454833984375, -2.143463134765625, -2.0623779296875, -1.981292724609375, -1.90020751953125, -1.819122314453125, -1.738037109375, -1.656951904296875, -1.57586669921875, -1.494781494140625, -1.4136962890625, -1.332611083984375, -1.25152587890625, -1.170440673828125, -1.08935546875, -1.008270263671875, -0.92718505859375, -0.846099853515625, -0.7650146484375, -0.683929443359375, -0.60284423828125, -0.521759033203125, -0.440673828125, -0.359588623046875, -0.27850341796875, -0.197418212890625, -0.1163330078125, -0.035247802734375, 0.04583740234375, 0.126922607421875, 0.2080078125, 0.289093017578125, 0.37017822265625, 0.451263427734375, 0.5323486328125, 0.613433837890625, 0.69451904296875, 0.775604248046875, 0.856689453125, 0.937774658203125, 1.01885986328125, 1.099945068359375, 1.1810302734375, 1.262115478515625, 1.34320068359375, 1.424285888671875, 1.50537109375, 1.586456298828125, 1.66754150390625, 1.748626708984375, 1.8297119140625, 1.910797119140625, 1.99188232421875, 2.072967529296875, 2.154052734375, 2.235137939453125, 2.31622314453125, 2.397308349609375, 2.4783935546875, 2.559478759765625, 2.64056396484375, 2.721649169921875, 2.802734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 17.0, 21.0, 38.0, 73.0, 3436.0, 307.0, 72.0, 39.0, 21.0, 14.0, 9.0, 10.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7823944091796875, -0.758636474609375, -0.7348785400390625, -0.71112060546875, -0.6873626708984375, -0.663604736328125, -0.6398468017578125, -0.6160888671875, -0.5923309326171875, -0.568572998046875, -0.5448150634765625, -0.52105712890625, -0.4972991943359375, -0.473541259765625, -0.4497833251953125, -0.426025390625, -0.4022674560546875, -0.378509521484375, -0.3547515869140625, -0.33099365234375, -0.3072357177734375, -0.283477783203125, -0.2597198486328125, -0.2359619140625, -0.2122039794921875, -0.188446044921875, -0.1646881103515625, -0.14093017578125, -0.1171722412109375, -0.093414306640625, -0.0696563720703125, -0.0458984375, -0.0221405029296875, 0.001617431640625, 0.0253753662109375, 0.04913330078125, 0.0728912353515625, 0.096649169921875, 0.1204071044921875, 0.1441650390625, 0.1679229736328125, 0.191680908203125, 0.2154388427734375, 0.23919677734375, 0.2629547119140625, 0.286712646484375, 0.3104705810546875, 0.334228515625, 0.3579864501953125, 0.381744384765625, 0.4055023193359375, 0.42926025390625, 0.4530181884765625, 0.476776123046875, 0.5005340576171875, 0.5242919921875, 0.5480499267578125, 0.571807861328125, 0.5955657958984375, 0.61932373046875, 0.6430816650390625, 0.666839599609375, 0.6905975341796875, 0.71435546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 22.0, 37.0, 83.0, 154.0, 207.0, 173.0, 143.0, 94.0, 32.0, 16.0, 14.0, 6.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5912890434265137, -3.4899652004241943, -3.388641119003296, -3.2873172760009766, -3.1859934329986572, -3.084669589996338, -2.9833455085754395, -2.88202166557312, -2.780697822570801, -2.6793739795684814, -2.578049898147583, -2.4767260551452637, -2.3754022121429443, -2.274078369140625, -2.1727542877197266, -2.0714304447174072, -1.9701064825057983, -1.8687825202941895, -1.7674586772918701, -1.6661347150802612, -1.564810872077942, -1.463486909866333, -1.3621630668640137, -1.2608391046524048, -1.159515142440796, -1.058191180229187, -0.9568673372268677, -0.8555433750152588, -0.7542195320129395, -0.6528955698013306, -0.5515716671943665, -0.45024776458740234, -0.348923921585083, -0.2476000189781189, -0.1462761014699936, -0.044952183961868286, 0.056371718645095825, 0.15769565105438232, 0.25901955366134644, 0.36034345626831055, 0.46166735887527466, 0.5629912614822388, 0.6643151640892029, 0.765639066696167, 0.8669630289077759, 0.96828693151474, 1.069610834121704, 1.1709346771240234, 1.2722586393356323, 1.3735826015472412, 1.4749064445495605, 1.5762304067611694, 1.6775542497634888, 1.7788782119750977, 1.880202054977417, 1.9815260171890259, 2.0828499794006348, 2.184173822402954, 2.2854979038238525, 2.386821746826172, 2.488145589828491, 2.5894694328308105, 2.690793514251709, 2.7921173572540283, 2.8934412002563477]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 6.0, 28.0, 22.0, 28.0, 35.0, 40.0, 51.0, 49.0, 66.0, 84.0, 62.0, 70.0, 72.0, 54.0, 56.0, 54.0, 36.0, 43.0, 33.0, 24.0, 17.0, 15.0, 16.0, 12.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8931628465652466, -1.8450496196746826, -1.7969363927841187, -1.7488231658935547, -1.7007099390029907, -1.6525967121124268, -1.6044834852218628, -1.5563702583312988, -1.5082570314407349, -1.460143804550171, -1.412030577659607, -1.363917350769043, -1.315804123878479, -1.267690896987915, -1.219577670097351, -1.171464443206787, -1.1233513355255127, -1.0752381086349487, -1.0271248817443848, -0.9790116548538208, -0.9308984279632568, -0.8827852010726929, -0.8346719741821289, -0.7865587472915649, -0.738445520401001, -0.690332293510437, -0.642219066619873, -0.5941058397293091, -0.5459926128387451, -0.49787938594818115, -0.4497661888599396, -0.4016529619693756, -0.35353970527648926, -0.3054264783859253, -0.25731325149536133, -0.20920003950595856, -0.1610868126153946, -0.11297358572483063, -0.06486037373542786, -0.01674714684486389, 0.03136608004570007, 0.07947930693626404, 0.127592533826828, 0.17570574581623077, 0.22381897270679474, 0.2719321846961975, 0.3200454115867615, 0.36815863847732544, 0.4162718653678894, 0.46438509225845337, 0.5124983191490173, 0.5606115460395813, 0.6087247729301453, 0.6568379998207092, 0.7049511671066284, 0.7530643939971924, 0.8011776208877563, 0.8492908477783203, 0.8974040746688843, 0.9455173015594482, 0.9936305284500122, 1.0417437553405762, 1.0898569822311401, 1.137970209121704, 1.186083436012268]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 12.0, 12.0, 13.0, 31.0, 41.0, 50.0, 91.0, 134.0, 208.0, 349.0, 666.0, 1111.0, 2119.0, 4069.0, 8125.0, 16840.0, 35536.0, 75053.0, 149863.0, 241385.0, 236329.0, 141347.0, 69723.0, 33442.0, 15836.0, 7681.0, 3955.0, 1969.0, 1051.0, 589.0, 329.0, 196.0, 119.0, 89.0, 57.0, 42.0, 29.0, 16.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.103118896484375, -1.06365966796875, -1.024200439453125, -0.9847412109375, -0.945281982421875, -0.90582275390625, -0.866363525390625, -0.826904296875, -0.787445068359375, -0.74798583984375, -0.708526611328125, -0.6690673828125, -0.629608154296875, -0.59014892578125, -0.550689697265625, -0.51123046875, -0.471771240234375, -0.43231201171875, -0.392852783203125, -0.3533935546875, -0.313934326171875, -0.27447509765625, -0.235015869140625, -0.195556640625, -0.156097412109375, -0.11663818359375, -0.077178955078125, -0.0377197265625, 0.001739501953125, 0.04119873046875, 0.080657958984375, 0.1201171875, 0.159576416015625, 0.19903564453125, 0.238494873046875, 0.2779541015625, 0.317413330078125, 0.35687255859375, 0.396331787109375, 0.435791015625, 0.475250244140625, 0.51470947265625, 0.554168701171875, 0.5936279296875, 0.633087158203125, 0.67254638671875, 0.712005615234375, 0.75146484375, 0.790924072265625, 0.83038330078125, 0.869842529296875, 0.9093017578125, 0.948760986328125, 0.98822021484375, 1.027679443359375, 1.067138671875, 1.106597900390625, 1.14605712890625, 1.185516357421875, 1.2249755859375, 1.264434814453125, 1.30389404296875, 1.343353271484375, 1.3828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 9.0, 4.0, 5.0, 9.0, 11.0, 15.0, 15.0, 14.0, 24.0, 35.0, 31.0, 34.0, 53.0, 56.0, 43.0, 55.0, 49.0, 53.0, 59.0, 57.0, 51.0, 38.0, 50.0, 43.0, 40.0, 41.0, 23.0, 21.0, 12.0, 16.0, 13.0, 10.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8851470947265625, -0.861602783203125, -0.8380584716796875, -0.81451416015625, -0.7909698486328125, -0.767425537109375, -0.7438812255859375, -0.7203369140625, -0.6967926025390625, -0.673248291015625, -0.6497039794921875, -0.62615966796875, -0.6026153564453125, -0.579071044921875, -0.5555267333984375, -0.531982421875, -0.5084381103515625, -0.484893798828125, -0.4613494873046875, -0.43780517578125, -0.4142608642578125, -0.390716552734375, -0.3671722412109375, -0.3436279296875, -0.3200836181640625, -0.296539306640625, -0.2729949951171875, -0.24945068359375, -0.2259063720703125, -0.202362060546875, -0.1788177490234375, -0.1552734375, -0.1317291259765625, -0.108184814453125, -0.0846405029296875, -0.06109619140625, -0.0375518798828125, -0.014007568359375, 0.0095367431640625, 0.0330810546875, 0.0566253662109375, 0.080169677734375, 0.1037139892578125, 0.12725830078125, 0.1508026123046875, 0.174346923828125, 0.1978912353515625, 0.221435546875, 0.2449798583984375, 0.268524169921875, 0.2920684814453125, 0.31561279296875, 0.3391571044921875, 0.362701416015625, 0.3862457275390625, 0.4097900390625, 0.4333343505859375, 0.456878662109375, 0.4804229736328125, 0.50396728515625, 0.5275115966796875, 0.551055908203125, 0.5746002197265625, 0.59814453125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 7.0, 14.0, 18.0, 26.0, 31.0, 49.0, 70.0, 89.0, 129.0, 170.0, 278.0, 398.0, 688.0, 1099.0, 2245.0, 5502.0, 18040.0, 71089.0, 307893.0, 472317.0, 123746.0, 29335.0, 8415.0, 3117.0, 1472.0, 794.0, 472.0, 332.0, 202.0, 129.0, 112.0, 86.0, 46.0, 40.0, 36.0, 11.0, 14.0, 12.0, 3.0, 5.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.775390625, -1.71240234375, -1.6494140625, -1.58642578125, -1.5234375, -1.46044921875, -1.3974609375, -1.33447265625, -1.271484375, -1.20849609375, -1.1455078125, -1.08251953125, -1.01953125, -0.95654296875, -0.8935546875, -0.83056640625, -0.767578125, -0.70458984375, -0.6416015625, -0.57861328125, -0.515625, -0.45263671875, -0.3896484375, -0.32666015625, -0.263671875, -0.20068359375, -0.1376953125, -0.07470703125, -0.01171875, 0.05126953125, 0.1142578125, 0.17724609375, 0.240234375, 0.30322265625, 0.3662109375, 0.42919921875, 0.4921875, 0.55517578125, 0.6181640625, 0.68115234375, 0.744140625, 0.80712890625, 0.8701171875, 0.93310546875, 0.99609375, 1.05908203125, 1.1220703125, 1.18505859375, 1.248046875, 1.31103515625, 1.3740234375, 1.43701171875, 1.5, 1.56298828125, 1.6259765625, 1.68896484375, 1.751953125, 1.81494140625, 1.8779296875, 1.94091796875, 2.00390625, 2.06689453125, 2.1298828125, 2.19287109375, 2.255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 4.0, 10.0, 13.0, 10.0, 13.0, 16.0, 26.0, 20.0, 25.0, 24.0, 27.0, 34.0, 38.0, 35.0, 39.0, 39.0, 38.0, 46.0, 53.0, 39.0, 48.0, 51.0, 50.0, 51.0, 32.0, 27.0, 27.0, 24.0, 22.0, 23.0, 10.0, 15.0, 13.0, 9.0, 6.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.703125, -2.6201171875, -2.537109375, -2.4541015625, -2.37109375, -2.2880859375, -2.205078125, -2.1220703125, -2.0390625, -1.9560546875, -1.873046875, -1.7900390625, -1.70703125, -1.6240234375, -1.541015625, -1.4580078125, -1.375, -1.2919921875, -1.208984375, -1.1259765625, -1.04296875, -0.9599609375, -0.876953125, -0.7939453125, -0.7109375, -0.6279296875, -0.544921875, -0.4619140625, -0.37890625, -0.2958984375, -0.212890625, -0.1298828125, -0.046875, 0.0361328125, 0.119140625, 0.2021484375, 0.28515625, 0.3681640625, 0.451171875, 0.5341796875, 0.6171875, 0.7001953125, 0.783203125, 0.8662109375, 0.94921875, 1.0322265625, 1.115234375, 1.1982421875, 1.28125, 1.3642578125, 1.447265625, 1.5302734375, 1.61328125, 1.6962890625, 1.779296875, 1.8623046875, 1.9453125, 2.0283203125, 2.111328125, 2.1943359375, 2.27734375, 2.3603515625, 2.443359375, 2.5263671875, 2.609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 6.0, 11.0, 9.0, 12.0, 20.0, 34.0, 49.0, 67.0, 94.0, 170.0, 294.0, 629.0, 1763.0, 6585.0, 43354.0, 620711.0, 341967.0, 25436.0, 4663.0, 1422.0, 574.0, 257.0, 151.0, 82.0, 59.0, 30.0, 27.0, 18.0, 13.0, 11.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8217620849609375, -1.764617919921875, -1.7074737548828125, -1.65032958984375, -1.5931854248046875, -1.536041259765625, -1.4788970947265625, -1.4217529296875, -1.3646087646484375, -1.307464599609375, -1.2503204345703125, -1.19317626953125, -1.1360321044921875, -1.078887939453125, -1.0217437744140625, -0.964599609375, -0.9074554443359375, -0.850311279296875, -0.7931671142578125, -0.73602294921875, -0.6788787841796875, -0.621734619140625, -0.5645904541015625, -0.5074462890625, -0.4503021240234375, -0.393157958984375, -0.3360137939453125, -0.27886962890625, -0.2217254638671875, -0.164581298828125, -0.1074371337890625, -0.05029296875, 0.0068511962890625, 0.063995361328125, 0.1211395263671875, 0.17828369140625, 0.2354278564453125, 0.292572021484375, 0.3497161865234375, 0.4068603515625, 0.4640045166015625, 0.521148681640625, 0.5782928466796875, 0.63543701171875, 0.6925811767578125, 0.749725341796875, 0.8068695068359375, 0.864013671875, 0.9211578369140625, 0.978302001953125, 1.0354461669921875, 1.09259033203125, 1.1497344970703125, 1.206878662109375, 1.2640228271484375, 1.3211669921875, 1.3783111572265625, 1.435455322265625, 1.4925994873046875, 1.54974365234375, 1.6068878173828125, 1.664031982421875, 1.7211761474609375, 1.7783203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 6.0, 11.0, 15.0, 13.0, 24.0, 26.0, 31.0, 32.0, 61.0, 55.0, 61.0, 92.0, 89.0, 100.0, 68.0, 57.0, 49.0, 40.0, 26.0, 30.0, 21.0, 28.0, 14.0, 10.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018846988677978516, -0.00018289871513843536, -0.00017732754349708557, -0.00017175637185573578, -0.00016618520021438599, -0.0001606140285730362, -0.0001550428569316864, -0.0001494716852903366, -0.00014390051364898682, -0.00013832934200763702, -0.00013275817036628723, -0.00012718699872493744, -0.00012161582708358765, -0.00011604465544223785, -0.00011047348380088806, -0.00010490231215953827, -9.933114051818848e-05, -9.375996887683868e-05, -8.818879723548889e-05, -8.26176255941391e-05, -7.70464539527893e-05, -7.147528231143951e-05, -6.590411067008972e-05, -6.033293902873993e-05, -5.476176738739014e-05, -4.9190595746040344e-05, -4.361942410469055e-05, -3.804825246334076e-05, -3.247708082199097e-05, -2.6905909180641174e-05, -2.1334737539291382e-05, -1.576356589794159e-05, -1.0192394256591797e-05, -4.621222615242004e-06, 9.499490261077881e-07, 6.5211206674575806e-06, 1.2092292308807373e-05, 1.7663463950157166e-05, 2.3234635591506958e-05, 2.880580723285675e-05, 3.437697887420654e-05, 3.9948150515556335e-05, 4.551932215690613e-05, 5.109049379825592e-05, 5.666166543960571e-05, 6.22328370809555e-05, 6.78040087223053e-05, 7.337518036365509e-05, 7.894635200500488e-05, 8.451752364635468e-05, 9.008869528770447e-05, 9.565986692905426e-05, 0.00010123103857040405, 0.00010680221021175385, 0.00011237338185310364, 0.00011794455349445343, 0.00012351572513580322, 0.00012908689677715302, 0.0001346580684185028, 0.0001402292400598526, 0.0001458004117012024, 0.00015137158334255219, 0.00015694275498390198, 0.00016251392662525177, 0.00016808509826660156]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 8.0, 6.0, 3.0, 14.0, 21.0, 36.0, 63.0, 114.0, 223.0, 463.0, 1307.0, 4500.0, 25316.0, 501983.0, 483393.0, 24400.0, 4375.0, 1321.0, 535.0, 210.0, 104.0, 55.0, 31.0, 21.0, 15.0, 13.0, 2.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6199798583984375, -1.549530029296875, -1.4790802001953125, -1.40863037109375, -1.3381805419921875, -1.267730712890625, -1.1972808837890625, -1.1268310546875, -1.0563812255859375, -0.985931396484375, -0.9154815673828125, -0.84503173828125, -0.7745819091796875, -0.704132080078125, -0.6336822509765625, -0.563232421875, -0.4927825927734375, -0.422332763671875, -0.3518829345703125, -0.28143310546875, -0.2109832763671875, -0.140533447265625, -0.0700836181640625, 0.0003662109375, 0.0708160400390625, 0.141265869140625, 0.2117156982421875, 0.28216552734375, 0.3526153564453125, 0.423065185546875, 0.4935150146484375, 0.56396484375, 0.6344146728515625, 0.704864501953125, 0.7753143310546875, 0.84576416015625, 0.9162139892578125, 0.986663818359375, 1.0571136474609375, 1.1275634765625, 1.1980133056640625, 1.268463134765625, 1.3389129638671875, 1.40936279296875, 1.4798126220703125, 1.550262451171875, 1.6207122802734375, 1.691162109375, 1.7616119384765625, 1.832061767578125, 1.9025115966796875, 1.97296142578125, 2.0434112548828125, 2.113861083984375, 2.1843109130859375, 2.2547607421875, 2.3252105712890625, 2.395660400390625, 2.4661102294921875, 2.53656005859375, 2.6070098876953125, 2.677459716796875, 2.7479095458984375, 2.818359375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 1.0, 5.0, 2.0, 6.0, 6.0, 10.0, 23.0, 29.0, 45.0, 77.0, 96.0, 116.0, 113.0, 127.0, 99.0, 75.0, 49.0, 36.0, 20.0, 16.0, 16.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.150390625, -2.0916900634765625, -2.032989501953125, -1.9742889404296875, -1.91558837890625, -1.8568878173828125, -1.798187255859375, -1.7394866943359375, -1.6807861328125, -1.6220855712890625, -1.563385009765625, -1.5046844482421875, -1.44598388671875, -1.3872833251953125, -1.328582763671875, -1.2698822021484375, -1.211181640625, -1.1524810791015625, -1.093780517578125, -1.0350799560546875, -0.97637939453125, -0.9176788330078125, -0.858978271484375, -0.8002777099609375, -0.7415771484375, -0.6828765869140625, -0.624176025390625, -0.5654754638671875, -0.50677490234375, -0.4480743408203125, -0.389373779296875, -0.3306732177734375, -0.27197265625, -0.2132720947265625, -0.154571533203125, -0.0958709716796875, -0.03717041015625, 0.0215301513671875, 0.080230712890625, 0.1389312744140625, 0.1976318359375, 0.2563323974609375, 0.315032958984375, 0.3737335205078125, 0.43243408203125, 0.4911346435546875, 0.549835205078125, 0.6085357666015625, 0.667236328125, 0.7259368896484375, 0.784637451171875, 0.8433380126953125, 0.90203857421875, 0.9607391357421875, 1.019439697265625, 1.0781402587890625, 1.1368408203125, 1.1955413818359375, 1.254241943359375, 1.3129425048828125, 1.37164306640625, 1.4303436279296875, 1.489044189453125, 1.5477447509765625, 1.6064453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 26.0, 53.0, 157.0, 341.0, 265.0, 116.0, 35.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.659332275390625, -33.06303024291992, -31.466724395751953, -29.87042236328125, -28.27411651611328, -26.677814483642578, -25.081510543823242, -23.485206604003906, -21.88890266418457, -20.292598724365234, -18.6962947845459, -17.099990844726562, -15.503687858581543, -13.907383918762207, -12.311080932617188, -10.714776992797852, -9.118473052978516, -7.52216911315918, -5.925865650177002, -4.329562187194824, -2.7332582473754883, -1.1369543075561523, 0.4593486785888672, 2.055652618408203, 3.651956558227539, 5.248260498046875, 6.844563961029053, 8.44086742401123, 10.037171363830566, 11.633475303649902, 13.229778289794922, 14.826082229614258, 16.422386169433594, 18.01869010925293, 19.614994049072266, 21.21129608154297, 22.807601928710938, 24.40390396118164, 26.000207901000977, 27.596511840820312, 29.19281578063965, 30.789119720458984, 32.38542175292969, 33.981727600097656, 35.57802963256836, 37.17433547973633, 38.77063751220703, 40.366943359375, 41.9632453918457, 43.559547424316406, 45.155853271484375, 46.75215530395508, 48.34846115112305, 49.94476318359375, 51.54106903076172, 53.13737106323242, 54.733673095703125, 56.32997512817383, 57.9262809753418, 59.5225830078125, 61.11888885498047, 62.71519088745117, 64.31149291992188, 65.90779876708984, 67.50410461425781]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 7.0, 8.0, 10.0, 25.0, 15.0, 16.0, 25.0, 21.0, 32.0, 39.0, 41.0, 45.0, 53.0, 51.0, 52.0, 46.0, 58.0, 48.0, 51.0, 53.0, 52.0, 38.0, 31.0, 35.0, 15.0, 18.0, 17.0, 12.0, 23.0, 9.0, 13.0, 11.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.073604583740234, -14.643697738647461, -14.213790893554688, -13.783884048461914, -13.353976249694824, -12.92406940460205, -12.494162559509277, -12.064255714416504, -11.634347915649414, -11.20444107055664, -10.774534225463867, -10.344627380371094, -9.914719581604004, -9.48481273651123, -9.054905891418457, -8.624999046325684, -8.19509220123291, -7.765185356140137, -7.335278034210205, -6.905371189117432, -6.4754638671875, -6.045557022094727, -5.615650177001953, -5.18574333190918, -4.755836009979248, -4.325929164886475, -3.896021842956543, -3.4661149978637695, -3.036207914352417, -2.6063008308410645, -2.176393985748291, -1.7464869022369385, -1.3165807723999023, -0.8866737484931946, -0.4567667245864868, -0.026859760284423828, 0.4030473232269287, 0.8329544067382812, 1.2628612518310547, 1.6927683353424072, 2.1226754188537598, 2.5525825023651123, 2.982489585876465, 3.4123964309692383, 3.842303514480591, 4.272210597991943, 4.702117443084717, 5.132024765014648, 5.561931610107422, 5.991838455200195, 6.421745777130127, 6.8516526222229, 7.281559944152832, 7.7114667892456055, 8.141373634338379, 8.571280479431152, 9.001188278198242, 9.431095123291016, 9.861001968383789, 10.290908813476562, 10.720816612243652, 11.150723457336426, 11.5806303024292, 12.010537147521973, 12.440443992614746]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 3.0, 9.0, 15.0, 15.0, 20.0, 30.0, 38.0, 57.0, 71.0, 111.0, 212.0, 317.0, 533.0, 980.0, 1919.0, 4132.0, 10943.0, 40741.0, 3676199.0, 405380.0, 34870.0, 9985.0, 3660.0, 1704.0, 895.0, 511.0, 299.0, 192.0, 122.0, 81.0, 63.0, 37.0, 29.0, 26.0, 21.0, 9.0, 9.0, 11.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26953125, -2.196197509765625, -2.12286376953125, -2.049530029296875, -1.9761962890625, -1.902862548828125, -1.82952880859375, -1.756195068359375, -1.682861328125, -1.609527587890625, -1.53619384765625, -1.462860107421875, -1.3895263671875, -1.316192626953125, -1.24285888671875, -1.169525146484375, -1.09619140625, -1.022857666015625, -0.94952392578125, -0.876190185546875, -0.8028564453125, -0.729522705078125, -0.65618896484375, -0.582855224609375, -0.509521484375, -0.436187744140625, -0.36285400390625, -0.289520263671875, -0.2161865234375, -0.142852783203125, -0.06951904296875, 0.003814697265625, 0.0771484375, 0.150482177734375, 0.22381591796875, 0.297149658203125, 0.3704833984375, 0.443817138671875, 0.51715087890625, 0.590484619140625, 0.663818359375, 0.737152099609375, 0.81048583984375, 0.883819580078125, 0.9571533203125, 1.030487060546875, 1.10382080078125, 1.177154541015625, 1.25048828125, 1.323822021484375, 1.39715576171875, 1.470489501953125, 1.5438232421875, 1.617156982421875, 1.69049072265625, 1.763824462890625, 1.837158203125, 1.910491943359375, 1.98382568359375, 2.057159423828125, 2.1304931640625, 2.203826904296875, 2.27716064453125, 2.350494384765625, 2.423828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 11.0, 18.0, 16.0, 20.0, 30.0, 28.0, 27.0, 44.0, 47.0, 54.0, 52.0, 55.0, 56.0, 61.0, 55.0, 58.0, 49.0, 50.0, 48.0, 32.0, 32.0, 27.0, 16.0, 20.0, 16.0, 15.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.703125, -0.67877197265625, -0.6544189453125, -0.63006591796875, -0.605712890625, -0.58135986328125, -0.5570068359375, -0.53265380859375, -0.50830078125, -0.48394775390625, -0.4595947265625, -0.43524169921875, -0.410888671875, -0.38653564453125, -0.3621826171875, -0.33782958984375, -0.3134765625, -0.28912353515625, -0.2647705078125, -0.24041748046875, -0.216064453125, -0.19171142578125, -0.1673583984375, -0.14300537109375, -0.11865234375, -0.09429931640625, -0.0699462890625, -0.04559326171875, -0.021240234375, 0.00311279296875, 0.0274658203125, 0.05181884765625, 0.076171875, 0.10052490234375, 0.1248779296875, 0.14923095703125, 0.173583984375, 0.19793701171875, 0.2222900390625, 0.24664306640625, 0.27099609375, 0.29534912109375, 0.3197021484375, 0.34405517578125, 0.368408203125, 0.39276123046875, 0.4171142578125, 0.44146728515625, 0.4658203125, 0.49017333984375, 0.5145263671875, 0.53887939453125, 0.563232421875, 0.58758544921875, 0.6119384765625, 0.63629150390625, 0.66064453125, 0.68499755859375, 0.7093505859375, 0.73370361328125, 0.758056640625, 0.78240966796875, 0.8067626953125, 0.83111572265625, 0.85546875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 8.0, 18.0, 13.0, 18.0, 31.0, 29.0, 43.0, 54.0, 71.0, 83.0, 108.0, 144.0, 274.0, 1352.0, 20971.0, 4126387.0, 41596.0, 2033.0, 355.0, 159.0, 121.0, 77.0, 81.0, 64.0, 48.0, 33.0, 24.0, 16.0, 16.0, 9.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.828125, -6.61859130859375, -6.4090576171875, -6.19952392578125, -5.989990234375, -5.78045654296875, -5.5709228515625, -5.36138916015625, -5.15185546875, -4.94232177734375, -4.7327880859375, -4.52325439453125, -4.313720703125, -4.10418701171875, -3.8946533203125, -3.68511962890625, -3.4755859375, -3.26605224609375, -3.0565185546875, -2.84698486328125, -2.637451171875, -2.42791748046875, -2.2183837890625, -2.00885009765625, -1.79931640625, -1.58978271484375, -1.3802490234375, -1.17071533203125, -0.961181640625, -0.75164794921875, -0.5421142578125, -0.33258056640625, -0.123046875, 0.08648681640625, 0.2960205078125, 0.50555419921875, 0.715087890625, 0.92462158203125, 1.1341552734375, 1.34368896484375, 1.55322265625, 1.76275634765625, 1.9722900390625, 2.18182373046875, 2.391357421875, 2.60089111328125, 2.8104248046875, 3.01995849609375, 3.2294921875, 3.43902587890625, 3.6485595703125, 3.85809326171875, 4.067626953125, 4.27716064453125, 4.4866943359375, 4.69622802734375, 4.90576171875, 5.11529541015625, 5.3248291015625, 5.53436279296875, 5.743896484375, 5.95343017578125, 6.1629638671875, 6.37249755859375, 6.58203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 16.0, 32.0, 160.0, 3305.0, 437.0, 73.0, 28.0, 14.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9409637451171875, -0.861419677734375, -0.7818756103515625, -0.70233154296875, -0.6227874755859375, -0.543243408203125, -0.4636993408203125, -0.3841552734375, -0.3046112060546875, -0.225067138671875, -0.1455230712890625, -0.06597900390625, 0.0135650634765625, 0.093109130859375, 0.1726531982421875, 0.252197265625, 0.3317413330078125, 0.411285400390625, 0.4908294677734375, 0.57037353515625, 0.6499176025390625, 0.729461669921875, 0.8090057373046875, 0.8885498046875, 0.9680938720703125, 1.047637939453125, 1.1271820068359375, 1.20672607421875, 1.2862701416015625, 1.365814208984375, 1.4453582763671875, 1.52490234375, 1.6044464111328125, 1.683990478515625, 1.7635345458984375, 1.84307861328125, 1.9226226806640625, 2.002166748046875, 2.0817108154296875, 2.1612548828125, 2.2407989501953125, 2.320343017578125, 2.3998870849609375, 2.47943115234375, 2.5589752197265625, 2.638519287109375, 2.7180633544921875, 2.797607421875, 2.8771514892578125, 2.956695556640625, 3.0362396240234375, 3.11578369140625, 3.1953277587890625, 3.274871826171875, 3.3544158935546875, 3.4339599609375, 3.5135040283203125, 3.593048095703125, 3.6725921630859375, 3.75213623046875, 3.8316802978515625, 3.911224365234375, 3.9907684326171875, 4.0703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 32.0, 77.0, 169.0, 324.0, 231.0, 90.0, 43.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60890007019043, -7.257029056549072, -6.905158519744873, -6.553287506103516, -6.201416492462158, -5.849545478820801, -5.497674942016602, -5.145803928375244, -4.793932914733887, -4.442061901092529, -4.09019136428833, -3.7383203506469727, -3.3864493370056152, -3.034578561782837, -2.6827077865600586, -2.330836772918701, -1.978966236114502, -1.627095341682434, -1.2752244472503662, -0.9233536720275879, -0.57148277759552, -0.21961188316345215, 0.13225889205932617, 0.4841299057006836, 0.8360006809234619, 1.1878715753555298, 1.5397424697875977, 1.891613245010376, 2.2434840202331543, 2.5953550338745117, 2.94722580909729, 3.2990968227386475, 3.650967597961426, 4.002838611602783, 4.354709148406982, 4.70658016204834, 5.058451175689697, 5.410322189331055, 5.762192726135254, 6.114063739776611, 6.465934753417969, 6.817805767059326, 7.169676303863525, 7.521547317504883, 7.87341833114624, 8.225289344787598, 8.577159881591797, 8.929031372070312, 9.280900955200195, 9.632771492004395, 9.98464298248291, 10.33651351928711, 10.688384056091309, 11.040255546569824, 11.392126083374023, 11.743997573852539, 12.095868110656738, 12.447738647460938, 12.799610137939453, 13.151480674743652, 13.503351211547852, 13.855222702026367, 14.207093238830566, 14.558963775634766, 14.910835266113281]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 9.0, 15.0, 17.0, 18.0, 25.0, 37.0, 51.0, 66.0, 86.0, 77.0, 103.0, 98.0, 79.0, 74.0, 66.0, 50.0, 38.0, 21.0, 20.0, 10.0, 6.0, 6.0, 8.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.232107162475586, -6.0413594245910645, -5.850611686706543, -5.6598639488220215, -5.4691162109375, -5.2783684730529785, -5.087620735168457, -4.8968729972839355, -4.706125259399414, -4.515377521514893, -4.324629783630371, -4.13388204574585, -3.943134307861328, -3.7523865699768066, -3.561638832092285, -3.3708910942077637, -3.180143356323242, -2.9893956184387207, -2.798647880554199, -2.6079001426696777, -2.4171524047851562, -2.2264046669006348, -2.0356569290161133, -1.8449091911315918, -1.6541614532470703, -1.4634137153625488, -1.2726659774780273, -1.0819182395935059, -0.8911705017089844, -0.7004227638244629, -0.5096750259399414, -0.3189272880554199, -0.12818002700805664, 0.06256771087646484, 0.25331544876098633, 0.4440631866455078, 0.6348109245300293, 0.8255586624145508, 1.0163064002990723, 1.2070541381835938, 1.3978018760681152, 1.5885496139526367, 1.7792973518371582, 1.9700450897216797, 2.160792827606201, 2.3515405654907227, 2.542288303375244, 2.7330360412597656, 2.923783779144287, 3.1145315170288086, 3.30527925491333, 3.4960269927978516, 3.686774730682373, 3.8775224685668945, 4.068270206451416, 4.2590179443359375, 4.449765682220459, 4.6405134201049805, 4.831261157989502, 5.022008895874023, 5.212756633758545, 5.403504371643066, 5.594252109527588, 5.784999847412109, 5.975747585296631]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 5.0, 14.0, 15.0, 23.0, 22.0, 68.0, 82.0, 136.0, 250.0, 393.0, 837.0, 1676.0, 3677.0, 8558.0, 22374.0, 62300.0, 173289.0, 343815.0, 264897.0, 104686.0, 37200.0, 13769.0, 5452.0, 2409.0, 1199.0, 599.0, 306.0, 197.0, 107.0, 80.0, 43.0, 22.0, 19.0, 7.0, 11.0, 5.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.640625, -1.58355712890625, -1.5264892578125, -1.46942138671875, -1.412353515625, -1.35528564453125, -1.2982177734375, -1.24114990234375, -1.18408203125, -1.12701416015625, -1.0699462890625, -1.01287841796875, -0.955810546875, -0.89874267578125, -0.8416748046875, -0.78460693359375, -0.7275390625, -0.67047119140625, -0.6134033203125, -0.55633544921875, -0.499267578125, -0.44219970703125, -0.3851318359375, -0.32806396484375, -0.27099609375, -0.21392822265625, -0.1568603515625, -0.09979248046875, -0.042724609375, 0.01434326171875, 0.0714111328125, 0.12847900390625, 0.185546875, 0.24261474609375, 0.2996826171875, 0.35675048828125, 0.413818359375, 0.47088623046875, 0.5279541015625, 0.58502197265625, 0.64208984375, 0.69915771484375, 0.7562255859375, 0.81329345703125, 0.870361328125, 0.92742919921875, 0.9844970703125, 1.04156494140625, 1.0986328125, 1.15570068359375, 1.2127685546875, 1.26983642578125, 1.326904296875, 1.38397216796875, 1.4410400390625, 1.49810791015625, 1.55517578125, 1.61224365234375, 1.6693115234375, 1.72637939453125, 1.783447265625, 1.84051513671875, 1.8975830078125, 1.95465087890625, 2.01171875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 14.0, 10.0, 21.0, 22.0, 17.0, 30.0, 33.0, 49.0, 67.0, 56.0, 82.0, 81.0, 74.0, 73.0, 83.0, 57.0, 58.0, 33.0, 36.0, 22.0, 16.0, 20.0, 10.0, 5.0, 7.0, 5.0, 1.0, 4.0, 2.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.085174560546875, -1.05023193359375, -1.015289306640625, -0.9803466796875, -0.945404052734375, -0.91046142578125, -0.875518798828125, -0.840576171875, -0.805633544921875, -0.77069091796875, -0.735748291015625, -0.7008056640625, -0.665863037109375, -0.63092041015625, -0.595977783203125, -0.56103515625, -0.526092529296875, -0.49114990234375, -0.456207275390625, -0.4212646484375, -0.386322021484375, -0.35137939453125, -0.316436767578125, -0.281494140625, -0.246551513671875, -0.21160888671875, -0.176666259765625, -0.1417236328125, -0.106781005859375, -0.07183837890625, -0.036895751953125, -0.001953125, 0.032989501953125, 0.06793212890625, 0.102874755859375, 0.1378173828125, 0.172760009765625, 0.20770263671875, 0.242645263671875, 0.277587890625, 0.312530517578125, 0.34747314453125, 0.382415771484375, 0.4173583984375, 0.452301025390625, 0.48724365234375, 0.522186279296875, 0.55712890625, 0.592071533203125, 0.62701416015625, 0.661956787109375, 0.6968994140625, 0.731842041015625, 0.76678466796875, 0.801727294921875, 0.836669921875, 0.871612548828125, 0.90655517578125, 0.941497802734375, 0.9764404296875, 1.011383056640625, 1.04632568359375, 1.081268310546875, 1.1162109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 9.0, 17.0, 19.0, 38.0, 35.0, 80.0, 127.0, 205.0, 361.0, 753.0, 1628.0, 4797.0, 26692.0, 495410.0, 483969.0, 26391.0, 4729.0, 1655.0, 711.0, 394.0, 210.0, 126.0, 62.0, 34.0, 31.0, 24.0, 10.0, 8.0, 7.0, 3.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.20703125, -5.0623779296875, -4.917724609375, -4.7730712890625, -4.62841796875, -4.4837646484375, -4.339111328125, -4.1944580078125, -4.0498046875, -3.9051513671875, -3.760498046875, -3.6158447265625, -3.47119140625, -3.3265380859375, -3.181884765625, -3.0372314453125, -2.892578125, -2.7479248046875, -2.603271484375, -2.4586181640625, -2.31396484375, -2.1693115234375, -2.024658203125, -1.8800048828125, -1.7353515625, -1.5906982421875, -1.446044921875, -1.3013916015625, -1.15673828125, -1.0120849609375, -0.867431640625, -0.7227783203125, -0.578125, -0.4334716796875, -0.288818359375, -0.1441650390625, 0.00048828125, 0.1451416015625, 0.289794921875, 0.4344482421875, 0.5791015625, 0.7237548828125, 0.868408203125, 1.0130615234375, 1.15771484375, 1.3023681640625, 1.447021484375, 1.5916748046875, 1.736328125, 1.8809814453125, 2.025634765625, 2.1702880859375, 2.31494140625, 2.4595947265625, 2.604248046875, 2.7489013671875, 2.8935546875, 3.0382080078125, 3.182861328125, 3.3275146484375, 3.47216796875, 3.6168212890625, 3.761474609375, 3.9061279296875, 4.05078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 9.0, 3.0, 5.0, 8.0, 18.0, 24.0, 33.0, 47.0, 72.0, 77.0, 101.0, 86.0, 97.0, 95.0, 83.0, 65.0, 58.0, 37.0, 28.0, 16.0, 17.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.7655029296875, -4.570068359375, -4.3746337890625, -4.17919921875, -3.9837646484375, -3.788330078125, -3.5928955078125, -3.3974609375, -3.2020263671875, -3.006591796875, -2.8111572265625, -2.61572265625, -2.4202880859375, -2.224853515625, -2.0294189453125, -1.833984375, -1.6385498046875, -1.443115234375, -1.2476806640625, -1.05224609375, -0.8568115234375, -0.661376953125, -0.4659423828125, -0.2705078125, -0.0750732421875, 0.120361328125, 0.3157958984375, 0.51123046875, 0.7066650390625, 0.902099609375, 1.0975341796875, 1.29296875, 1.4884033203125, 1.683837890625, 1.8792724609375, 2.07470703125, 2.2701416015625, 2.465576171875, 2.6610107421875, 2.8564453125, 3.0518798828125, 3.247314453125, 3.4427490234375, 3.63818359375, 3.8336181640625, 4.029052734375, 4.2244873046875, 4.419921875, 4.6153564453125, 4.810791015625, 5.0062255859375, 5.20166015625, 5.3970947265625, 5.592529296875, 5.7879638671875, 5.9833984375, 6.1788330078125, 6.374267578125, 6.5697021484375, 6.76513671875, 6.9605712890625, 7.156005859375, 7.3514404296875, 7.546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 1.0, 8.0, 9.0, 8.0, 22.0, 23.0, 37.0, 54.0, 149.0, 280.0, 811.0, 3745.0, 56106.0, 913943.0, 67662.0, 4180.0, 891.0, 313.0, 121.0, 67.0, 47.0, 19.0, 12.0, 18.0, 5.0, 8.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.947265625, -1.878997802734375, -1.81072998046875, -1.742462158203125, -1.6741943359375, -1.605926513671875, -1.53765869140625, -1.469390869140625, -1.401123046875, -1.332855224609375, -1.26458740234375, -1.196319580078125, -1.1280517578125, -1.059783935546875, -0.99151611328125, -0.923248291015625, -0.85498046875, -0.786712646484375, -0.71844482421875, -0.650177001953125, -0.5819091796875, -0.513641357421875, -0.44537353515625, -0.377105712890625, -0.308837890625, -0.240570068359375, -0.17230224609375, -0.104034423828125, -0.0357666015625, 0.032501220703125, 0.10076904296875, 0.169036865234375, 0.2373046875, 0.305572509765625, 0.37384033203125, 0.442108154296875, 0.5103759765625, 0.578643798828125, 0.64691162109375, 0.715179443359375, 0.783447265625, 0.851715087890625, 0.91998291015625, 0.988250732421875, 1.0565185546875, 1.124786376953125, 1.19305419921875, 1.261322021484375, 1.32958984375, 1.397857666015625, 1.46612548828125, 1.534393310546875, 1.6026611328125, 1.670928955078125, 1.73919677734375, 1.807464599609375, 1.875732421875, 1.944000244140625, 2.01226806640625, 2.080535888671875, 2.1488037109375, 2.217071533203125, 2.28533935546875, 2.353607177734375, 2.421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 11.0, 15.0, 12.0, 10.0, 25.0, 30.0, 39.0, 36.0, 46.0, 77.0, 83.0, 96.0, 94.0, 77.0, 67.0, 58.0, 43.0, 43.0, 27.0, 20.0, 19.0, 12.0, 12.0, 9.0, 9.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002117156982421875, -0.00020596943795681, -0.0002002231776714325, -0.000194476917386055, -0.0001887306571006775, -0.0001829843968153, -0.00017723813652992249, -0.00017149187624454498, -0.00016574561595916748, -0.00015999935567378998, -0.00015425309538841248, -0.00014850683510303497, -0.00014276057481765747, -0.00013701431453227997, -0.00013126805424690247, -0.00012552179396152496, -0.00011977553367614746, -0.00011402927339076996, -0.00010828301310539246, -0.00010253675282001495, -9.679049253463745e-05, -9.104423224925995e-05, -8.529797196388245e-05, -7.955171167850494e-05, -7.380545139312744e-05, -6.805919110774994e-05, -6.231293082237244e-05, -5.6566670536994934e-05, -5.082041025161743e-05, -4.507414996623993e-05, -3.932788968086243e-05, -3.3581629395484924e-05, -2.7835369110107422e-05, -2.208910882472992e-05, -1.6342848539352417e-05, -1.0596588253974915e-05, -4.850327968597412e-06, 8.959323167800903e-07, 6.642192602157593e-06, 1.2388452887535095e-05, 1.8134713172912598e-05, 2.38809734582901e-05, 2.9627233743667603e-05, 3.5373494029045105e-05, 4.111975431442261e-05, 4.686601459980011e-05, 5.261227488517761e-05, 5.8358535170555115e-05, 6.410479545593262e-05, 6.985105574131012e-05, 7.559731602668762e-05, 8.134357631206512e-05, 8.708983659744263e-05, 9.283609688282013e-05, 9.858235716819763e-05, 0.00010432861745357513, 0.00011007487773895264, 0.00011582113802433014, 0.00012156739830970764, 0.00012731365859508514, 0.00013305991888046265, 0.00013880617916584015, 0.00014455243945121765, 0.00015029869973659515, 0.00015604496002197266]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 9.0, 0.0, 4.0, 9.0, 16.0, 13.0, 33.0, 43.0, 82.0, 124.0, 223.0, 497.0, 1094.0, 3360.0, 14695.0, 176689.0, 760497.0, 77903.0, 9183.0, 2359.0, 902.0, 367.0, 170.0, 116.0, 64.0, 37.0, 24.0, 13.0, 12.0, 4.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.239837646484375, -1.19451904296875, -1.149200439453125, -1.1038818359375, -1.058563232421875, -1.01324462890625, -0.967926025390625, -0.922607421875, -0.877288818359375, -0.83197021484375, -0.786651611328125, -0.7413330078125, -0.696014404296875, -0.65069580078125, -0.605377197265625, -0.56005859375, -0.514739990234375, -0.46942138671875, -0.424102783203125, -0.3787841796875, -0.333465576171875, -0.28814697265625, -0.242828369140625, -0.197509765625, -0.152191162109375, -0.10687255859375, -0.061553955078125, -0.0162353515625, 0.029083251953125, 0.07440185546875, 0.119720458984375, 0.1650390625, 0.210357666015625, 0.25567626953125, 0.300994873046875, 0.3463134765625, 0.391632080078125, 0.43695068359375, 0.482269287109375, 0.527587890625, 0.572906494140625, 0.61822509765625, 0.663543701171875, 0.7088623046875, 0.754180908203125, 0.79949951171875, 0.844818115234375, 0.89013671875, 0.935455322265625, 0.98077392578125, 1.026092529296875, 1.0714111328125, 1.116729736328125, 1.16204833984375, 1.207366943359375, 1.252685546875, 1.298004150390625, 1.34332275390625, 1.388641357421875, 1.4339599609375, 1.479278564453125, 1.52459716796875, 1.569915771484375, 1.615234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 18.0, 19.0, 32.0, 47.0, 56.0, 84.0, 93.0, 121.0, 128.0, 107.0, 85.0, 71.0, 47.0, 25.0, 20.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5253143310546875, -1.476409912109375, -1.4275054931640625, -1.37860107421875, -1.3296966552734375, -1.280792236328125, -1.2318878173828125, -1.1829833984375, -1.1340789794921875, -1.085174560546875, -1.0362701416015625, -0.98736572265625, -0.9384613037109375, -0.889556884765625, -0.8406524658203125, -0.791748046875, -0.7428436279296875, -0.693939208984375, -0.6450347900390625, -0.59613037109375, -0.5472259521484375, -0.498321533203125, -0.4494171142578125, -0.4005126953125, -0.3516082763671875, -0.302703857421875, -0.2537994384765625, -0.20489501953125, -0.1559906005859375, -0.107086181640625, -0.0581817626953125, -0.00927734375, 0.0396270751953125, 0.088531494140625, 0.1374359130859375, 0.18634033203125, 0.2352447509765625, 0.284149169921875, 0.3330535888671875, 0.3819580078125, 0.4308624267578125, 0.479766845703125, 0.5286712646484375, 0.57757568359375, 0.6264801025390625, 0.675384521484375, 0.7242889404296875, 0.773193359375, 0.8220977783203125, 0.871002197265625, 0.9199066162109375, 0.96881103515625, 1.0177154541015625, 1.066619873046875, 1.1155242919921875, 1.1644287109375, 1.2133331298828125, 1.262237548828125, 1.3111419677734375, 1.36004638671875, 1.4089508056640625, 1.457855224609375, 1.5067596435546875, 1.5556640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 8.0, 6.0, 20.0, 16.0, 61.0, 88.0, 96.0, 157.0, 150.0, 150.0, 82.0, 68.0, 42.0, 25.0, 13.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.493077278137207, -12.710075378417969, -11.927074432373047, -11.144072532653809, -10.36107063293457, -9.578068733215332, -8.795066833496094, -8.012065887451172, -7.229063987731934, -6.446062088012695, -5.663060665130615, -4.880059242248535, -4.097057342529297, -3.3140556812286377, -2.5310540199279785, -1.7480525970458984, -0.9650506973266602, -0.18204903602600098, 0.6009526252746582, 1.3839542865753174, 2.1669559478759766, 2.9499576091766357, 3.732959270477295, 4.515960693359375, 5.298962593078613, 6.081964492797852, 6.864965915679932, 7.647967338562012, 8.43096923828125, 9.213971138000488, 9.996973037719727, 10.779973983764648, 11.562976837158203, 12.345978736877441, 13.12898063659668, 13.911981582641602, 14.69498348236084, 15.477985382080078, 16.260986328125, 17.043987274169922, 17.826990127563477, 18.6099910736084, 19.392993927001953, 20.175994873046875, 20.958995819091797, 21.74199867248535, 22.524999618530273, 23.308002471923828, 24.09100341796875, 24.874004364013672, 25.657007217407227, 26.44000816345215, 27.223011016845703, 28.006011962890625, 28.789012908935547, 29.57201385498047, 30.355016708374023, 31.138017654418945, 31.9210205078125, 32.70402145385742, 33.487022399902344, 34.270023345947266, 35.05302810668945, 35.836029052734375, 36.6190299987793]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 7.0, 17.0, 9.0, 14.0, 17.0, 15.0, 23.0, 28.0, 22.0, 35.0, 38.0, 52.0, 48.0, 56.0, 57.0, 47.0, 61.0, 51.0, 53.0, 35.0, 44.0, 40.0, 33.0, 28.0, 20.0, 22.0, 16.0, 20.0, 15.0, 15.0, 6.0, 8.0, 6.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-19.971073150634766, -19.428203582763672, -18.885332107543945, -18.34246253967285, -17.799591064453125, -17.25672149658203, -16.713850021362305, -16.17098045349121, -15.6281099319458, -15.08523941040039, -14.54236888885498, -13.99949836730957, -13.456628799438477, -12.91375732421875, -12.370887756347656, -11.828017234802246, -11.285146713256836, -10.742276191711426, -10.199405670166016, -9.656535148620605, -9.113664627075195, -8.570795059204102, -8.027924537658691, -7.485054016113281, -6.942183494567871, -6.399312973022461, -5.856442451477051, -5.313572406768799, -4.770701885223389, -4.2278313636779785, -3.6849610805511475, -3.1420907974243164, -2.59921932220459, -2.0563488006591797, -1.5134785175323486, -0.970608115196228, -0.4277377128601074, 0.11513280868530273, 0.6580030918121338, 1.2008733749389648, 1.743743896484375, 2.286614418029785, 2.829484701156616, 3.3723549842834473, 3.9152255058288574, 4.458096027374268, 5.0009660720825195, 5.54383659362793, 6.08670711517334, 6.62957763671875, 7.17244815826416, 7.715318202972412, 8.258188247680664, 8.80105972290039, 9.343929290771484, 9.886799812316895, 10.429670333862305, 10.972540855407715, 11.515411376953125, 12.058281898498535, 12.601152420043945, 13.144021987915039, 13.68689250946045, 14.22976303100586, 14.77263355255127]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 13.0, 20.0, 28.0, 45.0, 40.0, 76.0, 96.0, 171.0, 225.0, 385.0, 549.0, 958.0, 1603.0, 3143.0, 6553.0, 16224.0, 52841.0, 381845.0, 3438502.0, 224179.0, 41242.0, 13433.0, 5646.0, 2698.0, 1412.0, 843.0, 514.0, 321.0, 202.0, 138.0, 86.0, 74.0, 46.0, 29.0, 27.0, 20.0, 10.0, 8.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.547088623046875, -1.49261474609375, -1.438140869140625, -1.3836669921875, -1.329193115234375, -1.27471923828125, -1.220245361328125, -1.165771484375, -1.111297607421875, -1.05682373046875, -1.002349853515625, -0.9478759765625, -0.893402099609375, -0.83892822265625, -0.784454345703125, -0.72998046875, -0.675506591796875, -0.62103271484375, -0.566558837890625, -0.5120849609375, -0.457611083984375, -0.40313720703125, -0.348663330078125, -0.294189453125, -0.239715576171875, -0.18524169921875, -0.130767822265625, -0.0762939453125, -0.021820068359375, 0.03265380859375, 0.087127685546875, 0.1416015625, 0.196075439453125, 0.25054931640625, 0.305023193359375, 0.3594970703125, 0.413970947265625, 0.46844482421875, 0.522918701171875, 0.577392578125, 0.631866455078125, 0.68634033203125, 0.740814208984375, 0.7952880859375, 0.849761962890625, 0.90423583984375, 0.958709716796875, 1.01318359375, 1.067657470703125, 1.12213134765625, 1.176605224609375, 1.2310791015625, 1.285552978515625, 1.34002685546875, 1.394500732421875, 1.448974609375, 1.503448486328125, 1.55792236328125, 1.612396240234375, 1.6668701171875, 1.721343994140625, 1.77581787109375, 1.830291748046875, 1.884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 11.0, 21.0, 25.0, 33.0, 36.0, 51.0, 60.0, 55.0, 89.0, 94.0, 92.0, 80.0, 70.0, 48.0, 48.0, 38.0, 40.0, 28.0, 25.0, 16.0, 12.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.458984375, -1.425994873046875, -1.39300537109375, -1.360015869140625, -1.3270263671875, -1.294036865234375, -1.26104736328125, -1.228057861328125, -1.195068359375, -1.162078857421875, -1.12908935546875, -1.096099853515625, -1.0631103515625, -1.030120849609375, -0.99713134765625, -0.964141845703125, -0.93115234375, -0.898162841796875, -0.86517333984375, -0.832183837890625, -0.7991943359375, -0.766204833984375, -0.73321533203125, -0.700225830078125, -0.667236328125, -0.634246826171875, -0.60125732421875, -0.568267822265625, -0.5352783203125, -0.502288818359375, -0.46929931640625, -0.436309814453125, -0.4033203125, -0.370330810546875, -0.33734130859375, -0.304351806640625, -0.2713623046875, -0.238372802734375, -0.20538330078125, -0.172393798828125, -0.139404296875, -0.106414794921875, -0.07342529296875, -0.040435791015625, -0.0074462890625, 0.025543212890625, 0.05853271484375, 0.091522216796875, 0.12451171875, 0.157501220703125, 0.19049072265625, 0.223480224609375, 0.2564697265625, 0.289459228515625, 0.32244873046875, 0.355438232421875, 0.388427734375, 0.421417236328125, 0.45440673828125, 0.487396240234375, 0.5203857421875, 0.553375244140625, 0.58636474609375, 0.619354248046875, 0.65234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 11.0, 15.0, 18.0, 26.0, 47.0, 77.0, 177.0, 422.0, 1103.0, 4306.0, 24159.0, 313242.0, 3743988.0, 91562.0, 11545.0, 2374.0, 644.0, 261.0, 127.0, 56.0, 32.0, 22.0, 21.0, 11.0, 11.0, 10.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.96710205078125, -2.8658447265625, -2.76458740234375, -2.663330078125, -2.56207275390625, -2.4608154296875, -2.35955810546875, -2.25830078125, -2.15704345703125, -2.0557861328125, -1.95452880859375, -1.853271484375, -1.75201416015625, -1.6507568359375, -1.54949951171875, -1.4482421875, -1.34698486328125, -1.2457275390625, -1.14447021484375, -1.043212890625, -0.94195556640625, -0.8406982421875, -0.73944091796875, -0.63818359375, -0.53692626953125, -0.4356689453125, -0.33441162109375, -0.233154296875, -0.13189697265625, -0.0306396484375, 0.07061767578125, 0.171875, 0.27313232421875, 0.3743896484375, 0.47564697265625, 0.576904296875, 0.67816162109375, 0.7794189453125, 0.88067626953125, 0.98193359375, 1.08319091796875, 1.1844482421875, 1.28570556640625, 1.386962890625, 1.48822021484375, 1.5894775390625, 1.69073486328125, 1.7919921875, 1.89324951171875, 1.9945068359375, 2.09576416015625, 2.197021484375, 2.29827880859375, 2.3995361328125, 2.50079345703125, 2.60205078125, 2.70330810546875, 2.8045654296875, 2.90582275390625, 3.007080078125, 3.10833740234375, 3.2095947265625, 3.31085205078125, 3.412109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 14.0, 27.0, 31.0, 66.0, 90.0, 182.0, 461.0, 1615.0, 944.0, 291.0, 126.0, 67.0, 46.0, 23.0, 15.0, 16.0, 6.0, 4.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.396331787109375, -3.30633544921875, -3.216339111328125, -3.1263427734375, -3.036346435546875, -2.94635009765625, -2.856353759765625, -2.766357421875, -2.676361083984375, -2.58636474609375, -2.496368408203125, -2.4063720703125, -2.316375732421875, -2.22637939453125, -2.136383056640625, -2.04638671875, -1.956390380859375, -1.86639404296875, -1.776397705078125, -1.6864013671875, -1.596405029296875, -1.50640869140625, -1.416412353515625, -1.326416015625, -1.236419677734375, -1.14642333984375, -1.056427001953125, -0.9664306640625, -0.876434326171875, -0.78643798828125, -0.696441650390625, -0.6064453125, -0.516448974609375, -0.42645263671875, -0.336456298828125, -0.2464599609375, -0.156463623046875, -0.06646728515625, 0.023529052734375, 0.113525390625, 0.203521728515625, 0.29351806640625, 0.383514404296875, 0.4735107421875, 0.563507080078125, 0.65350341796875, 0.743499755859375, 0.83349609375, 0.923492431640625, 1.01348876953125, 1.103485107421875, 1.1934814453125, 1.283477783203125, 1.37347412109375, 1.463470458984375, 1.553466796875, 1.643463134765625, 1.73345947265625, 1.823455810546875, 1.9134521484375, 2.003448486328125, 2.09344482421875, 2.183441162109375, 2.2734375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 15.0, 35.0, 62.0, 118.0, 170.0, 202.0, 147.0, 96.0, 67.0, 35.0, 12.0, 10.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.216615676879883, -22.61217498779297, -22.007732391357422, -21.403291702270508, -20.798851013183594, -20.194408416748047, -19.589967727661133, -18.98552703857422, -18.381084442138672, -17.776643753051758, -17.17220115661621, -16.567760467529297, -15.963318824768066, -15.358877182006836, -14.754436492919922, -14.149994850158691, -13.545553207397461, -12.94111156463623, -12.336669921875, -11.732229232788086, -11.127787590026855, -10.523345947265625, -9.918905258178711, -9.31446361541748, -8.71002197265625, -8.10558032989502, -7.501139163970947, -6.896697998046875, -6.2922563552856445, -5.687814712524414, -5.083373546600342, -4.4789323806762695, -3.8744897842407227, -3.2700483798980713, -2.66560697555542, -2.0611655712127686, -1.4567241668701172, -0.8522827625274658, -0.24784135818481445, 0.3565998077392578, 0.9610414505004883, 1.5654828548431396, 2.169924259185791, 2.7743656635284424, 3.3788070678710938, 3.983248472213745, 4.5876898765563965, 5.192131042480469, 5.796572685241699, 6.40101432800293, 7.005455493927002, 7.609896659851074, 8.214338302612305, 8.818779945373535, 9.423221588134766, 10.02766227722168, 10.63210391998291, 11.23654556274414, 11.840986251831055, 12.445427894592285, 13.049869537353516, 13.654311180114746, 14.258752822875977, 14.86319351196289, 15.467635154724121]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 13.0, 7.0, 10.0, 25.0, 32.0, 21.0, 39.0, 41.0, 49.0, 48.0, 37.0, 57.0, 65.0, 68.0, 57.0, 59.0, 51.0, 44.0, 38.0, 38.0, 38.0, 33.0, 25.0, 19.0, 15.0, 15.0, 15.0, 8.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.658726692199707, -8.326745986938477, -7.994765758514404, -7.662785053253174, -7.330804824829102, -6.998824119567871, -6.666843414306641, -6.33486270904541, -6.002882480621338, -5.670901775360107, -5.338921546936035, -5.006940841674805, -4.674960136413574, -4.342979907989502, -4.0109992027282715, -3.67901873588562, -3.3470382690429688, -3.0150578022003174, -2.683077335357666, -2.3510966300964355, -2.019116163253784, -1.6871356964111328, -1.355155110359192, -1.023174524307251, -0.6911940574645996, -0.35921353101730347, -0.027233004570007324, 0.3047475218772888, 0.636728048324585, 0.9687085151672363, 1.3006891012191772, 1.6326696872711182, 1.964651107788086, 2.2966315746307373, 2.6286120414733887, 2.960592746734619, 3.2925732135772705, 3.624553680419922, 3.9565343856811523, 4.288515090942383, 4.620495319366455, 4.9524760246276855, 5.284456253051758, 5.616436958312988, 5.948417663574219, 6.280397891998291, 6.6123785972595215, 6.944358825683594, 7.276339530944824, 7.608320236206055, 7.940300464630127, 8.2722806930542, 8.60426139831543, 8.93624210357666, 9.26822280883789, 9.600203514099121, 9.932184219360352, 10.264164924621582, 10.596145629882812, 10.928125381469727, 11.260106086730957, 11.592086791992188, 11.924067497253418, 12.256048202514648, 12.588027954101562]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 6.0, 8.0, 19.0, 24.0, 32.0, 50.0, 70.0, 119.0, 173.0, 261.0, 517.0, 832.0, 1553.0, 3109.0, 6451.0, 14397.0, 31671.0, 74086.0, 168985.0, 304422.0, 241089.0, 112237.0, 48518.0, 21053.0, 9507.0, 4425.0, 2195.0, 1169.0, 629.0, 338.0, 210.0, 147.0, 76.0, 56.0, 42.0, 28.0, 14.0, 13.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.341796875, -1.29815673828125, -1.2545166015625, -1.21087646484375, -1.167236328125, -1.12359619140625, -1.0799560546875, -1.03631591796875, -0.99267578125, -0.94903564453125, -0.9053955078125, -0.86175537109375, -0.818115234375, -0.77447509765625, -0.7308349609375, -0.68719482421875, -0.6435546875, -0.59991455078125, -0.5562744140625, -0.51263427734375, -0.468994140625, -0.42535400390625, -0.3817138671875, -0.33807373046875, -0.29443359375, -0.25079345703125, -0.2071533203125, -0.16351318359375, -0.119873046875, -0.07623291015625, -0.0325927734375, 0.01104736328125, 0.0546875, 0.09832763671875, 0.1419677734375, 0.18560791015625, 0.229248046875, 0.27288818359375, 0.3165283203125, 0.36016845703125, 0.40380859375, 0.44744873046875, 0.4910888671875, 0.53472900390625, 0.578369140625, 0.62200927734375, 0.6656494140625, 0.70928955078125, 0.7529296875, 0.79656982421875, 0.8402099609375, 0.88385009765625, 0.927490234375, 0.97113037109375, 1.0147705078125, 1.05841064453125, 1.10205078125, 1.14569091796875, 1.1893310546875, 1.23297119140625, 1.276611328125, 1.32025146484375, 1.3638916015625, 1.40753173828125, 1.451171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 7.0, 11.0, 9.0, 13.0, 10.0, 29.0, 16.0, 35.0, 28.0, 28.0, 44.0, 56.0, 68.0, 48.0, 58.0, 62.0, 50.0, 49.0, 34.0, 53.0, 32.0, 41.0, 31.0, 32.0, 33.0, 26.0, 21.0, 16.0, 10.0, 11.0, 9.0, 10.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6677703857421875, -0.644622802734375, -0.6214752197265625, -0.59832763671875, -0.5751800537109375, -0.552032470703125, -0.5288848876953125, -0.5057373046875, -0.4825897216796875, -0.459442138671875, -0.4362945556640625, -0.41314697265625, -0.3899993896484375, -0.366851806640625, -0.3437042236328125, -0.320556640625, -0.2974090576171875, -0.274261474609375, -0.2511138916015625, -0.22796630859375, -0.2048187255859375, -0.181671142578125, -0.1585235595703125, -0.1353759765625, -0.1122283935546875, -0.089080810546875, -0.0659332275390625, -0.04278564453125, -0.0196380615234375, 0.003509521484375, 0.0266571044921875, 0.0498046875, 0.0729522705078125, 0.096099853515625, 0.1192474365234375, 0.14239501953125, 0.1655426025390625, 0.188690185546875, 0.2118377685546875, 0.2349853515625, 0.2581329345703125, 0.281280517578125, 0.3044281005859375, 0.32757568359375, 0.3507232666015625, 0.373870849609375, 0.3970184326171875, 0.420166015625, 0.4433135986328125, 0.466461181640625, 0.4896087646484375, 0.51275634765625, 0.5359039306640625, 0.559051513671875, 0.5821990966796875, 0.6053466796875, 0.6284942626953125, 0.651641845703125, 0.6747894287109375, 0.69793701171875, 0.7210845947265625, 0.744232177734375, 0.7673797607421875, 0.79052734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 5.0, 6.0, 6.0, 9.0, 19.0, 13.0, 22.0, 47.0, 64.0, 65.0, 126.0, 172.0, 277.0, 543.0, 918.0, 1874.0, 4862.0, 20427.0, 177775.0, 719470.0, 100769.0, 13769.0, 3823.0, 1513.0, 776.0, 426.0, 273.0, 172.0, 105.0, 64.0, 54.0, 41.0, 20.0, 18.0, 14.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.40234375, -3.3004150390625, -3.198486328125, -3.0965576171875, -2.99462890625, -2.8927001953125, -2.790771484375, -2.6888427734375, -2.5869140625, -2.4849853515625, -2.383056640625, -2.2811279296875, -2.17919921875, -2.0772705078125, -1.975341796875, -1.8734130859375, -1.771484375, -1.6695556640625, -1.567626953125, -1.4656982421875, -1.36376953125, -1.2618408203125, -1.159912109375, -1.0579833984375, -0.9560546875, -0.8541259765625, -0.752197265625, -0.6502685546875, -0.54833984375, -0.4464111328125, -0.344482421875, -0.2425537109375, -0.140625, -0.0386962890625, 0.063232421875, 0.1651611328125, 0.26708984375, 0.3690185546875, 0.470947265625, 0.5728759765625, 0.6748046875, 0.7767333984375, 0.878662109375, 0.9805908203125, 1.08251953125, 1.1844482421875, 1.286376953125, 1.3883056640625, 1.490234375, 1.5921630859375, 1.694091796875, 1.7960205078125, 1.89794921875, 1.9998779296875, 2.101806640625, 2.2037353515625, 2.3056640625, 2.4075927734375, 2.509521484375, 2.6114501953125, 2.71337890625, 2.8153076171875, 2.917236328125, 3.0191650390625, 3.12109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 12.0, 10.0, 21.0, 9.0, 18.0, 21.0, 22.0, 33.0, 26.0, 28.0, 21.0, 33.0, 34.0, 34.0, 50.0, 48.0, 43.0, 43.0, 51.0, 48.0, 49.0, 36.0, 48.0, 33.0, 32.0, 26.0, 25.0, 23.0, 18.0, 13.0, 15.0, 19.0, 10.0, 8.0, 6.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.395294189453125, -2.30621337890625, -2.217132568359375, -2.1280517578125, -2.038970947265625, -1.94989013671875, -1.860809326171875, -1.771728515625, -1.682647705078125, -1.59356689453125, -1.504486083984375, -1.4154052734375, -1.326324462890625, -1.23724365234375, -1.148162841796875, -1.05908203125, -0.970001220703125, -0.88092041015625, -0.791839599609375, -0.7027587890625, -0.613677978515625, -0.52459716796875, -0.435516357421875, -0.346435546875, -0.257354736328125, -0.16827392578125, -0.079193115234375, 0.0098876953125, 0.098968505859375, 0.18804931640625, 0.277130126953125, 0.3662109375, 0.455291748046875, 0.54437255859375, 0.633453369140625, 0.7225341796875, 0.811614990234375, 0.90069580078125, 0.989776611328125, 1.078857421875, 1.167938232421875, 1.25701904296875, 1.346099853515625, 1.4351806640625, 1.524261474609375, 1.61334228515625, 1.702423095703125, 1.79150390625, 1.880584716796875, 1.96966552734375, 2.058746337890625, 2.1478271484375, 2.236907958984375, 2.32598876953125, 2.415069580078125, 2.504150390625, 2.593231201171875, 2.68231201171875, 2.771392822265625, 2.8604736328125, 2.949554443359375, 3.03863525390625, 3.127716064453125, 3.216796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 14.0, 11.0, 17.0, 30.0, 49.0, 74.0, 113.0, 170.0, 272.0, 558.0, 1235.0, 3172.0, 11951.0, 80550.0, 772863.0, 152236.0, 17895.0, 4224.0, 1483.0, 715.0, 362.0, 200.0, 118.0, 64.0, 45.0, 35.0, 16.0, 22.0, 12.0, 11.0, 11.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.6689453125, -1.6245880126953125, -1.580230712890625, -1.5358734130859375, -1.49151611328125, -1.4471588134765625, -1.402801513671875, -1.3584442138671875, -1.3140869140625, -1.2697296142578125, -1.225372314453125, -1.1810150146484375, -1.13665771484375, -1.0923004150390625, -1.047943115234375, -1.0035858154296875, -0.959228515625, -0.9148712158203125, -0.870513916015625, -0.8261566162109375, -0.78179931640625, -0.7374420166015625, -0.693084716796875, -0.6487274169921875, -0.6043701171875, -0.5600128173828125, -0.515655517578125, -0.4712982177734375, -0.42694091796875, -0.3825836181640625, -0.338226318359375, -0.2938690185546875, -0.24951171875, -0.2051544189453125, -0.160797119140625, -0.1164398193359375, -0.07208251953125, -0.0277252197265625, 0.016632080078125, 0.0609893798828125, 0.1053466796875, 0.1497039794921875, 0.194061279296875, 0.2384185791015625, 0.28277587890625, 0.3271331787109375, 0.371490478515625, 0.4158477783203125, 0.460205078125, 0.5045623779296875, 0.548919677734375, 0.5932769775390625, 0.63763427734375, 0.6819915771484375, 0.726348876953125, 0.7707061767578125, 0.8150634765625, 0.8594207763671875, 0.903778076171875, 0.9481353759765625, 0.99249267578125, 1.0368499755859375, 1.081207275390625, 1.1255645751953125, 1.169921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 10.0, 13.0, 16.0, 13.0, 24.0, 36.0, 29.0, 46.0, 47.0, 74.0, 69.0, 102.0, 85.0, 89.0, 65.0, 37.0, 38.0, 30.0, 28.0, 24.0, 22.0, 11.0, 10.0, 13.0, 5.0, 6.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015103816986083984, -0.00014526955783367157, -0.0001395009458065033, -0.00013373233377933502, -0.00012796372175216675, -0.00012219510972499847, -0.0001164264976978302, -0.00011065788567066193, -0.00010488927364349365, -9.912066161632538e-05, -9.33520495891571e-05, -8.758343756198883e-05, -8.181482553482056e-05, -7.604621350765228e-05, -7.027760148048401e-05, -6.450898945331573e-05, -5.874037742614746e-05, -5.297176539897919e-05, -4.720315337181091e-05, -4.143454134464264e-05, -3.5665929317474365e-05, -2.989731729030609e-05, -2.4128705263137817e-05, -1.8360093235969543e-05, -1.259148120880127e-05, -6.822869181632996e-06, -1.0542571544647217e-06, 4.714354872703552e-06, 1.0482966899871826e-05, 1.62515789270401e-05, 2.2020190954208374e-05, 2.7788802981376648e-05, 3.355741500854492e-05, 3.9326027035713196e-05, 4.509463906288147e-05, 5.0863251090049744e-05, 5.663186311721802e-05, 6.240047514438629e-05, 6.816908717155457e-05, 7.393769919872284e-05, 7.970631122589111e-05, 8.547492325305939e-05, 9.124353528022766e-05, 9.701214730739594e-05, 0.00010278075933456421, 0.00010854937136173248, 0.00011431798338890076, 0.00012008659541606903, 0.0001258552074432373, 0.00013162381947040558, 0.00013739243149757385, 0.00014316104352474213, 0.0001489296555519104, 0.00015469826757907867, 0.00016046687960624695, 0.00016623549163341522, 0.0001720041036605835, 0.00017777271568775177, 0.00018354132771492004, 0.00018930993974208832, 0.0001950785517692566, 0.00020084716379642487, 0.00020661577582359314, 0.00021238438785076141, 0.0002181529998779297]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 4.0, 9.0, 27.0, 24.0, 48.0, 74.0, 88.0, 187.0, 326.0, 746.0, 1652.0, 5338.0, 29599.0, 409100.0, 557193.0, 34714.0, 5974.0, 1790.0, 786.0, 380.0, 213.0, 108.0, 63.0, 34.0, 22.0, 18.0, 11.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2329254150390625, -1.185577392578125, -1.1382293701171875, -1.09088134765625, -1.0435333251953125, -0.996185302734375, -0.9488372802734375, -0.9014892578125, -0.8541412353515625, -0.806793212890625, -0.7594451904296875, -0.71209716796875, -0.6647491455078125, -0.617401123046875, -0.5700531005859375, -0.522705078125, -0.4753570556640625, -0.428009033203125, -0.3806610107421875, -0.33331298828125, -0.2859649658203125, -0.238616943359375, -0.1912689208984375, -0.1439208984375, -0.0965728759765625, -0.049224853515625, -0.0018768310546875, 0.04547119140625, 0.0928192138671875, 0.140167236328125, 0.1875152587890625, 0.23486328125, 0.2822113037109375, 0.329559326171875, 0.3769073486328125, 0.42425537109375, 0.4716033935546875, 0.518951416015625, 0.5662994384765625, 0.6136474609375, 0.6609954833984375, 0.708343505859375, 0.7556915283203125, 0.80303955078125, 0.8503875732421875, 0.897735595703125, 0.9450836181640625, 0.992431640625, 1.0397796630859375, 1.087127685546875, 1.1344757080078125, 1.18182373046875, 1.2291717529296875, 1.276519775390625, 1.3238677978515625, 1.3712158203125, 1.4185638427734375, 1.465911865234375, 1.5132598876953125, 1.56060791015625, 1.6079559326171875, 1.655303955078125, 1.7026519775390625, 1.75]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 5.0, 7.0, 13.0, 16.0, 19.0, 22.0, 42.0, 41.0, 54.0, 81.0, 80.0, 108.0, 104.0, 74.0, 72.0, 62.0, 42.0, 25.0, 19.0, 25.0, 21.0, 14.0, 8.0, 7.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.62109375, -1.5816268920898438, -1.5421600341796875, -1.5026931762695312, -1.463226318359375, -1.4237594604492188, -1.3842926025390625, -1.3448257446289062, -1.30535888671875, -1.2658920288085938, -1.2264251708984375, -1.1869583129882812, -1.147491455078125, -1.1080245971679688, -1.0685577392578125, -1.0290908813476562, -0.9896240234375, -0.9501571655273438, -0.9106903076171875, -0.8712234497070312, -0.831756591796875, -0.7922897338867188, -0.7528228759765625, -0.7133560180664062, -0.67388916015625, -0.6344223022460938, -0.5949554443359375, -0.5554885864257812, -0.516021728515625, -0.47655487060546875, -0.4370880126953125, -0.39762115478515625, -0.358154296875, -0.31868743896484375, -0.2792205810546875, -0.23975372314453125, -0.200286865234375, -0.16082000732421875, -0.1213531494140625, -0.08188629150390625, -0.04241943359375, -0.00295257568359375, 0.0365142822265625, 0.07598114013671875, 0.115447998046875, 0.15491485595703125, 0.1943817138671875, 0.23384857177734375, 0.2733154296875, 0.31278228759765625, 0.3522491455078125, 0.39171600341796875, 0.431182861328125, 0.47064971923828125, 0.5101165771484375, 0.5495834350585938, 0.58905029296875, 0.6285171508789062, 0.6679840087890625, 0.7074508666992188, 0.746917724609375, 0.7863845825195312, 0.8258514404296875, 0.8653182983398438, 0.90478515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 18.0, 56.0, 137.0, 323.0, 264.0, 134.0, 33.0, 20.0, 9.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.43658447265625, -13.213057518005371, -11.989530563354492, -10.766002655029297, -9.542476654052734, -8.318948745727539, -7.09542179107666, -5.871894836425781, -4.648367881774902, -3.4248409271240234, -2.2013137340545654, -0.9777865409851074, 0.24574041366577148, 1.4692673683166504, 2.6927947998046875, 3.9163217544555664, 5.139848709106445, 6.363375663757324, 7.586902618408203, 8.810430526733398, 10.033956527709961, 11.257484436035156, 12.481011390686035, 13.704538345336914, 14.928065299987793, 16.151592254638672, 17.375120162963867, 18.59864616394043, 19.822174072265625, 21.045700073242188, 22.269227981567383, 23.492755889892578, 24.71628189086914, 25.939809799194336, 27.1633358001709, 28.386863708496094, 29.610389709472656, 30.83391761779785, 32.05744552612305, 33.28097152709961, 34.50449752807617, 35.728023529052734, 36.95155334472656, 38.175079345703125, 39.39860534667969, 40.62213134765625, 41.84566116333008, 43.06918716430664, 44.29271697998047, 45.51624298095703, 46.73977279663086, 47.96329879760742, 49.186824798583984, 50.41035079956055, 51.633880615234375, 52.85740661621094, 54.0809326171875, 55.30445861816406, 56.52798843383789, 57.75151443481445, 58.975040435791016, 60.19856643676758, 61.422096252441406, 62.64562225341797, 63.86914825439453]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 4.0, 7.0, 11.0, 8.0, 11.0, 21.0, 46.0, 39.0, 33.0, 53.0, 65.0, 69.0, 80.0, 89.0, 71.0, 58.0, 46.0, 38.0, 37.0, 46.0, 34.0, 22.0, 24.0, 16.0, 14.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.751739501953125, -11.231823921203613, -10.711908340454102, -10.19199275970459, -9.672077178955078, -9.152161598205566, -8.632246017456055, -8.112329483032227, -7.592414379119873, -7.072498798370361, -6.55258321762085, -6.03266716003418, -5.512751579284668, -4.992835998535156, -4.4729204177856445, -3.953004837036133, -3.433089256286621, -2.9131736755371094, -2.3932580947875977, -1.8733422756195068, -1.3534266948699951, -0.8335111141204834, -0.3135952949523926, 0.20632028579711914, 0.7262358665466309, 1.2461514472961426, 1.7660671472549438, 2.285982847213745, 2.805898427963257, 3.3258140087127686, 3.8457298278808594, 4.365645408630371, 4.885560989379883, 5.4054765701293945, 5.925392150878906, 6.445307731628418, 6.96522331237793, 7.485138893127441, 8.005054473876953, 8.524971008300781, 9.044885635375977, 9.564801216125488, 10.084716796875, 10.604632377624512, 11.124547958374023, 11.644463539123535, 12.164379119873047, 12.684295654296875, 13.204211235046387, 13.724126815795898, 14.24404239654541, 14.763957977294922, 15.283873558044434, 15.803789138793945, 16.323705673217773, 16.84362030029297, 17.363536834716797, 17.883453369140625, 18.40336799621582, 18.92328453063965, 19.443199157714844, 19.963115692138672, 20.483030319213867, 21.002946853637695, 21.52286148071289]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 12.0, 15.0, 11.0, 16.0, 19.0, 19.0, 47.0, 38.0, 66.0, 83.0, 116.0, 151.0, 283.0, 678.0, 2367.0, 11775.0, 127311.0, 3897709.0, 137602.0, 11780.0, 2342.0, 784.0, 344.0, 205.0, 104.0, 84.0, 70.0, 53.0, 37.0, 37.0, 22.0, 19.0, 23.0, 11.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.927734375, -2.831787109375, -2.73583984375, -2.639892578125, -2.5439453125, -2.447998046875, -2.35205078125, -2.256103515625, -2.16015625, -2.064208984375, -1.96826171875, -1.872314453125, -1.7763671875, -1.680419921875, -1.58447265625, -1.488525390625, -1.392578125, -1.296630859375, -1.20068359375, -1.104736328125, -1.0087890625, -0.912841796875, -0.81689453125, -0.720947265625, -0.625, -0.529052734375, -0.43310546875, -0.337158203125, -0.2412109375, -0.145263671875, -0.04931640625, 0.046630859375, 0.142578125, 0.238525390625, 0.33447265625, 0.430419921875, 0.5263671875, 0.622314453125, 0.71826171875, 0.814208984375, 0.91015625, 1.006103515625, 1.10205078125, 1.197998046875, 1.2939453125, 1.389892578125, 1.48583984375, 1.581787109375, 1.677734375, 1.773681640625, 1.86962890625, 1.965576171875, 2.0615234375, 2.157470703125, 2.25341796875, 2.349365234375, 2.4453125, 2.541259765625, 2.63720703125, 2.733154296875, 2.8291015625, 2.925048828125, 3.02099609375, 3.116943359375, 3.212890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 13.0, 27.0, 44.0, 44.0, 70.0, 99.0, 108.0, 111.0, 117.0, 88.0, 85.0, 66.0, 51.0, 33.0, 17.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.7859725952148438, -0.7394256591796875, -0.6928787231445312, -0.646331787109375, -0.5997848510742188, -0.5532379150390625, -0.5066909790039062, -0.46014404296875, -0.41359710693359375, -0.3670501708984375, -0.32050323486328125, -0.273956298828125, -0.22740936279296875, -0.1808624267578125, -0.13431549072265625, -0.0877685546875, -0.04122161865234375, 0.0053253173828125, 0.05187225341796875, 0.098419189453125, 0.14496612548828125, 0.1915130615234375, 0.23805999755859375, 0.28460693359375, 0.33115386962890625, 0.3777008056640625, 0.42424774169921875, 0.470794677734375, 0.5173416137695312, 0.5638885498046875, 0.6104354858398438, 0.656982421875, 0.7035293579101562, 0.7500762939453125, 0.7966232299804688, 0.843170166015625, 0.8897171020507812, 0.9362640380859375, 0.9828109741210938, 1.02935791015625, 1.0759048461914062, 1.1224517822265625, 1.1689987182617188, 1.215545654296875, 1.2620925903320312, 1.3086395263671875, 1.3551864624023438, 1.4017333984375, 1.4482803344726562, 1.4948272705078125, 1.5413742065429688, 1.587921142578125, 1.6344680786132812, 1.6810150146484375, 1.7275619506835938, 1.77410888671875, 1.8206558227539062, 1.8672027587890625, 1.9137496948242188, 1.960296630859375, 2.0068435668945312, 2.0533905029296875, 2.0999374389648438, 2.146484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 7.0, 7.0, 7.0, 11.0, 14.0, 22.0, 45.0, 96.0, 196.0, 478.0, 1216.0, 3835.0, 12734.0, 54186.0, 584974.0, 3351725.0, 150708.0, 24559.0, 6208.0, 1979.0, 753.0, 279.0, 116.0, 61.0, 33.0, 14.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.3266448974609375, -2.258758544921875, -2.1908721923828125, -2.12298583984375, -2.0550994873046875, -1.987213134765625, -1.9193267822265625, -1.8514404296875, -1.7835540771484375, -1.715667724609375, -1.6477813720703125, -1.57989501953125, -1.5120086669921875, -1.444122314453125, -1.3762359619140625, -1.308349609375, -1.2404632568359375, -1.172576904296875, -1.1046905517578125, -1.03680419921875, -0.9689178466796875, -0.901031494140625, -0.8331451416015625, -0.7652587890625, -0.6973724365234375, -0.629486083984375, -0.5615997314453125, -0.49371337890625, -0.4258270263671875, -0.357940673828125, -0.2900543212890625, -0.22216796875, -0.1542816162109375, -0.086395263671875, -0.0185089111328125, 0.04937744140625, 0.1172637939453125, 0.185150146484375, 0.2530364990234375, 0.3209228515625, 0.3888092041015625, 0.456695556640625, 0.5245819091796875, 0.59246826171875, 0.6603546142578125, 0.728240966796875, 0.7961273193359375, 0.864013671875, 0.9319000244140625, 0.999786376953125, 1.0676727294921875, 1.13555908203125, 1.2034454345703125, 1.271331787109375, 1.3392181396484375, 1.4071044921875, 1.4749908447265625, 1.542877197265625, 1.6107635498046875, 1.67864990234375, 1.7465362548828125, 1.814422607421875, 1.8823089599609375, 1.9501953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 11.0, 22.0, 30.0, 32.0, 44.0, 69.0, 114.0, 191.0, 357.0, 753.0, 1146.0, 631.0, 287.0, 129.0, 94.0, 35.0, 34.0, 13.0, 17.0, 10.0, 6.0, 9.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.2656402587890625, -2.203155517578125, -2.1406707763671875, -2.07818603515625, -2.0157012939453125, -1.953216552734375, -1.8907318115234375, -1.8282470703125, -1.7657623291015625, -1.703277587890625, -1.6407928466796875, -1.57830810546875, -1.5158233642578125, -1.453338623046875, -1.3908538818359375, -1.328369140625, -1.2658843994140625, -1.203399658203125, -1.1409149169921875, -1.07843017578125, -1.0159454345703125, -0.953460693359375, -0.8909759521484375, -0.8284912109375, -0.7660064697265625, -0.703521728515625, -0.6410369873046875, -0.57855224609375, -0.5160675048828125, -0.453582763671875, -0.3910980224609375, -0.32861328125, -0.2661285400390625, -0.203643798828125, -0.1411590576171875, -0.07867431640625, -0.0161895751953125, 0.046295166015625, 0.1087799072265625, 0.1712646484375, 0.2337493896484375, 0.296234130859375, 0.3587188720703125, 0.42120361328125, 0.4836883544921875, 0.546173095703125, 0.6086578369140625, 0.671142578125, 0.7336273193359375, 0.796112060546875, 0.8585968017578125, 0.92108154296875, 0.9835662841796875, 1.046051025390625, 1.1085357666015625, 1.1710205078125, 1.2335052490234375, 1.295989990234375, 1.3584747314453125, 1.42095947265625, 1.4834442138671875, 1.545928955078125, 1.6084136962890625, 1.6708984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 13.0, 17.0, 47.0, 192.0, 378.0, 262.0, 68.0, 9.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.10574722290039, -25.055419921875, -24.00509262084961, -22.95476531982422, -21.904438018798828, -20.854110717773438, -19.80378532409668, -18.75345802307129, -17.7031307220459, -16.652803421020508, -15.602476119995117, -14.552149772644043, -13.501822471618652, -12.451495170593262, -11.401168823242188, -10.350841522216797, -9.300514221191406, -8.250186920166016, -7.199860095977783, -6.149533271789551, -5.09920597076416, -4.0488786697387695, -2.998551845550537, -1.9482250213623047, -0.8978977203369141, 0.15242934226989746, 1.202756404876709, 2.2530834674835205, 3.303410530090332, 4.353737831115723, 5.404064655303955, 6.4543914794921875, 7.504722595214844, 8.555049896240234, 9.605377197265625, 10.6557035446167, 11.70603084564209, 12.75635814666748, 13.806684494018555, 14.857011795043945, 15.907339096069336, 16.957666397094727, 18.007993698120117, 19.058320999145508, 20.108646392822266, 21.158973693847656, 22.209300994873047, 23.259628295898438, 24.309955596923828, 25.36028289794922, 26.41061019897461, 27.4609375, 28.51126480102539, 29.56159210205078, 30.61191749572754, 31.66224479675293, 32.71257019042969, 33.76289749145508, 34.81322479248047, 35.86355209350586, 36.91387939453125, 37.96420669555664, 39.01453399658203, 40.064857482910156, 41.11518859863281]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 8.0, 18.0, 24.0, 25.0, 32.0, 23.0, 35.0, 42.0, 37.0, 42.0, 49.0, 42.0, 63.0, 54.0, 57.0, 64.0, 46.0, 41.0, 45.0, 42.0, 34.0, 27.0, 27.0, 24.0, 14.0, 16.0, 12.0, 8.0, 11.0, 3.0, 8.0, 4.0, 4.0, 0.0, 3.0], "bins": [-10.711135864257812, -10.457696914672852, -10.204257011413574, -9.950818061828613, -9.697378158569336, -9.443939208984375, -9.190499305725098, -8.937060356140137, -8.68362045288086, -8.430181503295898, -8.176741600036621, -7.923302173614502, -7.669862747192383, -7.416423797607422, -7.162984371185303, -6.909544944763184, -6.656105995178223, -6.4026665687561035, -6.149227142333984, -5.895787715911865, -5.642348289489746, -5.388909339904785, -5.135469913482666, -4.882030487060547, -4.628591060638428, -4.375151634216309, -4.1217122077941895, -3.8682730197906494, -3.6148335933685303, -3.361394166946411, -3.107954978942871, -2.854515552520752, -2.601077079772949, -2.34763765335083, -2.094198226928711, -1.840759038925171, -1.5873196125030518, -1.3338801860809326, -1.080440878868103, -0.8270015716552734, -0.5735621452331543, -0.32012277841567993, -0.06668341159820557, 0.1867559552192688, 0.44019532203674316, 0.6936347484588623, 0.9470740556716919, 1.2005133628845215, 1.4539527893066406, 1.7073922157287598, 1.9608315229415894, 2.214270830154419, 2.467710256576538, 2.7211496829986572, 2.9745888710021973, 3.2280282974243164, 3.4814677238464355, 3.7349071502685547, 3.988346576690674, 4.241786003112793, 4.495224952697754, 4.748664855957031, 5.002103805541992, 5.255543231964111, 5.5089826583862305]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 5.0, 13.0, 13.0, 9.0, 35.0, 47.0, 61.0, 106.0, 172.0, 288.0, 445.0, 816.0, 1507.0, 2882.0, 5551.0, 11118.0, 23821.0, 53453.0, 127223.0, 285567.0, 294750.0, 134754.0, 56726.0, 25182.0, 11806.0, 5649.0, 2898.0, 1573.0, 898.0, 443.0, 296.0, 180.0, 99.0, 59.0, 37.0, 26.0, 17.0, 12.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.0942840576171875, -1.053802490234375, -1.0133209228515625, -0.97283935546875, -0.9323577880859375, -0.891876220703125, -0.8513946533203125, -0.8109130859375, -0.7704315185546875, -0.729949951171875, -0.6894683837890625, -0.64898681640625, -0.6085052490234375, -0.568023681640625, -0.5275421142578125, -0.487060546875, -0.4465789794921875, -0.406097412109375, -0.3656158447265625, -0.32513427734375, -0.2846527099609375, -0.244171142578125, -0.2036895751953125, -0.1632080078125, -0.1227264404296875, -0.082244873046875, -0.0417633056640625, -0.00128173828125, 0.0391998291015625, 0.079681396484375, 0.1201629638671875, 0.16064453125, 0.2011260986328125, 0.241607666015625, 0.2820892333984375, 0.32257080078125, 0.3630523681640625, 0.403533935546875, 0.4440155029296875, 0.4844970703125, 0.5249786376953125, 0.565460205078125, 0.6059417724609375, 0.64642333984375, 0.6869049072265625, 0.727386474609375, 0.7678680419921875, 0.808349609375, 0.8488311767578125, 0.889312744140625, 0.9297943115234375, 0.97027587890625, 1.0107574462890625, 1.051239013671875, 1.0917205810546875, 1.1322021484375, 1.1726837158203125, 1.213165283203125, 1.2536468505859375, 1.29412841796875, 1.3346099853515625, 1.375091552734375, 1.4155731201171875, 1.4560546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 5.0, 5.0, 9.0, 19.0, 25.0, 19.0, 31.0, 33.0, 42.0, 40.0, 40.0, 44.0, 50.0, 59.0, 51.0, 56.0, 47.0, 56.0, 46.0, 55.0, 41.0, 41.0, 30.0, 29.0, 33.0, 23.0, 11.0, 11.0, 9.0, 8.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6350555419921875, -0.611907958984375, -0.5887603759765625, -0.56561279296875, -0.5424652099609375, -0.519317626953125, -0.4961700439453125, -0.4730224609375, -0.4498748779296875, -0.426727294921875, -0.4035797119140625, -0.38043212890625, -0.3572845458984375, -0.334136962890625, -0.3109893798828125, -0.287841796875, -0.2646942138671875, -0.241546630859375, -0.2183990478515625, -0.19525146484375, -0.1721038818359375, -0.148956298828125, -0.1258087158203125, -0.1026611328125, -0.0795135498046875, -0.056365966796875, -0.0332183837890625, -0.01007080078125, 0.0130767822265625, 0.036224365234375, 0.0593719482421875, 0.08251953125, 0.1056671142578125, 0.128814697265625, 0.1519622802734375, 0.17510986328125, 0.1982574462890625, 0.221405029296875, 0.2445526123046875, 0.2677001953125, 0.2908477783203125, 0.313995361328125, 0.3371429443359375, 0.36029052734375, 0.3834381103515625, 0.406585693359375, 0.4297332763671875, 0.452880859375, 0.4760284423828125, 0.499176025390625, 0.5223236083984375, 0.54547119140625, 0.5686187744140625, 0.591766357421875, 0.6149139404296875, 0.6380615234375, 0.6612091064453125, 0.684356689453125, 0.7075042724609375, 0.73065185546875, 0.7537994384765625, 0.776947021484375, 0.8000946044921875, 0.8232421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 6.0, 10.0, 4.0, 10.0, 13.0, 24.0, 17.0, 38.0, 44.0, 62.0, 74.0, 137.0, 173.0, 250.0, 415.0, 619.0, 1048.0, 2073.0, 4542.0, 12419.0, 40258.0, 154658.0, 550894.0, 203435.0, 50745.0, 15429.0, 5493.0, 2410.0, 1250.0, 662.0, 448.0, 270.0, 184.0, 121.0, 100.0, 55.0, 34.0, 30.0, 21.0, 22.0, 16.0, 11.0, 5.0, 4.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8623046875, -1.8033599853515625, -1.744415283203125, -1.6854705810546875, -1.62652587890625, -1.5675811767578125, -1.508636474609375, -1.4496917724609375, -1.3907470703125, -1.3318023681640625, -1.272857666015625, -1.2139129638671875, -1.15496826171875, -1.0960235595703125, -1.037078857421875, -0.9781341552734375, -0.919189453125, -0.8602447509765625, -0.801300048828125, -0.7423553466796875, -0.68341064453125, -0.6244659423828125, -0.565521240234375, -0.5065765380859375, -0.4476318359375, -0.3886871337890625, -0.329742431640625, -0.2707977294921875, -0.21185302734375, -0.1529083251953125, -0.093963623046875, -0.0350189208984375, 0.02392578125, 0.0828704833984375, 0.141815185546875, 0.2007598876953125, 0.25970458984375, 0.3186492919921875, 0.377593994140625, 0.4365386962890625, 0.4954833984375, 0.5544281005859375, 0.613372802734375, 0.6723175048828125, 0.73126220703125, 0.7902069091796875, 0.849151611328125, 0.9080963134765625, 0.967041015625, 1.0259857177734375, 1.084930419921875, 1.1438751220703125, 1.20281982421875, 1.2617645263671875, 1.320709228515625, 1.3796539306640625, 1.4385986328125, 1.4975433349609375, 1.556488037109375, 1.6154327392578125, 1.67437744140625, 1.7333221435546875, 1.792266845703125, 1.8512115478515625, 1.91015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 8.0, 3.0, 11.0, 11.0, 16.0, 18.0, 14.0, 20.0, 22.0, 27.0, 37.0, 37.0, 33.0, 33.0, 28.0, 24.0, 41.0, 45.0, 34.0, 43.0, 43.0, 35.0, 39.0, 34.0, 30.0, 34.0, 38.0, 24.0, 29.0, 19.0, 24.0, 23.0, 14.0, 20.0, 11.0, 11.0, 10.0, 5.0, 16.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0234375, -1.95928955078125, -1.8951416015625, -1.83099365234375, -1.766845703125, -1.70269775390625, -1.6385498046875, -1.57440185546875, -1.51025390625, -1.44610595703125, -1.3819580078125, -1.31781005859375, -1.253662109375, -1.18951416015625, -1.1253662109375, -1.06121826171875, -0.9970703125, -0.93292236328125, -0.8687744140625, -0.80462646484375, -0.740478515625, -0.67633056640625, -0.6121826171875, -0.54803466796875, -0.48388671875, -0.41973876953125, -0.3555908203125, -0.29144287109375, -0.227294921875, -0.16314697265625, -0.0989990234375, -0.03485107421875, 0.029296875, 0.09344482421875, 0.1575927734375, 0.22174072265625, 0.285888671875, 0.35003662109375, 0.4141845703125, 0.47833251953125, 0.54248046875, 0.60662841796875, 0.6707763671875, 0.73492431640625, 0.799072265625, 0.86322021484375, 0.9273681640625, 0.99151611328125, 1.0556640625, 1.11981201171875, 1.1839599609375, 1.24810791015625, 1.312255859375, 1.37640380859375, 1.4405517578125, 1.50469970703125, 1.56884765625, 1.63299560546875, 1.6971435546875, 1.76129150390625, 1.825439453125, 1.88958740234375, 1.9537353515625, 2.01788330078125, 2.08203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 15.0, 17.0, 27.0, 36.0, 49.0, 84.0, 157.0, 336.0, 775.0, 2115.0, 9312.0, 91134.0, 817017.0, 112861.0, 10738.0, 2321.0, 772.0, 344.0, 155.0, 96.0, 55.0, 38.0, 29.0, 17.0, 11.0, 9.0, 9.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.358856201171875, -1.30950927734375, -1.260162353515625, -1.2108154296875, -1.161468505859375, -1.11212158203125, -1.062774658203125, -1.013427734375, -0.964080810546875, -0.91473388671875, -0.865386962890625, -0.8160400390625, -0.766693115234375, -0.71734619140625, -0.667999267578125, -0.61865234375, -0.569305419921875, -0.51995849609375, -0.470611572265625, -0.4212646484375, -0.371917724609375, -0.32257080078125, -0.273223876953125, -0.223876953125, -0.174530029296875, -0.12518310546875, -0.075836181640625, -0.0264892578125, 0.022857666015625, 0.07220458984375, 0.121551513671875, 0.1708984375, 0.220245361328125, 0.26959228515625, 0.318939208984375, 0.3682861328125, 0.417633056640625, 0.46697998046875, 0.516326904296875, 0.565673828125, 0.615020751953125, 0.66436767578125, 0.713714599609375, 0.7630615234375, 0.812408447265625, 0.86175537109375, 0.911102294921875, 0.96044921875, 1.009796142578125, 1.05914306640625, 1.108489990234375, 1.1578369140625, 1.207183837890625, 1.25653076171875, 1.305877685546875, 1.355224609375, 1.404571533203125, 1.45391845703125, 1.503265380859375, 1.5526123046875, 1.601959228515625, 1.65130615234375, 1.700653076171875, 1.75]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 13.0, 26.0, 46.0, 92.0, 194.0, 238.0, 191.0, 87.0, 42.0, 23.0, 11.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000377655029296875, -0.00036153942346572876, -0.0003454238176345825, -0.0003293082118034363, -0.00031319260597229004, -0.0002970770001411438, -0.00028096139430999756, -0.0002648457884788513, -0.0002487301826477051, -0.00023261457681655884, -0.0002164989709854126, -0.00020038336515426636, -0.00018426775932312012, -0.00016815215349197388, -0.00015203654766082764, -0.0001359209418296814, -0.00011980533599853516, -0.00010368973016738892, -8.757412433624268e-05, -7.145851850509644e-05, -5.5342912673950195e-05, -3.9227306842803955e-05, -2.3111701011657715e-05, -6.996095180511475e-06, 9.119510650634766e-06, 2.5235116481781006e-05, 4.1350722312927246e-05, 5.7466328144073486e-05, 7.358193397521973e-05, 8.969753980636597e-05, 0.00010581314563751221, 0.00012192875146865845, 0.0001380443572998047, 0.00015415996313095093, 0.00017027556896209717, 0.0001863911747932434, 0.00020250678062438965, 0.0002186223864555359, 0.00023473799228668213, 0.00025085359811782837, 0.0002669692039489746, 0.00028308480978012085, 0.0002992004156112671, 0.00031531602144241333, 0.00033143162727355957, 0.0003475472331047058, 0.00036366283893585205, 0.0003797784447669983, 0.00039589405059814453, 0.00041200965642929077, 0.000428125262260437, 0.00044424086809158325, 0.0004603564739227295, 0.00047647207975387573, 0.000492587685585022, 0.0005087032914161682, 0.0005248188972473145, 0.0005409345030784607, 0.0005570501089096069, 0.0005731657147407532, 0.0005892813205718994, 0.0006053969264030457, 0.0006215125322341919, 0.0006376281380653381, 0.0006537437438964844]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 12.0, 27.0, 25.0, 39.0, 59.0, 87.0, 114.0, 206.0, 332.0, 606.0, 1262.0, 2951.0, 8537.0, 35387.0, 229789.0, 630006.0, 109721.0, 19550.0, 5557.0, 2104.0, 926.0, 445.0, 277.0, 152.0, 101.0, 71.0, 56.0, 44.0, 26.0, 16.0, 9.0, 15.0, 7.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9628753662109375, -0.933074951171875, -0.9032745361328125, -0.87347412109375, -0.8436737060546875, -0.813873291015625, -0.7840728759765625, -0.7542724609375, -0.7244720458984375, -0.694671630859375, -0.6648712158203125, -0.63507080078125, -0.6052703857421875, -0.575469970703125, -0.5456695556640625, -0.515869140625, -0.4860687255859375, -0.456268310546875, -0.4264678955078125, -0.39666748046875, -0.3668670654296875, -0.337066650390625, -0.3072662353515625, -0.2774658203125, -0.2476654052734375, -0.217864990234375, -0.1880645751953125, -0.15826416015625, -0.1284637451171875, -0.098663330078125, -0.0688629150390625, -0.0390625, -0.0092620849609375, 0.020538330078125, 0.0503387451171875, 0.08013916015625, 0.1099395751953125, 0.139739990234375, 0.1695404052734375, 0.1993408203125, 0.2291412353515625, 0.258941650390625, 0.2887420654296875, 0.31854248046875, 0.3483428955078125, 0.378143310546875, 0.4079437255859375, 0.437744140625, 0.4675445556640625, 0.497344970703125, 0.5271453857421875, 0.55694580078125, 0.5867462158203125, 0.616546630859375, 0.6463470458984375, 0.6761474609375, 0.7059478759765625, 0.735748291015625, 0.7655487060546875, 0.79534912109375, 0.8251495361328125, 0.854949951171875, 0.8847503662109375, 0.91455078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 6.0, 3.0, 8.0, 14.0, 11.0, 18.0, 13.0, 25.0, 32.0, 32.0, 40.0, 50.0, 52.0, 58.0, 70.0, 64.0, 85.0, 65.0, 64.0, 44.0, 40.0, 37.0, 27.0, 27.0, 23.0, 14.0, 13.0, 11.0, 9.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5370025634765625, -0.514434814453125, -0.4918670654296875, -0.46929931640625, -0.4467315673828125, -0.424163818359375, -0.4015960693359375, -0.3790283203125, -0.3564605712890625, -0.333892822265625, -0.3113250732421875, -0.28875732421875, -0.2661895751953125, -0.243621826171875, -0.2210540771484375, -0.198486328125, -0.1759185791015625, -0.153350830078125, -0.1307830810546875, -0.10821533203125, -0.0856475830078125, -0.063079833984375, -0.0405120849609375, -0.0179443359375, 0.0046234130859375, 0.027191162109375, 0.0497589111328125, 0.07232666015625, 0.0948944091796875, 0.117462158203125, 0.1400299072265625, 0.16259765625, 0.1851654052734375, 0.207733154296875, 0.2303009033203125, 0.25286865234375, 0.2754364013671875, 0.298004150390625, 0.3205718994140625, 0.3431396484375, 0.3657073974609375, 0.388275146484375, 0.4108428955078125, 0.43341064453125, 0.4559783935546875, 0.478546142578125, 0.5011138916015625, 0.523681640625, 0.5462493896484375, 0.568817138671875, 0.5913848876953125, 0.61395263671875, 0.6365203857421875, 0.659088134765625, 0.6816558837890625, 0.7042236328125, 0.7267913818359375, 0.749359130859375, 0.7719268798828125, 0.79449462890625, 0.8170623779296875, 0.839630126953125, 0.8621978759765625, 0.884765625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 8.0, 21.0, 51.0, 129.0, 244.0, 279.0, 137.0, 67.0, 31.0, 12.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.25227165222168, -27.34659767150879, -26.4409236907959, -25.535247802734375, -24.629573822021484, -23.723899841308594, -22.818225860595703, -21.912551879882812, -21.006877899169922, -20.10120391845703, -19.19552993774414, -18.28985595703125, -17.384180068969727, -16.478506088256836, -15.572832107543945, -14.667158126831055, -13.761483192443848, -12.855809211730957, -11.95013427734375, -11.04446029663086, -10.138786315917969, -9.233112335205078, -8.327437400817871, -7.4217634201049805, -6.516088962554932, -5.610414505004883, -4.704740524291992, -3.7990660667419434, -2.8933918476104736, -1.987717628479004, -1.082043170928955, -0.17636919021606445, 0.7293052673339844, 1.634979486465454, 2.540653705596924, 3.4463281631469727, 4.352002143859863, 5.257676601409912, 6.163351058959961, 7.069025039672852, 7.9746994972229, 8.88037395477295, 9.78604793548584, 10.691722869873047, 11.597396850585938, 12.503070831298828, 13.408744812011719, 14.31441879272461, 15.220093727111816, 16.125768661499023, 17.031442642211914, 17.937116622924805, 18.842790603637695, 19.748464584350586, 20.65414047241211, 21.559814453125, 22.46548843383789, 23.37116241455078, 24.276836395263672, 25.182510375976562, 26.088186264038086, 26.993860244750977, 27.899534225463867, 28.805208206176758, 29.71088218688965]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 4.0, 6.0, 9.0, 17.0, 11.0, 10.0, 14.0, 25.0, 20.0, 29.0, 29.0, 32.0, 38.0, 35.0, 41.0, 51.0, 70.0, 61.0, 57.0, 55.0, 48.0, 47.0, 38.0, 38.0, 40.0, 25.0, 32.0, 20.0, 15.0, 13.0, 8.0, 12.0, 10.0, 9.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.498224258422852, -12.157544136047363, -11.816864967346191, -11.476184844970703, -11.135505676269531, -10.794825553894043, -10.454146385192871, -10.113466262817383, -9.772787094116211, -9.432106971740723, -9.09142780303955, -8.750747680664062, -8.41006851196289, -8.069388389587402, -7.7287092208862305, -7.388029098510742, -7.047349452972412, -6.706669807434082, -6.365990161895752, -6.025310516357422, -5.684630870819092, -5.343951225280762, -5.003271102905273, -4.662591934204102, -4.321911811828613, -3.981232166290283, -3.640552520751953, -3.299872875213623, -2.959193229675293, -2.618513584136963, -2.2778337001800537, -1.9371540546417236, -1.5964746475219727, -1.2557950019836426, -0.9151152968406677, -0.5744355916976929, -0.2337559461593628, 0.10692369937896729, 0.4476034641265869, 0.788283109664917, 1.128962755203247, 1.4696424007415771, 1.8103220462799072, 2.1510019302368164, 2.4916815757751465, 2.8323612213134766, 3.1730408668518066, 3.5137205123901367, 3.854400157928467, 4.195079803466797, 4.535759449005127, 4.876439094543457, 5.217118740081787, 5.557798385620117, 5.8984785079956055, 6.239157676696777, 6.579837799072266, 6.920517444610596, 7.261197090148926, 7.601876735687256, 7.942556381225586, 8.283236503601074, 8.623915672302246, 8.964595794677734, 9.305274963378906]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 6.0, 7.0, 15.0, 36.0, 31.0, 47.0, 82.0, 128.0, 258.0, 556.0, 1492.0, 4192.0, 13673.0, 53873.0, 323976.0, 2676048.0, 972448.0, 111423.0, 24484.0, 7242.0, 2403.0, 955.0, 406.0, 202.0, 113.0, 58.0, 29.0, 24.0, 14.0, 18.0, 6.0, 7.0, 8.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7373046875, -1.6956710815429688, -1.6540374755859375, -1.6124038696289062, -1.570770263671875, -1.5291366577148438, -1.4875030517578125, -1.4458694458007812, -1.40423583984375, -1.3626022338867188, -1.3209686279296875, -1.2793350219726562, -1.237701416015625, -1.1960678100585938, -1.1544342041015625, -1.1128005981445312, -1.0711669921875, -1.0295333862304688, -0.9878997802734375, -0.9462661743164062, -0.904632568359375, -0.8629989624023438, -0.8213653564453125, -0.7797317504882812, -0.73809814453125, -0.6964645385742188, -0.6548309326171875, -0.6131973266601562, -0.571563720703125, -0.5299301147460938, -0.4882965087890625, -0.44666290283203125, -0.405029296875, -0.36339569091796875, -0.3217620849609375, -0.28012847900390625, -0.238494873046875, -0.19686126708984375, -0.1552276611328125, -0.11359405517578125, -0.07196044921875, -0.03032684326171875, 0.0113067626953125, 0.05294036865234375, 0.094573974609375, 0.13620758056640625, 0.1778411865234375, 0.21947479248046875, 0.2611083984375, 0.30274200439453125, 0.3443756103515625, 0.38600921630859375, 0.427642822265625, 0.46927642822265625, 0.5109100341796875, 0.5525436401367188, 0.59417724609375, 0.6358108520507812, 0.6774444580078125, 0.7190780639648438, 0.760711669921875, 0.8023452758789062, 0.8439788818359375, 0.8856124877929688, 0.92724609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 11.0, 7.0, 17.0, 21.0, 17.0, 24.0, 41.0, 30.0, 52.0, 43.0, 40.0, 60.0, 55.0, 56.0, 69.0, 45.0, 48.0, 54.0, 42.0, 35.0, 36.0, 34.0, 30.0, 23.0, 24.0, 23.0, 12.0, 11.0, 10.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7147216796875, -0.692626953125, -0.6705322265625, -0.6484375, -0.6263427734375, -0.604248046875, -0.5821533203125, -0.56005859375, -0.5379638671875, -0.515869140625, -0.4937744140625, -0.4716796875, -0.4495849609375, -0.427490234375, -0.4053955078125, -0.38330078125, -0.3612060546875, -0.339111328125, -0.3170166015625, -0.294921875, -0.2728271484375, -0.250732421875, -0.2286376953125, -0.20654296875, -0.1844482421875, -0.162353515625, -0.1402587890625, -0.1181640625, -0.0960693359375, -0.073974609375, -0.0518798828125, -0.02978515625, -0.0076904296875, 0.014404296875, 0.0364990234375, 0.05859375, 0.0806884765625, 0.102783203125, 0.1248779296875, 0.14697265625, 0.1690673828125, 0.191162109375, 0.2132568359375, 0.2353515625, 0.2574462890625, 0.279541015625, 0.3016357421875, 0.32373046875, 0.3458251953125, 0.367919921875, 0.3900146484375, 0.412109375, 0.4342041015625, 0.456298828125, 0.4783935546875, 0.50048828125, 0.5225830078125, 0.544677734375, 0.5667724609375, 0.5888671875, 0.6109619140625, 0.633056640625, 0.6551513671875, 0.67724609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 2.0, 12.0, 19.0, 23.0, 30.0, 40.0, 85.0, 194.0, 444.0, 1163.0, 3794.0, 17310.0, 131148.0, 2880317.0, 1076710.0, 67455.0, 11192.0, 2654.0, 906.0, 375.0, 154.0, 103.0, 54.0, 26.0, 17.0, 21.0, 16.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.662109375, -2.5935821533203125, -2.525054931640625, -2.4565277099609375, -2.38800048828125, -2.3194732666015625, -2.250946044921875, -2.1824188232421875, -2.1138916015625, -2.0453643798828125, -1.976837158203125, -1.9083099365234375, -1.83978271484375, -1.7712554931640625, -1.702728271484375, -1.6342010498046875, -1.565673828125, -1.4971466064453125, -1.428619384765625, -1.3600921630859375, -1.29156494140625, -1.2230377197265625, -1.154510498046875, -1.0859832763671875, -1.0174560546875, -0.9489288330078125, -0.880401611328125, -0.8118743896484375, -0.74334716796875, -0.6748199462890625, -0.606292724609375, -0.5377655029296875, -0.46923828125, -0.4007110595703125, -0.332183837890625, -0.2636566162109375, -0.19512939453125, -0.1266021728515625, -0.058074951171875, 0.0104522705078125, 0.0789794921875, 0.1475067138671875, 0.216033935546875, 0.2845611572265625, 0.35308837890625, 0.4216156005859375, 0.490142822265625, 0.5586700439453125, 0.627197265625, 0.6957244873046875, 0.764251708984375, 0.8327789306640625, 0.90130615234375, 0.9698333740234375, 1.038360595703125, 1.1068878173828125, 1.1754150390625, 1.2439422607421875, 1.312469482421875, 1.3809967041015625, 1.44952392578125, 1.5180511474609375, 1.586578369140625, 1.6551055908203125, 1.7236328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 8.0, 12.0, 19.0, 25.0, 38.0, 50.0, 63.0, 80.0, 130.0, 173.0, 342.0, 495.0, 729.0, 666.0, 412.0, 255.0, 155.0, 119.0, 70.0, 54.0, 33.0, 36.0, 26.0, 15.0, 16.0, 12.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4846649169921875, -1.429290771484375, -1.3739166259765625, -1.31854248046875, -1.2631683349609375, -1.207794189453125, -1.1524200439453125, -1.0970458984375, -1.0416717529296875, -0.986297607421875, -0.9309234619140625, -0.87554931640625, -0.8201751708984375, -0.764801025390625, -0.7094268798828125, -0.654052734375, -0.5986785888671875, -0.543304443359375, -0.4879302978515625, -0.43255615234375, -0.3771820068359375, -0.321807861328125, -0.2664337158203125, -0.2110595703125, -0.1556854248046875, -0.100311279296875, -0.0449371337890625, 0.01043701171875, 0.0658111572265625, 0.121185302734375, 0.1765594482421875, 0.23193359375, 0.2873077392578125, 0.342681884765625, 0.3980560302734375, 0.45343017578125, 0.5088043212890625, 0.564178466796875, 0.6195526123046875, 0.6749267578125, 0.7303009033203125, 0.785675048828125, 0.8410491943359375, 0.89642333984375, 0.9517974853515625, 1.007171630859375, 1.0625457763671875, 1.117919921875, 1.1732940673828125, 1.228668212890625, 1.2840423583984375, 1.33941650390625, 1.3947906494140625, 1.450164794921875, 1.5055389404296875, 1.5609130859375, 1.6162872314453125, 1.671661376953125, 1.7270355224609375, 1.78240966796875, 1.8377838134765625, 1.893157958984375, 1.9485321044921875, 2.00390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 29.0, 81.0, 255.0, 330.0, 201.0, 64.0, 20.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90439224243164, -53.773372650146484, -52.64234924316406, -51.511329650878906, -50.380306243896484, -49.24928665161133, -48.118263244628906, -46.98724365234375, -45.856224060058594, -44.72520446777344, -43.594181060791016, -42.46316146850586, -41.33213806152344, -40.20111846923828, -39.07009506225586, -37.9390754699707, -36.80805206298828, -35.677032470703125, -34.5460090637207, -33.41498947143555, -32.283966064453125, -31.15294647216797, -30.02192497253418, -28.89090347290039, -27.7598819732666, -26.628860473632812, -25.497838973999023, -24.366817474365234, -23.235797882080078, -22.104774475097656, -20.9737548828125, -19.84273338317871, -18.711713790893555, -17.580692291259766, -16.449670791625977, -15.318650245666504, -14.187628746032715, -13.056607246398926, -11.925586700439453, -10.794565200805664, -9.663543701171875, -8.532522201538086, -7.401501178741455, -6.270480155944824, -5.139458656311035, -4.008437156677246, -2.8774161338806152, -1.7463951110839844, -0.6153736114501953, 0.5156476497650146, 1.6466689109802246, 2.7776901721954346, 3.9087114334106445, 5.039732933044434, 6.1707539558410645, 7.301774978637695, 8.432796478271484, 9.563817977905273, 10.694839477539062, 11.825860023498535, 12.956881523132324, 14.087903022766113, 15.218923568725586, 16.349945068359375, 17.480966567993164]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 9.0, 8.0, 15.0, 12.0, 15.0, 20.0, 24.0, 25.0, 23.0, 27.0, 30.0, 31.0, 45.0, 44.0, 50.0, 51.0, 39.0, 54.0, 27.0, 46.0, 40.0, 45.0, 39.0, 30.0, 44.0, 21.0, 25.0, 20.0, 20.0, 23.0, 12.0, 12.0, 9.0, 12.0, 6.0, 11.0, 2.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.35908031463623, -8.098928451538086, -7.838776111602783, -7.578624248504639, -7.318471908569336, -7.058320045471191, -6.798168182373047, -6.538016319274902, -6.2778639793396, -6.017712116241455, -5.757559776306152, -5.497407913208008, -5.237256050109863, -4.9771037101745605, -4.716951847076416, -4.456799507141113, -4.196647644042969, -3.936495542526245, -3.6763434410095215, -3.416191577911377, -3.1560394763946533, -2.8958873748779297, -2.635735511779785, -2.3755834102630615, -2.115431308746338, -1.8552792072296143, -1.5951272249221802, -1.334975242614746, -1.0748231410980225, -0.8146710395812988, -0.5545190572738647, -0.29436707496643066, -0.03421592712402344, 0.22593611478805542, 0.4860881567001343, 0.7462401986122131, 1.006392240524292, 1.2665443420410156, 1.5266963243484497, 1.7868483066558838, 2.0470004081726074, 2.307152509689331, 2.5673046112060547, 2.827456474304199, 3.087608575820923, 3.3477606773376465, 3.607912540435791, 3.8680646419525146, 4.128216743469238, 4.388368606567383, 4.6485209465026855, 4.90867280960083, 5.168825149536133, 5.428977012634277, 5.689128875732422, 5.949280738830566, 6.209433078765869, 6.469584941864014, 6.729737281799316, 6.989889144897461, 7.2500410079956055, 7.510193347930908, 7.770345211029053, 8.030497550964355, 8.2906494140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 8.0, 12.0, 15.0, 16.0, 49.0, 78.0, 125.0, 239.0, 431.0, 927.0, 2036.0, 4847.0, 12062.0, 31841.0, 82588.0, 203607.0, 344478.0, 218392.0, 89557.0, 34546.0, 13095.0, 5298.0, 2217.0, 1003.0, 478.0, 269.0, 137.0, 77.0, 51.0, 23.0, 18.0, 15.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.106292724609375, -1.06121826171875, -1.016143798828125, -0.9710693359375, -0.925994873046875, -0.88092041015625, -0.835845947265625, -0.790771484375, -0.745697021484375, -0.70062255859375, -0.655548095703125, -0.6104736328125, -0.565399169921875, -0.52032470703125, -0.475250244140625, -0.43017578125, -0.385101318359375, -0.34002685546875, -0.294952392578125, -0.2498779296875, -0.204803466796875, -0.15972900390625, -0.114654541015625, -0.069580078125, -0.024505615234375, 0.02056884765625, 0.065643310546875, 0.1107177734375, 0.155792236328125, 0.20086669921875, 0.245941162109375, 0.291015625, 0.336090087890625, 0.38116455078125, 0.426239013671875, 0.4713134765625, 0.516387939453125, 0.56146240234375, 0.606536865234375, 0.651611328125, 0.696685791015625, 0.74176025390625, 0.786834716796875, 0.8319091796875, 0.876983642578125, 0.92205810546875, 0.967132568359375, 1.01220703125, 1.057281494140625, 1.10235595703125, 1.147430419921875, 1.1925048828125, 1.237579345703125, 1.28265380859375, 1.327728271484375, 1.372802734375, 1.417877197265625, 1.46295166015625, 1.508026123046875, 1.5531005859375, 1.598175048828125, 1.64324951171875, 1.688323974609375, 1.7333984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 7.0, 13.0, 8.0, 7.0, 13.0, 10.0, 16.0, 17.0, 17.0, 28.0, 29.0, 27.0, 33.0, 29.0, 30.0, 28.0, 29.0, 23.0, 36.0, 34.0, 49.0, 43.0, 46.0, 42.0, 32.0, 33.0, 38.0, 29.0, 31.0, 31.0, 28.0, 22.0, 20.0, 16.0, 18.0, 17.0, 13.0, 5.0, 6.0, 5.0, 8.0, 6.0, 4.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.515625, -0.4998435974121094, -0.48406219482421875, -0.4682807922363281, -0.4524993896484375, -0.4367179870605469, -0.42093658447265625, -0.4051551818847656, -0.389373779296875, -0.3735923767089844, -0.35781097412109375, -0.3420295715332031, -0.3262481689453125, -0.3104667663574219, -0.29468536376953125, -0.2789039611816406, -0.26312255859375, -0.24734115600585938, -0.23155975341796875, -0.21577835083007812, -0.1999969482421875, -0.18421554565429688, -0.16843414306640625, -0.15265274047851562, -0.136871337890625, -0.12108993530273438, -0.10530853271484375, -0.08952713012695312, -0.0737457275390625, -0.057964324951171875, -0.04218292236328125, -0.026401519775390625, -0.0106201171875, 0.005161285400390625, 0.02094268798828125, 0.036724090576171875, 0.0525054931640625, 0.06828689575195312, 0.08406829833984375, 0.09984970092773438, 0.115631103515625, 0.13141250610351562, 0.14719390869140625, 0.16297531127929688, 0.1787567138671875, 0.19453811645507812, 0.21031951904296875, 0.22610092163085938, 0.24188232421875, 0.2576637268066406, 0.27344512939453125, 0.2892265319824219, 0.3050079345703125, 0.3207893371582031, 0.33657073974609375, 0.3523521423339844, 0.368133544921875, 0.3839149475097656, 0.39969635009765625, 0.4154777526855469, 0.4312591552734375, 0.4470405578613281, 0.46282196044921875, 0.4786033630371094, 0.494384765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 12.0, 7.0, 13.0, 11.0, 24.0, 36.0, 39.0, 57.0, 68.0, 105.0, 166.0, 230.0, 348.0, 526.0, 732.0, 1217.0, 2170.0, 4676.0, 14292.0, 65677.0, 391515.0, 472778.0, 68178.0, 14930.0, 4936.0, 2194.0, 1222.0, 755.0, 484.0, 379.0, 219.0, 153.0, 134.0, 77.0, 59.0, 42.0, 28.0, 22.0, 16.0, 9.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.689453125, -2.616790771484375, -2.54412841796875, -2.471466064453125, -2.3988037109375, -2.326141357421875, -2.25347900390625, -2.180816650390625, -2.108154296875, -2.035491943359375, -1.96282958984375, -1.890167236328125, -1.8175048828125, -1.744842529296875, -1.67218017578125, -1.599517822265625, -1.52685546875, -1.454193115234375, -1.38153076171875, -1.308868408203125, -1.2362060546875, -1.163543701171875, -1.09088134765625, -1.018218994140625, -0.945556640625, -0.872894287109375, -0.80023193359375, -0.727569580078125, -0.6549072265625, -0.582244873046875, -0.50958251953125, -0.436920166015625, -0.3642578125, -0.291595458984375, -0.21893310546875, -0.146270751953125, -0.0736083984375, -0.000946044921875, 0.07171630859375, 0.144378662109375, 0.217041015625, 0.289703369140625, 0.36236572265625, 0.435028076171875, 0.5076904296875, 0.580352783203125, 0.65301513671875, 0.725677490234375, 0.79833984375, 0.871002197265625, 0.94366455078125, 1.016326904296875, 1.0889892578125, 1.161651611328125, 1.23431396484375, 1.306976318359375, 1.379638671875, 1.452301025390625, 1.52496337890625, 1.597625732421875, 1.6702880859375, 1.742950439453125, 1.81561279296875, 1.888275146484375, 1.9609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 7.0, 9.0, 17.0, 9.0, 29.0, 33.0, 28.0, 38.0, 34.0, 29.0, 51.0, 41.0, 52.0, 55.0, 63.0, 69.0, 51.0, 56.0, 44.0, 51.0, 37.0, 45.0, 25.0, 21.0, 19.0, 21.0, 10.0, 11.0, 10.0, 5.0, 8.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.7890625, -3.689208984375, -3.58935546875, -3.489501953125, -3.3896484375, -3.289794921875, -3.18994140625, -3.090087890625, -2.990234375, -2.890380859375, -2.79052734375, -2.690673828125, -2.5908203125, -2.490966796875, -2.39111328125, -2.291259765625, -2.19140625, -2.091552734375, -1.99169921875, -1.891845703125, -1.7919921875, -1.692138671875, -1.59228515625, -1.492431640625, -1.392578125, -1.292724609375, -1.19287109375, -1.093017578125, -0.9931640625, -0.893310546875, -0.79345703125, -0.693603515625, -0.59375, -0.493896484375, -0.39404296875, -0.294189453125, -0.1943359375, -0.094482421875, 0.00537109375, 0.105224609375, 0.205078125, 0.304931640625, 0.40478515625, 0.504638671875, 0.6044921875, 0.704345703125, 0.80419921875, 0.904052734375, 1.00390625, 1.103759765625, 1.20361328125, 1.303466796875, 1.4033203125, 1.503173828125, 1.60302734375, 1.702880859375, 1.802734375, 1.902587890625, 2.00244140625, 2.102294921875, 2.2021484375, 2.302001953125, 2.40185546875, 2.501708984375, 2.6015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 11.0, 19.0, 16.0, 33.0, 29.0, 38.0, 76.0, 135.0, 235.0, 524.0, 1445.0, 5552.0, 42367.0, 720266.0, 252519.0, 20027.0, 3400.0, 973.0, 374.0, 178.0, 100.0, 63.0, 54.0, 27.0, 21.0, 18.0, 15.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.263702392578125, -1.22271728515625, -1.181732177734375, -1.1407470703125, -1.099761962890625, -1.05877685546875, -1.017791748046875, -0.976806640625, -0.935821533203125, -0.89483642578125, -0.853851318359375, -0.8128662109375, -0.771881103515625, -0.73089599609375, -0.689910888671875, -0.64892578125, -0.607940673828125, -0.56695556640625, -0.525970458984375, -0.4849853515625, -0.444000244140625, -0.40301513671875, -0.362030029296875, -0.321044921875, -0.280059814453125, -0.23907470703125, -0.198089599609375, -0.1571044921875, -0.116119384765625, -0.07513427734375, -0.034149169921875, 0.0068359375, 0.047821044921875, 0.08880615234375, 0.129791259765625, 0.1707763671875, 0.211761474609375, 0.25274658203125, 0.293731689453125, 0.334716796875, 0.375701904296875, 0.41668701171875, 0.457672119140625, 0.4986572265625, 0.539642333984375, 0.58062744140625, 0.621612548828125, 0.66259765625, 0.703582763671875, 0.74456787109375, 0.785552978515625, 0.8265380859375, 0.867523193359375, 0.90850830078125, 0.949493408203125, 0.990478515625, 1.031463623046875, 1.07244873046875, 1.113433837890625, 1.1544189453125, 1.195404052734375, 1.23638916015625, 1.277374267578125, 1.318359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 8.0, 14.0, 7.0, 14.0, 16.0, 18.0, 23.0, 25.0, 39.0, 35.0, 53.0, 75.0, 93.0, 105.0, 101.0, 66.0, 62.0, 45.0, 34.0, 31.0, 21.0, 14.0, 11.0, 9.0, 9.0, 13.0, 7.0, 6.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023496150970458984, -0.0002283584326505661, -0.00022175535559654236, -0.00021515227854251862, -0.00020854920148849487, -0.00020194612443447113, -0.0001953430473804474, -0.00018873997032642365, -0.0001821368932723999, -0.00017553381621837616, -0.00016893073916435242, -0.00016232766211032867, -0.00015572458505630493, -0.0001491215080022812, -0.00014251843094825745, -0.0001359153538942337, -0.00012931227684020996, -0.00012270919978618622, -0.00011610612273216248, -0.00010950304567813873, -0.00010289996862411499, -9.629689157009125e-05, -8.96938145160675e-05, -8.309073746204376e-05, -7.648766040802002e-05, -6.988458335399628e-05, -6.328150629997253e-05, -5.667842924594879e-05, -5.007535219192505e-05, -4.3472275137901306e-05, -3.6869198083877563e-05, -3.026612102985382e-05, -2.3663043975830078e-05, -1.7059966921806335e-05, -1.0456889867782593e-05, -3.85381281375885e-06, 2.7492642402648926e-06, 9.352341294288635e-06, 1.5955418348312378e-05, 2.255849540233612e-05, 2.9161572456359863e-05, 3.5764649510383606e-05, 4.236772656440735e-05, 4.897080361843109e-05, 5.5573880672454834e-05, 6.217695772647858e-05, 6.878003478050232e-05, 7.538311183452606e-05, 8.19861888885498e-05, 8.858926594257355e-05, 9.519234299659729e-05, 0.00010179542005062103, 0.00010839849710464478, 0.00011500157415866852, 0.00012160465121269226, 0.000128207728266716, 0.00013481080532073975, 0.0001414138823747635, 0.00014801695942878723, 0.00015462003648281097, 0.00016122311353683472, 0.00016782619059085846, 0.0001744292676448822, 0.00018103234469890594, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 6.0, 9.0, 11.0, 16.0, 18.0, 27.0, 56.0, 114.0, 167.0, 353.0, 786.0, 2018.0, 7340.0, 61731.0, 859465.0, 102354.0, 9918.0, 2437.0, 890.0, 371.0, 188.0, 103.0, 54.0, 40.0, 23.0, 15.0, 14.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2694091796875, -1.223388671875, -1.1773681640625, -1.13134765625, -1.0853271484375, -1.039306640625, -0.9932861328125, -0.947265625, -0.9012451171875, -0.855224609375, -0.8092041015625, -0.76318359375, -0.7171630859375, -0.671142578125, -0.6251220703125, -0.5791015625, -0.5330810546875, -0.487060546875, -0.4410400390625, -0.39501953125, -0.3489990234375, -0.302978515625, -0.2569580078125, -0.2109375, -0.1649169921875, -0.118896484375, -0.0728759765625, -0.02685546875, 0.0191650390625, 0.065185546875, 0.1112060546875, 0.1572265625, 0.2032470703125, 0.249267578125, 0.2952880859375, 0.34130859375, 0.3873291015625, 0.433349609375, 0.4793701171875, 0.525390625, 0.5714111328125, 0.617431640625, 0.6634521484375, 0.70947265625, 0.7554931640625, 0.801513671875, 0.8475341796875, 0.8935546875, 0.9395751953125, 0.985595703125, 1.0316162109375, 1.07763671875, 1.1236572265625, 1.169677734375, 1.2156982421875, 1.26171875, 1.3077392578125, 1.353759765625, 1.3997802734375, 1.44580078125, 1.4918212890625, 1.537841796875, 1.5838623046875, 1.6298828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 5.0, 2.0, 6.0, 5.0, 4.0, 8.0, 9.0, 12.0, 14.0, 10.0, 26.0, 22.0, 18.0, 44.0, 44.0, 62.0, 60.0, 64.0, 78.0, 77.0, 65.0, 69.0, 53.0, 50.0, 36.0, 20.0, 29.0, 24.0, 20.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.578155517578125, -0.55523681640625, -0.532318115234375, -0.5093994140625, -0.486480712890625, -0.46356201171875, -0.440643310546875, -0.417724609375, -0.394805908203125, -0.37188720703125, -0.348968505859375, -0.3260498046875, -0.303131103515625, -0.28021240234375, -0.257293701171875, -0.234375, -0.211456298828125, -0.18853759765625, -0.165618896484375, -0.1427001953125, -0.119781494140625, -0.09686279296875, -0.073944091796875, -0.051025390625, -0.028106689453125, -0.00518798828125, 0.017730712890625, 0.0406494140625, 0.063568115234375, 0.08648681640625, 0.109405517578125, 0.13232421875, 0.155242919921875, 0.17816162109375, 0.201080322265625, 0.2239990234375, 0.246917724609375, 0.26983642578125, 0.292755126953125, 0.315673828125, 0.338592529296875, 0.36151123046875, 0.384429931640625, 0.4073486328125, 0.430267333984375, 0.45318603515625, 0.476104736328125, 0.4990234375, 0.521942138671875, 0.54486083984375, 0.567779541015625, 0.5906982421875, 0.613616943359375, 0.63653564453125, 0.659454345703125, 0.682373046875, 0.705291748046875, 0.72821044921875, 0.751129150390625, 0.7740478515625, 0.796966552734375, 0.81988525390625, 0.842803955078125, 0.86572265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 26.0, 63.0, 113.0, 180.0, 270.0, 154.0, 87.0, 41.0, 15.0, 9.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.599945068359375, -23.90130043029785, -23.202655792236328, -22.504009246826172, -21.80536460876465, -21.106719970703125, -20.4080753326416, -19.709430694580078, -19.010784149169922, -18.3121395111084, -17.613494873046875, -16.91484832763672, -16.216203689575195, -15.517559051513672, -14.818914413452148, -14.120268821716309, -13.421624183654785, -12.722979545593262, -12.024333953857422, -11.325689315795898, -10.627043724060059, -9.928399085998535, -9.229753494262695, -8.531108856201172, -7.83246374130249, -7.133818626403809, -6.435173511505127, -5.736528396606445, -5.037883758544922, -4.339238166809082, -3.6405935287475586, -2.941948413848877, -2.2433032989501953, -1.5446581840515137, -0.8460131883621216, -0.1473681926727295, 0.5512769222259521, 1.2499220371246338, 1.9485669136047363, 2.647212028503418, 3.3458571434020996, 4.044502258300781, 4.743147373199463, 5.4417924880981445, 6.140437126159668, 6.839082717895508, 7.537727355957031, 8.236371994018555, 8.935017585754395, 9.633662223815918, 10.332307815551758, 11.030952453613281, 11.729598045349121, 12.428242683410645, 13.126888275146484, 13.825532913208008, 14.524177551269531, 15.222822189331055, 15.921467781066895, 16.620113372802734, 17.318758010864258, 18.01740264892578, 18.716047286987305, 19.414691925048828, 20.113338470458984]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 13.0, 14.0, 9.0, 18.0, 16.0, 26.0, 30.0, 41.0, 50.0, 60.0, 73.0, 99.0, 117.0, 91.0, 74.0, 55.0, 57.0, 30.0, 35.0, 23.0, 23.0, 14.0, 13.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.525236129760742, -9.979242324829102, -9.433248519897461, -8.88725471496582, -8.341261863708496, -7.7952680587768555, -7.249274253845215, -6.703280448913574, -6.157287120819092, -5.611293315887451, -5.065299987792969, -4.519306182861328, -3.9733126163482666, -3.427319049835205, -2.8813252449035645, -2.335331678390503, -1.7893381118774414, -1.2433445453643799, -0.6973508596420288, -0.15135717391967773, 0.3946363925933838, 0.9406299591064453, 1.486623764038086, 2.0326173305511475, 2.578610897064209, 3.1246044635772705, 3.670598030090332, 4.216591835021973, 4.762585639953613, 5.308578968048096, 5.854572772979736, 6.400566101074219, 6.946559906005859, 7.4925537109375, 8.03854751586914, 8.584541320800781, 9.130534172058105, 9.676527976989746, 10.222521781921387, 10.768515586853027, 11.314508438110352, 11.860502243041992, 12.406496047973633, 12.952489852905273, 13.498482704162598, 14.044476509094238, 14.590470314025879, 15.13646411895752, 15.68245792388916, 16.228450775146484, 16.774444580078125, 17.320438385009766, 17.866432189941406, 18.412425994873047, 18.958419799804688, 19.504413604736328, 20.05040740966797, 20.59640121459961, 21.14239501953125, 21.68838882446289, 22.23438262939453, 22.780376434326172, 23.326370239257812, 23.87236213684082, 24.41835594177246]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 15.0, 55.0, 257.0, 1042.0, 4667.0, 46949.0, 2914864.0, 1198761.0, 24539.0, 2457.0, 436.0, 117.0, 45.0, 20.0, 14.0, 14.0, 8.0, 3.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.623046875, -3.5423431396484375, -3.461639404296875, -3.3809356689453125, -3.30023193359375, -3.2195281982421875, -3.138824462890625, -3.0581207275390625, -2.9774169921875, -2.8967132568359375, -2.816009521484375, -2.7353057861328125, -2.65460205078125, -2.5738983154296875, -2.493194580078125, -2.4124908447265625, -2.331787109375, -2.2510833740234375, -2.170379638671875, -2.0896759033203125, -2.00897216796875, -1.9282684326171875, -1.847564697265625, -1.7668609619140625, -1.6861572265625, -1.6054534912109375, -1.524749755859375, -1.4440460205078125, -1.36334228515625, -1.2826385498046875, -1.201934814453125, -1.1212310791015625, -1.04052734375, -0.9598236083984375, -0.879119873046875, -0.7984161376953125, -0.71771240234375, -0.6370086669921875, -0.556304931640625, -0.4756011962890625, -0.3948974609375, -0.3141937255859375, -0.233489990234375, -0.1527862548828125, -0.07208251953125, 0.0086212158203125, 0.089324951171875, 0.1700286865234375, 0.250732421875, 0.3314361572265625, 0.412139892578125, 0.4928436279296875, 0.57354736328125, 0.6542510986328125, 0.734954833984375, 0.8156585693359375, 0.8963623046875, 0.9770660400390625, 1.057769775390625, 1.1384735107421875, 1.21917724609375, 1.2998809814453125, 1.380584716796875, 1.4612884521484375, 1.5419921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 15.0, 29.0, 64.0, 83.0, 118.0, 155.0, 181.0, 145.0, 99.0, 68.0, 32.0, 17.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7421875, -0.675811767578125, -0.60943603515625, -0.543060302734375, -0.4766845703125, -0.410308837890625, -0.34393310546875, -0.277557373046875, -0.211181640625, -0.144805908203125, -0.07843017578125, -0.012054443359375, 0.0543212890625, 0.120697021484375, 0.18707275390625, 0.253448486328125, 0.31982421875, 0.386199951171875, 0.45257568359375, 0.518951416015625, 0.5853271484375, 0.651702880859375, 0.71807861328125, 0.784454345703125, 0.850830078125, 0.917205810546875, 0.98358154296875, 1.049957275390625, 1.1163330078125, 1.182708740234375, 1.24908447265625, 1.315460205078125, 1.3818359375, 1.448211669921875, 1.51458740234375, 1.580963134765625, 1.6473388671875, 1.713714599609375, 1.78009033203125, 1.846466064453125, 1.912841796875, 1.979217529296875, 2.04559326171875, 2.111968994140625, 2.1783447265625, 2.244720458984375, 2.31109619140625, 2.377471923828125, 2.44384765625, 2.510223388671875, 2.57659912109375, 2.642974853515625, 2.7093505859375, 2.775726318359375, 2.84210205078125, 2.908477783203125, 2.974853515625, 3.041229248046875, 3.10760498046875, 3.173980712890625, 3.2403564453125, 3.306732177734375, 3.37310791015625, 3.439483642578125, 3.505859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 20.0, 48.0, 102.0, 174.0, 487.0, 1607.0, 7692.0, 73917.0, 3426148.0, 653429.0, 25689.0, 3623.0, 870.0, 269.0, 97.0, 48.0, 21.0, 14.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.078125, -3.98907470703125, -3.9000244140625, -3.81097412109375, -3.721923828125, -3.63287353515625, -3.5438232421875, -3.45477294921875, -3.36572265625, -3.27667236328125, -3.1876220703125, -3.09857177734375, -3.009521484375, -2.92047119140625, -2.8314208984375, -2.74237060546875, -2.6533203125, -2.56427001953125, -2.4752197265625, -2.38616943359375, -2.297119140625, -2.20806884765625, -2.1190185546875, -2.02996826171875, -1.94091796875, -1.85186767578125, -1.7628173828125, -1.67376708984375, -1.584716796875, -1.49566650390625, -1.4066162109375, -1.31756591796875, -1.228515625, -1.13946533203125, -1.0504150390625, -0.96136474609375, -0.872314453125, -0.78326416015625, -0.6942138671875, -0.60516357421875, -0.51611328125, -0.42706298828125, -0.3380126953125, -0.24896240234375, -0.159912109375, -0.07086181640625, 0.0181884765625, 0.10723876953125, 0.1962890625, 0.28533935546875, 0.3743896484375, 0.46343994140625, 0.552490234375, 0.64154052734375, 0.7305908203125, 0.81964111328125, 0.90869140625, 0.99774169921875, 1.0867919921875, 1.17584228515625, 1.264892578125, 1.35394287109375, 1.4429931640625, 1.53204345703125, 1.62109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 12.0, 12.0, 10.0, 21.0, 21.0, 27.0, 41.0, 55.0, 97.0, 126.0, 217.0, 397.0, 595.0, 732.0, 627.0, 386.0, 231.0, 133.0, 82.0, 55.0, 49.0, 25.0, 25.0, 20.0, 15.0, 6.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7431640625, -1.6910247802734375, -1.638885498046875, -1.5867462158203125, -1.53460693359375, -1.4824676513671875, -1.430328369140625, -1.3781890869140625, -1.3260498046875, -1.2739105224609375, -1.221771240234375, -1.1696319580078125, -1.11749267578125, -1.0653533935546875, -1.013214111328125, -0.9610748291015625, -0.908935546875, -0.8567962646484375, -0.804656982421875, -0.7525177001953125, -0.70037841796875, -0.6482391357421875, -0.596099853515625, -0.5439605712890625, -0.4918212890625, -0.4396820068359375, -0.387542724609375, -0.3354034423828125, -0.28326416015625, -0.2311248779296875, -0.178985595703125, -0.1268463134765625, -0.07470703125, -0.0225677490234375, 0.029571533203125, 0.0817108154296875, 0.13385009765625, 0.1859893798828125, 0.238128662109375, 0.2902679443359375, 0.3424072265625, 0.3945465087890625, 0.446685791015625, 0.4988250732421875, 0.55096435546875, 0.6031036376953125, 0.655242919921875, 0.7073822021484375, 0.759521484375, 0.8116607666015625, 0.863800048828125, 0.9159393310546875, 0.96807861328125, 1.0202178955078125, 1.072357177734375, 1.1244964599609375, 1.1766357421875, 1.2287750244140625, 1.280914306640625, 1.3330535888671875, 1.38519287109375, 1.4373321533203125, 1.489471435546875, 1.5416107177734375, 1.59375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 7.0, 13.0, 16.0, 53.0, 111.0, 170.0, 193.0, 175.0, 122.0, 63.0, 23.0, 25.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.957542419433594, -14.393253326416016, -13.828963279724121, -13.264674186706543, -12.700385093688965, -12.13609504699707, -11.571805953979492, -11.007516860961914, -10.443227767944336, -9.878938674926758, -9.314648628234863, -8.750359535217285, -8.186070442199707, -7.621780872344971, -7.057491302490234, -6.493202209472656, -5.928912162780762, -5.364622592926025, -4.800333499908447, -4.236043930053711, -3.6717545986175537, -3.1074652671813965, -2.54317569732666, -1.978886365890503, -1.4145970344543457, -0.8503076434135437, -0.2860182523727417, 0.2782711982727051, 0.8425605297088623, 1.4068498611450195, 1.9711394309997559, 2.535428762435913, 3.0997180938720703, 3.6640074253082275, 4.228296756744385, 4.792586326599121, 5.356875419616699, 5.9211649894714355, 6.485454559326172, 7.04974365234375, 7.614033222198486, 8.178322792053223, 8.7426118850708, 9.306901931762695, 9.871191024780273, 10.435480117797852, 10.99976921081543, 11.564059257507324, 12.128348350524902, 12.69263744354248, 13.256927490234375, 13.821216583251953, 14.385505676269531, 14.94979476928711, 15.514084815979004, 16.0783748626709, 16.642663955688477, 17.206953048706055, 17.771242141723633, 18.335533142089844, 18.899822235107422, 19.464111328125, 20.028400421142578, 20.592689514160156, 21.156978607177734]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 8.0, 14.0, 10.0, 11.0, 22.0, 33.0, 40.0, 61.0, 56.0, 85.0, 71.0, 79.0, 82.0, 65.0, 72.0, 57.0, 62.0, 45.0, 29.0, 26.0, 20.0, 18.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.44374656677246, -16.060718536376953, -15.677689552307129, -15.294661521911621, -14.911632537841797, -14.528604507446289, -14.145576477050781, -13.762548446655273, -13.37951946258545, -12.996491432189941, -12.613462448120117, -12.23043441772461, -11.847406387329102, -11.464377403259277, -11.08134937286377, -10.698320388793945, -10.315292358398438, -9.93226432800293, -9.549235343933105, -9.166207313537598, -8.783178329467773, -8.400150299072266, -8.017122268676758, -7.634093761444092, -7.251065254211426, -6.86803674697876, -6.485008239746094, -6.101980209350586, -5.71895170211792, -5.335923194885254, -4.952895164489746, -4.56986665725708, -4.186838150024414, -3.803809642791748, -3.420781373977661, -3.037753105163574, -2.654724597930908, -2.271696090698242, -1.8886678218841553, -1.5056395530700684, -1.1226110458374023, -0.7395826578140259, -0.3565542697906494, 0.02647411823272705, 0.4095025062561035, 0.79253089427948, 1.1755592823028564, 1.5585875511169434, 1.9416160583496094, 2.3246445655822754, 2.7076728343963623, 3.090701103210449, 3.4737296104431152, 3.8567581176757812, 4.239786148071289, 4.622814655303955, 5.005843162536621, 5.388871669769287, 5.771900177001953, 6.154928207397461, 6.537956714630127, 6.920985221862793, 7.304013252258301, 7.687041759490967, 8.070070266723633]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 8.0, 11.0, 19.0, 23.0, 42.0, 74.0, 118.0, 205.0, 378.0, 718.0, 1452.0, 2901.0, 7281.0, 18523.0, 53303.0, 164197.0, 408276.0, 260752.0, 83273.0, 28320.0, 10423.0, 4313.0, 1918.0, 911.0, 474.0, 264.0, 147.0, 88.0, 53.0, 30.0, 21.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.419921875, -1.370452880859375, -1.32098388671875, -1.271514892578125, -1.2220458984375, -1.172576904296875, -1.12310791015625, -1.073638916015625, -1.024169921875, -0.974700927734375, -0.92523193359375, -0.875762939453125, -0.8262939453125, -0.776824951171875, -0.72735595703125, -0.677886962890625, -0.62841796875, -0.578948974609375, -0.52947998046875, -0.480010986328125, -0.4305419921875, -0.381072998046875, -0.33160400390625, -0.282135009765625, -0.232666015625, -0.183197021484375, -0.13372802734375, -0.084259033203125, -0.0347900390625, 0.014678955078125, 0.06414794921875, 0.113616943359375, 0.1630859375, 0.212554931640625, 0.26202392578125, 0.311492919921875, 0.3609619140625, 0.410430908203125, 0.45989990234375, 0.509368896484375, 0.558837890625, 0.608306884765625, 0.65777587890625, 0.707244873046875, 0.7567138671875, 0.806182861328125, 0.85565185546875, 0.905120849609375, 0.95458984375, 1.004058837890625, 1.05352783203125, 1.102996826171875, 1.1524658203125, 1.201934814453125, 1.25140380859375, 1.300872802734375, 1.350341796875, 1.399810791015625, 1.44927978515625, 1.498748779296875, 1.5482177734375, 1.597686767578125, 1.64715576171875, 1.696624755859375, 1.74609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 29.0, 30.0, 45.0, 58.0, 58.0, 70.0, 80.0, 82.0, 89.0, 87.0, 68.0, 71.0, 49.0, 29.0, 39.0, 29.0, 18.0, 17.0, 14.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5282058715820312, -0.4934234619140625, -0.45864105224609375, -0.423858642578125, -0.38907623291015625, -0.3542938232421875, -0.31951141357421875, -0.28472900390625, -0.24994659423828125, -0.2151641845703125, -0.18038177490234375, -0.145599365234375, -0.11081695556640625, -0.0760345458984375, -0.04125213623046875, -0.0064697265625, 0.02831268310546875, 0.0630950927734375, 0.09787750244140625, 0.132659912109375, 0.16744232177734375, 0.2022247314453125, 0.23700714111328125, 0.27178955078125, 0.30657196044921875, 0.3413543701171875, 0.37613677978515625, 0.410919189453125, 0.44570159912109375, 0.4804840087890625, 0.5152664184570312, 0.550048828125, 0.5848312377929688, 0.6196136474609375, 0.6543960571289062, 0.689178466796875, 0.7239608764648438, 0.7587432861328125, 0.7935256958007812, 0.82830810546875, 0.8630905151367188, 0.8978729248046875, 0.9326553344726562, 0.967437744140625, 1.0022201538085938, 1.0370025634765625, 1.0717849731445312, 1.1065673828125, 1.1413497924804688, 1.1761322021484375, 1.2109146118164062, 1.245697021484375, 1.2804794311523438, 1.3152618408203125, 1.3500442504882812, 1.38482666015625, 1.4196090698242188, 1.4543914794921875, 1.4891738891601562, 1.523956298828125, 1.5587387084960938, 1.5935211181640625, 1.6283035278320312, 1.6630859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 7.0, 7.0, 18.0, 19.0, 21.0, 25.0, 33.0, 60.0, 76.0, 135.0, 167.0, 294.0, 454.0, 716.0, 1255.0, 2922.0, 8322.0, 38360.0, 280128.0, 625771.0, 69217.0, 12745.0, 3829.0, 1613.0, 886.0, 491.0, 325.0, 199.0, 140.0, 101.0, 54.0, 41.0, 38.0, 26.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.29254150390625, -2.2081298828125, -2.12371826171875, -2.039306640625, -1.95489501953125, -1.8704833984375, -1.78607177734375, -1.70166015625, -1.61724853515625, -1.5328369140625, -1.44842529296875, -1.364013671875, -1.27960205078125, -1.1951904296875, -1.11077880859375, -1.0263671875, -0.94195556640625, -0.8575439453125, -0.77313232421875, -0.688720703125, -0.60430908203125, -0.5198974609375, -0.43548583984375, -0.35107421875, -0.26666259765625, -0.1822509765625, -0.09783935546875, -0.013427734375, 0.07098388671875, 0.1553955078125, 0.23980712890625, 0.32421875, 0.40863037109375, 0.4930419921875, 0.57745361328125, 0.661865234375, 0.74627685546875, 0.8306884765625, 0.91510009765625, 0.99951171875, 1.08392333984375, 1.1683349609375, 1.25274658203125, 1.337158203125, 1.42156982421875, 1.5059814453125, 1.59039306640625, 1.6748046875, 1.75921630859375, 1.8436279296875, 1.92803955078125, 2.012451171875, 2.09686279296875, 2.1812744140625, 2.26568603515625, 2.35009765625, 2.43450927734375, 2.5189208984375, 2.60333251953125, 2.687744140625, 2.77215576171875, 2.8565673828125, 2.94097900390625, 3.025390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 11.0, 11.0, 21.0, 18.0, 27.0, 22.0, 46.0, 34.0, 47.0, 49.0, 50.0, 68.0, 56.0, 76.0, 70.0, 65.0, 58.0, 49.0, 42.0, 36.0, 30.0, 23.0, 20.0, 24.0, 14.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.14373779296875, -3.0355224609375, -2.92730712890625, -2.819091796875, -2.71087646484375, -2.6026611328125, -2.49444580078125, -2.38623046875, -2.27801513671875, -2.1697998046875, -2.06158447265625, -1.953369140625, -1.84515380859375, -1.7369384765625, -1.62872314453125, -1.5205078125, -1.41229248046875, -1.3040771484375, -1.19586181640625, -1.087646484375, -0.97943115234375, -0.8712158203125, -0.76300048828125, -0.65478515625, -0.54656982421875, -0.4383544921875, -0.33013916015625, -0.221923828125, -0.11370849609375, -0.0054931640625, 0.10272216796875, 0.2109375, 0.31915283203125, 0.4273681640625, 0.53558349609375, 0.643798828125, 0.75201416015625, 0.8602294921875, 0.96844482421875, 1.07666015625, 1.18487548828125, 1.2930908203125, 1.40130615234375, 1.509521484375, 1.61773681640625, 1.7259521484375, 1.83416748046875, 1.9423828125, 2.05059814453125, 2.1588134765625, 2.26702880859375, 2.375244140625, 2.48345947265625, 2.5916748046875, 2.69989013671875, 2.80810546875, 2.91632080078125, 3.0245361328125, 3.13275146484375, 3.240966796875, 3.34918212890625, 3.4573974609375, 3.56561279296875, 3.673828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 9.0, 15.0, 10.0, 14.0, 20.0, 33.0, 47.0, 53.0, 97.0, 121.0, 190.0, 301.0, 586.0, 1281.0, 3112.0, 9623.0, 38005.0, 218747.0, 645597.0, 99831.0, 20830.0, 5848.0, 2073.0, 945.0, 445.0, 239.0, 137.0, 97.0, 54.0, 51.0, 31.0, 24.0, 17.0, 14.0, 15.0, 13.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.81591796875, -0.794036865234375, -0.77215576171875, -0.750274658203125, -0.7283935546875, -0.706512451171875, -0.68463134765625, -0.662750244140625, -0.640869140625, -0.618988037109375, -0.59710693359375, -0.575225830078125, -0.5533447265625, -0.531463623046875, -0.50958251953125, -0.487701416015625, -0.4658203125, -0.443939208984375, -0.42205810546875, -0.400177001953125, -0.3782958984375, -0.356414794921875, -0.33453369140625, -0.312652587890625, -0.290771484375, -0.268890380859375, -0.24700927734375, -0.225128173828125, -0.2032470703125, -0.181365966796875, -0.15948486328125, -0.137603759765625, -0.11572265625, -0.093841552734375, -0.07196044921875, -0.050079345703125, -0.0281982421875, -0.006317138671875, 0.01556396484375, 0.037445068359375, 0.059326171875, 0.081207275390625, 0.10308837890625, 0.124969482421875, 0.1468505859375, 0.168731689453125, 0.19061279296875, 0.212493896484375, 0.234375, 0.256256103515625, 0.27813720703125, 0.300018310546875, 0.3218994140625, 0.343780517578125, 0.36566162109375, 0.387542724609375, 0.409423828125, 0.431304931640625, 0.45318603515625, 0.475067138671875, 0.4969482421875, 0.518829345703125, 0.54071044921875, 0.562591552734375, 0.58447265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 4.0, 8.0, 11.0, 20.0, 21.0, 23.0, 28.0, 38.0, 34.0, 59.0, 97.0, 118.0, 104.0, 109.0, 68.0, 61.0, 42.0, 31.0, 14.0, 15.0, 12.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001690387725830078, -0.0001623295247554779, -0.000155620276927948, -0.0001489110291004181, -0.00014220178127288818, -0.00013549253344535828, -0.00012878328561782837, -0.00012207403779029846, -0.00011536478996276855, -0.00010865554213523865, -0.00010194629430770874, -9.523704648017883e-05, -8.852779865264893e-05, -8.181855082511902e-05, -7.510930299758911e-05, -6.84000551700592e-05, -6.16908073425293e-05, -5.498155951499939e-05, -4.827231168746948e-05, -4.1563063859939575e-05, -3.485381603240967e-05, -2.814456820487976e-05, -2.1435320377349854e-05, -1.4726072549819946e-05, -8.016824722290039e-06, -1.3075768947601318e-06, 5.401670932769775e-06, 1.2110918760299683e-05, 1.882016658782959e-05, 2.5529414415359497e-05, 3.2238662242889404e-05, 3.894791007041931e-05, 4.565715789794922e-05, 5.2366405725479126e-05, 5.907565355300903e-05, 6.578490138053894e-05, 7.249414920806885e-05, 7.920339703559875e-05, 8.591264486312866e-05, 9.262189269065857e-05, 9.933114051818848e-05, 0.00010604038834571838, 0.00011274963617324829, 0.0001194588840007782, 0.0001261681318283081, 0.000132877379655838, 0.00013958662748336792, 0.00014629587531089783, 0.00015300512313842773, 0.00015971437096595764, 0.00016642361879348755, 0.00017313286662101746, 0.00017984211444854736, 0.00018655136227607727, 0.00019326061010360718, 0.00019996985793113708, 0.000206679105758667, 0.0002133883535861969, 0.0002200976014137268, 0.00022680684924125671, 0.00023351609706878662, 0.00024022534489631653, 0.00024693459272384644, 0.00025364384055137634, 0.00026035308837890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 10.0, 10.0, 14.0, 18.0, 24.0, 31.0, 38.0, 50.0, 79.0, 114.0, 162.0, 262.0, 385.0, 634.0, 1290.0, 2538.0, 5771.0, 17482.0, 71620.0, 500067.0, 354282.0, 65996.0, 16461.0, 5707.0, 2487.0, 1156.0, 651.0, 382.0, 257.0, 182.0, 97.0, 69.0, 50.0, 54.0, 28.0, 17.0, 15.0, 13.0, 15.0, 7.0, 7.0, 7.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5637130737304688, -0.5449066162109375, -0.5261001586914062, -0.507293701171875, -0.48848724365234375, -0.4696807861328125, -0.45087432861328125, -0.43206787109375, -0.41326141357421875, -0.3944549560546875, -0.37564849853515625, -0.356842041015625, -0.33803558349609375, -0.3192291259765625, -0.30042266845703125, -0.2816162109375, -0.26280975341796875, -0.2440032958984375, -0.22519683837890625, -0.206390380859375, -0.18758392333984375, -0.1687774658203125, -0.14997100830078125, -0.13116455078125, -0.11235809326171875, -0.0935516357421875, -0.07474517822265625, -0.055938720703125, -0.03713226318359375, -0.0183258056640625, 0.00048065185546875, 0.019287109375, 0.03809356689453125, 0.0569000244140625, 0.07570648193359375, 0.094512939453125, 0.11331939697265625, 0.1321258544921875, 0.15093231201171875, 0.16973876953125, 0.18854522705078125, 0.2073516845703125, 0.22615814208984375, 0.244964599609375, 0.26377105712890625, 0.2825775146484375, 0.30138397216796875, 0.3201904296875, 0.33899688720703125, 0.3578033447265625, 0.37660980224609375, 0.395416259765625, 0.41422271728515625, 0.4330291748046875, 0.45183563232421875, 0.47064208984375, 0.48944854736328125, 0.5082550048828125, 0.5270614624023438, 0.545867919921875, 0.5646743774414062, 0.5834808349609375, 0.6022872924804688, 0.62109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 9.0, 4.0, 15.0, 12.0, 19.0, 25.0, 19.0, 35.0, 45.0, 58.0, 57.0, 90.0, 73.0, 91.0, 86.0, 85.0, 49.0, 49.0, 33.0, 31.0, 37.0, 23.0, 10.0, 12.0, 9.0, 6.0, 5.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5829315185546875, -0.560882568359375, -0.5388336181640625, -0.51678466796875, -0.4947357177734375, -0.472686767578125, -0.4506378173828125, -0.4285888671875, -0.4065399169921875, -0.384490966796875, -0.3624420166015625, -0.34039306640625, -0.3183441162109375, -0.296295166015625, -0.2742462158203125, -0.252197265625, -0.2301483154296875, -0.208099365234375, -0.1860504150390625, -0.16400146484375, -0.1419525146484375, -0.119903564453125, -0.0978546142578125, -0.0758056640625, -0.0537567138671875, -0.031707763671875, -0.0096588134765625, 0.01239013671875, 0.0344390869140625, 0.056488037109375, 0.0785369873046875, 0.1005859375, 0.1226348876953125, 0.144683837890625, 0.1667327880859375, 0.18878173828125, 0.2108306884765625, 0.232879638671875, 0.2549285888671875, 0.2769775390625, 0.2990264892578125, 0.321075439453125, 0.3431243896484375, 0.36517333984375, 0.3872222900390625, 0.409271240234375, 0.4313201904296875, 0.453369140625, 0.4754180908203125, 0.497467041015625, 0.5195159912109375, 0.54156494140625, 0.5636138916015625, 0.585662841796875, 0.6077117919921875, 0.6297607421875, 0.6518096923828125, 0.673858642578125, 0.6959075927734375, 0.71795654296875, 0.7400054931640625, 0.762054443359375, 0.7841033935546875, 0.80615234375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 23.0, 46.0, 74.0, 151.0, 277.0, 181.0, 122.0, 43.0, 22.0, 10.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.37348747253418, -19.767303466796875, -19.161121368408203, -18.5549373626709, -17.948753356933594, -17.342571258544922, -16.736387252807617, -16.130203247070312, -15.524020195007324, -14.917837142944336, -14.311653137207031, -13.705470085144043, -13.099287033081055, -12.49310302734375, -11.886919975280762, -11.280736923217773, -10.674552917480469, -10.06836986541748, -9.462185859680176, -8.856002807617188, -8.249818801879883, -7.6436357498168945, -7.037452697753906, -6.43126916885376, -5.825085639953613, -5.218902111053467, -4.61271858215332, -4.006535530090332, -3.4003520011901855, -2.794168472290039, -2.1879851818084717, -1.5818018913269043, -0.9756202697753906, -0.3694368600845337, 0.23674654960632324, 0.8429299592971802, 1.449113368988037, 2.0552968978881836, 2.661480188369751, 3.2676634788513184, 3.873847007751465, 4.480030536651611, 5.086214065551758, 5.692397117614746, 6.298580646514893, 6.904764175415039, 7.510947227478027, 8.117130279541016, 8.72331428527832, 9.329497337341309, 9.935681343078613, 10.541864395141602, 11.148048400878906, 11.754231452941895, 12.360414505004883, 12.966598510742188, 13.572781562805176, 14.178964614868164, 14.785148620605469, 15.391331672668457, 15.997514724731445, 16.60369873046875, 17.209882736206055, 17.816064834594727, 18.42224884033203]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 10.0, 12.0, 8.0, 22.0, 18.0, 25.0, 28.0, 31.0, 36.0, 33.0, 54.0, 62.0, 77.0, 92.0, 83.0, 70.0, 50.0, 49.0, 44.0, 29.0, 21.0, 27.0, 22.0, 15.0, 26.0, 16.0, 12.0, 6.0, 5.0, 3.0, 6.0, 3.0, 5.0], "bins": [-17.341094970703125, -16.954734802246094, -16.568374633789062, -16.1820125579834, -15.795652389526367, -15.409292221069336, -15.022931098937988, -14.63656997680664, -14.25020980834961, -13.863849639892578, -13.47748851776123, -13.091127395629883, -12.704767227172852, -12.31840705871582, -11.932045936584473, -11.545684814453125, -11.159324645996094, -10.772964477539062, -10.386603355407715, -10.000242233276367, -9.613882064819336, -9.227521896362305, -8.841160774230957, -8.45479965209961, -8.068439483642578, -7.682078838348389, -7.295718193054199, -6.90935754776001, -6.52299690246582, -6.136636257171631, -5.750275611877441, -5.363914966583252, -4.9775543212890625, -4.591193675994873, -4.204833030700684, -3.818472385406494, -3.4321117401123047, -3.0457510948181152, -2.659390449523926, -2.2730298042297363, -1.8866691589355469, -1.5003085136413574, -1.113947868347168, -0.7275872230529785, -0.34122657775878906, 0.04513406753540039, 0.43149471282958984, 0.8178553581237793, 1.2042160034179688, 1.5905766487121582, 1.9769372940063477, 2.363297939300537, 2.7496585845947266, 3.136019229888916, 3.5223798751831055, 3.908740520477295, 4.295101165771484, 4.681461811065674, 5.067822456359863, 5.454183101654053, 5.840543746948242, 6.226904392242432, 6.613265037536621, 6.9996256828308105, 7.385986328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 9.0, 19.0, 29.0, 57.0, 102.0, 189.0, 392.0, 861.0, 2279.0, 7320.0, 30377.0, 260644.0, 3068399.0, 748603.0, 57948.0, 11458.0, 3393.0, 1216.0, 511.0, 225.0, 115.0, 61.0, 30.0, 23.0, 8.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.6155319213867188, -1.5767669677734375, -1.5380020141601562, -1.499237060546875, -1.4604721069335938, -1.4217071533203125, -1.3829421997070312, -1.34417724609375, -1.3054122924804688, -1.2666473388671875, -1.2278823852539062, -1.189117431640625, -1.1503524780273438, -1.1115875244140625, -1.0728225708007812, -1.0340576171875, -0.9952926635742188, -0.9565277099609375, -0.9177627563476562, -0.878997802734375, -0.8402328491210938, -0.8014678955078125, -0.7627029418945312, -0.72393798828125, -0.6851730346679688, -0.6464080810546875, -0.6076431274414062, -0.568878173828125, -0.5301132202148438, -0.4913482666015625, -0.45258331298828125, -0.413818359375, -0.37505340576171875, -0.3362884521484375, -0.29752349853515625, -0.258758544921875, -0.21999359130859375, -0.1812286376953125, -0.14246368408203125, -0.10369873046875, -0.06493377685546875, -0.0261688232421875, 0.01259613037109375, 0.051361083984375, 0.09012603759765625, 0.1288909912109375, 0.16765594482421875, 0.2064208984375, 0.24518585205078125, 0.2839508056640625, 0.32271575927734375, 0.361480712890625, 0.40024566650390625, 0.4390106201171875, 0.47777557373046875, 0.51654052734375, 0.5553054809570312, 0.5940704345703125, 0.6328353881835938, 0.671600341796875, 0.7103652954101562, 0.7491302490234375, 0.7878952026367188, 0.82666015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 8.0, 6.0, 8.0, 10.0, 18.0, 13.0, 20.0, 23.0, 18.0, 26.0, 21.0, 34.0, 45.0, 33.0, 42.0, 41.0, 49.0, 45.0, 40.0, 55.0, 37.0, 52.0, 31.0, 42.0, 41.0, 29.0, 36.0, 31.0, 12.0, 19.0, 17.0, 19.0, 19.0, 14.0, 8.0, 7.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634765625, -0.546112060546875, -0.52874755859375, -0.511383056640625, -0.4940185546875, -0.476654052734375, -0.45928955078125, -0.441925048828125, -0.424560546875, -0.407196044921875, -0.38983154296875, -0.372467041015625, -0.3551025390625, -0.337738037109375, -0.32037353515625, -0.303009033203125, -0.28564453125, -0.268280029296875, -0.25091552734375, -0.233551025390625, -0.2161865234375, -0.198822021484375, -0.18145751953125, -0.164093017578125, -0.146728515625, -0.129364013671875, -0.11199951171875, -0.094635009765625, -0.0772705078125, -0.059906005859375, -0.04254150390625, -0.025177001953125, -0.0078125, 0.009552001953125, 0.02691650390625, 0.044281005859375, 0.0616455078125, 0.079010009765625, 0.09637451171875, 0.113739013671875, 0.131103515625, 0.148468017578125, 0.16583251953125, 0.183197021484375, 0.2005615234375, 0.217926025390625, 0.23529052734375, 0.252655029296875, 0.27001953125, 0.287384033203125, 0.30474853515625, 0.322113037109375, 0.3394775390625, 0.356842041015625, 0.37420654296875, 0.391571044921875, 0.408935546875, 0.426300048828125, 0.44366455078125, 0.461029052734375, 0.4783935546875, 0.495758056640625, 0.51312255859375, 0.530487060546875, 0.5478515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 22.0, 32.0, 46.0, 64.0, 137.0, 227.0, 442.0, 1129.0, 3310.0, 16194.0, 193549.0, 3803599.0, 158031.0, 13113.0, 2586.0, 870.0, 370.0, 202.0, 106.0, 67.0, 51.0, 31.0, 26.0, 14.0, 8.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-2.880859375, -2.8078765869140625, -2.734893798828125, -2.6619110107421875, -2.58892822265625, -2.5159454345703125, -2.442962646484375, -2.3699798583984375, -2.2969970703125, -2.2240142822265625, -2.151031494140625, -2.0780487060546875, -2.00506591796875, -1.9320831298828125, -1.859100341796875, -1.7861175537109375, -1.713134765625, -1.6401519775390625, -1.567169189453125, -1.4941864013671875, -1.42120361328125, -1.3482208251953125, -1.275238037109375, -1.2022552490234375, -1.1292724609375, -1.0562896728515625, -0.983306884765625, -0.9103240966796875, -0.83734130859375, -0.7643585205078125, -0.691375732421875, -0.6183929443359375, -0.54541015625, -0.4724273681640625, -0.399444580078125, -0.3264617919921875, -0.25347900390625, -0.1804962158203125, -0.107513427734375, -0.0345306396484375, 0.0384521484375, 0.1114349365234375, 0.184417724609375, 0.2574005126953125, 0.33038330078125, 0.4033660888671875, 0.476348876953125, 0.5493316650390625, 0.622314453125, 0.6952972412109375, 0.768280029296875, 0.8412628173828125, 0.91424560546875, 0.9872283935546875, 1.060211181640625, 1.1331939697265625, 1.2061767578125, 1.2791595458984375, 1.352142333984375, 1.4251251220703125, 1.49810791015625, 1.5710906982421875, 1.644073486328125, 1.7170562744140625, 1.7900390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 12.0, 14.0, 12.0, 24.0, 39.0, 40.0, 50.0, 98.0, 160.0, 272.0, 532.0, 835.0, 789.0, 492.0, 271.0, 135.0, 97.0, 54.0, 38.0, 23.0, 16.0, 17.0, 10.0, 10.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.473175048828125, -1.42388916015625, -1.374603271484375, -1.3253173828125, -1.276031494140625, -1.22674560546875, -1.177459716796875, -1.128173828125, -1.078887939453125, -1.02960205078125, -0.980316162109375, -0.9310302734375, -0.881744384765625, -0.83245849609375, -0.783172607421875, -0.73388671875, -0.684600830078125, -0.63531494140625, -0.586029052734375, -0.5367431640625, -0.487457275390625, -0.43817138671875, -0.388885498046875, -0.339599609375, -0.290313720703125, -0.24102783203125, -0.191741943359375, -0.1424560546875, -0.093170166015625, -0.04388427734375, 0.005401611328125, 0.0546875, 0.103973388671875, 0.15325927734375, 0.202545166015625, 0.2518310546875, 0.301116943359375, 0.35040283203125, 0.399688720703125, 0.448974609375, 0.498260498046875, 0.54754638671875, 0.596832275390625, 0.6461181640625, 0.695404052734375, 0.74468994140625, 0.793975830078125, 0.84326171875, 0.892547607421875, 0.94183349609375, 0.991119384765625, 1.0404052734375, 1.089691162109375, 1.13897705078125, 1.188262939453125, 1.237548828125, 1.286834716796875, 1.33612060546875, 1.385406494140625, 1.4346923828125, 1.483978271484375, 1.53326416015625, 1.582550048828125, 1.6318359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 14.0, 40.0, 82.0, 140.0, 212.0, 206.0, 155.0, 75.0, 26.0, 12.0, 4.0, 7.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.668704986572266, -20.125930786132812, -19.58315658569336, -19.040382385253906, -18.497608184814453, -17.954833984375, -17.412059783935547, -16.869287490844727, -16.326513290405273, -15.78373908996582, -15.240964889526367, -14.698190689086914, -14.155417442321777, -13.612643241882324, -13.069869041442871, -12.527094841003418, -11.984320640563965, -11.441546440124512, -10.898772239685059, -10.355998992919922, -9.813224792480469, -9.270450592041016, -8.727676391601562, -8.18490219116211, -7.6421284675598145, -7.099354267120361, -6.556580543518066, -6.013806343078613, -5.47103214263916, -4.928258419036865, -4.385484218597412, -3.842710256576538, -3.2999353408813477, -2.7571613788604736, -2.2143874168395996, -1.6716132164001465, -1.1288392543792725, -0.5860652923583984, -0.04329109191894531, 0.4994828701019287, 1.0422568321228027, 1.5850307941436768, 2.127804756164551, 2.670578956604004, 3.213352918624878, 3.756126880645752, 4.298901081085205, 4.8416748046875, 5.384449005126953, 5.927223205566406, 6.469996929168701, 7.012771129608154, 7.555544853210449, 8.098319053649902, 8.641093254089355, 9.183867454528809, 9.726640701293945, 10.269414901733398, 10.812189102172852, 11.354963302612305, 11.897736549377441, 12.440510749816895, 12.983284950256348, 13.5260591506958, 14.068833351135254]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 5.0, 5.0, 11.0, 12.0, 15.0, 11.0, 21.0, 18.0, 24.0, 27.0, 20.0, 25.0, 43.0, 51.0, 39.0, 38.0, 58.0, 37.0, 58.0, 58.0, 43.0, 35.0, 43.0, 43.0, 39.0, 30.0, 31.0, 20.0, 26.0, 21.0, 23.0, 18.0, 5.0, 10.0, 10.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.182754039764404, -5.995802879333496, -5.80885124206543, -5.6219000816345215, -5.434948921203613, -5.247997283935547, -5.061046123504639, -4.8740949630737305, -4.687143325805664, -4.500192165374756, -4.3132405281066895, -4.126289367675781, -3.939337968826294, -3.7523865699768066, -3.5654354095458984, -3.378484010696411, -3.191532850265503, -3.0045814514160156, -2.8176302909851074, -2.63067889213562, -2.443727493286133, -2.2567763328552246, -2.0698249340057373, -1.88287353515625, -1.6959222555160522, -1.5089709758758545, -1.3220195770263672, -1.1350682973861694, -0.9481169581413269, -0.7611656188964844, -0.5742143392562866, -0.3872629404067993, -0.20031166076660156, -0.013360336422920227, 0.1735909879207611, 0.36054229736328125, 0.5474936366081238, 0.7344449758529663, 0.9213962554931641, 1.1083476543426514, 1.2952989339828491, 1.4822502136230469, 1.6692016124725342, 1.856152892112732, 2.0431041717529297, 2.230055570602417, 2.4170069694519043, 2.6039581298828125, 2.7909095287323, 2.977860927581787, 3.1648120880126953, 3.3517634868621826, 3.53871488571167, 3.725666046142578, 3.9126174449920654, 4.099568843841553, 4.286520004272461, 4.473471164703369, 4.6604228019714355, 4.847373962402344, 5.034325122833252, 5.221276760101318, 5.408227920532227, 5.595179557800293, 5.782130718231201]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 7.0, 11.0, 14.0, 21.0, 29.0, 36.0, 54.0, 86.0, 135.0, 214.0, 368.0, 592.0, 1016.0, 1940.0, 3553.0, 7141.0, 14957.0, 31964.0, 71876.0, 153282.0, 260911.0, 245957.0, 136652.0, 62580.0, 28179.0, 13134.0, 6379.0, 3248.0, 1785.0, 937.0, 563.0, 350.0, 213.0, 117.0, 72.0, 56.0, 31.0, 21.0, 13.0, 12.0, 8.0, 7.0, 6.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.84375, -0.8164596557617188, -0.7891693115234375, -0.7618789672851562, -0.734588623046875, -0.7072982788085938, -0.6800079345703125, -0.6527175903320312, -0.62542724609375, -0.5981369018554688, -0.5708465576171875, -0.5435562133789062, -0.516265869140625, -0.48897552490234375, -0.4616851806640625, -0.43439483642578125, -0.4071044921875, -0.37981414794921875, -0.3525238037109375, -0.32523345947265625, -0.297943115234375, -0.27065277099609375, -0.2433624267578125, -0.21607208251953125, -0.18878173828125, -0.16149139404296875, -0.1342010498046875, -0.10691070556640625, -0.079620361328125, -0.05233001708984375, -0.0250396728515625, 0.00225067138671875, 0.029541015625, 0.05683135986328125, 0.0841217041015625, 0.11141204833984375, 0.138702392578125, 0.16599273681640625, 0.1932830810546875, 0.22057342529296875, 0.24786376953125, 0.27515411376953125, 0.3024444580078125, 0.32973480224609375, 0.357025146484375, 0.38431549072265625, 0.4116058349609375, 0.43889617919921875, 0.4661865234375, 0.49347686767578125, 0.5207672119140625, 0.5480575561523438, 0.575347900390625, 0.6026382446289062, 0.6299285888671875, 0.6572189331054688, 0.68450927734375, 0.7117996215820312, 0.7390899658203125, 0.7663803100585938, 0.793670654296875, 0.8209609985351562, 0.8482513427734375, 0.8755416870117188, 0.90283203125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 6.0, 11.0, 8.0, 4.0, 13.0, 16.0, 15.0, 14.0, 18.0, 25.0, 17.0, 29.0, 28.0, 29.0, 31.0, 36.0, 36.0, 37.0, 37.0, 39.0, 40.0, 42.0, 39.0, 34.0, 36.0, 41.0, 35.0, 30.0, 36.0, 29.0, 21.0, 27.0, 22.0, 26.0, 16.0, 11.0, 9.0, 12.0, 13.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.48802947998046875, -0.4721527099609375, -0.45627593994140625, -0.440399169921875, -0.42452239990234375, -0.4086456298828125, -0.39276885986328125, -0.37689208984375, -0.36101531982421875, -0.3451385498046875, -0.32926177978515625, -0.313385009765625, -0.29750823974609375, -0.2816314697265625, -0.26575469970703125, -0.2498779296875, -0.23400115966796875, -0.2181243896484375, -0.20224761962890625, -0.186370849609375, -0.17049407958984375, -0.1546173095703125, -0.13874053955078125, -0.12286376953125, -0.10698699951171875, -0.0911102294921875, -0.07523345947265625, -0.059356689453125, -0.04347991943359375, -0.0276031494140625, -0.01172637939453125, 0.004150390625, 0.02002716064453125, 0.0359039306640625, 0.05178070068359375, 0.067657470703125, 0.08353424072265625, 0.0994110107421875, 0.11528778076171875, 0.13116455078125, 0.14704132080078125, 0.1629180908203125, 0.17879486083984375, 0.194671630859375, 0.21054840087890625, 0.2264251708984375, 0.24230194091796875, 0.2581787109375, 0.27405548095703125, 0.2899322509765625, 0.30580902099609375, 0.321685791015625, 0.33756256103515625, 0.3534393310546875, 0.36931610107421875, 0.38519287109375, 0.40106964111328125, 0.4169464111328125, 0.43282318115234375, 0.448699951171875, 0.46457672119140625, 0.4804534912109375, 0.49633026123046875, 0.51220703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 4.0, 6.0, 8.0, 8.0, 13.0, 15.0, 26.0, 29.0, 49.0, 60.0, 68.0, 143.0, 254.0, 390.0, 712.0, 1400.0, 3386.0, 8985.0, 30838.0, 133240.0, 576979.0, 219317.0, 50567.0, 13230.0, 4678.0, 1975.0, 964.0, 473.0, 244.0, 152.0, 87.0, 73.0, 38.0, 45.0, 25.0, 16.0, 8.0, 14.0, 5.0, 8.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5634765625, -1.5141143798828125, -1.464752197265625, -1.4153900146484375, -1.36602783203125, -1.3166656494140625, -1.267303466796875, -1.2179412841796875, -1.1685791015625, -1.1192169189453125, -1.069854736328125, -1.0204925537109375, -0.97113037109375, -0.9217681884765625, -0.872406005859375, -0.8230438232421875, -0.773681640625, -0.7243194580078125, -0.674957275390625, -0.6255950927734375, -0.57623291015625, -0.5268707275390625, -0.477508544921875, -0.4281463623046875, -0.3787841796875, -0.3294219970703125, -0.280059814453125, -0.2306976318359375, -0.18133544921875, -0.1319732666015625, -0.082611083984375, -0.0332489013671875, 0.01611328125, 0.0654754638671875, 0.114837646484375, 0.1641998291015625, 0.21356201171875, 0.2629241943359375, 0.312286376953125, 0.3616485595703125, 0.4110107421875, 0.4603729248046875, 0.509735107421875, 0.5590972900390625, 0.60845947265625, 0.6578216552734375, 0.707183837890625, 0.7565460205078125, 0.805908203125, 0.8552703857421875, 0.904632568359375, 0.9539947509765625, 1.00335693359375, 1.0527191162109375, 1.102081298828125, 1.1514434814453125, 1.2008056640625, 1.2501678466796875, 1.299530029296875, 1.3488922119140625, 1.39825439453125, 1.4476165771484375, 1.496978759765625, 1.5463409423828125, 1.595703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 11.0, 13.0, 8.0, 24.0, 22.0, 34.0, 39.0, 36.0, 40.0, 28.0, 58.0, 56.0, 50.0, 61.0, 51.0, 53.0, 51.0, 57.0, 38.0, 47.0, 30.0, 35.0, 29.0, 22.0, 21.0, 12.0, 19.0, 10.0, 5.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.818359375, -2.7443695068359375, -2.670379638671875, -2.5963897705078125, -2.52239990234375, -2.4484100341796875, -2.374420166015625, -2.3004302978515625, -2.2264404296875, -2.1524505615234375, -2.078460693359375, -2.0044708251953125, -1.93048095703125, -1.8564910888671875, -1.782501220703125, -1.7085113525390625, -1.634521484375, -1.5605316162109375, -1.486541748046875, -1.4125518798828125, -1.33856201171875, -1.2645721435546875, -1.190582275390625, -1.1165924072265625, -1.0426025390625, -0.9686126708984375, -0.894622802734375, -0.8206329345703125, -0.74664306640625, -0.6726531982421875, -0.598663330078125, -0.5246734619140625, -0.45068359375, -0.3766937255859375, -0.302703857421875, -0.2287139892578125, -0.15472412109375, -0.0807342529296875, -0.006744384765625, 0.0672454833984375, 0.1412353515625, 0.2152252197265625, 0.289215087890625, 0.3632049560546875, 0.43719482421875, 0.5111846923828125, 0.585174560546875, 0.6591644287109375, 0.733154296875, 0.8071441650390625, 0.881134033203125, 0.9551239013671875, 1.02911376953125, 1.1031036376953125, 1.177093505859375, 1.2510833740234375, 1.3250732421875, 1.3990631103515625, 1.473052978515625, 1.5470428466796875, 1.62103271484375, 1.6950225830078125, 1.769012451171875, 1.8430023193359375, 1.9169921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 13.0, 12.0, 29.0, 34.0, 72.0, 105.0, 170.0, 360.0, 728.0, 1881.0, 5074.0, 16057.0, 56837.0, 214863.0, 568301.0, 132209.0, 35339.0, 10410.0, 3527.0, 1307.0, 604.0, 257.0, 127.0, 85.0, 52.0, 31.0, 28.0, 12.0, 8.0, 2.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37353515625, -0.3587799072265625, -0.344024658203125, -0.3292694091796875, -0.31451416015625, -0.2997589111328125, -0.285003662109375, -0.2702484130859375, -0.2554931640625, -0.2407379150390625, -0.225982666015625, -0.2112274169921875, -0.19647216796875, -0.1817169189453125, -0.166961669921875, -0.1522064208984375, -0.137451171875, -0.1226959228515625, -0.107940673828125, -0.0931854248046875, -0.07843017578125, -0.0636749267578125, -0.048919677734375, -0.0341644287109375, -0.0194091796875, -0.0046539306640625, 0.010101318359375, 0.0248565673828125, 0.03961181640625, 0.0543670654296875, 0.069122314453125, 0.0838775634765625, 0.0986328125, 0.1133880615234375, 0.128143310546875, 0.1428985595703125, 0.15765380859375, 0.1724090576171875, 0.187164306640625, 0.2019195556640625, 0.2166748046875, 0.2314300537109375, 0.246185302734375, 0.2609405517578125, 0.27569580078125, 0.2904510498046875, 0.305206298828125, 0.3199615478515625, 0.334716796875, 0.3494720458984375, 0.364227294921875, 0.3789825439453125, 0.39373779296875, 0.4084930419921875, 0.423248291015625, 0.4380035400390625, 0.4527587890625, 0.4675140380859375, 0.482269287109375, 0.4970245361328125, 0.51177978515625, 0.5265350341796875, 0.541290283203125, 0.5560455322265625, 0.57080078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 10.0, 9.0, 6.0, 18.0, 10.0, 28.0, 25.0, 48.0, 61.0, 67.0, 97.0, 142.0, 130.0, 90.0, 64.0, 46.0, 41.0, 32.0, 31.0, 12.0, 12.0, 11.0, 4.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015664100646972656, -0.00015059113502502441, -0.00014454126358032227, -0.00013849139213562012, -0.00013244152069091797, -0.00012639164924621582, -0.00012034177780151367, -0.00011429190635681152, -0.00010824203491210938, -0.00010219216346740723, -9.614229202270508e-05, -9.009242057800293e-05, -8.404254913330078e-05, -7.799267768859863e-05, -7.194280624389648e-05, -6.589293479919434e-05, -5.984306335449219e-05, -5.379319190979004e-05, -4.774332046508789e-05, -4.169344902038574e-05, -3.5643577575683594e-05, -2.9593706130981445e-05, -2.3543834686279297e-05, -1.749396324157715e-05, -1.1444091796875e-05, -5.3942203521728516e-06, 6.556510925292969e-07, 6.705522537231445e-06, 1.2755393981933594e-05, 1.8805265426635742e-05, 2.485513687133789e-05, 3.090500831604004e-05, 3.695487976074219e-05, 4.3004751205444336e-05, 4.9054622650146484e-05, 5.510449409484863e-05, 6.115436553955078e-05, 6.720423698425293e-05, 7.325410842895508e-05, 7.930397987365723e-05, 8.535385131835938e-05, 9.140372276306152e-05, 9.745359420776367e-05, 0.00010350346565246582, 0.00010955333709716797, 0.00011560320854187012, 0.00012165307998657227, 0.00012770295143127441, 0.00013375282287597656, 0.0001398026943206787, 0.00014585256576538086, 0.000151902437210083, 0.00015795230865478516, 0.0001640021800994873, 0.00017005205154418945, 0.0001761019229888916, 0.00018215179443359375, 0.0001882016658782959, 0.00019425153732299805, 0.0002003014087677002, 0.00020635128021240234, 0.0002124011516571045, 0.00021845102310180664, 0.0002245008945465088, 0.00023055076599121094]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 3.0, 7.0, 27.0, 30.0, 55.0, 109.0, 217.0, 493.0, 1225.0, 3978.0, 16274.0, 89280.0, 606463.0, 270414.0, 46605.0, 9223.0, 2588.0, 853.0, 369.0, 140.0, 85.0, 40.0, 24.0, 14.0, 12.0, 2.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.634765625, -0.6148147583007812, -0.5948638916015625, -0.5749130249023438, -0.554962158203125, -0.5350112915039062, -0.5150604248046875, -0.49510955810546875, -0.47515869140625, -0.45520782470703125, -0.4352569580078125, -0.41530609130859375, -0.395355224609375, -0.37540435791015625, -0.3554534912109375, -0.33550262451171875, -0.3155517578125, -0.29560089111328125, -0.2756500244140625, -0.25569915771484375, -0.235748291015625, -0.21579742431640625, -0.1958465576171875, -0.17589569091796875, -0.15594482421875, -0.13599395751953125, -0.1160430908203125, -0.09609222412109375, -0.076141357421875, -0.05619049072265625, -0.0362396240234375, -0.01628875732421875, 0.003662109375, 0.02361297607421875, 0.0435638427734375, 0.06351470947265625, 0.083465576171875, 0.10341644287109375, 0.1233673095703125, 0.14331817626953125, 0.16326904296875, 0.18321990966796875, 0.2031707763671875, 0.22312164306640625, 0.243072509765625, 0.26302337646484375, 0.2829742431640625, 0.30292510986328125, 0.3228759765625, 0.34282684326171875, 0.3627777099609375, 0.38272857666015625, 0.402679443359375, 0.42263031005859375, 0.4425811767578125, 0.46253204345703125, 0.48248291015625, 0.5024337768554688, 0.5223846435546875, 0.5423355102539062, 0.562286376953125, 0.5822372436523438, 0.6021881103515625, 0.6221389770507812, 0.64208984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 4.0, 9.0, 5.0, 9.0, 14.0, 24.0, 25.0, 42.0, 62.0, 73.0, 92.0, 67.0, 107.0, 96.0, 81.0, 72.0, 58.0, 35.0, 42.0, 25.0, 17.0, 13.0, 11.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.572479248046875, -0.55169677734375, -0.530914306640625, -0.5101318359375, -0.489349365234375, -0.46856689453125, -0.447784423828125, -0.427001953125, -0.406219482421875, -0.38543701171875, -0.364654541015625, -0.3438720703125, -0.323089599609375, -0.30230712890625, -0.281524658203125, -0.2607421875, -0.239959716796875, -0.21917724609375, -0.198394775390625, -0.1776123046875, -0.156829833984375, -0.13604736328125, -0.115264892578125, -0.094482421875, -0.073699951171875, -0.05291748046875, -0.032135009765625, -0.0113525390625, 0.009429931640625, 0.03021240234375, 0.050994873046875, 0.07177734375, 0.092559814453125, 0.11334228515625, 0.134124755859375, 0.1549072265625, 0.175689697265625, 0.19647216796875, 0.217254638671875, 0.238037109375, 0.258819580078125, 0.27960205078125, 0.300384521484375, 0.3211669921875, 0.341949462890625, 0.36273193359375, 0.383514404296875, 0.404296875, 0.425079345703125, 0.44586181640625, 0.466644287109375, 0.4874267578125, 0.508209228515625, 0.52899169921875, 0.549774169921875, 0.570556640625, 0.591339111328125, 0.61212158203125, 0.632904052734375, 0.6536865234375, 0.674468994140625, 0.69525146484375, 0.716033935546875, 0.73681640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 13.0, 18.0, 50.0, 97.0, 147.0, 239.0, 165.0, 106.0, 63.0, 38.0, 20.0, 12.0, 6.0, 1.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.703070640563965, -13.25552749633789, -12.8079833984375, -12.360440254211426, -11.912897109985352, -11.465353012084961, -11.017809867858887, -10.570266723632812, -10.122723579406738, -9.675180435180664, -9.227636337280273, -8.7800931930542, -8.332550048828125, -7.885006427764893, -7.43746280670166, -6.989919662475586, -6.5423760414123535, -6.094832420349121, -5.647289276123047, -5.1997456550598145, -4.75220251083374, -4.304658889770508, -3.8571155071258545, -3.409572124481201, -2.962028741836548, -2.5144853591918945, -2.066941976547241, -1.6193984746932983, -1.171855092048645, -0.7243115901947021, -0.27676820755004883, 0.1707751750946045, 0.6183185577392578, 1.0658619403839111, 1.5134053230285645, 1.9609488248825073, 2.408492088317871, 2.8560357093811035, 3.303579092025757, 3.75112247467041, 4.198665618896484, 4.646209239959717, 5.093752384185791, 5.541296005249023, 5.988839149475098, 6.43638277053833, 6.8839263916015625, 7.331469535827637, 7.779013156890869, 8.226556777954102, 8.674099922180176, 9.12164306640625, 9.56918716430664, 10.016730308532715, 10.464273452758789, 10.91181755065918, 11.359360694885254, 11.806903839111328, 12.254447937011719, 12.701991081237793, 13.149534225463867, 13.597078323364258, 14.044621467590332, 14.492164611816406, 14.93970775604248]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 7.0, 14.0, 13.0, 14.0, 13.0, 19.0, 24.0, 26.0, 36.0, 32.0, 31.0, 55.0, 72.0, 78.0, 78.0, 82.0, 50.0, 48.0, 33.0, 44.0, 21.0, 24.0, 30.0, 20.0, 19.0, 13.0, 10.0, 19.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.953629493713379, -8.69128704071045, -8.428945541381836, -8.166603088378906, -7.904261112213135, -7.641919136047363, -7.379577159881592, -7.11723518371582, -6.854892730712891, -6.592550754547119, -6.330208778381348, -6.067866325378418, -5.8055243492126465, -5.543182373046875, -5.2808403968811035, -5.018498420715332, -4.7561564445495605, -4.493814468383789, -4.231472492218018, -3.969130277633667, -3.7067880630493164, -3.444446086883545, -3.1821041107177734, -2.919762134552002, -2.6574199199676514, -2.39507794380188, -2.1327357292175293, -1.8703937530517578, -1.6080516576766968, -1.3457095623016357, -1.0833675861358643, -0.8210254907608032, -0.5586833953857422, -0.29634132981300354, -0.03399926424026489, 0.22834277153015137, 0.4906848669052124, 0.7530269622802734, 1.015368938446045, 1.277711033821106, 1.540053129196167, 1.802395224571228, 2.064737319946289, 2.3270792961120605, 2.589421272277832, 2.8517634868621826, 3.114105463027954, 3.3764476776123047, 3.638789653778076, 3.9011316299438477, 4.163473606109619, 4.425815582275391, 4.68815803527832, 4.950500011444092, 5.212841987609863, 5.475183963775635, 5.737525939941406, 5.999867916107178, 6.262209892272949, 6.524552345275879, 6.78689432144165, 7.049236297607422, 7.311578273773193, 7.573920249938965, 7.8362627029418945]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 16.0, 14.0, 35.0, 57.0, 86.0, 181.0, 370.0, 720.0, 1741.0, 4141.0, 13256.0, 59743.0, 595464.0, 2961386.0, 485799.0, 52620.0, 11966.0, 3843.0, 1536.0, 659.0, 298.0, 151.0, 81.0, 52.0, 35.0, 12.0, 7.0, 6.0, 4.0, 1.0, 1.0], "bins": [-1.546875, -1.513580322265625, -1.48028564453125, -1.446990966796875, -1.4136962890625, -1.380401611328125, -1.34710693359375, -1.313812255859375, -1.280517578125, -1.247222900390625, -1.21392822265625, -1.180633544921875, -1.1473388671875, -1.114044189453125, -1.08074951171875, -1.047454833984375, -1.01416015625, -0.980865478515625, -0.94757080078125, -0.914276123046875, -0.8809814453125, -0.847686767578125, -0.81439208984375, -0.781097412109375, -0.747802734375, -0.714508056640625, -0.68121337890625, -0.647918701171875, -0.6146240234375, -0.581329345703125, -0.54803466796875, -0.514739990234375, -0.4814453125, -0.448150634765625, -0.41485595703125, -0.381561279296875, -0.3482666015625, -0.314971923828125, -0.28167724609375, -0.248382568359375, -0.215087890625, -0.181793212890625, -0.14849853515625, -0.115203857421875, -0.0819091796875, -0.048614501953125, -0.01531982421875, 0.017974853515625, 0.05126953125, 0.084564208984375, 0.11785888671875, 0.151153564453125, 0.1844482421875, 0.217742919921875, 0.25103759765625, 0.284332275390625, 0.317626953125, 0.350921630859375, 0.38421630859375, 0.417510986328125, 0.4508056640625, 0.484100341796875, 0.51739501953125, 0.550689697265625, 0.583984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 7.0, 4.0, 11.0, 3.0, 6.0, 13.0, 8.0, 9.0, 17.0, 20.0, 16.0, 27.0, 36.0, 35.0, 26.0, 34.0, 33.0, 41.0, 40.0, 54.0, 53.0, 54.0, 49.0, 49.0, 44.0, 50.0, 37.0, 26.0, 30.0, 22.0, 28.0, 35.0, 18.0, 14.0, 13.0, 8.0, 6.0, 8.0, 4.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5704193115234375, -0.552459716796875, -0.5345001220703125, -0.51654052734375, -0.4985809326171875, -0.480621337890625, -0.4626617431640625, -0.4447021484375, -0.4267425537109375, -0.408782958984375, -0.3908233642578125, -0.37286376953125, -0.3549041748046875, -0.336944580078125, -0.3189849853515625, -0.301025390625, -0.2830657958984375, -0.265106201171875, -0.2471466064453125, -0.22918701171875, -0.2112274169921875, -0.193267822265625, -0.1753082275390625, -0.1573486328125, -0.1393890380859375, -0.121429443359375, -0.1034698486328125, -0.08551025390625, -0.0675506591796875, -0.049591064453125, -0.0316314697265625, -0.013671875, 0.0042877197265625, 0.022247314453125, 0.0402069091796875, 0.05816650390625, 0.0761260986328125, 0.094085693359375, 0.1120452880859375, 0.1300048828125, 0.1479644775390625, 0.165924072265625, 0.1838836669921875, 0.20184326171875, 0.2198028564453125, 0.237762451171875, 0.2557220458984375, 0.273681640625, 0.2916412353515625, 0.309600830078125, 0.3275604248046875, 0.34552001953125, 0.3634796142578125, 0.381439208984375, 0.3993988037109375, 0.4173583984375, 0.4353179931640625, 0.453277587890625, 0.4712371826171875, 0.48919677734375, 0.5071563720703125, 0.525115966796875, 0.5430755615234375, 0.56103515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 8.0, 6.0, 14.0, 19.0, 31.0, 77.0, 227.0, 685.0, 3127.0, 36685.0, 3689478.0, 450783.0, 10972.0, 1487.0, 408.0, 152.0, 46.0, 37.0, 15.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.82806396484375, -2.7362060546875, -2.64434814453125, -2.552490234375, -2.46063232421875, -2.3687744140625, -2.27691650390625, -2.18505859375, -2.09320068359375, -2.0013427734375, -1.90948486328125, -1.817626953125, -1.72576904296875, -1.6339111328125, -1.54205322265625, -1.4501953125, -1.35833740234375, -1.2664794921875, -1.17462158203125, -1.082763671875, -0.99090576171875, -0.8990478515625, -0.80718994140625, -0.71533203125, -0.62347412109375, -0.5316162109375, -0.43975830078125, -0.347900390625, -0.25604248046875, -0.1641845703125, -0.07232666015625, 0.01953125, 0.11138916015625, 0.2032470703125, 0.29510498046875, 0.386962890625, 0.47882080078125, 0.5706787109375, 0.66253662109375, 0.75439453125, 0.84625244140625, 0.9381103515625, 1.02996826171875, 1.121826171875, 1.21368408203125, 1.3055419921875, 1.39739990234375, 1.4892578125, 1.58111572265625, 1.6729736328125, 1.76483154296875, 1.856689453125, 1.94854736328125, 2.0404052734375, 2.13226318359375, 2.22412109375, 2.31597900390625, 2.4078369140625, 2.49969482421875, 2.591552734375, 2.68341064453125, 2.7752685546875, 2.86712646484375, 2.958984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 3.0, 15.0, 15.0, 18.0, 27.0, 63.0, 112.0, 174.0, 316.0, 677.0, 1021.0, 759.0, 386.0, 202.0, 117.0, 59.0, 37.0, 20.0, 13.0, 9.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.695556640625, -1.64013671875, -1.584716796875, -1.529296875, -1.473876953125, -1.41845703125, -1.363037109375, -1.3076171875, -1.252197265625, -1.19677734375, -1.141357421875, -1.0859375, -1.030517578125, -0.97509765625, -0.919677734375, -0.8642578125, -0.808837890625, -0.75341796875, -0.697998046875, -0.642578125, -0.587158203125, -0.53173828125, -0.476318359375, -0.4208984375, -0.365478515625, -0.31005859375, -0.254638671875, -0.19921875, -0.143798828125, -0.08837890625, -0.032958984375, 0.0224609375, 0.077880859375, 0.13330078125, 0.188720703125, 0.244140625, 0.299560546875, 0.35498046875, 0.410400390625, 0.4658203125, 0.521240234375, 0.57666015625, 0.632080078125, 0.6875, 0.742919921875, 0.79833984375, 0.853759765625, 0.9091796875, 0.964599609375, 1.02001953125, 1.075439453125, 1.130859375, 1.186279296875, 1.24169921875, 1.297119140625, 1.3525390625, 1.407958984375, 1.46337890625, 1.518798828125, 1.57421875, 1.629638671875, 1.68505859375, 1.740478515625, 1.7958984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 9.0, 18.0, 52.0, 98.0, 219.0, 271.0, 184.0, 82.0, 40.0, 10.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.194992065429688, -19.655071258544922, -19.115150451660156, -18.575227737426758, -18.035306930541992, -17.495386123657227, -16.955463409423828, -16.415542602539062, -15.875621795654297, -15.335700988769531, -14.79577922821045, -14.255857467651367, -13.715936660766602, -13.176015853881836, -12.636094093322754, -12.096172332763672, -11.556251525878906, -11.01633071899414, -10.476408958435059, -9.936487197875977, -9.396566390991211, -8.856645584106445, -8.316723823547363, -7.7768025398254395, -7.236881256103516, -6.696959972381592, -6.157038688659668, -5.617117404937744, -5.07719612121582, -4.5372748374938965, -3.9973535537719727, -3.457432270050049, -2.917510986328125, -2.377589702606201, -1.8376684188842773, -1.2977471351623535, -0.7578258514404297, -0.21790456771850586, 0.32201671600341797, 0.8619379997253418, 1.4018592834472656, 1.9417805671691895, 2.4817018508911133, 3.021623134613037, 3.561544418334961, 4.101465702056885, 4.641386985778809, 5.181308269500732, 5.721229553222656, 6.26115083694458, 6.801072120666504, 7.340993404388428, 7.880914688110352, 8.420835494995117, 8.9607572555542, 9.500679016113281, 10.040599822998047, 10.580520629882812, 11.120442390441895, 11.660364151000977, 12.200284957885742, 12.740205764770508, 13.28012752532959, 13.820049285888672, 14.359970092773438]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 7.0, 9.0, 12.0, 18.0, 18.0, 9.0, 19.0, 24.0, 25.0, 26.0, 37.0, 34.0, 39.0, 37.0, 48.0, 49.0, 48.0, 54.0, 57.0, 59.0, 39.0, 40.0, 35.0, 28.0, 44.0, 23.0, 25.0, 22.0, 18.0, 16.0, 14.0, 17.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.991859436035156, -5.827316761016846, -5.662774085998535, -5.498231887817383, -5.333689212799072, -5.169146537780762, -5.004603862762451, -4.840061187744141, -4.675518989562988, -4.510976314544678, -4.346433639526367, -4.181891441345215, -4.017348766326904, -3.8528060913085938, -3.688263416290283, -3.5237207412719727, -3.359178066253662, -3.1946353912353516, -3.03009295463562, -2.8655502796173096, -2.701007843017578, -2.5364651679992676, -2.371922492980957, -2.2073798179626465, -2.042837381362915, -1.878294825553894, -1.713752269744873, -1.5492095947265625, -1.3846670389175415, -1.2201244831085205, -1.05558180809021, -0.891039252281189, -0.7264962196350098, -0.5619536638259888, -0.397411048412323, -0.23286846280097961, -0.06832587718963623, 0.09621667861938477, 0.26075929403305054, 0.4253019094467163, 0.5898444652557373, 0.7543870210647583, 0.9189296364784241, 1.0834722518920898, 1.2480148077011108, 1.4125573635101318, 1.5771000385284424, 1.7416425943374634, 1.9061851501464844, 2.070727825164795, 2.2352702617645264, 2.399812936782837, 2.5643553733825684, 2.728898048400879, 2.8934407234191895, 3.0579833984375, 3.2225258350372314, 3.387068510055542, 3.5516109466552734, 3.716153621673584, 3.8806962966918945, 4.045238494873047, 4.209781169891357, 4.374323844909668, 4.5388665199279785]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 11.0, 7.0, 21.0, 28.0, 22.0, 44.0, 63.0, 104.0, 145.0, 228.0, 396.0, 653.0, 1017.0, 1898.0, 3415.0, 6542.0, 13640.0, 29302.0, 63128.0, 141338.0, 269096.0, 263878.0, 136480.0, 61584.0, 28057.0, 13164.0, 6389.0, 3436.0, 1805.0, 1008.0, 630.0, 352.0, 243.0, 141.0, 91.0, 74.0, 48.0, 29.0, 13.0, 6.0, 11.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.86767578125, -0.8435592651367188, -0.8194427490234375, -0.7953262329101562, -0.771209716796875, -0.7470932006835938, -0.7229766845703125, -0.6988601684570312, -0.67474365234375, -0.6506271362304688, -0.6265106201171875, -0.6023941040039062, -0.578277587890625, -0.5541610717773438, -0.5300445556640625, -0.5059280395507812, -0.4818115234375, -0.45769500732421875, -0.4335784912109375, -0.40946197509765625, -0.385345458984375, -0.36122894287109375, -0.3371124267578125, -0.31299591064453125, -0.28887939453125, -0.26476287841796875, -0.2406463623046875, -0.21652984619140625, -0.192413330078125, -0.16829681396484375, -0.1441802978515625, -0.12006378173828125, -0.095947265625, -0.07183074951171875, -0.0477142333984375, -0.02359771728515625, 0.000518798828125, 0.02463531494140625, 0.0487518310546875, 0.07286834716796875, 0.09698486328125, 0.12110137939453125, 0.1452178955078125, 0.16933441162109375, 0.193450927734375, 0.21756744384765625, 0.2416839599609375, 0.26580047607421875, 0.2899169921875, 0.31403350830078125, 0.3381500244140625, 0.36226654052734375, 0.386383056640625, 0.41049957275390625, 0.4346160888671875, 0.45873260498046875, 0.48284912109375, 0.5069656372070312, 0.5310821533203125, 0.5551986694335938, 0.579315185546875, 0.6034317016601562, 0.6275482177734375, 0.6516647338867188, 0.67578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 6.0, 8.0, 13.0, 13.0, 21.0, 20.0, 20.0, 26.0, 33.0, 34.0, 25.0, 32.0, 31.0, 36.0, 35.0, 38.0, 33.0, 44.0, 54.0, 46.0, 48.0, 34.0, 35.0, 29.0, 38.0, 33.0, 31.0, 20.0, 28.0, 17.0, 14.0, 11.0, 15.0, 11.0, 7.0, 5.0, 9.0, 6.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5849609375, -0.5680007934570312, -0.5510406494140625, -0.5340805053710938, -0.517120361328125, -0.5001602172851562, -0.4832000732421875, -0.46623992919921875, -0.44927978515625, -0.43231964111328125, -0.4153594970703125, -0.39839935302734375, -0.381439208984375, -0.36447906494140625, -0.3475189208984375, -0.33055877685546875, -0.3135986328125, -0.29663848876953125, -0.2796783447265625, -0.26271820068359375, -0.245758056640625, -0.22879791259765625, -0.2118377685546875, -0.19487762451171875, -0.17791748046875, -0.16095733642578125, -0.1439971923828125, -0.12703704833984375, -0.110076904296875, -0.09311676025390625, -0.0761566162109375, -0.05919647216796875, -0.042236328125, -0.02527618408203125, -0.0083160400390625, 0.00864410400390625, 0.025604248046875, 0.04256439208984375, 0.0595245361328125, 0.07648468017578125, 0.09344482421875, 0.11040496826171875, 0.1273651123046875, 0.14432525634765625, 0.161285400390625, 0.17824554443359375, 0.1952056884765625, 0.21216583251953125, 0.2291259765625, 0.24608612060546875, 0.2630462646484375, 0.28000640869140625, 0.296966552734375, 0.31392669677734375, 0.3308868408203125, 0.34784698486328125, 0.36480712890625, 0.38176727294921875, 0.3987274169921875, 0.41568756103515625, 0.432647705078125, 0.44960784912109375, 0.4665679931640625, 0.48352813720703125, 0.50048828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 9.0, 8.0, 12.0, 26.0, 34.0, 44.0, 65.0, 83.0, 133.0, 180.0, 302.0, 498.0, 985.0, 2467.0, 7771.0, 35268.0, 207488.0, 664104.0, 101764.0, 18863.0, 4787.0, 1703.0, 742.0, 383.0, 257.0, 183.0, 93.0, 104.0, 45.0, 42.0, 17.0, 22.0, 18.0, 8.0, 10.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4775390625, -1.4253387451171875, -1.373138427734375, -1.3209381103515625, -1.26873779296875, -1.2165374755859375, -1.164337158203125, -1.1121368408203125, -1.0599365234375, -1.0077362060546875, -0.955535888671875, -0.9033355712890625, -0.85113525390625, -0.7989349365234375, -0.746734619140625, -0.6945343017578125, -0.642333984375, -0.5901336669921875, -0.537933349609375, -0.4857330322265625, -0.43353271484375, -0.3813323974609375, -0.329132080078125, -0.2769317626953125, -0.2247314453125, -0.1725311279296875, -0.120330810546875, -0.0681304931640625, -0.01593017578125, 0.0362701416015625, 0.088470458984375, 0.1406707763671875, 0.19287109375, 0.2450714111328125, 0.297271728515625, 0.3494720458984375, 0.40167236328125, 0.4538726806640625, 0.506072998046875, 0.5582733154296875, 0.6104736328125, 0.6626739501953125, 0.714874267578125, 0.7670745849609375, 0.81927490234375, 0.8714752197265625, 0.923675537109375, 0.9758758544921875, 1.028076171875, 1.0802764892578125, 1.132476806640625, 1.1846771240234375, 1.23687744140625, 1.2890777587890625, 1.341278076171875, 1.3934783935546875, 1.4456787109375, 1.4978790283203125, 1.550079345703125, 1.6022796630859375, 1.65447998046875, 1.7066802978515625, 1.758880615234375, 1.8110809326171875, 1.86328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 8.0, 9.0, 11.0, 13.0, 19.0, 23.0, 25.0, 34.0, 42.0, 44.0, 39.0, 38.0, 52.0, 42.0, 51.0, 70.0, 63.0, 59.0, 45.0, 45.0, 42.0, 40.0, 30.0, 21.0, 19.0, 14.0, 13.0, 21.0, 12.0, 7.0, 6.0, 10.0, 7.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.630859375, -2.5587310791015625, -2.486602783203125, -2.4144744873046875, -2.34234619140625, -2.2702178955078125, -2.198089599609375, -2.1259613037109375, -2.0538330078125, -1.9817047119140625, -1.909576416015625, -1.8374481201171875, -1.76531982421875, -1.6931915283203125, -1.621063232421875, -1.5489349365234375, -1.476806640625, -1.4046783447265625, -1.332550048828125, -1.2604217529296875, -1.18829345703125, -1.1161651611328125, -1.044036865234375, -0.9719085693359375, -0.8997802734375, -0.8276519775390625, -0.755523681640625, -0.6833953857421875, -0.61126708984375, -0.5391387939453125, -0.467010498046875, -0.3948822021484375, -0.32275390625, -0.2506256103515625, -0.178497314453125, -0.1063690185546875, -0.03424072265625, 0.0378875732421875, 0.110015869140625, 0.1821441650390625, 0.2542724609375, 0.3264007568359375, 0.398529052734375, 0.4706573486328125, 0.54278564453125, 0.6149139404296875, 0.687042236328125, 0.7591705322265625, 0.831298828125, 0.9034271240234375, 0.975555419921875, 1.0476837158203125, 1.11981201171875, 1.1919403076171875, 1.264068603515625, 1.3361968994140625, 1.4083251953125, 1.4804534912109375, 1.552581787109375, 1.6247100830078125, 1.69683837890625, 1.7689666748046875, 1.841094970703125, 1.9132232666015625, 1.9853515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 8.0, 6.0, 9.0, 9.0, 14.0, 13.0, 35.0, 42.0, 68.0, 80.0, 149.0, 241.0, 430.0, 875.0, 1965.0, 5243.0, 16186.0, 57625.0, 307185.0, 563682.0, 66498.0, 18060.0, 5878.0, 2128.0, 954.0, 481.0, 265.0, 153.0, 90.0, 53.0, 43.0, 30.0, 13.0, 15.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472412109375, -0.457672119140625, -0.44293212890625, -0.428192138671875, -0.4134521484375, -0.398712158203125, -0.38397216796875, -0.369232177734375, -0.3544921875, -0.339752197265625, -0.32501220703125, -0.310272216796875, -0.2955322265625, -0.280792236328125, -0.26605224609375, -0.251312255859375, -0.236572265625, -0.221832275390625, -0.20709228515625, -0.192352294921875, -0.1776123046875, -0.162872314453125, -0.14813232421875, -0.133392333984375, -0.11865234375, -0.103912353515625, -0.08917236328125, -0.074432373046875, -0.0596923828125, -0.044952392578125, -0.03021240234375, -0.015472412109375, -0.000732421875, 0.014007568359375, 0.02874755859375, 0.043487548828125, 0.0582275390625, 0.072967529296875, 0.08770751953125, 0.102447509765625, 0.1171875, 0.131927490234375, 0.14666748046875, 0.161407470703125, 0.1761474609375, 0.190887451171875, 0.20562744140625, 0.220367431640625, 0.235107421875, 0.249847412109375, 0.26458740234375, 0.279327392578125, 0.2940673828125, 0.308807373046875, 0.32354736328125, 0.338287353515625, 0.35302734375, 0.367767333984375, 0.38250732421875, 0.397247314453125, 0.4119873046875, 0.426727294921875, 0.44146728515625, 0.456207275390625, 0.470947265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 9.0, 7.0, 10.0, 8.0, 20.0, 22.0, 29.0, 25.0, 33.0, 47.0, 67.0, 69.0, 107.0, 107.0, 112.0, 81.0, 57.0, 37.0, 37.0, 21.0, 20.0, 16.0, 7.0, 11.0, 3.0, 4.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00013256072998046875, -0.00012819841504096985, -0.00012383610010147095, -0.00011947378516197205, -0.00011511147022247314, -0.00011074915528297424, -0.00010638684034347534, -0.00010202452540397644, -9.766221046447754e-05, -9.329989552497864e-05, -8.893758058547974e-05, -8.457526564598083e-05, -8.021295070648193e-05, -7.585063576698303e-05, -7.148832082748413e-05, -6.712600588798523e-05, -6.276369094848633e-05, -5.840137600898743e-05, -5.4039061069488525e-05, -4.9676746129989624e-05, -4.531443119049072e-05, -4.095211625099182e-05, -3.658980131149292e-05, -3.222748637199402e-05, -2.7865171432495117e-05, -2.3502856492996216e-05, -1.9140541553497314e-05, -1.4778226613998413e-05, -1.0415911674499512e-05, -6.05359673500061e-06, -1.691281795501709e-06, 2.6710331439971924e-06, 7.033348083496094e-06, 1.1395663022994995e-05, 1.5757977962493896e-05, 2.0120292901992798e-05, 2.44826078414917e-05, 2.88449227809906e-05, 3.32072377204895e-05, 3.75695526599884e-05, 4.1931867599487305e-05, 4.6294182538986206e-05, 5.065649747848511e-05, 5.501881241798401e-05, 5.938112735748291e-05, 6.374344229698181e-05, 6.810575723648071e-05, 7.246807217597961e-05, 7.683038711547852e-05, 8.119270205497742e-05, 8.555501699447632e-05, 8.991733193397522e-05, 9.427964687347412e-05, 9.864196181297302e-05, 0.00010300427675247192, 0.00010736659169197083, 0.00011172890663146973, 0.00011609122157096863, 0.00012045353651046753, 0.00012481585144996643, 0.00012917816638946533, 0.00013354048132896423, 0.00013790279626846313, 0.00014226511120796204, 0.00014662742614746094]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 14.0, 8.0, 21.0, 25.0, 38.0, 72.0, 142.0, 310.0, 601.0, 1451.0, 3829.0, 13245.0, 61697.0, 647738.0, 265193.0, 40036.0, 9191.0, 2835.0, 1073.0, 529.0, 239.0, 116.0, 47.0, 37.0, 24.0, 13.0, 17.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63720703125, -0.6183929443359375, -0.599578857421875, -0.5807647705078125, -0.56195068359375, -0.5431365966796875, -0.524322509765625, -0.5055084228515625, -0.4866943359375, -0.4678802490234375, -0.449066162109375, -0.4302520751953125, -0.41143798828125, -0.3926239013671875, -0.373809814453125, -0.3549957275390625, -0.336181640625, -0.3173675537109375, -0.298553466796875, -0.2797393798828125, -0.26092529296875, -0.2421112060546875, -0.223297119140625, -0.2044830322265625, -0.1856689453125, -0.1668548583984375, -0.148040771484375, -0.1292266845703125, -0.11041259765625, -0.0915985107421875, -0.072784423828125, -0.0539703369140625, -0.03515625, -0.0163421630859375, 0.002471923828125, 0.0212860107421875, 0.04010009765625, 0.0589141845703125, 0.077728271484375, 0.0965423583984375, 0.1153564453125, 0.1341705322265625, 0.152984619140625, 0.1717987060546875, 0.19061279296875, 0.2094268798828125, 0.228240966796875, 0.2470550537109375, 0.265869140625, 0.2846832275390625, 0.303497314453125, 0.3223114013671875, 0.34112548828125, 0.3599395751953125, 0.378753662109375, 0.3975677490234375, 0.4163818359375, 0.4351959228515625, 0.454010009765625, 0.4728240966796875, 0.49163818359375, 0.5104522705078125, 0.529266357421875, 0.5480804443359375, 0.56689453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 0.0, 3.0, 9.0, 19.0, 23.0, 21.0, 39.0, 69.0, 68.0, 80.0, 120.0, 103.0, 82.0, 91.0, 57.0, 54.0, 46.0, 27.0, 26.0, 12.0, 10.0, 7.0, 8.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5475692749023438, -0.5301971435546875, -0.5128250122070312, -0.495452880859375, -0.47808074951171875, -0.4607086181640625, -0.44333648681640625, -0.42596435546875, -0.40859222412109375, -0.3912200927734375, -0.37384796142578125, -0.356475830078125, -0.33910369873046875, -0.3217315673828125, -0.30435943603515625, -0.2869873046875, -0.26961517333984375, -0.2522430419921875, -0.23487091064453125, -0.217498779296875, -0.20012664794921875, -0.1827545166015625, -0.16538238525390625, -0.14801025390625, -0.13063812255859375, -0.1132659912109375, -0.09589385986328125, -0.078521728515625, -0.06114959716796875, -0.0437774658203125, -0.02640533447265625, -0.009033203125, 0.00833892822265625, 0.0257110595703125, 0.04308319091796875, 0.060455322265625, 0.07782745361328125, 0.0951995849609375, 0.11257171630859375, 0.12994384765625, 0.14731597900390625, 0.1646881103515625, 0.18206024169921875, 0.199432373046875, 0.21680450439453125, 0.2341766357421875, 0.25154876708984375, 0.2689208984375, 0.28629302978515625, 0.3036651611328125, 0.32103729248046875, 0.338409423828125, 0.35578155517578125, 0.3731536865234375, 0.39052581787109375, 0.40789794921875, 0.42527008056640625, 0.4426422119140625, 0.46001434326171875, 0.477386474609375, 0.49475860595703125, 0.5121307373046875, 0.5295028686523438, 0.546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 20.0, 36.0, 60.0, 84.0, 244.0, 245.0, 129.0, 73.0, 40.0, 20.0, 19.0, 9.0, 12.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.146360397338867, -7.738837718963623, -7.331315040588379, -6.923792362213135, -6.516269683837891, -6.108746528625488, -5.701224327087402, -5.293701171875, -4.886178970336914, -4.47865629196167, -4.071133613586426, -3.6636109352111816, -3.2560882568359375, -2.8485653400421143, -2.44104266166687, -2.033519983291626, -1.6259970664978027, -1.2184743881225586, -0.8109516501426697, -0.40342891216278076, 0.004093766212463379, 0.41161656379699707, 0.8191392421722412, 1.2266619205474854, 1.6341845989227295, 2.0417072772979736, 2.4492299556732178, 2.856752872467041, 3.264275550842285, 3.6717982292175293, 4.079320907592773, 4.486843585968018, 4.894366264343262, 5.301888942718506, 5.70941162109375, 6.116934299468994, 6.524456977844238, 6.931980133056641, 7.339502334594727, 7.747025489807129, 8.154547691345215, 8.562070846557617, 8.969593048095703, 9.377116203308105, 9.784638404846191, 10.192161560058594, 10.59968376159668, 11.007206916809082, 11.414730072021484, 11.822253227233887, 12.229775428771973, 12.637298583984375, 13.044820785522461, 13.452343940734863, 13.85986614227295, 14.267389297485352, 14.674911499023438, 15.08243465423584, 15.489956855773926, 15.897480010986328, 16.305002212524414, 16.7125244140625, 17.12004852294922, 17.527570724487305, 17.93509292602539]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 7.0, 8.0, 9.0, 17.0, 12.0, 13.0, 9.0, 24.0, 17.0, 27.0, 26.0, 20.0, 32.0, 33.0, 39.0, 56.0, 112.0, 102.0, 75.0, 51.0, 36.0, 38.0, 38.0, 31.0, 24.0, 29.0, 18.0, 19.0, 11.0, 16.0, 12.0, 15.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.032028198242188, -8.775113105773926, -8.518198013305664, -8.261282920837402, -8.00436782836914, -7.747452735900879, -7.490537643432617, -7.2336225509643555, -6.976707458496094, -6.719792366027832, -6.46287727355957, -6.205962181091309, -5.949047088623047, -5.692131996154785, -5.435216903686523, -5.178301811218262, -4.921386241912842, -4.66447114944458, -4.407556056976318, -4.150640964508057, -3.893725872039795, -3.636810779571533, -3.3798954486846924, -3.1229803562164307, -2.866065263748169, -2.6091501712799072, -2.3522350788116455, -2.0953197479248047, -1.8384047746658325, -1.5814896821975708, -1.3245744705200195, -1.0676593780517578, -0.8107442855834961, -0.5538291931152344, -0.2969140410423279, -0.03999888896942139, 0.21691620349884033, 0.47383129596710205, 0.7307465076446533, 0.987661600112915, 1.2445766925811768, 1.5014917850494385, 1.7584068775177002, 2.015322208404541, 2.2722373008728027, 2.5291523933410645, 2.786067485809326, 3.042982578277588, 3.2998976707458496, 3.5568127632141113, 3.813727855682373, 4.070642948150635, 4.3275580406188965, 4.584473133087158, 4.841388702392578, 5.09830379486084, 5.355218887329102, 5.612133979797363, 5.869049072265625, 6.125964164733887, 6.382879257202148, 6.63979434967041, 6.896709442138672, 7.153624534606934, 7.410539627075195]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 29.0, 43.0, 69.0, 112.0, 196.0, 412.0, 765.0, 1795.0, 4235.0, 11848.0, 42340.0, 220783.0, 1457748.0, 2023795.0, 345597.0, 59522.0, 15405.0, 5392.0, 2144.0, 965.0, 484.0, 256.0, 127.0, 86.0, 54.0, 29.0, 12.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-1.1240234375, -1.0979537963867188, -1.0718841552734375, -1.0458145141601562, -1.019744873046875, -0.9936752319335938, -0.9676055908203125, -0.9415359497070312, -0.91546630859375, -0.8893966674804688, -0.8633270263671875, -0.8372573852539062, -0.811187744140625, -0.7851181030273438, -0.7590484619140625, -0.7329788208007812, -0.7069091796875, -0.6808395385742188, -0.6547698974609375, -0.6287002563476562, -0.602630615234375, -0.5765609741210938, -0.5504913330078125, -0.5244216918945312, -0.49835205078125, -0.47228240966796875, -0.4462127685546875, -0.42014312744140625, -0.394073486328125, -0.36800384521484375, -0.3419342041015625, -0.31586456298828125, -0.289794921875, -0.26372528076171875, -0.2376556396484375, -0.21158599853515625, -0.185516357421875, -0.15944671630859375, -0.1333770751953125, -0.10730743408203125, -0.08123779296875, -0.05516815185546875, -0.0290985107421875, -0.00302886962890625, 0.023040771484375, 0.04911041259765625, 0.0751800537109375, 0.10124969482421875, 0.1273193359375, 0.15338897705078125, 0.1794586181640625, 0.20552825927734375, 0.231597900390625, 0.25766754150390625, 0.2837371826171875, 0.30980682373046875, 0.33587646484375, 0.36194610595703125, 0.3880157470703125, 0.41408538818359375, 0.440155029296875, 0.46622467041015625, 0.4922943115234375, 0.5183639526367188, 0.54443359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 16.0, 12.0, 16.0, 23.0, 25.0, 27.0, 20.0, 38.0, 30.0, 30.0, 40.0, 35.0, 35.0, 45.0, 35.0, 44.0, 46.0, 45.0, 48.0, 50.0, 43.0, 32.0, 34.0, 36.0, 29.0, 24.0, 19.0, 20.0, 18.0, 10.0, 10.0, 11.0, 6.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57373046875, -0.5561599731445312, -0.5385894775390625, -0.5210189819335938, -0.503448486328125, -0.48587799072265625, -0.4683074951171875, -0.45073699951171875, -0.43316650390625, -0.41559600830078125, -0.3980255126953125, -0.38045501708984375, -0.362884521484375, -0.34531402587890625, -0.3277435302734375, -0.31017303466796875, -0.2926025390625, -0.27503204345703125, -0.2574615478515625, -0.23989105224609375, -0.222320556640625, -0.20475006103515625, -0.1871795654296875, -0.16960906982421875, -0.15203857421875, -0.13446807861328125, -0.1168975830078125, -0.09932708740234375, -0.081756591796875, -0.06418609619140625, -0.0466156005859375, -0.02904510498046875, -0.011474609375, 0.00609588623046875, 0.0236663818359375, 0.04123687744140625, 0.058807373046875, 0.07637786865234375, 0.0939483642578125, 0.11151885986328125, 0.12908935546875, 0.14665985107421875, 0.1642303466796875, 0.18180084228515625, 0.199371337890625, 0.21694183349609375, 0.2345123291015625, 0.25208282470703125, 0.2696533203125, 0.28722381591796875, 0.3047943115234375, 0.32236480712890625, 0.339935302734375, 0.35750579833984375, 0.3750762939453125, 0.39264678955078125, 0.41021728515625, 0.42778778076171875, 0.4453582763671875, 0.46292877197265625, 0.480499267578125, 0.49806976318359375, 0.5156402587890625, 0.5332107543945312, 0.55078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 8.0, 4.0, 10.0, 8.0, 19.0, 27.0, 31.0, 38.0, 75.0, 101.0, 185.0, 358.0, 737.0, 1818.0, 6261.0, 31972.0, 340834.0, 3442645.0, 329319.0, 30881.0, 5870.0, 1645.0, 664.0, 293.0, 161.0, 90.0, 67.0, 47.0, 25.0, 23.0, 19.0, 9.0, 11.0, 9.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.534271240234375, -1.48846435546875, -1.442657470703125, -1.3968505859375, -1.351043701171875, -1.30523681640625, -1.259429931640625, -1.213623046875, -1.167816162109375, -1.12200927734375, -1.076202392578125, -1.0303955078125, -0.984588623046875, -0.93878173828125, -0.892974853515625, -0.84716796875, -0.801361083984375, -0.75555419921875, -0.709747314453125, -0.6639404296875, -0.618133544921875, -0.57232666015625, -0.526519775390625, -0.480712890625, -0.434906005859375, -0.38909912109375, -0.343292236328125, -0.2974853515625, -0.251678466796875, -0.20587158203125, -0.160064697265625, -0.1142578125, -0.068450927734375, -0.02264404296875, 0.023162841796875, 0.0689697265625, 0.114776611328125, 0.16058349609375, 0.206390380859375, 0.252197265625, 0.298004150390625, 0.34381103515625, 0.389617919921875, 0.4354248046875, 0.481231689453125, 0.52703857421875, 0.572845458984375, 0.61865234375, 0.664459228515625, 0.71026611328125, 0.756072998046875, 0.8018798828125, 0.847686767578125, 0.89349365234375, 0.939300537109375, 0.985107421875, 1.030914306640625, 1.07672119140625, 1.122528076171875, 1.1683349609375, 1.214141845703125, 1.25994873046875, 1.305755615234375, 1.3515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 14.0, 14.0, 18.0, 32.0, 41.0, 45.0, 91.0, 166.0, 242.0, 395.0, 596.0, 763.0, 619.0, 360.0, 248.0, 152.0, 76.0, 63.0, 37.0, 25.0, 10.0, 16.0, 13.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.47412109375, -1.4287109375, -1.38330078125, -1.337890625, -1.29248046875, -1.2470703125, -1.20166015625, -1.15625, -1.11083984375, -1.0654296875, -1.02001953125, -0.974609375, -0.92919921875, -0.8837890625, -0.83837890625, -0.79296875, -0.74755859375, -0.7021484375, -0.65673828125, -0.611328125, -0.56591796875, -0.5205078125, -0.47509765625, -0.4296875, -0.38427734375, -0.3388671875, -0.29345703125, -0.248046875, -0.20263671875, -0.1572265625, -0.11181640625, -0.06640625, -0.02099609375, 0.0244140625, 0.06982421875, 0.115234375, 0.16064453125, 0.2060546875, 0.25146484375, 0.296875, 0.34228515625, 0.3876953125, 0.43310546875, 0.478515625, 0.52392578125, 0.5693359375, 0.61474609375, 0.66015625, 0.70556640625, 0.7509765625, 0.79638671875, 0.841796875, 0.88720703125, 0.9326171875, 0.97802734375, 1.0234375, 1.06884765625, 1.1142578125, 1.15966796875, 1.205078125, 1.25048828125, 1.2958984375, 1.34130859375, 1.38671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 17.0, 29.0, 58.0, 163.0, 210.0, 218.0, 143.0, 87.0, 29.0, 14.0, 9.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.287250518798828, -14.811155319213867, -14.335061073303223, -13.858966827392578, -13.382871627807617, -12.906776428222656, -12.430682182312012, -11.954587936401367, -11.478492736816406, -11.002397537231445, -10.5263032913208, -10.050209045410156, -9.574113845825195, -9.098018646240234, -8.62192440032959, -8.145830154418945, -7.669734954833984, -7.193640232086182, -6.717545509338379, -6.241450786590576, -5.765356063842773, -5.289261341094971, -4.813166618347168, -4.337071895599365, -3.8609771728515625, -3.3848824501037598, -2.908787727355957, -2.4326930046081543, -1.9565982818603516, -1.4805035591125488, -1.004408836364746, -0.5283141136169434, -0.05221843719482422, 0.4238762855529785, 0.8999710083007812, 1.376065731048584, 1.8521604537963867, 2.3282551765441895, 2.804349899291992, 3.280444622039795, 3.7565393447875977, 4.2326340675354, 4.708728790283203, 5.184823513031006, 5.660918235778809, 6.137012958526611, 6.613107681274414, 7.089202404022217, 7.5652971267700195, 8.041391372680664, 8.517486572265625, 8.993581771850586, 9.46967601776123, 9.945770263671875, 10.421865463256836, 10.897960662841797, 11.374054908752441, 11.850149154663086, 12.326244354248047, 12.802339553833008, 13.278433799743652, 13.754528045654297, 14.230623245239258, 14.706718444824219, 15.182812690734863]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 10.0, 5.0, 9.0, 8.0, 12.0, 4.0, 12.0, 18.0, 17.0, 21.0, 14.0, 30.0, 35.0, 35.0, 38.0, 40.0, 41.0, 38.0, 32.0, 36.0, 34.0, 42.0, 43.0, 40.0, 34.0, 35.0, 36.0, 41.0, 36.0, 27.0, 26.0, 17.0, 16.0, 19.0, 13.0, 11.0, 12.0, 9.0, 10.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.812309741973877, -4.6557722091674805, -4.499234676361084, -4.342697620391846, -4.186160087585449, -4.029622554779053, -3.8730850219726562, -3.7165474891662598, -3.5600101947784424, -3.403472661972046, -3.2469353675842285, -3.090397834777832, -2.9338603019714355, -2.777323007583618, -2.6207854747772217, -2.4642481803894043, -2.307710647583008, -2.1511731147766113, -1.994635820388794, -1.8380982875823975, -1.6815608739852905, -1.5250234603881836, -1.368485927581787, -1.2119485139846802, -1.0554111003875732, -0.8988736867904663, -0.7423362135887146, -0.5857987403869629, -0.42926132678985596, -0.272723913192749, -0.11618643999099731, 0.040351033210754395, 0.19688892364501953, 0.35342636704444885, 0.5099638104438782, 0.6665012836456299, 0.8230386972427368, 0.9795761108398438, 1.1361136436462402, 1.2926510572433472, 1.449188470840454, 1.605725884437561, 1.762263298034668, 1.9188008308410645, 2.075338363647461, 2.2318756580352783, 2.388413190841675, 2.544950485229492, 2.7014880180358887, 2.858025550842285, 3.0145628452301025, 3.171100378036499, 3.3276376724243164, 3.484175205230713, 3.6407127380371094, 3.797250270843506, 3.9537875652313232, 4.110324859619141, 4.266862392425537, 4.423399925231934, 4.57993745803833, 4.736474990844727, 4.893012046813965, 5.049549579620361, 5.206087112426758]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 8.0, 6.0, 10.0, 11.0, 19.0, 22.0, 30.0, 35.0, 57.0, 79.0, 120.0, 207.0, 326.0, 525.0, 844.0, 1446.0, 2432.0, 4237.0, 7397.0, 13395.0, 25705.0, 50767.0, 106179.0, 224537.0, 289985.0, 163552.0, 76136.0, 37023.0, 19400.0, 10117.0, 5731.0, 3317.0, 1934.0, 1073.0, 659.0, 432.0, 258.0, 191.0, 108.0, 80.0, 59.0, 38.0, 25.0, 13.0, 7.0, 10.0, 8.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7568359375, -0.730072021484375, -0.70330810546875, -0.676544189453125, -0.6497802734375, -0.623016357421875, -0.59625244140625, -0.569488525390625, -0.542724609375, -0.515960693359375, -0.48919677734375, -0.462432861328125, -0.4356689453125, -0.408905029296875, -0.38214111328125, -0.355377197265625, -0.32861328125, -0.301849365234375, -0.27508544921875, -0.248321533203125, -0.2215576171875, -0.194793701171875, -0.16802978515625, -0.141265869140625, -0.114501953125, -0.087738037109375, -0.06097412109375, -0.034210205078125, -0.0074462890625, 0.019317626953125, 0.04608154296875, 0.072845458984375, 0.099609375, 0.126373291015625, 0.15313720703125, 0.179901123046875, 0.2066650390625, 0.233428955078125, 0.26019287109375, 0.286956787109375, 0.313720703125, 0.340484619140625, 0.36724853515625, 0.394012451171875, 0.4207763671875, 0.447540283203125, 0.47430419921875, 0.501068115234375, 0.52783203125, 0.554595947265625, 0.58135986328125, 0.608123779296875, 0.6348876953125, 0.661651611328125, 0.68841552734375, 0.715179443359375, 0.741943359375, 0.768707275390625, 0.79547119140625, 0.822235107421875, 0.8489990234375, 0.875762939453125, 0.90252685546875, 0.929290771484375, 0.9560546875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 2.0, 6.0, 2.0, 7.0, 11.0, 7.0, 13.0, 15.0, 19.0, 16.0, 17.0, 23.0, 28.0, 22.0, 23.0, 36.0, 32.0, 28.0, 33.0, 42.0, 35.0, 56.0, 45.0, 45.0, 42.0, 45.0, 36.0, 38.0, 41.0, 29.0, 34.0, 19.0, 25.0, 14.0, 15.0, 13.0, 21.0, 11.0, 10.0, 6.0, 7.0, 10.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.58837890625, -0.5712203979492188, -0.5540618896484375, -0.5369033813476562, -0.519744873046875, -0.5025863647460938, -0.4854278564453125, -0.46826934814453125, -0.45111083984375, -0.43395233154296875, -0.4167938232421875, -0.39963531494140625, -0.382476806640625, -0.36531829833984375, -0.3481597900390625, -0.33100128173828125, -0.3138427734375, -0.29668426513671875, -0.2795257568359375, -0.26236724853515625, -0.245208740234375, -0.22805023193359375, -0.2108917236328125, -0.19373321533203125, -0.17657470703125, -0.15941619873046875, -0.1422576904296875, -0.12509918212890625, -0.107940673828125, -0.09078216552734375, -0.0736236572265625, -0.05646514892578125, -0.039306640625, -0.02214813232421875, -0.0049896240234375, 0.01216888427734375, 0.029327392578125, 0.04648590087890625, 0.0636444091796875, 0.08080291748046875, 0.09796142578125, 0.11511993408203125, 0.1322784423828125, 0.14943695068359375, 0.166595458984375, 0.18375396728515625, 0.2009124755859375, 0.21807098388671875, 0.2352294921875, 0.25238800048828125, 0.2695465087890625, 0.28670501708984375, 0.303863525390625, 0.32102203369140625, 0.3381805419921875, 0.35533905029296875, 0.37249755859375, 0.38965606689453125, 0.4068145751953125, 0.42397308349609375, 0.441131591796875, 0.45829010009765625, 0.4754486083984375, 0.49260711669921875, 0.509765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 9.0, 6.0, 5.0, 10.0, 20.0, 26.0, 22.0, 51.0, 60.0, 73.0, 116.0, 168.0, 255.0, 374.0, 543.0, 1116.0, 2200.0, 5934.0, 22111.0, 128637.0, 746062.0, 110814.0, 19456.0, 5431.0, 2113.0, 1129.0, 597.0, 398.0, 242.0, 178.0, 128.0, 78.0, 49.0, 34.0, 33.0, 29.0, 12.0, 11.0, 8.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.52630615234375, -1.4686279296875, -1.41094970703125, -1.353271484375, -1.29559326171875, -1.2379150390625, -1.18023681640625, -1.12255859375, -1.06488037109375, -1.0072021484375, -0.94952392578125, -0.891845703125, -0.83416748046875, -0.7764892578125, -0.71881103515625, -0.6611328125, -0.60345458984375, -0.5457763671875, -0.48809814453125, -0.430419921875, -0.37274169921875, -0.3150634765625, -0.25738525390625, -0.19970703125, -0.14202880859375, -0.0843505859375, -0.02667236328125, 0.031005859375, 0.08868408203125, 0.1463623046875, 0.20404052734375, 0.26171875, 0.31939697265625, 0.3770751953125, 0.43475341796875, 0.492431640625, 0.55010986328125, 0.6077880859375, 0.66546630859375, 0.72314453125, 0.78082275390625, 0.8385009765625, 0.89617919921875, 0.953857421875, 1.01153564453125, 1.0692138671875, 1.12689208984375, 1.1845703125, 1.24224853515625, 1.2999267578125, 1.35760498046875, 1.415283203125, 1.47296142578125, 1.5306396484375, 1.58831787109375, 1.64599609375, 1.70367431640625, 1.7613525390625, 1.81903076171875, 1.876708984375, 1.93438720703125, 1.9920654296875, 2.04974365234375, 2.107421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 5.0, 5.0, 8.0, 15.0, 13.0, 12.0, 20.0, 32.0, 40.0, 27.0, 36.0, 49.0, 44.0, 56.0, 58.0, 61.0, 49.0, 42.0, 56.0, 49.0, 39.0, 41.0, 31.0, 29.0, 30.0, 18.0, 17.0, 14.0, 17.0, 7.0, 18.0, 6.0, 7.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-2.5859375, -2.5176544189453125, -2.449371337890625, -2.3810882568359375, -2.31280517578125, -2.2445220947265625, -2.176239013671875, -2.1079559326171875, -2.0396728515625, -1.9713897705078125, -1.903106689453125, -1.8348236083984375, -1.76654052734375, -1.6982574462890625, -1.629974365234375, -1.5616912841796875, -1.493408203125, -1.4251251220703125, -1.356842041015625, -1.2885589599609375, -1.22027587890625, -1.1519927978515625, -1.083709716796875, -1.0154266357421875, -0.9471435546875, -0.8788604736328125, -0.810577392578125, -0.7422943115234375, -0.67401123046875, -0.6057281494140625, -0.537445068359375, -0.4691619873046875, -0.40087890625, -0.3325958251953125, -0.264312744140625, -0.1960296630859375, -0.12774658203125, -0.0594635009765625, 0.008819580078125, 0.0771026611328125, 0.1453857421875, 0.2136688232421875, 0.281951904296875, 0.3502349853515625, 0.41851806640625, 0.4868011474609375, 0.555084228515625, 0.6233673095703125, 0.691650390625, 0.7599334716796875, 0.828216552734375, 0.8964996337890625, 0.96478271484375, 1.0330657958984375, 1.101348876953125, 1.1696319580078125, 1.2379150390625, 1.3061981201171875, 1.374481201171875, 1.4427642822265625, 1.51104736328125, 1.5793304443359375, 1.647613525390625, 1.7158966064453125, 1.7841796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 11.0, 9.0, 12.0, 19.0, 26.0, 32.0, 54.0, 70.0, 128.0, 187.0, 339.0, 515.0, 1033.0, 2182.0, 5526.0, 18674.0, 91503.0, 772014.0, 121673.0, 22895.0, 6420.0, 2491.0, 1168.0, 566.0, 327.0, 219.0, 149.0, 87.0, 69.0, 39.0, 39.0, 22.0, 19.0, 10.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.576690673828125, -0.55718994140625, -0.537689208984375, -0.5181884765625, -0.498687744140625, -0.47918701171875, -0.459686279296875, -0.440185546875, -0.420684814453125, -0.40118408203125, -0.381683349609375, -0.3621826171875, -0.342681884765625, -0.32318115234375, -0.303680419921875, -0.2841796875, -0.264678955078125, -0.24517822265625, -0.225677490234375, -0.2061767578125, -0.186676025390625, -0.16717529296875, -0.147674560546875, -0.128173828125, -0.108673095703125, -0.08917236328125, -0.069671630859375, -0.0501708984375, -0.030670166015625, -0.01116943359375, 0.008331298828125, 0.02783203125, 0.047332763671875, 0.06683349609375, 0.086334228515625, 0.1058349609375, 0.125335693359375, 0.14483642578125, 0.164337158203125, 0.183837890625, 0.203338623046875, 0.22283935546875, 0.242340087890625, 0.2618408203125, 0.281341552734375, 0.30084228515625, 0.320343017578125, 0.33984375, 0.359344482421875, 0.37884521484375, 0.398345947265625, 0.4178466796875, 0.437347412109375, 0.45684814453125, 0.476348876953125, 0.495849609375, 0.515350341796875, 0.53485107421875, 0.554351806640625, 0.5738525390625, 0.593353271484375, 0.61285400390625, 0.632354736328125, 0.65185546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 9.0, 10.0, 7.0, 11.0, 14.0, 18.0, 26.0, 30.0, 29.0, 60.0, 90.0, 109.0, 113.0, 93.0, 88.0, 77.0, 42.0, 29.0, 28.0, 20.0, 12.0, 15.0, 8.0, 12.0, 6.0, 4.0, 3.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014257431030273438, -0.00013723596930503845, -0.00013189762830734253, -0.0001265592873096466, -0.00012122094631195068, -0.00011588260531425476, -0.00011054426431655884, -0.00010520592331886292, -9.986758232116699e-05, -9.452924132347107e-05, -8.919090032577515e-05, -8.385255932807922e-05, -7.85142183303833e-05, -7.317587733268738e-05, -6.783753633499146e-05, -6.249919533729553e-05, -5.716085433959961e-05, -5.1822513341903687e-05, -4.6484172344207764e-05, -4.114583134651184e-05, -3.580749034881592e-05, -3.0469149351119995e-05, -2.5130808353424072e-05, -1.979246735572815e-05, -1.4454126358032227e-05, -9.115785360336304e-06, -3.777444362640381e-06, 1.560896635055542e-06, 6.899237632751465e-06, 1.2237578630447388e-05, 1.757591962814331e-05, 2.2914260625839233e-05, 2.8252601623535156e-05, 3.359094262123108e-05, 3.8929283618927e-05, 4.4267624616622925e-05, 4.960596561431885e-05, 5.494430661201477e-05, 6.028264760971069e-05, 6.562098860740662e-05, 7.095932960510254e-05, 7.629767060279846e-05, 8.163601160049438e-05, 8.697435259819031e-05, 9.231269359588623e-05, 9.765103459358215e-05, 0.00010298937559127808, 0.000108327716588974, 0.00011366605758666992, 0.00011900439858436584, 0.00012434273958206177, 0.0001296810805797577, 0.0001350194215774536, 0.00014035776257514954, 0.00014569610357284546, 0.00015103444457054138, 0.0001563727855682373, 0.00016171112656593323, 0.00016704946756362915, 0.00017238780856132507, 0.000177726149559021, 0.00018306449055671692, 0.00018840283155441284, 0.00019374117255210876, 0.0001990795135498047]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 10.0, 13.0, 13.0, 18.0, 12.0, 53.0, 78.0, 124.0, 250.0, 411.0, 858.0, 2253.0, 7268.0, 31518.0, 227059.0, 705129.0, 56793.0, 11078.0, 3169.0, 1217.0, 536.0, 291.0, 158.0, 89.0, 56.0, 27.0, 21.0, 19.0, 10.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5978546142578125, -0.578033447265625, -0.5582122802734375, -0.53839111328125, -0.5185699462890625, -0.498748779296875, -0.4789276123046875, -0.4591064453125, -0.4392852783203125, -0.419464111328125, -0.3996429443359375, -0.37982177734375, -0.3600006103515625, -0.340179443359375, -0.3203582763671875, -0.300537109375, -0.2807159423828125, -0.260894775390625, -0.2410736083984375, -0.22125244140625, -0.2014312744140625, -0.181610107421875, -0.1617889404296875, -0.1419677734375, -0.1221466064453125, -0.102325439453125, -0.0825042724609375, -0.06268310546875, -0.0428619384765625, -0.023040771484375, -0.0032196044921875, 0.0166015625, 0.0364227294921875, 0.056243896484375, 0.0760650634765625, 0.09588623046875, 0.1157073974609375, 0.135528564453125, 0.1553497314453125, 0.1751708984375, 0.1949920654296875, 0.214813232421875, 0.2346343994140625, 0.25445556640625, 0.2742767333984375, 0.294097900390625, 0.3139190673828125, 0.333740234375, 0.3535614013671875, 0.373382568359375, 0.3932037353515625, 0.41302490234375, 0.4328460693359375, 0.452667236328125, 0.4724884033203125, 0.4923095703125, 0.5121307373046875, 0.531951904296875, 0.5517730712890625, 0.57159423828125, 0.5914154052734375, 0.611236572265625, 0.6310577392578125, 0.65087890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 8.0, 1.0, 8.0, 12.0, 7.0, 10.0, 16.0, 21.0, 14.0, 17.0, 21.0, 22.0, 21.0, 35.0, 26.0, 39.0, 47.0, 72.0, 58.0, 77.0, 68.0, 58.0, 46.0, 36.0, 31.0, 29.0, 22.0, 18.0, 32.0, 18.0, 19.0, 17.0, 5.0, 10.0, 17.0, 7.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 7.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2541007995605469, -0.24404144287109375, -0.23398208618164062, -0.2239227294921875, -0.21386337280273438, -0.20380401611328125, -0.19374465942382812, -0.183685302734375, -0.17362594604492188, -0.16356658935546875, -0.15350723266601562, -0.1434478759765625, -0.13338851928710938, -0.12332916259765625, -0.11326980590820312, -0.10321044921875, -0.09315109252929688, -0.08309173583984375, -0.07303237915039062, -0.0629730224609375, -0.052913665771484375, -0.04285430908203125, -0.032794952392578125, -0.022735595703125, -0.012676239013671875, -0.00261688232421875, 0.007442474365234375, 0.0175018310546875, 0.027561187744140625, 0.03762054443359375, 0.047679901123046875, 0.0577392578125, 0.06779861450195312, 0.07785797119140625, 0.08791732788085938, 0.0979766845703125, 0.10803604125976562, 0.11809539794921875, 0.12815475463867188, 0.138214111328125, 0.14827346801757812, 0.15833282470703125, 0.16839218139648438, 0.1784515380859375, 0.18851089477539062, 0.19857025146484375, 0.20862960815429688, 0.21868896484375, 0.22874832153320312, 0.23880767822265625, 0.24886703491210938, 0.2589263916015625, 0.2689857482910156, 0.27904510498046875, 0.2891044616699219, 0.299163818359375, 0.3092231750488281, 0.31928253173828125, 0.3293418884277344, 0.3394012451171875, 0.3494606018066406, 0.35951995849609375, 0.3695793151855469, 0.379638671875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 25.0, 49.0, 167.0, 456.0, 142.0, 71.0, 39.0, 19.0, 11.0, 6.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.847379684448242, -9.04951286315918, -8.2516450881958, -7.453778266906738, -6.655910968780518, -5.858043670654297, -5.060176849365234, -4.262309551239014, -3.464442253112793, -2.6665749549865723, -1.8687078952789307, -1.070840835571289, -0.27297353744506836, 0.5248937606811523, 1.3227605819702148, 2.1206278800964355, 2.9184951782226562, 3.716362476348877, 4.514229774475098, 5.31209659576416, 6.109963893890381, 6.907831192016602, 7.705698013305664, 8.503564834594727, 9.301432609558105, 10.099299430847168, 10.897167205810547, 11.69503402709961, 12.492900848388672, 13.29076862335205, 14.088635444641113, 14.886503219604492, 15.684368133544922, 16.482234954833984, 17.280101776123047, 18.07796859741211, 18.875837326049805, 19.673704147338867, 20.47157096862793, 21.269437789916992, 22.067306518554688, 22.86517333984375, 23.663040161132812, 24.460906982421875, 25.25877571105957, 26.056642532348633, 26.854509353637695, 27.652376174926758, 28.45024299621582, 29.248109817504883, 30.045976638793945, 30.84384536743164, 31.641712188720703, 32.439579010009766, 33.23744583129883, 34.03531265258789, 34.83317947387695, 35.631046295166016, 36.42891311645508, 37.22677993774414, 38.0246467590332, 38.82251739501953, 39.620384216308594, 40.418251037597656, 41.21611785888672]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 4.0, 5.0, 9.0, 5.0, 11.0, 9.0, 19.0, 12.0, 15.0, 15.0, 18.0, 11.0, 23.0, 21.0, 16.0, 27.0, 27.0, 45.0, 63.0, 120.0, 132.0, 66.0, 32.0, 26.0, 39.0, 21.0, 23.0, 17.0, 30.0, 16.0, 15.0, 13.0, 12.0, 14.0, 14.0, 5.0, 7.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.11758804321289, -7.879914283752441, -7.64224100112915, -7.404567241668701, -7.16689395904541, -6.929220199584961, -6.691546440124512, -6.453873157501221, -6.2161993980407715, -5.978525638580322, -5.740852355957031, -5.503178596496582, -5.265505313873291, -5.027831554412842, -4.790158271789551, -4.552484512329102, -4.314810752868652, -4.077136993408203, -3.839463710784912, -3.601789951324463, -3.3641164302825928, -3.1264429092407227, -2.8887693881988525, -2.6510958671569824, -2.4134225845336914, -2.1757490634918213, -1.9380754232406616, -1.7004019021987915, -1.4627282619476318, -1.2250547409057617, -0.9873812198638916, -0.7497075796127319, -0.5120339393615723, -0.2743603587150574, -0.03668680787086487, 0.20098674297332764, 0.43866032361984253, 0.6763339042663574, 0.9140074253082275, 1.1516810655593872, 1.3893545866012573, 1.6270281076431274, 1.864701747894287, 2.1023752689361572, 2.3400487899780273, 2.5777225494384766, 2.8153958320617676, 3.053069591522217, 3.290743112564087, 3.528416633605957, 3.766090154647827, 4.003763675689697, 4.2414374351501465, 4.4791107177734375, 4.716784477233887, 4.954458236694336, 5.192131519317627, 5.429805278778076, 5.667478561401367, 5.905152320861816, 6.142825603485107, 6.380499362945557, 6.618172645568848, 6.855846405029297, 7.093520164489746]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 10.0, 4.0, 6.0, 15.0, 19.0, 30.0, 38.0, 68.0, 123.0, 179.0, 311.0, 570.0, 1064.0, 2163.0, 5158.0, 14676.0, 52826.0, 259936.0, 1266269.0, 1936595.0, 516528.0, 98933.0, 24204.0, 8143.0, 3213.0, 1432.0, 744.0, 404.0, 237.0, 156.0, 92.0, 51.0, 41.0, 21.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.0703048706054688, -1.0380706787109375, -1.0058364868164062, -0.973602294921875, -0.9413681030273438, -0.9091339111328125, -0.8768997192382812, -0.84466552734375, -0.8124313354492188, -0.7801971435546875, -0.7479629516601562, -0.715728759765625, -0.6834945678710938, -0.6512603759765625, -0.6190261840820312, -0.5867919921875, -0.5545578002929688, -0.5223236083984375, -0.49008941650390625, -0.457855224609375, -0.42562103271484375, -0.3933868408203125, -0.36115264892578125, -0.32891845703125, -0.29668426513671875, -0.2644500732421875, -0.23221588134765625, -0.199981689453125, -0.16774749755859375, -0.1355133056640625, -0.10327911376953125, -0.071044921875, -0.03881072998046875, -0.0065765380859375, 0.02565765380859375, 0.057891845703125, 0.09012603759765625, 0.1223602294921875, 0.15459442138671875, 0.18682861328125, 0.21906280517578125, 0.2512969970703125, 0.28353118896484375, 0.315765380859375, 0.34799957275390625, 0.3802337646484375, 0.41246795654296875, 0.4447021484375, 0.47693634033203125, 0.5091705322265625, 0.5414047241210938, 0.573638916015625, 0.6058731079101562, 0.6381072998046875, 0.6703414916992188, 0.70257568359375, 0.7348098754882812, 0.7670440673828125, 0.7992782592773438, 0.831512451171875, 0.8637466430664062, 0.8959808349609375, 0.9282150268554688, 0.96044921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 0.0, 3.0, 4.0, 3.0, 10.0, 12.0, 11.0, 10.0, 13.0, 20.0, 15.0, 18.0, 30.0, 26.0, 28.0, 30.0, 38.0, 33.0, 32.0, 53.0, 48.0, 44.0, 44.0, 44.0, 44.0, 53.0, 35.0, 41.0, 32.0, 29.0, 31.0, 18.0, 27.0, 23.0, 18.0, 15.0, 16.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5313034057617188, -0.5137786865234375, -0.49625396728515625, -0.478729248046875, -0.46120452880859375, -0.4436798095703125, -0.42615509033203125, -0.40863037109375, -0.39110565185546875, -0.3735809326171875, -0.35605621337890625, -0.338531494140625, -0.32100677490234375, -0.3034820556640625, -0.28595733642578125, -0.2684326171875, -0.25090789794921875, -0.2333831787109375, -0.21585845947265625, -0.198333740234375, -0.18080902099609375, -0.1632843017578125, -0.14575958251953125, -0.12823486328125, -0.11071014404296875, -0.0931854248046875, -0.07566070556640625, -0.058135986328125, -0.04061126708984375, -0.0230865478515625, -0.00556182861328125, 0.011962890625, 0.02948760986328125, 0.0470123291015625, 0.06453704833984375, 0.082061767578125, 0.09958648681640625, 0.1171112060546875, 0.13463592529296875, 0.15216064453125, 0.16968536376953125, 0.1872100830078125, 0.20473480224609375, 0.222259521484375, 0.23978424072265625, 0.2573089599609375, 0.27483367919921875, 0.2923583984375, 0.30988311767578125, 0.3274078369140625, 0.34493255615234375, 0.362457275390625, 0.37998199462890625, 0.3975067138671875, 0.41503143310546875, 0.43255615234375, 0.45008087158203125, 0.4676055908203125, 0.48513031005859375, 0.502655029296875, 0.5201797485351562, 0.5377044677734375, 0.5552291870117188, 0.57275390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 5.0, 12.0, 11.0, 21.0, 17.0, 46.0, 100.0, 233.0, 441.0, 1193.0, 4743.0, 141935.0, 4020870.0, 20856.0, 2339.0, 782.0, 298.0, 176.0, 81.0, 48.0, 25.0, 19.0, 12.0, 5.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.55078125, -4.38409423828125, -4.2174072265625, -4.05072021484375, -3.884033203125, -3.71734619140625, -3.5506591796875, -3.38397216796875, -3.21728515625, -3.05059814453125, -2.8839111328125, -2.71722412109375, -2.550537109375, -2.38385009765625, -2.2171630859375, -2.05047607421875, -1.8837890625, -1.71710205078125, -1.5504150390625, -1.38372802734375, -1.217041015625, -1.05035400390625, -0.8836669921875, -0.71697998046875, -0.55029296875, -0.38360595703125, -0.2169189453125, -0.05023193359375, 0.116455078125, 0.28314208984375, 0.4498291015625, 0.61651611328125, 0.783203125, 0.94989013671875, 1.1165771484375, 1.28326416015625, 1.449951171875, 1.61663818359375, 1.7833251953125, 1.95001220703125, 2.11669921875, 2.28338623046875, 2.4500732421875, 2.61676025390625, 2.783447265625, 2.95013427734375, 3.1168212890625, 3.28350830078125, 3.4501953125, 3.61688232421875, 3.7835693359375, 3.95025634765625, 4.116943359375, 4.28363037109375, 4.4503173828125, 4.61700439453125, 4.78369140625, 4.95037841796875, 5.1170654296875, 5.28375244140625, 5.450439453125, 5.61712646484375, 5.7838134765625, 5.95050048828125, 6.1171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 13.0, 23.0, 35.0, 81.0, 145.0, 275.0, 554.0, 1086.0, 922.0, 480.0, 238.0, 113.0, 44.0, 29.0, 13.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.74578857421875, -3.6243896484375, -3.50299072265625, -3.381591796875, -3.26019287109375, -3.1387939453125, -3.01739501953125, -2.89599609375, -2.77459716796875, -2.6531982421875, -2.53179931640625, -2.410400390625, -2.28900146484375, -2.1676025390625, -2.04620361328125, -1.9248046875, -1.80340576171875, -1.6820068359375, -1.56060791015625, -1.439208984375, -1.31781005859375, -1.1964111328125, -1.07501220703125, -0.95361328125, -0.83221435546875, -0.7108154296875, -0.58941650390625, -0.468017578125, -0.34661865234375, -0.2252197265625, -0.10382080078125, 0.017578125, 0.13897705078125, 0.2603759765625, 0.38177490234375, 0.503173828125, 0.62457275390625, 0.7459716796875, 0.86737060546875, 0.98876953125, 1.11016845703125, 1.2315673828125, 1.35296630859375, 1.474365234375, 1.59576416015625, 1.7171630859375, 1.83856201171875, 1.9599609375, 2.08135986328125, 2.2027587890625, 2.32415771484375, 2.445556640625, 2.56695556640625, 2.6883544921875, 2.80975341796875, 2.93115234375, 3.05255126953125, 3.1739501953125, 3.29534912109375, 3.416748046875, 3.53814697265625, 3.6595458984375, 3.78094482421875, 3.90234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 12.0, 21.0, 68.0, 128.0, 238.0, 250.0, 144.0, 57.0, 33.0, 21.0, 11.0, 7.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.005016326904297, -23.92644691467285, -22.847877502441406, -21.76930809020996, -20.690738677978516, -19.612171173095703, -18.533601760864258, -17.455032348632812, -16.376462936401367, -15.297893524169922, -14.219324111938477, -13.140755653381348, -12.062186241149902, -10.983616828918457, -9.905048370361328, -8.826478958129883, -7.7479095458984375, -6.669340133666992, -5.590771198272705, -4.512202262878418, -3.4336328506469727, -2.3550634384155273, -1.2764945030212402, -0.19792556762695312, 0.8806438446044922, 1.9592130184173584, 3.0377821922302246, 4.116351127624512, 5.194920539855957, 6.273489952087402, 7.3520588874816895, 8.430627822875977, 9.509193420410156, 10.587762832641602, 11.666332244873047, 12.744900703430176, 13.823470115661621, 14.902039527893066, 15.980607986450195, 17.05917739868164, 18.137746810913086, 19.21631622314453, 20.294885635375977, 21.373455047607422, 22.452022552490234, 23.530593872070312, 24.609161376953125, 25.68773078918457, 26.766300201416016, 27.84486961364746, 28.923439025878906, 30.00200843811035, 31.080577850341797, 32.15914535522461, 33.23771667480469, 34.3162841796875, 35.39485168457031, 36.473419189453125, 37.5519905090332, 38.630558013916016, 39.709129333496094, 40.787696838378906, 41.866268157958984, 42.9448356628418, 44.023406982421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 8.0, 6.0, 12.0, 17.0, 17.0, 19.0, 29.0, 28.0, 31.0, 48.0, 57.0, 68.0, 70.0, 91.0, 102.0, 84.0, 48.0, 44.0, 54.0, 28.0, 30.0, 25.0, 18.0, 18.0, 11.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.929338455200195, -15.431610107421875, -14.933880805969238, -14.436152458190918, -13.938424110412598, -13.440694808959961, -12.94296646118164, -12.44523811340332, -11.947508811950684, -11.449780464172363, -10.952051162719727, -10.454322814941406, -9.956594467163086, -9.45886516571045, -8.961136817932129, -8.463407516479492, -7.96567964553833, -7.467950820922852, -6.970222473144531, -6.472493648529053, -5.974764823913574, -5.477036476135254, -4.979307651519775, -4.481578826904297, -3.9838502407073975, -3.486121654510498, -2.9883928298950195, -2.49066424369812, -1.9929355382919312, -1.4952068328857422, -0.9974782466888428, -0.49974942207336426, -0.0020208358764648438, 0.49570783972740173, 0.9934365153312683, 1.4911651611328125, 1.9888938665390015, 2.4866225719451904, 2.98435115814209, 3.4820799827575684, 3.9798085689544678, 4.477537155151367, 4.975265979766846, 5.472994804382324, 5.9707231521606445, 6.468451976776123, 6.966180801391602, 7.463909149169922, 7.9616379737854, 8.459366798400879, 8.9570951461792, 9.454824447631836, 9.952552795410156, 10.450281143188477, 10.948009490966797, 11.445738792419434, 11.943467140197754, 12.441195487976074, 12.938924789428711, 13.436653137207031, 13.934381484985352, 14.432110786437988, 14.929839134216309, 15.427568435668945, 15.925296783447266]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 8.0, 14.0, 13.0, 31.0, 52.0, 67.0, 138.0, 239.0, 438.0, 842.0, 1913.0, 4453.0, 11916.0, 39216.0, 167780.0, 618235.0, 148905.0, 35546.0, 10922.0, 4190.0, 1790.0, 845.0, 422.0, 224.0, 121.0, 97.0, 36.0, 25.0, 20.0, 17.0, 9.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5806732177734375, -1.537322998046875, -1.4939727783203125, -1.45062255859375, -1.4072723388671875, -1.363922119140625, -1.3205718994140625, -1.2772216796875, -1.2338714599609375, -1.190521240234375, -1.1471710205078125, -1.10382080078125, -1.0604705810546875, -1.017120361328125, -0.9737701416015625, -0.930419921875, -0.8870697021484375, -0.843719482421875, -0.8003692626953125, -0.75701904296875, -0.7136688232421875, -0.670318603515625, -0.6269683837890625, -0.5836181640625, -0.5402679443359375, -0.496917724609375, -0.4535675048828125, -0.41021728515625, -0.3668670654296875, -0.323516845703125, -0.2801666259765625, -0.23681640625, -0.1934661865234375, -0.150115966796875, -0.1067657470703125, -0.06341552734375, -0.0200653076171875, 0.023284912109375, 0.0666351318359375, 0.1099853515625, 0.1533355712890625, 0.196685791015625, 0.2400360107421875, 0.28338623046875, 0.3267364501953125, 0.370086669921875, 0.4134368896484375, 0.456787109375, 0.5001373291015625, 0.543487548828125, 0.5868377685546875, 0.63018798828125, 0.6735382080078125, 0.716888427734375, 0.7602386474609375, 0.8035888671875, 0.8469390869140625, 0.890289306640625, 0.9336395263671875, 0.97698974609375, 1.0203399658203125, 1.063690185546875, 1.1070404052734375, 1.150390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 15.0, 7.0, 23.0, 18.0, 25.0, 28.0, 29.0, 55.0, 58.0, 41.0, 58.0, 61.0, 52.0, 62.0, 54.0, 50.0, 56.0, 47.0, 39.0, 34.0, 23.0, 29.0, 23.0, 13.0, 12.0, 11.0, 11.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.93310546875, -0.9070281982421875, -0.880950927734375, -0.8548736572265625, -0.82879638671875, -0.8027191162109375, -0.776641845703125, -0.7505645751953125, -0.7244873046875, -0.6984100341796875, -0.672332763671875, -0.6462554931640625, -0.62017822265625, -0.5941009521484375, -0.568023681640625, -0.5419464111328125, -0.515869140625, -0.4897918701171875, -0.463714599609375, -0.4376373291015625, -0.41156005859375, -0.3854827880859375, -0.359405517578125, -0.3333282470703125, -0.3072509765625, -0.2811737060546875, -0.255096435546875, -0.2290191650390625, -0.20294189453125, -0.1768646240234375, -0.150787353515625, -0.1247100830078125, -0.0986328125, -0.0725555419921875, -0.046478271484375, -0.0204010009765625, 0.00567626953125, 0.0317535400390625, 0.057830810546875, 0.0839080810546875, 0.1099853515625, 0.1360626220703125, 0.162139892578125, 0.1882171630859375, 0.21429443359375, 0.2403717041015625, 0.266448974609375, 0.2925262451171875, 0.318603515625, 0.3446807861328125, 0.370758056640625, 0.3968353271484375, 0.42291259765625, 0.4489898681640625, 0.475067138671875, 0.5011444091796875, 0.5272216796875, 0.5532989501953125, 0.579376220703125, 0.6054534912109375, 0.63153076171875, 0.6576080322265625, 0.683685302734375, 0.7097625732421875, 0.73583984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 7.0, 8.0, 18.0, 17.0, 25.0, 35.0, 45.0, 71.0, 114.0, 187.0, 337.0, 631.0, 1538.0, 5789.0, 42898.0, 898877.0, 84894.0, 9184.0, 2057.0, 795.0, 388.0, 219.0, 139.0, 78.0, 59.0, 33.0, 28.0, 18.0, 15.0, 13.0, 7.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5299835205078125, -1.465240478515625, -1.4004974365234375, -1.33575439453125, -1.2710113525390625, -1.206268310546875, -1.1415252685546875, -1.0767822265625, -1.0120391845703125, -0.947296142578125, -0.8825531005859375, -0.81781005859375, -0.7530670166015625, -0.688323974609375, -0.6235809326171875, -0.558837890625, -0.4940948486328125, -0.429351806640625, -0.3646087646484375, -0.29986572265625, -0.2351226806640625, -0.170379638671875, -0.1056365966796875, -0.0408935546875, 0.0238494873046875, 0.088592529296875, 0.1533355712890625, 0.21807861328125, 0.2828216552734375, 0.347564697265625, 0.4123077392578125, 0.47705078125, 0.5417938232421875, 0.606536865234375, 0.6712799072265625, 0.73602294921875, 0.8007659912109375, 0.865509033203125, 0.9302520751953125, 0.9949951171875, 1.0597381591796875, 1.124481201171875, 1.1892242431640625, 1.25396728515625, 1.3187103271484375, 1.383453369140625, 1.4481964111328125, 1.512939453125, 1.5776824951171875, 1.642425537109375, 1.7071685791015625, 1.77191162109375, 1.8366546630859375, 1.901397705078125, 1.9661407470703125, 2.0308837890625, 2.0956268310546875, 2.160369873046875, 2.2251129150390625, 2.28985595703125, 2.3545989990234375, 2.419342041015625, 2.4840850830078125, 2.548828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 7.0, 6.0, 9.0, 10.0, 8.0, 22.0, 21.0, 23.0, 19.0, 39.0, 47.0, 49.0, 66.0, 76.0, 98.0, 96.0, 77.0, 75.0, 55.0, 40.0, 30.0, 21.0, 18.0, 15.0, 18.0, 14.0, 9.0, 11.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8343505859375, -2.715576171875, -2.5968017578125, -2.47802734375, -2.3592529296875, -2.240478515625, -2.1217041015625, -2.0029296875, -1.8841552734375, -1.765380859375, -1.6466064453125, -1.52783203125, -1.4090576171875, -1.290283203125, -1.1715087890625, -1.052734375, -0.9339599609375, -0.815185546875, -0.6964111328125, -0.57763671875, -0.4588623046875, -0.340087890625, -0.2213134765625, -0.1025390625, 0.0162353515625, 0.135009765625, 0.2537841796875, 0.37255859375, 0.4913330078125, 0.610107421875, 0.7288818359375, 0.84765625, 0.9664306640625, 1.085205078125, 1.2039794921875, 1.32275390625, 1.4415283203125, 1.560302734375, 1.6790771484375, 1.7978515625, 1.9166259765625, 2.035400390625, 2.1541748046875, 2.27294921875, 2.3917236328125, 2.510498046875, 2.6292724609375, 2.748046875, 2.8668212890625, 2.985595703125, 3.1043701171875, 3.22314453125, 3.3419189453125, 3.460693359375, 3.5794677734375, 3.6982421875, 3.8170166015625, 3.935791015625, 4.0545654296875, 4.17333984375, 4.2921142578125, 4.410888671875, 4.5296630859375, 4.6484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 13.0, 13.0, 18.0, 35.0, 42.0, 63.0, 112.0, 215.0, 335.0, 810.0, 2301.0, 7831.0, 40920.0, 879908.0, 96580.0, 13659.0, 3448.0, 1137.0, 482.0, 234.0, 135.0, 84.0, 46.0, 27.0, 24.0, 16.0, 14.0, 11.0, 2.0, 4.0, 0.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.431396484375, -0.4193077087402344, -0.40721893310546875, -0.3951301574707031, -0.3830413818359375, -0.3709526062011719, -0.35886383056640625, -0.3467750549316406, -0.334686279296875, -0.3225975036621094, -0.31050872802734375, -0.2984199523925781, -0.2863311767578125, -0.2742424011230469, -0.26215362548828125, -0.2500648498535156, -0.23797607421875, -0.22588729858398438, -0.21379852294921875, -0.20170974731445312, -0.1896209716796875, -0.17753219604492188, -0.16544342041015625, -0.15335464477539062, -0.141265869140625, -0.12917709350585938, -0.11708831787109375, -0.10499954223632812, -0.0929107666015625, -0.08082199096679688, -0.06873321533203125, -0.056644439697265625, -0.0445556640625, -0.032466888427734375, -0.02037811279296875, -0.008289337158203125, 0.0037994384765625, 0.015888214111328125, 0.02797698974609375, 0.040065765380859375, 0.052154541015625, 0.06424331665039062, 0.07633209228515625, 0.08842086791992188, 0.1005096435546875, 0.11259841918945312, 0.12468719482421875, 0.13677597045898438, 0.14886474609375, 0.16095352172851562, 0.17304229736328125, 0.18513107299804688, 0.1972198486328125, 0.20930862426757812, 0.22139739990234375, 0.23348617553710938, 0.245574951171875, 0.2576637268066406, 0.26975250244140625, 0.2818412780761719, 0.2939300537109375, 0.3060188293457031, 0.31810760498046875, 0.3301963806152344, 0.34228515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 2.0, 9.0, 8.0, 12.0, 13.0, 22.0, 17.0, 25.0, 29.0, 38.0, 56.0, 95.0, 103.0, 117.0, 114.0, 79.0, 55.0, 40.0, 27.0, 25.0, 21.0, 10.0, 13.0, 4.0, 5.0, 9.0, 2.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.0001055002212524414, -0.00010260380804538727, -9.970739483833313e-05, -9.681098163127899e-05, -9.391456842422485e-05, -9.101815521717072e-05, -8.812174201011658e-05, -8.522532880306244e-05, -8.23289155960083e-05, -7.943250238895416e-05, -7.653608918190002e-05, -7.363967597484589e-05, -7.074326276779175e-05, -6.784684956073761e-05, -6.495043635368347e-05, -6.205402314662933e-05, -5.9157609939575195e-05, -5.626119673252106e-05, -5.336478352546692e-05, -5.046837031841278e-05, -4.757195711135864e-05, -4.4675543904304504e-05, -4.1779130697250366e-05, -3.888271749019623e-05, -3.598630428314209e-05, -3.308989107608795e-05, -3.0193477869033813e-05, -2.7297064661979675e-05, -2.4400651454925537e-05, -2.15042382478714e-05, -1.860782504081726e-05, -1.5711411833763123e-05, -1.2814998626708984e-05, -9.918585419654846e-06, -7.022172212600708e-06, -4.12575900554657e-06, -1.2293457984924316e-06, 1.6670674085617065e-06, 4.563480615615845e-06, 7.459893822669983e-06, 1.0356307029724121e-05, 1.325272023677826e-05, 1.6149133443832397e-05, 1.9045546650886536e-05, 2.1941959857940674e-05, 2.4838373064994812e-05, 2.773478627204895e-05, 3.063119947910309e-05, 3.3527612686157227e-05, 3.6424025893211365e-05, 3.93204391002655e-05, 4.221685230731964e-05, 4.511326551437378e-05, 4.800967872142792e-05, 5.0906091928482056e-05, 5.3802505135536194e-05, 5.669891834259033e-05, 5.959533154964447e-05, 6.249174475669861e-05, 6.538815796375275e-05, 6.828457117080688e-05, 7.118098437786102e-05, 7.407739758491516e-05, 7.69738107919693e-05, 7.987022399902344e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 12.0, 8.0, 17.0, 17.0, 32.0, 34.0, 72.0, 103.0, 233.0, 429.0, 844.0, 1846.0, 4766.0, 15544.0, 69960.0, 835197.0, 91254.0, 18443.0, 5662.0, 2156.0, 922.0, 446.0, 214.0, 128.0, 70.0, 46.0, 31.0, 23.0, 13.0, 8.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.330078125, -0.3217353820800781, -0.31339263916015625, -0.3050498962402344, -0.2967071533203125, -0.2883644104003906, -0.28002166748046875, -0.2716789245605469, -0.263336181640625, -0.2549934387207031, -0.24665069580078125, -0.23830795288085938, -0.2299652099609375, -0.22162246704101562, -0.21327972412109375, -0.20493698120117188, -0.19659423828125, -0.18825149536132812, -0.17990875244140625, -0.17156600952148438, -0.1632232666015625, -0.15488052368164062, -0.14653778076171875, -0.13819503784179688, -0.129852294921875, -0.12150955200195312, -0.11316680908203125, -0.10482406616210938, -0.0964813232421875, -0.08813858032226562, -0.07979583740234375, -0.07145309448242188, -0.0631103515625, -0.054767608642578125, -0.04642486572265625, -0.038082122802734375, -0.0297393798828125, -0.021396636962890625, -0.01305389404296875, -0.004711151123046875, 0.003631591796875, 0.011974334716796875, 0.02031707763671875, 0.028659820556640625, 0.0370025634765625, 0.045345306396484375, 0.05368804931640625, 0.062030792236328125, 0.07037353515625, 0.07871627807617188, 0.08705902099609375, 0.09540176391601562, 0.1037445068359375, 0.11208724975585938, 0.12042999267578125, 0.12877273559570312, 0.137115478515625, 0.14545822143554688, 0.15380096435546875, 0.16214370727539062, 0.1704864501953125, 0.17882919311523438, 0.18717193603515625, 0.19551467895507812, 0.203857421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 10.0, 4.0, 8.0, 7.0, 9.0, 5.0, 16.0, 13.0, 29.0, 20.0, 29.0, 31.0, 44.0, 62.0, 70.0, 74.0, 76.0, 65.0, 65.0, 62.0, 52.0, 53.0, 38.0, 23.0, 23.0, 22.0, 11.0, 12.0, 7.0, 5.0, 10.0, 7.0, 2.0, 4.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.232421875, -0.22484970092773438, -0.21727752685546875, -0.20970535278320312, -0.2021331787109375, -0.19456100463867188, -0.18698883056640625, -0.17941665649414062, -0.171844482421875, -0.16427230834960938, -0.15670013427734375, -0.14912796020507812, -0.1415557861328125, -0.13398361206054688, -0.12641143798828125, -0.11883926391601562, -0.11126708984375, -0.10369491577148438, -0.09612274169921875, -0.08855056762695312, -0.0809783935546875, -0.07340621948242188, -0.06583404541015625, -0.058261871337890625, -0.050689697265625, -0.043117523193359375, -0.03554534912109375, -0.027973175048828125, -0.0204010009765625, -0.012828826904296875, -0.00525665283203125, 0.002315521240234375, 0.0098876953125, 0.017459869384765625, 0.02503204345703125, 0.032604217529296875, 0.0401763916015625, 0.047748565673828125, 0.05532073974609375, 0.06289291381835938, 0.070465087890625, 0.07803726196289062, 0.08560943603515625, 0.09318161010742188, 0.1007537841796875, 0.10832595825195312, 0.11589813232421875, 0.12347030639648438, 0.13104248046875, 0.13861465454101562, 0.14618682861328125, 0.15375900268554688, 0.1613311767578125, 0.16890335083007812, 0.17647552490234375, 0.18404769897460938, 0.191619873046875, 0.19919204711914062, 0.20676422119140625, 0.21433639526367188, 0.2219085693359375, 0.22948074340820312, 0.23705291748046875, 0.24462509155273438, 0.252197265625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 14.0, 32.0, 76.0, 325.0, 383.0, 87.0, 42.0, 23.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.62642478942871, -23.036149978637695, -22.44587516784668, -21.855600357055664, -21.26532745361328, -20.675052642822266, -20.08477783203125, -19.494503021240234, -18.90422821044922, -18.313953399658203, -17.723678588867188, -17.133403778076172, -16.543128967285156, -15.952855110168457, -15.362581253051758, -14.772306442260742, -14.182031631469727, -13.591756820678711, -13.001482009887695, -12.411208152770996, -11.82093334197998, -11.230658531188965, -10.640384674072266, -10.05010986328125, -9.459835052490234, -8.869560241699219, -8.279285430908203, -7.689011573791504, -7.098736763000488, -6.508461952209473, -5.918187618255615, -5.327913284301758, -4.737639427185059, -4.147364616394043, -3.5570902824401855, -2.966815710067749, -2.3765411376953125, -1.786266565322876, -1.1959919929504395, -0.605717658996582, -0.015442848205566406, 0.5748317241668701, 1.1651062965393066, 1.7553808689117432, 2.3456554412841797, 2.935930013656616, 3.5262045860290527, 4.11647891998291, 4.706753730773926, 5.297028541564941, 5.887302875518799, 6.477577209472656, 7.067852020263672, 7.6581268310546875, 8.248401641845703, 8.838675498962402, 9.428950309753418, 10.019225120544434, 10.609498977661133, 11.199773788452148, 11.790048599243164, 12.38032341003418, 12.970598220825195, 13.560872077941895, 14.15114688873291]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 2.0, 7.0, 7.0, 7.0, 6.0, 9.0, 16.0, 14.0, 16.0, 17.0, 18.0, 16.0, 19.0, 27.0, 29.0, 37.0, 127.0, 213.0, 170.0, 46.0, 25.0, 27.0, 15.0, 22.0, 21.0, 11.0, 12.0, 15.0, 8.0, 9.0, 5.0, 11.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.838184356689453, -8.559163093566895, -8.280141830444336, -8.001120567321777, -7.722099781036377, -7.443078517913818, -7.164057731628418, -6.885036468505859, -6.606015205383301, -6.326993942260742, -6.047972679138184, -5.768951892852783, -5.489930629730225, -5.210909366607666, -4.931888580322266, -4.652867317199707, -4.373846054077148, -4.09482479095459, -3.8158037662506104, -3.536782741546631, -3.2577614784240723, -2.9787402153015137, -2.699719190597534, -2.4206981658935547, -2.141676902770996, -1.862655758857727, -1.583634614944458, -1.304613471031189, -1.02559232711792, -0.7465711832046509, -0.46755003929138184, -0.1885288953781128, 0.09049224853515625, 0.3695133924484253, 0.6485345363616943, 0.9275556802749634, 1.2065768241882324, 1.4855979681015015, 1.7646191120147705, 2.04364013671875, 2.3226613998413086, 2.601682662963867, 2.8807036876678467, 3.159724712371826, 3.4387459754943848, 3.7177672386169434, 3.996788263320923, 4.275809288024902, 4.554830551147461, 4.8338518142700195, 5.112873077392578, 5.3918938636779785, 5.670915126800537, 5.949936389923096, 6.228957176208496, 6.507978439331055, 6.786999702453613, 7.066020965576172, 7.3450422286987305, 7.624063014984131, 7.9030842781066895, 8.18210506439209, 8.461126327514648, 8.740147590637207, 9.019168853759766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 4.0, 6.0, 13.0, 7.0, 12.0, 10.0, 17.0, 20.0, 23.0, 19.0, 35.0, 15.0, 41.0, 55.0, 162.0, 222.0, 80.0, 32.0, 25.0, 26.0, 32.0, 19.0, 14.0, 23.0, 16.0, 15.0, 6.0, 11.0, 4.0, 5.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6606674194335938, -0.6387176513671875, -0.6167678833007812, -0.594818115234375, -0.5728683471679688, -0.5509185791015625, -0.5289688110351562, -0.50701904296875, -0.48506927490234375, -0.4631195068359375, -0.44116973876953125, -0.419219970703125, -0.39727020263671875, -0.3753204345703125, -0.35337066650390625, -0.3314208984375, -0.30947113037109375, -0.2875213623046875, -0.26557159423828125, -0.243621826171875, -0.22167205810546875, -0.1997222900390625, -0.17777252197265625, -0.15582275390625, -0.13387298583984375, -0.1119232177734375, -0.08997344970703125, -0.068023681640625, -0.04607391357421875, -0.0241241455078125, -0.00217437744140625, 0.019775390625, 0.04172515869140625, 0.0636749267578125, 0.08562469482421875, 0.107574462890625, 0.12952423095703125, 0.1514739990234375, 0.17342376708984375, 0.19537353515625, 0.21732330322265625, 0.2392730712890625, 0.26122283935546875, 0.283172607421875, 0.30512237548828125, 0.3270721435546875, 0.34902191162109375, 0.3709716796875, 0.39292144775390625, 0.4148712158203125, 0.43682098388671875, 0.458770751953125, 0.48072052001953125, 0.5026702880859375, 0.5246200561523438, 0.54656982421875, 0.5685195922851562, 0.5904693603515625, 0.6124191284179688, 0.634368896484375, 0.6563186645507812, 0.6782684326171875, 0.7002182006835938, 0.72216796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 7.0, 8.0, 12.0, 8.0, 12.0, 18.0, 17.0, 18.0, 57.0, 68.0, 103.0, 192.0, 373.0, 799.0, 2397.0, 9712.0, 8288435.0, 77246.0, 6049.0, 1673.0, 612.0, 303.0, 151.0, 97.0, 61.0, 35.0, 33.0, 17.0, 13.0, 8.0, 8.0, 6.0, 5.0, 14.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-6.545567989349365, -6.340040683746338, -6.134513854980469, -5.928986549377441, -5.723459243774414, -5.517932415008545, -5.312405109405518, -5.106878280639648, -4.901350975036621, -4.695823669433594, -4.490296840667725, -4.284769535064697, -4.079242706298828, -3.873715400695801, -3.6681880950927734, -3.462661027908325, -3.257133960723877, -3.0516068935394287, -2.8460798263549805, -2.640552520751953, -2.435025453567505, -2.2294983863830566, -2.0239710807800293, -1.818444013595581, -1.6129169464111328, -1.4073898792266846, -1.2018626928329468, -0.9963355660438538, -0.7908084392547607, -0.5852813720703125, -0.3797541856765747, -0.17422699928283691, 0.03130054473876953, 0.23682767152786255, 0.44235479831695557, 0.6478819251060486, 0.8534090518951416, 1.0589361190795898, 1.2644633054733276, 1.4699904918670654, 1.6755175590515137, 1.881044626235962, 2.08657169342041, 2.2920989990234375, 2.4976260662078857, 2.703153133392334, 2.9086804389953613, 3.1142075061798096, 3.319734573364258, 3.525261640548706, 3.7307887077331543, 3.9363160133361816, 4.141842842102051, 4.347370147705078, 4.5528974533081055, 4.758424758911133, 4.963951587677002, 5.169478893280029, 5.375005722045898, 5.580533027648926, 5.786060333251953, 5.991587162017822, 6.19711446762085, 6.402641296386719, 6.608168601989746]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 7.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.11011028289795, -7.809652328491211, -7.509194374084473, -7.208736419677734, -6.908278465270996, -6.607820510864258, -6.307363033294678, -6.0069050788879395, -5.706447124481201, -5.405989170074463, -5.105531215667725, -4.805073261260986, -4.504615783691406, -4.204157829284668, -3.9036998748779297, -3.6032419204711914, -3.302783966064453, -3.002326011657715, -2.7018680572509766, -2.4014103412628174, -2.100952386856079, -1.8004944324493408, -1.500036597251892, -1.1995787620544434, -0.8991208076477051, -0.5986629128456116, -0.29820501804351807, 0.0022528767585754395, 0.30271077156066895, 0.6031687259674072, 0.903626561164856, 1.2040843963623047, 1.5045413970947266, 1.8049993515014648, 2.105457305908203, 2.4059150218963623, 2.7063729763031006, 3.006830930709839, 3.307288646697998, 3.6077466011047363, 3.9082045555114746, 4.208662509918213, 4.509120464324951, 4.8095784187316895, 5.1100358963012695, 5.410493850708008, 5.710951805114746, 6.011409759521484, 6.311867713928223, 6.612325668334961, 6.912783622741699, 7.2132415771484375, 7.513699531555176, 7.814157485961914, 8.114615440368652, 8.41507339477539, 8.715530395507812, 9.01598834991455, 9.316446304321289, 9.616904258728027, 9.917362213134766, 10.217820167541504, 10.518278121948242, 10.818735122680664, 11.119194030761719]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 15.0, 16.0, 17.0, 26.0, 40.0, 57.0, 61.0, 88.0, 149.0, 226.0, 315.0, 564.0, 1189.0, 2517.0, 5919.0, 14978.0, 38231.0, 100967.0, 183434.0, 107136.0, 40611.0, 15714.0, 6474.0, 2715.0, 1197.0, 609.0, 340.0, 217.0, 132.0, 80.0, 53.0, 51.0, 30.0, 27.0, 13.0, 5.0, 10.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.5390625, -5.378662109375, -5.21826171875, -5.057861328125, -4.8974609375, -4.737060546875, -4.57666015625, -4.416259765625, -4.255859375, -4.095458984375, -3.93505859375, -3.774658203125, -3.6142578125, -3.453857421875, -3.29345703125, -3.133056640625, -2.97265625, -2.812255859375, -2.65185546875, -2.491455078125, -2.3310546875, -2.170654296875, -2.01025390625, -1.849853515625, -1.689453125, -1.529052734375, -1.36865234375, -1.208251953125, -1.0478515625, -0.887451171875, -0.72705078125, -0.566650390625, -0.40625, -0.245849609375, -0.08544921875, 0.074951171875, 0.2353515625, 0.395751953125, 0.55615234375, 0.716552734375, 0.876953125, 1.037353515625, 1.19775390625, 1.358154296875, 1.5185546875, 1.678955078125, 1.83935546875, 1.999755859375, 2.16015625, 2.320556640625, 2.48095703125, 2.641357421875, 2.8017578125, 2.962158203125, 3.12255859375, 3.282958984375, 3.443359375, 3.603759765625, 3.76416015625, 3.924560546875, 4.0849609375, 4.245361328125, 4.40576171875, 4.566162109375, 4.7265625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 10.0, 5.0, 10.0, 16.0, 17.0, 15.0, 26.0, 30.0, 39.0, 46.0, 41.0, 63.0, 75.0, 66.0, 76.0, 70.0, 77.0, 52.0, 44.0, 41.0, 32.0, 23.0, 23.0, 18.0, 21.0, 17.0, 10.0, 5.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9388046264648438, -0.9122772216796875, -0.8857498168945312, -0.859222412109375, -0.8326950073242188, -0.8061676025390625, -0.7796401977539062, -0.75311279296875, -0.7265853881835938, -0.7000579833984375, -0.6735305786132812, -0.647003173828125, -0.6204757690429688, -0.5939483642578125, -0.5674209594726562, -0.5408935546875, -0.5143661499023438, -0.4878387451171875, -0.46131134033203125, -0.434783935546875, -0.40825653076171875, -0.3817291259765625, -0.35520172119140625, -0.32867431640625, -0.30214691162109375, -0.2756195068359375, -0.24909210205078125, -0.222564697265625, -0.19603729248046875, -0.1695098876953125, -0.14298248291015625, -0.116455078125, -0.08992767333984375, -0.0634002685546875, -0.03687286376953125, -0.010345458984375, 0.01618194580078125, 0.0427093505859375, 0.06923675537109375, 0.09576416015625, 0.12229156494140625, 0.1488189697265625, 0.17534637451171875, 0.201873779296875, 0.22840118408203125, 0.2549285888671875, 0.28145599365234375, 0.3079833984375, 0.33451080322265625, 0.3610382080078125, 0.38756561279296875, 0.414093017578125, 0.44062042236328125, 0.4671478271484375, 0.49367523193359375, 0.52020263671875, 0.5467300415039062, 0.5732574462890625, 0.5997848510742188, 0.626312255859375, 0.6528396606445312, 0.6793670654296875, 0.7058944702148438, 0.732421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 5.0, 6.0, 9.0, 9.0, 26.0, 40.0, 65.0, 83.0, 101.0, 66.0, 33.0, 14.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2566556930542, -8.99672794342041, -8.736799240112305, -8.476871490478516, -8.216943740844727, -7.957015514373779, -7.697087287902832, -7.437159538269043, -7.177231311798096, -6.917303085327148, -6.657375335693359, -6.397447109222412, -6.137518882751465, -5.877591133117676, -5.6176629066467285, -5.357734680175781, -5.097806930541992, -4.837878704071045, -4.577950954437256, -4.318022727966309, -4.0580949783325195, -3.7981667518615723, -3.538238525390625, -3.278310537338257, -3.0183825492858887, -2.7584545612335205, -2.4985265731811523, -2.238598346710205, -1.978670358657837, -1.7187423706054688, -1.458814263343811, -1.1988861560821533, -0.9389572143554688, -0.6790291666984558, -0.41910111904144287, -0.15917307138442993, 0.10075497627258301, 0.36068296432495117, 0.6206110715866089, 0.8805391788482666, 1.1404671669006348, 1.400395154953003, 1.6603232622146606, 1.9202513694763184, 2.1801793575286865, 2.4401073455810547, 2.700035572052002, 2.95996356010437, 3.2198915481567383, 3.4798195362091064, 3.7397475242614746, 3.999675750732422, 4.259603500366211, 4.519531726837158, 4.7794599533081055, 5.0393877029418945, 5.299315929412842, 5.559244155883789, 5.819171905517578, 6.079100131988525, 6.339028358459473, 6.598956108093262, 6.858884334564209, 7.118812561035156, 7.378740310668945]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 10.0, 24.0, 34.0, 92.0, 118.0, 85.0, 35.0, 4.0, 9.0, 7.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.105400562286377, -4.955692768096924, -4.805984973907471, -4.656276702880859, -4.506568908691406, -4.356861114501953, -4.2071533203125, -4.057445526123047, -3.9077374935150146, -3.7580296993255615, -3.6083216667175293, -3.458613872528076, -3.308906078338623, -3.159198045730591, -3.0094902515411377, -2.8597822189331055, -2.7100744247436523, -2.560366630554199, -2.410658597946167, -2.260950803756714, -2.1112427711486816, -1.9615349769592285, -1.8118271827697754, -1.6621192693710327, -1.51241135597229, -1.3627034425735474, -1.2129955291748047, -1.0632877349853516, -0.9135798215866089, -0.7638719081878662, -0.6141640543937683, -0.4644562005996704, -0.31474876403808594, -0.16504088044166565, -0.015332996845245361, 0.13437488675117493, 0.2840827703475952, 0.4337906837463379, 0.5834985375404358, 0.7332063913345337, 0.8829143047332764, 1.032622218132019, 1.1823301315307617, 1.3320379257202148, 1.4817458391189575, 1.6314537525177002, 1.7811615467071533, 1.930869460105896, 2.0805773735046387, 2.230285167694092, 2.379993200302124, 2.529700994491577, 2.6794090270996094, 2.8291168212890625, 2.9788246154785156, 3.1285324096679688, 3.278240442276001, 3.427948236465454, 3.5776562690734863, 3.7273640632629395, 3.8770718574523926, 4.026780128479004, 4.176487922668457, 4.32619571685791, 4.475903511047363]}, "eval/loss": 5.307173728942871, "eval/wer": 0.9908171360571202, "eval/runtime": 583.899, "eval/samples_per_second": 4.525, "eval/steps_per_second": 0.567} \ No newline at end of file