diff --git "a/wandb/run-20220306_154547-4pqitlp3/files/wandb-summary.json" "b/wandb/run-20220306_154547-4pqitlp3/files/wandb-summary.json" --- "a/wandb/run-20220306_154547-4pqitlp3/files/wandb-summary.json" +++ "b/wandb/run-20220306_154547-4pqitlp3/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0935, "train/learning_rate": 6.142517814726841e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 46008, "_timestamp": 1646627555, "_step": 7502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 9.0, 20.0, 22.0, 31.0, 54.0, 82.0, 110.0, 107.0, 143.0, 103.0, 89.0, 64.0, 42.0, 31.0, 22.0, 27.0, 8.0, 8.0, 5.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.982908248901367, -18.49204444885254, -18.001178741455078, -17.51031494140625, -17.019451141357422, -16.528587341308594, -16.037721633911133, -15.546857833862305, -15.05599308013916, -14.565128326416016, -14.074264526367188, -13.583399772644043, -13.092535972595215, -12.60167121887207, -12.110807418823242, -11.619942665100098, -11.129077911376953, -10.638213157653809, -10.14734935760498, -9.656484603881836, -9.165620803833008, -8.674756050109863, -8.183891296386719, -7.693027496337891, -7.2021636962890625, -6.711299419403076, -6.22043514251709, -5.729570388793945, -5.238706111907959, -4.747841835021973, -4.256977558135986, -3.766113042831421, -3.2752485275268555, -2.784384250640869, -2.2935197353363037, -1.8026554584503174, -1.3117910623550415, -0.8209266662597656, -0.3300623893737793, 0.16080212593078613, 0.6516664028167725, 1.1425307989120483, 1.6333951950073242, 2.1242594718933105, 2.615123748779297, 3.1059882640838623, 3.5968525409698486, 4.087717056274414, 4.5785813331604, 5.069445610046387, 5.560309886932373, 6.051174163818359, 6.542038917541504, 7.03290319442749, 7.523767471313477, 8.014632225036621, 8.50549602508545, 8.996360778808594, 9.487224578857422, 9.978089332580566, 10.468953132629395, 10.959817886352539, 11.450681686401367, 11.941546440124512, 12.432411193847656]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 11.0, 7.0, 8.0, 11.0, 14.0, 17.0, 14.0, 22.0, 19.0, 22.0, 38.0, 37.0, 37.0, 34.0, 39.0, 43.0, 51.0, 51.0, 54.0, 50.0, 45.0, 43.0, 41.0, 34.0, 44.0, 23.0, 30.0, 22.0, 18.0, 22.0, 14.0, 17.0, 11.0, 14.0, 9.0, 12.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.343513488769531, -10.959884643554688, -10.576254844665527, -10.192625999450684, -9.808996200561523, -9.42536735534668, -9.04173755645752, -8.658108711242676, -8.274478912353516, -7.890849590301514, -7.507220268249512, -7.12359094619751, -6.739961624145508, -6.356332302093506, -5.972702980041504, -5.58907413482666, -5.205444812774658, -4.821815490722656, -4.438186168670654, -4.054556846618652, -3.6709275245666504, -3.2872982025146484, -2.9036691188812256, -2.5200397968292236, -2.1364104747772217, -1.7527811527252197, -1.3691518306732178, -0.9855226278305054, -0.6018933057785034, -0.21826398372650146, 0.16536521911621094, 0.5489945411682129, 0.9326238632202148, 1.3162531852722168, 1.6998825073242188, 2.0835118293762207, 2.4671411514282227, 2.8507704734802246, 3.2343995571136475, 3.6180288791656494, 4.0016584396362305, 4.385287761688232, 4.768917083740234, 5.152546405792236, 5.536175727844238, 5.91980504989624, 6.303434371948242, 6.687063217163086, 7.070692539215088, 7.45432186126709, 7.837951183319092, 8.221580505371094, 8.605209350585938, 8.988839149475098, 9.372467994689941, 9.756097793579102, 10.139726638793945, 10.523355484008789, 10.90698528289795, 11.290614128112793, 11.674243927001953, 12.057872772216797, 12.441502571105957, 12.8251314163208, 13.208761215209961]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 10.0, 4.0, 9.0, 14.0, 16.0, 21.0, 20.0, 28.0, 35.0, 28.0, 43.0, 41.0, 58.0, 42.0, 49.0, 59.0, 59.0, 54.0, 61.0, 49.0, 44.0, 37.0, 39.0, 30.0, 28.0, 21.0, 20.0, 16.0, 19.0, 9.0, 9.0, 8.0, 7.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85498046875, -0.8306808471679688, -0.8063812255859375, -0.7820816040039062, -0.757781982421875, -0.7334823608398438, -0.7091827392578125, -0.6848831176757812, -0.66058349609375, -0.6362838745117188, -0.6119842529296875, -0.5876846313476562, -0.563385009765625, -0.5390853881835938, -0.5147857666015625, -0.49048614501953125, -0.4661865234375, -0.44188690185546875, -0.4175872802734375, -0.39328765869140625, -0.368988037109375, -0.34468841552734375, -0.3203887939453125, -0.29608917236328125, -0.27178955078125, -0.24748992919921875, -0.2231903076171875, -0.19889068603515625, -0.174591064453125, -0.15029144287109375, -0.1259918212890625, -0.10169219970703125, -0.077392578125, -0.05309295654296875, -0.0287933349609375, -0.00449371337890625, 0.019805908203125, 0.04410552978515625, 0.0684051513671875, 0.09270477294921875, 0.11700439453125, 0.14130401611328125, 0.1656036376953125, 0.18990325927734375, 0.214202880859375, 0.23850250244140625, 0.2628021240234375, 0.28710174560546875, 0.3114013671875, 0.33570098876953125, 0.3600006103515625, 0.38430023193359375, 0.408599853515625, 0.43289947509765625, 0.4571990966796875, 0.48149871826171875, 0.50579833984375, 0.5300979614257812, 0.5543975830078125, 0.5786972045898438, 0.602996826171875, 0.6272964477539062, 0.6515960693359375, 0.6758956909179688, 0.7001953125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 11.0, 8.0, 17.0, 23.0, 37.0, 38.0, 51.0, 79.0, 92.0, 173.0, 264.0, 419.0, 816.0, 1721.0, 4840.0, 18738.0, 119136.0, 3466130.0, 518835.0, 48401.0, 9221.0, 2680.0, 1123.0, 491.0, 331.0, 183.0, 138.0, 81.0, 55.0, 41.0, 41.0, 25.0, 15.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.9609375, -8.6875, -8.4140625, -8.140625, -7.8671875, -7.59375, -7.3203125, -7.046875, -6.7734375, -6.5, -6.2265625, -5.953125, -5.6796875, -5.40625, -5.1328125, -4.859375, -4.5859375, -4.3125, -4.0390625, -3.765625, -3.4921875, -3.21875, -2.9453125, -2.671875, -2.3984375, -2.125, -1.8515625, -1.578125, -1.3046875, -1.03125, -0.7578125, -0.484375, -0.2109375, 0.0625, 0.3359375, 0.609375, 0.8828125, 1.15625, 1.4296875, 1.703125, 1.9765625, 2.25, 2.5234375, 2.796875, 3.0703125, 3.34375, 3.6171875, 3.890625, 4.1640625, 4.4375, 4.7109375, 4.984375, 5.2578125, 5.53125, 5.8046875, 6.078125, 6.3515625, 6.625, 6.8984375, 7.171875, 7.4453125, 7.71875, 7.9921875, 8.265625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 15.0, 25.0, 35.0, 78.0, 94.0, 172.0, 282.0, 495.0, 988.0, 859.0, 391.0, 222.0, 151.0, 111.0, 64.0, 26.0, 20.0, 17.0, 17.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.859375, -5.71588134765625, -5.5723876953125, -5.42889404296875, -5.285400390625, -5.14190673828125, -4.9984130859375, -4.85491943359375, -4.71142578125, -4.56793212890625, -4.4244384765625, -4.28094482421875, -4.137451171875, -3.99395751953125, -3.8504638671875, -3.70697021484375, -3.5634765625, -3.41998291015625, -3.2764892578125, -3.13299560546875, -2.989501953125, -2.84600830078125, -2.7025146484375, -2.55902099609375, -2.41552734375, -2.27203369140625, -2.1285400390625, -1.98504638671875, -1.841552734375, -1.69805908203125, -1.5545654296875, -1.41107177734375, -1.267578125, -1.12408447265625, -0.9805908203125, -0.83709716796875, -0.693603515625, -0.55010986328125, -0.4066162109375, -0.26312255859375, -0.11962890625, 0.02386474609375, 0.1673583984375, 0.31085205078125, 0.454345703125, 0.59783935546875, 0.7413330078125, 0.88482666015625, 1.0283203125, 1.17181396484375, 1.3153076171875, 1.45880126953125, 1.602294921875, 1.74578857421875, 1.8892822265625, 2.03277587890625, 2.17626953125, 2.31976318359375, 2.4632568359375, 2.60675048828125, 2.750244140625, 2.89373779296875, 3.0372314453125, 3.18072509765625, 3.32421875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 9.0, 10.0, 18.0, 17.0, 26.0, 27.0, 41.0, 80.0, 102.0, 206.0, 289.0, 562.0, 1416.0, 4947.0, 24561.0, 194983.0, 3271402.0, 624874.0, 57395.0, 9226.0, 2269.0, 808.0, 368.0, 227.0, 138.0, 85.0, 70.0, 35.0, 31.0, 11.0, 9.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-14.109375, -13.72509765625, -13.3408203125, -12.95654296875, -12.572265625, -12.18798828125, -11.8037109375, -11.41943359375, -11.03515625, -10.65087890625, -10.2666015625, -9.88232421875, -9.498046875, -9.11376953125, -8.7294921875, -8.34521484375, -7.9609375, -7.57666015625, -7.1923828125, -6.80810546875, -6.423828125, -6.03955078125, -5.6552734375, -5.27099609375, -4.88671875, -4.50244140625, -4.1181640625, -3.73388671875, -3.349609375, -2.96533203125, -2.5810546875, -2.19677734375, -1.8125, -1.42822265625, -1.0439453125, -0.65966796875, -0.275390625, 0.10888671875, 0.4931640625, 0.87744140625, 1.26171875, 1.64599609375, 2.0302734375, 2.41455078125, 2.798828125, 3.18310546875, 3.5673828125, 3.95166015625, 4.3359375, 4.72021484375, 5.1044921875, 5.48876953125, 5.873046875, 6.25732421875, 6.6416015625, 7.02587890625, 7.41015625, 7.79443359375, 8.1787109375, 8.56298828125, 8.947265625, 9.33154296875, 9.7158203125, 10.10009765625, 10.484375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 11.0, 22.0, 44.0, 119.0, 154.0, 241.0, 188.0, 124.0, 54.0, 24.0, 14.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-53.097686767578125, -52.06794738769531, -51.038204193115234, -50.00846481323242, -48.978721618652344, -47.94898223876953, -46.91924285888672, -45.88949966430664, -44.85976028442383, -43.830020904541016, -42.80027770996094, -41.770538330078125, -40.74079513549805, -39.711055755615234, -38.681312561035156, -37.651573181152344, -36.62183380126953, -35.59209442138672, -34.56235122680664, -33.53261184692383, -32.50286865234375, -31.473129272460938, -30.443387985229492, -29.413646697998047, -28.38390350341797, -27.354162216186523, -26.324420928955078, -25.294681549072266, -24.26494026184082, -23.235198974609375, -22.20545768737793, -21.175716400146484, -20.145978927612305, -19.11623764038086, -18.086496353149414, -17.05675506591797, -16.027015686035156, -14.997274398803711, -13.967533111572266, -12.93779182434082, -11.908051490783691, -10.878310203552246, -9.848569869995117, -8.818828582763672, -7.789087772369385, -6.759346961975098, -5.729605674743652, -4.699864864349365, -3.670124053955078, -2.640383243560791, -1.6106421947479248, -0.5809011459350586, 0.4488396644592285, 1.4785804748535156, 2.508321762084961, 3.538062572479248, 4.567803382873535, 5.597544193267822, 6.627285003662109, 7.657026290893555, 8.686767578125, 9.716507911682129, 10.746249198913574, 11.775989532470703, 12.805730819702148]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 11.0, 10.0, 11.0, 21.0, 12.0, 16.0, 24.0, 25.0, 20.0, 26.0, 38.0, 46.0, 43.0, 42.0, 48.0, 40.0, 39.0, 39.0, 48.0, 39.0, 45.0, 31.0, 31.0, 35.0, 35.0, 27.0, 33.0, 19.0, 18.0, 26.0, 20.0, 13.0, 17.0, 12.0, 11.0, 3.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.355179786682129, -11.022886276245117, -10.690592765808105, -10.358299255371094, -10.026005744934082, -9.69371223449707, -9.361417770385742, -9.02912425994873, -8.696830749511719, -8.364537239074707, -8.032243728637695, -7.699950218200684, -7.367656230926514, -7.035362720489502, -6.70306921005249, -6.37077522277832, -6.038482189178467, -5.706188678741455, -5.373895168304443, -5.041601181030273, -4.709307670593262, -4.37701416015625, -4.044720649719238, -3.7124269008636475, -3.3801333904266357, -3.047839879989624, -2.715546131134033, -2.3832526206970215, -2.0509591102600098, -1.718665361404419, -1.3863718509674072, -1.0540781021118164, -0.7217845916748047, -0.3894909918308258, -0.057197391986846924, 0.27509617805480957, 0.6073898077011108, 0.9396834373474121, 1.2719769477844238, 1.6042706966400146, 1.9365642070770264, 2.268857717514038, 2.601151466369629, 2.9334449768066406, 3.2657384872436523, 3.598032236099243, 3.930325746536255, 4.262619495391846, 4.594913005828857, 4.927206516265869, 5.259500026702881, 5.591794013977051, 5.9240875244140625, 6.256381034851074, 6.588674545288086, 6.920968055725098, 7.253261566162109, 7.585555076599121, 7.917848587036133, 8.250142097473145, 8.582435607910156, 8.914730072021484, 9.24702262878418, 9.579317092895508, 9.91161060333252]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 12.0, 15.0, 10.0, 25.0, 22.0, 19.0, 25.0, 24.0, 28.0, 44.0, 44.0, 46.0, 29.0, 47.0, 43.0, 48.0, 40.0, 61.0, 45.0, 33.0, 27.0, 28.0, 36.0, 33.0, 36.0, 20.0, 22.0, 18.0, 20.0, 15.0, 11.0, 10.0, 7.0, 3.0, 8.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6931991577148438, -0.6705780029296875, -0.6479568481445312, -0.625335693359375, -0.6027145385742188, -0.5800933837890625, -0.5574722290039062, -0.53485107421875, -0.5122299194335938, -0.4896087646484375, -0.46698760986328125, -0.444366455078125, -0.42174530029296875, -0.3991241455078125, -0.37650299072265625, -0.3538818359375, -0.33126068115234375, -0.3086395263671875, -0.28601837158203125, -0.263397216796875, -0.24077606201171875, -0.2181549072265625, -0.19553375244140625, -0.17291259765625, -0.15029144287109375, -0.1276702880859375, -0.10504913330078125, -0.082427978515625, -0.05980682373046875, -0.0371856689453125, -0.01456451416015625, 0.008056640625, 0.03067779541015625, 0.0532989501953125, 0.07592010498046875, 0.098541259765625, 0.12116241455078125, 0.1437835693359375, 0.16640472412109375, 0.18902587890625, 0.21164703369140625, 0.2342681884765625, 0.25688934326171875, 0.279510498046875, 0.30213165283203125, 0.3247528076171875, 0.34737396240234375, 0.3699951171875, 0.39261627197265625, 0.4152374267578125, 0.43785858154296875, 0.460479736328125, 0.48310089111328125, 0.5057220458984375, 0.5283432006835938, 0.55096435546875, 0.5735855102539062, 0.5962066650390625, 0.6188278198242188, 0.641448974609375, 0.6640701293945312, 0.6866912841796875, 0.7093124389648438, 0.73193359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 13.0, 16.0, 30.0, 25.0, 64.0, 78.0, 94.0, 145.0, 237.0, 297.0, 404.0, 592.0, 885.0, 1256.0, 1873.0, 2880.0, 4409.0, 6927.0, 10867.0, 18171.0, 31814.0, 60605.0, 134617.0, 342664.0, 230219.0, 90877.0, 44350.0, 24372.0, 14462.0, 8692.0, 5603.0, 3581.0, 2342.0, 1569.0, 1042.0, 769.0, 473.0, 369.0, 234.0, 180.0, 123.0, 85.0, 65.0, 49.0, 41.0, 26.0, 17.0, 17.0, 10.0, 7.0, 5.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.373046875, -1.331146240234375, -1.28924560546875, -1.247344970703125, -1.2054443359375, -1.163543701171875, -1.12164306640625, -1.079742431640625, -1.037841796875, -0.995941162109375, -0.95404052734375, -0.912139892578125, -0.8702392578125, -0.828338623046875, -0.78643798828125, -0.744537353515625, -0.70263671875, -0.660736083984375, -0.61883544921875, -0.576934814453125, -0.5350341796875, -0.493133544921875, -0.45123291015625, -0.409332275390625, -0.367431640625, -0.325531005859375, -0.28363037109375, -0.241729736328125, -0.1998291015625, -0.157928466796875, -0.11602783203125, -0.074127197265625, -0.0322265625, 0.009674072265625, 0.05157470703125, 0.093475341796875, 0.1353759765625, 0.177276611328125, 0.21917724609375, 0.261077880859375, 0.302978515625, 0.344879150390625, 0.38677978515625, 0.428680419921875, 0.4705810546875, 0.512481689453125, 0.55438232421875, 0.596282958984375, 0.63818359375, 0.680084228515625, 0.72198486328125, 0.763885498046875, 0.8057861328125, 0.847686767578125, 0.88958740234375, 0.931488037109375, 0.973388671875, 1.015289306640625, 1.05718994140625, 1.099090576171875, 1.1409912109375, 1.182891845703125, 1.22479248046875, 1.266693115234375, 1.30859375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 7.0, 8.0, 7.0, 15.0, 26.0, 16.0, 14.0, 27.0, 21.0, 37.0, 40.0, 39.0, 41.0, 32.0, 37.0, 38.0, 42.0, 1074.0, 49.0, 44.0, 41.0, 50.0, 42.0, 39.0, 34.0, 28.0, 34.0, 18.0, 10.0, 30.0, 15.0, 10.0, 7.0, 10.0, 10.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5603713989257812, -0.5411529541015625, -0.5219345092773438, -0.502716064453125, -0.48349761962890625, -0.4642791748046875, -0.44506072998046875, -0.42584228515625, -0.40662384033203125, -0.3874053955078125, -0.36818695068359375, -0.348968505859375, -0.32975006103515625, -0.3105316162109375, -0.29131317138671875, -0.2720947265625, -0.25287628173828125, -0.2336578369140625, -0.21443939208984375, -0.195220947265625, -0.17600250244140625, -0.1567840576171875, -0.13756561279296875, -0.11834716796875, -0.09912872314453125, -0.0799102783203125, -0.06069183349609375, -0.041473388671875, -0.02225494384765625, -0.0030364990234375, 0.01618194580078125, 0.035400390625, 0.05461883544921875, 0.0738372802734375, 0.09305572509765625, 0.112274169921875, 0.13149261474609375, 0.1507110595703125, 0.16992950439453125, 0.18914794921875, 0.20836639404296875, 0.2275848388671875, 0.24680328369140625, 0.266021728515625, 0.28524017333984375, 0.3044586181640625, 0.32367706298828125, 0.3428955078125, 0.36211395263671875, 0.3813323974609375, 0.40055084228515625, 0.419769287109375, 0.43898773193359375, 0.4582061767578125, 0.47742462158203125, 0.49664306640625, 0.5158615112304688, 0.5350799560546875, 0.5542984008789062, 0.573516845703125, 0.5927352905273438, 0.6119537353515625, 0.6311721801757812, 0.650390625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 14.0, 8.0, 20.0, 16.0, 28.0, 43.0, 61.0, 103.0, 173.0, 260.0, 456.0, 789.0, 1134.0, 2051.0, 3456.0, 6036.0, 11192.0, 22569.0, 54706.0, 199147.0, 1493146.0, 198492.0, 54719.0, 23133.0, 11281.0, 5849.0, 3412.0, 1876.0, 1066.0, 651.0, 419.0, 245.0, 207.0, 116.0, 75.0, 61.0, 28.0, 18.0, 25.0, 28.0, 10.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.177734375, -1.1414947509765625, -1.105255126953125, -1.0690155029296875, -1.03277587890625, -0.9965362548828125, -0.960296630859375, -0.9240570068359375, -0.8878173828125, -0.8515777587890625, -0.815338134765625, -0.7790985107421875, -0.74285888671875, -0.7066192626953125, -0.670379638671875, -0.6341400146484375, -0.597900390625, -0.5616607666015625, -0.525421142578125, -0.4891815185546875, -0.45294189453125, -0.4167022705078125, -0.380462646484375, -0.3442230224609375, -0.3079833984375, -0.2717437744140625, -0.235504150390625, -0.1992645263671875, -0.16302490234375, -0.1267852783203125, -0.090545654296875, -0.0543060302734375, -0.01806640625, 0.0181732177734375, 0.054412841796875, 0.0906524658203125, 0.12689208984375, 0.1631317138671875, 0.199371337890625, 0.2356109619140625, 0.2718505859375, 0.3080902099609375, 0.344329833984375, 0.3805694580078125, 0.41680908203125, 0.4530487060546875, 0.489288330078125, 0.5255279541015625, 0.561767578125, 0.5980072021484375, 0.634246826171875, 0.6704864501953125, 0.70672607421875, 0.7429656982421875, 0.779205322265625, 0.8154449462890625, 0.8516845703125, 0.8879241943359375, 0.924163818359375, 0.9604034423828125, 0.99664306640625, 1.0328826904296875, 1.069122314453125, 1.1053619384765625, 1.1416015625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 12.0, 20.0, 25.0, 48.0, 96.0, 390.0, 186.0, 80.0, 49.0, 23.0, 15.0, 10.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.4141693115234375, -0.398162841796875, -0.3821563720703125, -0.36614990234375, -0.3501434326171875, -0.334136962890625, -0.3181304931640625, -0.3021240234375, -0.2861175537109375, -0.270111083984375, -0.2541046142578125, -0.23809814453125, -0.2220916748046875, -0.206085205078125, -0.1900787353515625, -0.174072265625, -0.1580657958984375, -0.142059326171875, -0.1260528564453125, -0.11004638671875, -0.0940399169921875, -0.078033447265625, -0.0620269775390625, -0.0460205078125, -0.0300140380859375, -0.014007568359375, 0.0019989013671875, 0.01800537109375, 0.0340118408203125, 0.050018310546875, 0.0660247802734375, 0.08203125, 0.0980377197265625, 0.114044189453125, 0.1300506591796875, 0.14605712890625, 0.1620635986328125, 0.178070068359375, 0.1940765380859375, 0.2100830078125, 0.2260894775390625, 0.242095947265625, 0.2581024169921875, 0.27410888671875, 0.2901153564453125, 0.306121826171875, 0.3221282958984375, 0.338134765625, 0.3541412353515625, 0.370147705078125, 0.3861541748046875, 0.40216064453125, 0.4181671142578125, 0.434173583984375, 0.4501800537109375, 0.4661865234375, 0.4821929931640625, 0.498199462890625, 0.5142059326171875, 0.53021240234375, 0.5462188720703125, 0.562225341796875, 0.5782318115234375, 0.59423828125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 7.0, 11.0, 15.0, 29.0, 86.0, 221.0, 2293.0, 1003740.0, 40922.0, 926.0, 163.0, 48.0, 24.0, 20.0, 12.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.125, -11.812744140625, -11.50048828125, -11.188232421875, -10.8759765625, -10.563720703125, -10.25146484375, -9.939208984375, -9.626953125, -9.314697265625, -9.00244140625, -8.690185546875, -8.3779296875, -8.065673828125, -7.75341796875, -7.441162109375, -7.12890625, -6.816650390625, -6.50439453125, -6.192138671875, -5.8798828125, -5.567626953125, -5.25537109375, -4.943115234375, -4.630859375, -4.318603515625, -4.00634765625, -3.694091796875, -3.3818359375, -3.069580078125, -2.75732421875, -2.445068359375, -2.1328125, -1.820556640625, -1.50830078125, -1.196044921875, -0.8837890625, -0.571533203125, -0.25927734375, 0.052978515625, 0.365234375, 0.677490234375, 0.98974609375, 1.302001953125, 1.6142578125, 1.926513671875, 2.23876953125, 2.551025390625, 2.86328125, 3.175537109375, 3.48779296875, 3.800048828125, 4.1123046875, 4.424560546875, 4.73681640625, 5.049072265625, 5.361328125, 5.673583984375, 5.98583984375, 6.298095703125, 6.6103515625, 6.922607421875, 7.23486328125, 7.547119140625, 7.859375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 15.0, 36.0, 108.0, 314.0, 335.0, 121.0, 52.0, 16.0, 9.0, 1.0, 2.0], "bins": [-2.719010591506958, -2.6713390350341797, -2.6236677169799805, -2.575996160507202, -2.528324604034424, -2.4806530475616455, -2.432981491088867, -2.385310173034668, -2.3376386165618896, -2.2899670600891113, -2.242295742034912, -2.194624185562134, -2.1469526290893555, -2.099281072616577, -2.051609516143799, -2.0039381980895996, -1.9562666416168213, -1.908595085144043, -1.8609236478805542, -1.8132522106170654, -1.765580654144287, -1.7179090976715088, -1.67023766040802, -1.6225662231445312, -1.574894666671753, -1.5272231101989746, -1.4795516729354858, -1.431880235671997, -1.3842086791992188, -1.3365371227264404, -1.2888656854629517, -1.241194248199463, -1.1935226917266846, -1.1458511352539062, -1.0981796979904175, -1.0505082607269287, -1.0028367042541504, -0.9551652073860168, -0.9074937105178833, -0.8598222136497498, -0.812150776386261, -0.7644792795181274, -0.7168077826499939, -0.6691362857818604, -0.6214647889137268, -0.5737932920455933, -0.5261217951774597, -0.47845029830932617, -0.4307788014411926, -0.3831073045730591, -0.33543580770492554, -0.287764310836792, -0.24009281396865845, -0.1924213171005249, -0.14474982023239136, -0.09707832336425781, -0.04940682649612427, -0.0017353296279907227, 0.04593616724014282, 0.09360766410827637, 0.1412791609764099, 0.18895065784454346, 0.236622154712677, 0.28429365158081055, 0.3319651484489441]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 3.0, 4.0, 8.0, 5.0, 7.0, 12.0, 6.0, 14.0, 14.0, 18.0, 19.0, 25.0, 19.0, 38.0, 30.0, 34.0, 31.0, 43.0, 48.0, 49.0, 45.0, 37.0, 60.0, 42.0, 55.0, 41.0, 37.0, 31.0, 25.0, 33.0, 13.0, 23.0, 26.0, 23.0, 17.0, 11.0, 11.0, 5.0, 13.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.4486656188964844, -0.43576836585998535, -0.42287108302116394, -0.4099738299846649, -0.3970765471458435, -0.3841792941093445, -0.37128204107284546, -0.35838478803634644, -0.345487505197525, -0.332590252161026, -0.3196929693222046, -0.30679571628570557, -0.29389846324920654, -0.28100118041038513, -0.2681039273738861, -0.2552066445350647, -0.24230939149856567, -0.22941212356090546, -0.21651485562324524, -0.20361760258674622, -0.190720334649086, -0.17782306671142578, -0.16492581367492676, -0.15202854573726654, -0.13913127779960632, -0.1262340098619461, -0.11333674937486649, -0.10043948888778687, -0.08754222095012665, -0.07464495301246643, -0.06174769252538681, -0.04885043203830719, -0.03595316410064697, -0.023055899888277054, -0.010158635675907135, 0.002738628536462784, 0.015635892748832703, 0.02853316068649292, 0.04143042117357254, 0.05432768166065216, 0.06722494959831238, 0.0801222175359726, 0.09301947802305222, 0.10591673851013184, 0.11881400644779205, 0.13171127438545227, 0.1446085274219513, 0.1575057953596115, 0.17040306329727173, 0.18330033123493195, 0.19619759917259216, 0.2090948522090912, 0.2219921201467514, 0.23488938808441162, 0.24778664112091064, 0.26068389415740967, 0.2735811769962311, 0.2864784300327301, 0.2993757128715515, 0.31227296590805054, 0.32517021894454956, 0.33806750178337097, 0.35096475481987, 0.3638620376586914, 0.37675929069519043]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 2.0, 3.0, 5.0, 8.0, 11.0, 11.0, 15.0, 8.0, 23.0, 22.0, 20.0, 23.0, 27.0, 24.0, 43.0, 41.0, 43.0, 37.0, 48.0, 34.0, 51.0, 46.0, 54.0, 48.0, 36.0, 28.0, 20.0, 40.0, 30.0, 36.0, 29.0, 19.0, 19.0, 22.0, 15.0, 12.0, 9.0, 10.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71875, -0.696197509765625, -0.67364501953125, -0.651092529296875, -0.6285400390625, -0.605987548828125, -0.58343505859375, -0.560882568359375, -0.538330078125, -0.515777587890625, -0.49322509765625, -0.470672607421875, -0.4481201171875, -0.425567626953125, -0.40301513671875, -0.380462646484375, -0.35791015625, -0.335357666015625, -0.31280517578125, -0.290252685546875, -0.2677001953125, -0.245147705078125, -0.22259521484375, -0.200042724609375, -0.177490234375, -0.154937744140625, -0.13238525390625, -0.109832763671875, -0.0872802734375, -0.064727783203125, -0.04217529296875, -0.019622802734375, 0.0029296875, 0.025482177734375, 0.04803466796875, 0.070587158203125, 0.0931396484375, 0.115692138671875, 0.13824462890625, 0.160797119140625, 0.183349609375, 0.205902099609375, 0.22845458984375, 0.251007080078125, 0.2735595703125, 0.296112060546875, 0.31866455078125, 0.341217041015625, 0.36376953125, 0.386322021484375, 0.40887451171875, 0.431427001953125, 0.4539794921875, 0.476531982421875, 0.49908447265625, 0.521636962890625, 0.544189453125, 0.566741943359375, 0.58929443359375, 0.611846923828125, 0.6343994140625, 0.656951904296875, 0.67950439453125, 0.702056884765625, 0.724609375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 9.0, 19.0, 21.0, 26.0, 44.0, 42.0, 59.0, 99.0, 153.0, 211.0, 302.0, 481.0, 765.0, 1191.0, 1916.0, 3342.0, 5706.0, 10368.0, 21095.0, 49999.0, 159516.0, 441375.0, 229323.0, 67177.0, 26214.0, 12372.0, 6787.0, 3707.0, 2239.0, 1399.0, 852.0, 555.0, 380.0, 248.0, 168.0, 101.0, 86.0, 56.0, 38.0, 35.0, 11.0, 22.0, 17.0, 6.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.134765625, -3.038726806640625, -2.94268798828125, -2.846649169921875, -2.7506103515625, -2.654571533203125, -2.55853271484375, -2.462493896484375, -2.366455078125, -2.270416259765625, -2.17437744140625, -2.078338623046875, -1.9822998046875, -1.886260986328125, -1.79022216796875, -1.694183349609375, -1.59814453125, -1.502105712890625, -1.40606689453125, -1.310028076171875, -1.2139892578125, -1.117950439453125, -1.02191162109375, -0.925872802734375, -0.829833984375, -0.733795166015625, -0.63775634765625, -0.541717529296875, -0.4456787109375, -0.349639892578125, -0.25360107421875, -0.157562255859375, -0.0615234375, 0.034515380859375, 0.13055419921875, 0.226593017578125, 0.3226318359375, 0.418670654296875, 0.51470947265625, 0.610748291015625, 0.706787109375, 0.802825927734375, 0.89886474609375, 0.994903564453125, 1.0909423828125, 1.186981201171875, 1.28302001953125, 1.379058837890625, 1.47509765625, 1.571136474609375, 1.66717529296875, 1.763214111328125, 1.8592529296875, 1.955291748046875, 2.05133056640625, 2.147369384765625, 2.243408203125, 2.339447021484375, 2.43548583984375, 2.531524658203125, 2.6275634765625, 2.723602294921875, 2.81964111328125, 2.915679931640625, 3.01171875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 5.0, 9.0, 12.0, 10.0, 14.0, 21.0, 13.0, 30.0, 34.0, 52.0, 48.0, 46.0, 59.0, 86.0, 117.0, 240.0, 1457.0, 234.0, 147.0, 75.0, 48.0, 43.0, 36.0, 35.0, 28.0, 17.0, 20.0, 19.0, 13.0, 18.0, 13.0, 4.0, 7.0, 9.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-3.875, -3.7744140625, -3.673828125, -3.5732421875, -3.47265625, -3.3720703125, -3.271484375, -3.1708984375, -3.0703125, -2.9697265625, -2.869140625, -2.7685546875, -2.66796875, -2.5673828125, -2.466796875, -2.3662109375, -2.265625, -2.1650390625, -2.064453125, -1.9638671875, -1.86328125, -1.7626953125, -1.662109375, -1.5615234375, -1.4609375, -1.3603515625, -1.259765625, -1.1591796875, -1.05859375, -0.9580078125, -0.857421875, -0.7568359375, -0.65625, -0.5556640625, -0.455078125, -0.3544921875, -0.25390625, -0.1533203125, -0.052734375, 0.0478515625, 0.1484375, 0.2490234375, 0.349609375, 0.4501953125, 0.55078125, 0.6513671875, 0.751953125, 0.8525390625, 0.953125, 1.0537109375, 1.154296875, 1.2548828125, 1.35546875, 1.4560546875, 1.556640625, 1.6572265625, 1.7578125, 1.8583984375, 1.958984375, 2.0595703125, 2.16015625, 2.2607421875, 2.361328125, 2.4619140625, 2.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 11.0, 14.0, 13.0, 12.0, 17.0, 22.0, 15.0, 20.0, 34.0, 41.0, 70.0, 164.0, 507.0, 2448.0, 21318.0, 2020289.0, 1080941.0, 16719.0, 2065.0, 467.0, 149.0, 63.0, 43.0, 39.0, 34.0, 27.0, 33.0, 24.0, 15.0, 8.0, 10.0, 10.0, 8.0, 8.0, 6.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.1319580078125, -9.756103515625, -9.3802490234375, -9.00439453125, -8.6285400390625, -8.252685546875, -7.8768310546875, -7.5009765625, -7.1251220703125, -6.749267578125, -6.3734130859375, -5.99755859375, -5.6217041015625, -5.245849609375, -4.8699951171875, -4.494140625, -4.1182861328125, -3.742431640625, -3.3665771484375, -2.99072265625, -2.6148681640625, -2.239013671875, -1.8631591796875, -1.4873046875, -1.1114501953125, -0.735595703125, -0.3597412109375, 0.01611328125, 0.3919677734375, 0.767822265625, 1.1436767578125, 1.51953125, 1.8953857421875, 2.271240234375, 2.6470947265625, 3.02294921875, 3.3988037109375, 3.774658203125, 4.1505126953125, 4.5263671875, 4.9022216796875, 5.278076171875, 5.6539306640625, 6.02978515625, 6.4056396484375, 6.781494140625, 7.1573486328125, 7.533203125, 7.9090576171875, 8.284912109375, 8.6607666015625, 9.03662109375, 9.4124755859375, 9.788330078125, 10.1641845703125, 10.5400390625, 10.9158935546875, 11.291748046875, 11.6676025390625, 12.04345703125, 12.4193115234375, 12.795166015625, 13.1710205078125, 13.546875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 874.0, 145.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.30627727508545, -7.840479373931885, -3.3746814727783203, 1.0911169052124023, 5.556914329528809, 10.022711753845215, 14.488511085510254, 18.954307556152344, 23.42010498046875, 27.885902404785156, 32.35169982910156, 36.81749725341797, 41.283294677734375, 45.74909210205078, 50.21489334106445, 54.68069076538086, 59.146488189697266, 63.61228561401367, 68.07808685302734, 72.54388427734375, 77.00968170166016, 81.47547912597656, 85.94127655029297, 90.40707397460938, 94.87287139892578, 99.33866882324219, 103.8044662475586, 108.270263671875, 112.7360610961914, 117.20185852050781, 121.66766357421875, 126.13345336914062, 130.59925842285156, 135.0650634765625, 139.53085327148438, 143.9966583251953, 148.4624481201172, 152.92825317382812, 157.39404296875, 161.85984802246094, 166.3256378173828, 170.79144287109375, 175.25723266601562, 179.72303771972656, 184.18882751464844, 188.65463256835938, 193.12042236328125, 197.5862274169922, 202.05203247070312, 206.51783752441406, 210.98362731933594, 215.44943237304688, 219.91522216796875, 224.3810272216797, 228.84681701660156, 233.3126220703125, 237.77841186523438, 242.2442169189453, 246.7100067138672, 251.17581176757812, 255.6416015625, 260.1073913574219, 264.5732116699219, 269.03900146484375, 273.5047912597656]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 14.0, 15.0, 14.0, 21.0, 13.0, 20.0, 25.0, 26.0, 31.0, 38.0, 32.0, 40.0, 55.0, 40.0, 43.0, 35.0, 45.0, 46.0, 47.0, 34.0, 41.0, 41.0, 37.0, 35.0, 36.0, 28.0, 17.0, 26.0, 14.0, 22.0, 7.0, 13.0, 7.0, 8.0, 6.0, 10.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.848706245422363, -9.51983642578125, -9.190966606140137, -8.86209774017334, -8.533227920532227, -8.204358100891113, -7.87548828125, -7.546618461608887, -7.217749118804932, -6.888879299163818, -6.560009956359863, -6.23114013671875, -5.902270317077637, -5.573400974273682, -5.244531154632568, -4.915661811828613, -4.5867919921875, -4.257922172546387, -3.9290528297424316, -3.6001830101013184, -3.271313428878784, -2.94244384765625, -2.6135740280151367, -2.2847044467926025, -1.9558348655700684, -1.6269652843475342, -1.2980955839157104, -0.9692259430885315, -0.6403563022613525, -0.31148672103881836, 0.01738297939300537, 0.3462526798248291, 0.6751222610473633, 1.0039918422698975, 1.3328615427017212, 1.661731243133545, 1.990600824356079, 2.3194704055786133, 2.6483402252197266, 2.9772098064422607, 3.306079387664795, 3.634948968887329, 3.9638185501098633, 4.292688369750977, 4.62155818939209, 4.950427532196045, 5.279297351837158, 5.608166694641113, 5.937036514282227, 6.26590633392334, 6.594775676727295, 6.923645496368408, 7.252514839172363, 7.581384658813477, 7.91025447845459, 8.239124298095703, 8.5679931640625, 8.896862983703613, 9.225732803344727, 9.554601669311523, 9.883471488952637, 10.21234130859375, 10.541211128234863, 10.870080947875977, 11.19895076751709]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 10.0, 7.0, 5.0, 15.0, 9.0, 14.0, 19.0, 23.0, 15.0, 23.0, 24.0, 24.0, 48.0, 29.0, 40.0, 47.0, 31.0, 34.0, 47.0, 46.0, 47.0, 44.0, 41.0, 37.0, 23.0, 36.0, 27.0, 34.0, 38.0, 29.0, 16.0, 17.0, 22.0, 21.0, 16.0, 8.0, 6.0, 4.0, 7.0, 3.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.73681640625, -0.7128982543945312, -0.6889801025390625, -0.6650619506835938, -0.641143798828125, -0.6172256469726562, -0.5933074951171875, -0.5693893432617188, -0.54547119140625, -0.5215530395507812, -0.4976348876953125, -0.47371673583984375, -0.449798583984375, -0.42588043212890625, -0.4019622802734375, -0.37804412841796875, -0.3541259765625, -0.33020782470703125, -0.3062896728515625, -0.28237152099609375, -0.258453369140625, -0.23453521728515625, -0.2106170654296875, -0.18669891357421875, -0.16278076171875, -0.13886260986328125, -0.1149444580078125, -0.09102630615234375, -0.067108154296875, -0.04319000244140625, -0.0192718505859375, 0.00464630126953125, 0.028564453125, 0.05248260498046875, 0.0764007568359375, 0.10031890869140625, 0.124237060546875, 0.14815521240234375, 0.1720733642578125, 0.19599151611328125, 0.21990966796875, 0.24382781982421875, 0.2677459716796875, 0.29166412353515625, 0.315582275390625, 0.33950042724609375, 0.3634185791015625, 0.38733673095703125, 0.4112548828125, 0.43517303466796875, 0.4590911865234375, 0.48300933837890625, 0.506927490234375, 0.5308456420898438, 0.5547637939453125, 0.5786819458007812, 0.60260009765625, 0.6265182495117188, 0.6504364013671875, 0.6743545532226562, 0.698272705078125, 0.7221908569335938, 0.7461090087890625, 0.7700271606445312, 0.7939453125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 4.0, 9.0, 11.0, 14.0, 31.0, 34.0, 36.0, 74.0, 74.0, 141.0, 189.0, 302.0, 457.0, 769.0, 1289.0, 2224.0, 4305.0, 8392.0, 18787.0, 45802.0, 136930.0, 931422.0, 2653965.0, 260574.0, 74897.0, 28478.0, 12326.0, 5743.0, 2975.0, 1612.0, 889.0, 504.0, 348.0, 192.0, 137.0, 98.0, 72.0, 48.0, 37.0, 20.0, 15.0, 12.0, 10.0, 7.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.095703125, -2.9932861328125, -2.890869140625, -2.7884521484375, -2.68603515625, -2.5836181640625, -2.481201171875, -2.3787841796875, -2.2763671875, -2.1739501953125, -2.071533203125, -1.9691162109375, -1.86669921875, -1.7642822265625, -1.661865234375, -1.5594482421875, -1.45703125, -1.3546142578125, -1.252197265625, -1.1497802734375, -1.04736328125, -0.9449462890625, -0.842529296875, -0.7401123046875, -0.6376953125, -0.5352783203125, -0.432861328125, -0.3304443359375, -0.22802734375, -0.1256103515625, -0.023193359375, 0.0792236328125, 0.181640625, 0.2840576171875, 0.386474609375, 0.4888916015625, 0.59130859375, 0.6937255859375, 0.796142578125, 0.8985595703125, 1.0009765625, 1.1033935546875, 1.205810546875, 1.3082275390625, 1.41064453125, 1.5130615234375, 1.615478515625, 1.7178955078125, 1.8203125, 1.9227294921875, 2.025146484375, 2.1275634765625, 2.22998046875, 2.3323974609375, 2.434814453125, 2.5372314453125, 2.6396484375, 2.7420654296875, 2.844482421875, 2.9468994140625, 3.04931640625, 3.1517333984375, 3.254150390625, 3.3565673828125, 3.458984375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 19.0, 21.0, 36.0, 75.0, 103.0, 193.0, 357.0, 823.0, 1040.0, 592.0, 350.0, 196.0, 128.0, 71.0, 27.0, 19.0, 10.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.03515625, -3.84600830078125, -3.6568603515625, -3.46771240234375, -3.278564453125, -3.08941650390625, -2.9002685546875, -2.71112060546875, -2.52197265625, -2.33282470703125, -2.1436767578125, -1.95452880859375, -1.765380859375, -1.57623291015625, -1.3870849609375, -1.19793701171875, -1.0087890625, -0.81964111328125, -0.6304931640625, -0.44134521484375, -0.252197265625, -0.06304931640625, 0.1260986328125, 0.31524658203125, 0.50439453125, 0.69354248046875, 0.8826904296875, 1.07183837890625, 1.260986328125, 1.45013427734375, 1.6392822265625, 1.82843017578125, 2.017578125, 2.20672607421875, 2.3958740234375, 2.58502197265625, 2.774169921875, 2.96331787109375, 3.1524658203125, 3.34161376953125, 3.53076171875, 3.71990966796875, 3.9090576171875, 4.09820556640625, 4.287353515625, 4.47650146484375, 4.6656494140625, 4.85479736328125, 5.0439453125, 5.23309326171875, 5.4222412109375, 5.61138916015625, 5.800537109375, 5.98968505859375, 6.1788330078125, 6.36798095703125, 6.55712890625, 6.74627685546875, 6.9354248046875, 7.12457275390625, 7.313720703125, 7.50286865234375, 7.6920166015625, 7.88116455078125, 8.0703125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 5.0, 3.0, 10.0, 21.0, 13.0, 40.0, 35.0, 62.0, 78.0, 112.0, 156.0, 263.0, 429.0, 1071.0, 3789.0, 21198.0, 194031.0, 3622166.0, 314513.0, 29084.0, 4877.0, 1184.0, 426.0, 217.0, 130.0, 97.0, 74.0, 47.0, 39.0, 33.0, 20.0, 18.0, 12.0, 9.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5859375, -10.172119140625, -9.75830078125, -9.344482421875, -8.9306640625, -8.516845703125, -8.10302734375, -7.689208984375, -7.275390625, -6.861572265625, -6.44775390625, -6.033935546875, -5.6201171875, -5.206298828125, -4.79248046875, -4.378662109375, -3.96484375, -3.551025390625, -3.13720703125, -2.723388671875, -2.3095703125, -1.895751953125, -1.48193359375, -1.068115234375, -0.654296875, -0.240478515625, 0.17333984375, 0.587158203125, 1.0009765625, 1.414794921875, 1.82861328125, 2.242431640625, 2.65625, 3.070068359375, 3.48388671875, 3.897705078125, 4.3115234375, 4.725341796875, 5.13916015625, 5.552978515625, 5.966796875, 6.380615234375, 6.79443359375, 7.208251953125, 7.6220703125, 8.035888671875, 8.44970703125, 8.863525390625, 9.27734375, 9.691162109375, 10.10498046875, 10.518798828125, 10.9326171875, 11.346435546875, 11.76025390625, 12.174072265625, 12.587890625, 13.001708984375, 13.41552734375, 13.829345703125, 14.2431640625, 14.656982421875, 15.07080078125, 15.484619140625, 15.8984375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 10.0, 435.0, 564.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.016820907592773, -16.56915283203125, -11.12148666381836, -5.673818588256836, -0.2261524200439453, 5.221513748168945, 10.669183731079102, 16.116849899291992, 21.564516067504883, 27.012184143066406, 32.4598503112793, 37.90751647949219, 43.355186462402344, 48.80284881591797, 54.250518798828125, 59.69818878173828, 65.1458511352539, 70.59352111816406, 76.04118347167969, 81.48885345458984, 86.9365234375, 92.38418579101562, 97.83185577392578, 103.27952575683594, 108.72718811035156, 114.17485809326172, 119.62252044677734, 125.0701904296875, 130.51785278320312, 135.96551513671875, 141.41319274902344, 146.86085510253906, 152.30853271484375, 157.75619506835938, 163.20387268066406, 168.6515350341797, 174.0991973876953, 179.546875, 184.99453735351562, 190.44219970703125, 195.88986206054688, 201.3375244140625, 206.7852020263672, 212.2328643798828, 217.68052673339844, 223.12820434570312, 228.57586669921875, 234.02352905273438, 239.47120666503906, 244.9188690185547, 250.36654663085938, 255.814208984375, 261.2618713378906, 266.70953369140625, 272.1572265625, 277.6048889160156, 283.05255126953125, 288.5002136230469, 293.9478759765625, 299.39556884765625, 304.8432312011719, 310.2908935546875, 315.7385559082031, 321.18621826171875, 326.6338806152344]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 10.0, 15.0, 17.0, 19.0, 23.0, 20.0, 28.0, 43.0, 40.0, 45.0, 47.0, 50.0, 64.0, 41.0, 46.0, 55.0, 38.0, 48.0, 49.0, 41.0, 34.0, 49.0, 30.0, 29.0, 27.0, 18.0, 22.0, 7.0, 13.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-20.97309684753418, -20.459436416625977, -19.94577407836914, -19.432113647460938, -18.918453216552734, -18.40479278564453, -17.891132354736328, -17.377470016479492, -16.86380958557129, -16.350149154663086, -15.836487770080566, -15.322826385498047, -14.809165954589844, -14.29550552368164, -13.781844139099121, -13.268182754516602, -12.754522323608398, -12.240861892700195, -11.727200508117676, -11.213539123535156, -10.699878692626953, -10.18621826171875, -9.67255687713623, -9.158895492553711, -8.645235061645508, -8.131574630737305, -7.617913246154785, -7.104252338409424, -6.5905914306640625, -6.076930522918701, -5.56326961517334, -5.0496087074279785, -4.535946846008301, -4.0222859382629395, -3.508625030517578, -2.994964122772217, -2.4813032150268555, -1.9676423072814941, -1.4539813995361328, -0.9403204917907715, -0.42665958404541016, 0.08700132369995117, 0.6006622314453125, 1.1143231391906738, 1.6279840469360352, 2.1416449546813965, 2.655305862426758, 3.168966770172119, 3.6826276779174805, 4.196288585662842, 4.709949493408203, 5.2236104011535645, 5.737271308898926, 6.250932216644287, 6.764593124389648, 7.27825403213501, 7.791914939880371, 8.30557632446289, 8.819236755371094, 9.332897186279297, 9.846558570861816, 10.360219955444336, 10.873880386352539, 11.387540817260742, 11.901202201843262]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 5.0, 10.0, 9.0, 16.0, 16.0, 21.0, 19.0, 26.0, 22.0, 28.0, 41.0, 28.0, 37.0, 39.0, 34.0, 40.0, 48.0, 43.0, 39.0, 59.0, 33.0, 35.0, 17.0, 36.0, 40.0, 35.0, 35.0, 28.0, 13.0, 22.0, 19.0, 21.0, 10.0, 12.0, 12.0, 4.0, 10.0, 3.0, 7.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74169921875, -0.7179031372070312, -0.6941070556640625, -0.6703109741210938, -0.646514892578125, -0.6227188110351562, -0.5989227294921875, -0.5751266479492188, -0.55133056640625, -0.5275344848632812, -0.5037384033203125, -0.47994232177734375, -0.456146240234375, -0.43235015869140625, -0.4085540771484375, -0.38475799560546875, -0.3609619140625, -0.33716583251953125, -0.3133697509765625, -0.28957366943359375, -0.265777587890625, -0.24198150634765625, -0.2181854248046875, -0.19438934326171875, -0.17059326171875, -0.14679718017578125, -0.1230010986328125, -0.09920501708984375, -0.075408935546875, -0.05161285400390625, -0.0278167724609375, -0.00402069091796875, 0.019775390625, 0.04357147216796875, 0.0673675537109375, 0.09116363525390625, 0.114959716796875, 0.13875579833984375, 0.1625518798828125, 0.18634796142578125, 0.21014404296875, 0.23394012451171875, 0.2577362060546875, 0.28153228759765625, 0.305328369140625, 0.32912445068359375, 0.3529205322265625, 0.37671661376953125, 0.4005126953125, 0.42430877685546875, 0.4481048583984375, 0.47190093994140625, 0.495697021484375, 0.5194931030273438, 0.5432891845703125, 0.5670852661132812, 0.59088134765625, 0.6146774291992188, 0.6384735107421875, 0.6622695922851562, 0.686065673828125, 0.7098617553710938, 0.7336578369140625, 0.7574539184570312, 0.78125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 1.0, 16.0, 16.0, 29.0, 26.0, 53.0, 62.0, 79.0, 144.0, 197.0, 289.0, 423.0, 615.0, 1018.0, 1461.0, 2151.0, 3309.0, 5218.0, 8282.0, 13449.0, 22058.0, 37689.0, 66701.0, 128665.0, 270008.0, 231545.0, 110046.0, 58539.0, 33316.0, 19643.0, 11981.0, 7571.0, 4889.0, 3088.0, 1950.0, 1372.0, 865.0, 593.0, 402.0, 229.0, 174.0, 134.0, 74.0, 59.0, 44.0, 25.0, 17.0, 17.0, 8.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.244140625, -2.17376708984375, -2.1033935546875, -2.03302001953125, -1.962646484375, -1.89227294921875, -1.8218994140625, -1.75152587890625, -1.68115234375, -1.61077880859375, -1.5404052734375, -1.47003173828125, -1.399658203125, -1.32928466796875, -1.2589111328125, -1.18853759765625, -1.1181640625, -1.04779052734375, -0.9774169921875, -0.90704345703125, -0.836669921875, -0.76629638671875, -0.6959228515625, -0.62554931640625, -0.55517578125, -0.48480224609375, -0.4144287109375, -0.34405517578125, -0.273681640625, -0.20330810546875, -0.1329345703125, -0.06256103515625, 0.0078125, 0.07818603515625, 0.1485595703125, 0.21893310546875, 0.289306640625, 0.35968017578125, 0.4300537109375, 0.50042724609375, 0.57080078125, 0.64117431640625, 0.7115478515625, 0.78192138671875, 0.852294921875, 0.92266845703125, 0.9930419921875, 1.06341552734375, 1.1337890625, 1.20416259765625, 1.2745361328125, 1.34490966796875, 1.415283203125, 1.48565673828125, 1.5560302734375, 1.62640380859375, 1.69677734375, 1.76715087890625, 1.8375244140625, 1.90789794921875, 1.978271484375, 2.04864501953125, 2.1190185546875, 2.18939208984375, 2.259765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 7.0, 13.0, 14.0, 17.0, 22.0, 18.0, 28.0, 20.0, 30.0, 29.0, 19.0, 31.0, 37.0, 41.0, 44.0, 42.0, 54.0, 1066.0, 50.0, 44.0, 38.0, 42.0, 28.0, 46.0, 32.0, 25.0, 28.0, 30.0, 17.0, 16.0, 19.0, 15.0, 15.0, 10.0, 12.0, 6.0, 2.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6630859375, -0.6426467895507812, -0.6222076416015625, -0.6017684936523438, -0.581329345703125, -0.5608901977539062, -0.5404510498046875, -0.5200119018554688, -0.49957275390625, -0.47913360595703125, -0.4586944580078125, -0.43825531005859375, -0.417816162109375, -0.39737701416015625, -0.3769378662109375, -0.35649871826171875, -0.3360595703125, -0.31562042236328125, -0.2951812744140625, -0.27474212646484375, -0.254302978515625, -0.23386383056640625, -0.2134246826171875, -0.19298553466796875, -0.17254638671875, -0.15210723876953125, -0.1316680908203125, -0.11122894287109375, -0.090789794921875, -0.07035064697265625, -0.0499114990234375, -0.02947235107421875, -0.009033203125, 0.01140594482421875, 0.0318450927734375, 0.05228424072265625, 0.072723388671875, 0.09316253662109375, 0.1136016845703125, 0.13404083251953125, 0.15447998046875, 0.17491912841796875, 0.1953582763671875, 0.21579742431640625, 0.236236572265625, 0.25667572021484375, 0.2771148681640625, 0.29755401611328125, 0.3179931640625, 0.33843231201171875, 0.3588714599609375, 0.37931060791015625, 0.399749755859375, 0.42018890380859375, 0.4406280517578125, 0.46106719970703125, 0.48150634765625, 0.5019454956054688, 0.5223846435546875, 0.5428237915039062, 0.563262939453125, 0.5837020874023438, 0.6041412353515625, 0.6245803833007812, 0.64501953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 9.0, 12.0, 18.0, 19.0, 39.0, 52.0, 71.0, 94.0, 155.0, 266.0, 359.0, 554.0, 791.0, 1196.0, 1722.0, 2838.0, 4662.0, 8013.0, 14920.0, 30880.0, 73292.0, 238081.0, 1311831.0, 259837.0, 77818.0, 32447.0, 15700.0, 8335.0, 4817.0, 2868.0, 1890.0, 1200.0, 777.0, 472.0, 320.0, 245.0, 169.0, 134.0, 78.0, 52.0, 38.0, 14.0, 17.0, 11.0, 9.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-2.107421875, -2.04638671875, -1.9853515625, -1.92431640625, -1.86328125, -1.80224609375, -1.7412109375, -1.68017578125, -1.619140625, -1.55810546875, -1.4970703125, -1.43603515625, -1.375, -1.31396484375, -1.2529296875, -1.19189453125, -1.130859375, -1.06982421875, -1.0087890625, -0.94775390625, -0.88671875, -0.82568359375, -0.7646484375, -0.70361328125, -0.642578125, -0.58154296875, -0.5205078125, -0.45947265625, -0.3984375, -0.33740234375, -0.2763671875, -0.21533203125, -0.154296875, -0.09326171875, -0.0322265625, 0.02880859375, 0.08984375, 0.15087890625, 0.2119140625, 0.27294921875, 0.333984375, 0.39501953125, 0.4560546875, 0.51708984375, 0.578125, 0.63916015625, 0.7001953125, 0.76123046875, 0.822265625, 0.88330078125, 0.9443359375, 1.00537109375, 1.06640625, 1.12744140625, 1.1884765625, 1.24951171875, 1.310546875, 1.37158203125, 1.4326171875, 1.49365234375, 1.5546875, 1.61572265625, 1.6767578125, 1.73779296875, 1.798828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 4.0, 9.0, 14.0, 28.0, 98.0, 489.0, 202.0, 53.0, 22.0, 8.0, 7.0, 3.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.228515625, -2.160614013671875, -2.09271240234375, -2.024810791015625, -1.9569091796875, -1.889007568359375, -1.82110595703125, -1.753204345703125, -1.685302734375, -1.617401123046875, -1.54949951171875, -1.481597900390625, -1.4136962890625, -1.345794677734375, -1.27789306640625, -1.209991455078125, -1.14208984375, -1.074188232421875, -1.00628662109375, -0.938385009765625, -0.8704833984375, -0.802581787109375, -0.73468017578125, -0.666778564453125, -0.598876953125, -0.530975341796875, -0.46307373046875, -0.395172119140625, -0.3272705078125, -0.259368896484375, -0.19146728515625, -0.123565673828125, -0.0556640625, 0.012237548828125, 0.08013916015625, 0.148040771484375, 0.2159423828125, 0.283843994140625, 0.35174560546875, 0.419647216796875, 0.487548828125, 0.555450439453125, 0.62335205078125, 0.691253662109375, 0.7591552734375, 0.827056884765625, 0.89495849609375, 0.962860107421875, 1.03076171875, 1.098663330078125, 1.16656494140625, 1.234466552734375, 1.3023681640625, 1.370269775390625, 1.43817138671875, 1.506072998046875, 1.573974609375, 1.641876220703125, 1.70977783203125, 1.777679443359375, 1.8455810546875, 1.913482666015625, 1.98138427734375, 2.049285888671875, 2.1171875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 6.0, 3.0, 3.0, 5.0, 4.0, 5.0, 10.0, 4.0, 8.0, 7.0, 11.0, 9.0, 6.0, 12.0, 12.0, 21.0, 21.0, 48.0, 99.0, 487.0, 4694.0, 957267.0, 82031.0, 3151.0, 359.0, 84.0, 37.0, 25.0, 17.0, 18.0, 9.0, 10.0, 7.0, 10.0, 9.0, 3.0, 5.0, 5.0, 12.0, 6.0, 1.0, 7.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-33.21875, -32.20947265625, -31.2001953125, -30.19091796875, -29.181640625, -28.17236328125, -27.1630859375, -26.15380859375, -25.14453125, -24.13525390625, -23.1259765625, -22.11669921875, -21.107421875, -20.09814453125, -19.0888671875, -18.07958984375, -17.0703125, -16.06103515625, -15.0517578125, -14.04248046875, -13.033203125, -12.02392578125, -11.0146484375, -10.00537109375, -8.99609375, -7.98681640625, -6.9775390625, -5.96826171875, -4.958984375, -3.94970703125, -2.9404296875, -1.93115234375, -0.921875, 0.08740234375, 1.0966796875, 2.10595703125, 3.115234375, 4.12451171875, 5.1337890625, 6.14306640625, 7.15234375, 8.16162109375, 9.1708984375, 10.18017578125, 11.189453125, 12.19873046875, 13.2080078125, 14.21728515625, 15.2265625, 16.23583984375, 17.2451171875, 18.25439453125, 19.263671875, 20.27294921875, 21.2822265625, 22.29150390625, 23.30078125, 24.31005859375, 25.3193359375, 26.32861328125, 27.337890625, 28.34716796875, 29.3564453125, 30.36572265625, 31.375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 8.0, 4.0, 18.0, 26.0, 32.0, 57.0, 105.0, 166.0, 190.0, 141.0, 76.0, 48.0, 46.0, 21.0, 12.0, 14.0, 14.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.643264055252075, -3.5646469593048096, -3.486029863357544, -3.4074127674102783, -3.3287956714630127, -3.250178575515747, -3.1715614795684814, -3.092944383621216, -3.01432728767395, -2.9357101917266846, -2.857093095779419, -2.7784759998321533, -2.6998589038848877, -2.621241807937622, -2.5426247119903564, -2.464007616043091, -2.385390520095825, -2.3067734241485596, -2.228156328201294, -2.1495392322540283, -2.0709221363067627, -1.992305040359497, -1.9136879444122314, -1.8350708484649658, -1.7564537525177002, -1.6778366565704346, -1.599219560623169, -1.5206024646759033, -1.4419853687286377, -1.363368272781372, -1.2847511768341064, -1.2061340808868408, -1.1275168657302856, -1.04889976978302, -0.9702826738357544, -0.8916655778884888, -0.8130484819412231, -0.7344313859939575, -0.6558142900466919, -0.5771971940994263, -0.49858009815216064, -0.419963002204895, -0.3413459062576294, -0.26272881031036377, -0.18411171436309814, -0.10549461841583252, -0.026877522468566895, 0.05173957347869873, 0.13035666942596436, 0.20897376537322998, 0.2875908613204956, 0.36620795726776123, 0.44482505321502686, 0.5234421491622925, 0.6020592451095581, 0.6806763410568237, 0.7592934370040894, 0.837910532951355, 0.9165276288986206, 0.9951447248458862, 1.0737618207931519, 1.1523789167404175, 1.230996012687683, 1.3096131086349487, 1.3882302045822144]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 7.0, 16.0, 17.0, 18.0, 17.0, 17.0, 30.0, 31.0, 39.0, 25.0, 42.0, 52.0, 47.0, 40.0, 53.0, 47.0, 53.0, 43.0, 38.0, 43.0, 36.0, 32.0, 46.0, 37.0, 26.0, 21.0, 22.0, 21.0, 22.0, 15.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8690627813339233, -1.810356855392456, -1.7516508102416992, -1.692944884300232, -1.6342389583587646, -1.5755329132080078, -1.5168269872665405, -1.4581210613250732, -1.3994150161743164, -1.3407090902328491, -1.2820030450820923, -1.223297119140625, -1.1645910739898682, -1.1058851480484009, -1.0471792221069336, -0.9884732365608215, -0.9297672510147095, -0.8710612654685974, -0.8123552799224854, -0.7536493539810181, -0.694943368434906, -0.636237382888794, -0.5775314569473267, -0.5188254714012146, -0.46011948585510254, -0.4014135003089905, -0.3427075445652008, -0.28400158882141113, -0.22529560327529907, -0.166589617729187, -0.10788366198539734, -0.049177706241607666, 0.009528398513793945, 0.06823436915874481, 0.12694033980369568, 0.18564631044864655, 0.2443522810935974, 0.3030582666397095, 0.36176422238349915, 0.4204701781272888, 0.4791761636734009, 0.5378821492195129, 0.596588134765625, 0.6552940607070923, 0.7140000462532043, 0.7727060317993164, 0.8314119577407837, 0.8901179432868958, 0.9488239288330078, 1.007529854774475, 1.066235899925232, 1.1249418258666992, 1.183647871017456, 1.2423537969589233, 1.3010597229003906, 1.3597657680511475, 1.4184716939926147, 1.477177619934082, 1.5358836650848389, 1.5945895910263062, 1.6532955169677734, 1.7120015621185303, 1.7707074880599976, 1.8294134140014648, 1.8881194591522217]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 8.0, 6.0, 6.0, 2.0, 10.0, 11.0, 20.0, 23.0, 16.0, 9.0, 37.0, 23.0, 33.0, 23.0, 32.0, 38.0, 40.0, 27.0, 36.0, 45.0, 43.0, 50.0, 47.0, 38.0, 24.0, 36.0, 26.0, 36.0, 38.0, 32.0, 29.0, 18.0, 24.0, 19.0, 8.0, 14.0, 19.0, 14.0, 6.0, 8.0, 3.0, 7.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.72021484375, -0.6971359252929688, -0.6740570068359375, -0.6509780883789062, -0.627899169921875, -0.6048202514648438, -0.5817413330078125, -0.5586624145507812, -0.53558349609375, -0.5125045776367188, -0.4894256591796875, -0.46634674072265625, -0.443267822265625, -0.42018890380859375, -0.3971099853515625, -0.37403106689453125, -0.3509521484375, -0.32787322998046875, -0.3047943115234375, -0.28171539306640625, -0.258636474609375, -0.23555755615234375, -0.2124786376953125, -0.18939971923828125, -0.16632080078125, -0.14324188232421875, -0.1201629638671875, -0.09708404541015625, -0.074005126953125, -0.05092620849609375, -0.0278472900390625, -0.00476837158203125, 0.018310546875, 0.04138946533203125, 0.0644683837890625, 0.08754730224609375, 0.110626220703125, 0.13370513916015625, 0.1567840576171875, 0.17986297607421875, 0.20294189453125, 0.22602081298828125, 0.2490997314453125, 0.27217864990234375, 0.295257568359375, 0.31833648681640625, 0.3414154052734375, 0.36449432373046875, 0.3875732421875, 0.41065216064453125, 0.4337310791015625, 0.45680999755859375, 0.479888916015625, 0.5029678344726562, 0.5260467529296875, 0.5491256713867188, 0.57220458984375, 0.5952835083007812, 0.6183624267578125, 0.6414413452148438, 0.664520263671875, 0.6875991821289062, 0.7106781005859375, 0.7337570190429688, 0.7568359375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 21.0, 19.0, 23.0, 42.0, 52.0, 61.0, 91.0, 130.0, 195.0, 258.0, 380.0, 496.0, 698.0, 1010.0, 1437.0, 2119.0, 3141.0, 4884.0, 8191.0, 13665.0, 25400.0, 55348.0, 138998.0, 324830.0, 266460.0, 104049.0, 43482.0, 21025.0, 11612.0, 6861.0, 4425.0, 2900.0, 1848.0, 1303.0, 842.0, 618.0, 433.0, 320.0, 241.0, 189.0, 112.0, 82.0, 81.0, 51.0, 31.0, 26.0, 18.0, 9.0, 14.0, 5.0, 4.0, 5.0, 3.0, 3.0], "bins": [-1.1962890625, -1.16094970703125, -1.1256103515625, -1.09027099609375, -1.054931640625, -1.01959228515625, -0.9842529296875, -0.94891357421875, -0.91357421875, -0.87823486328125, -0.8428955078125, -0.80755615234375, -0.772216796875, -0.73687744140625, -0.7015380859375, -0.66619873046875, -0.630859375, -0.59552001953125, -0.5601806640625, -0.52484130859375, -0.489501953125, -0.45416259765625, -0.4188232421875, -0.38348388671875, -0.34814453125, -0.31280517578125, -0.2774658203125, -0.24212646484375, -0.206787109375, -0.17144775390625, -0.1361083984375, -0.10076904296875, -0.0654296875, -0.03009033203125, 0.0052490234375, 0.04058837890625, 0.075927734375, 0.11126708984375, 0.1466064453125, 0.18194580078125, 0.21728515625, 0.25262451171875, 0.2879638671875, 0.32330322265625, 0.358642578125, 0.39398193359375, 0.4293212890625, 0.46466064453125, 0.5, 0.53533935546875, 0.5706787109375, 0.60601806640625, 0.641357421875, 0.67669677734375, 0.7120361328125, 0.74737548828125, 0.78271484375, 0.81805419921875, 0.8533935546875, 0.88873291015625, 0.924072265625, 0.95941162109375, 0.9947509765625, 1.03009033203125, 1.0654296875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 8.0, 5.0, 5.0, 6.0, 11.0, 6.0, 12.0, 10.0, 20.0, 17.0, 25.0, 20.0, 34.0, 47.0, 45.0, 45.0, 52.0, 67.0, 96.0, 189.0, 283.0, 1319.0, 177.0, 99.0, 70.0, 62.0, 42.0, 51.0, 31.0, 28.0, 32.0, 27.0, 28.0, 13.0, 21.0, 16.0, 13.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.804595947265625, -2.70098876953125, -2.597381591796875, -2.4937744140625, -2.390167236328125, -2.28656005859375, -2.182952880859375, -2.079345703125, -1.975738525390625, -1.87213134765625, -1.768524169921875, -1.6649169921875, -1.561309814453125, -1.45770263671875, -1.354095458984375, -1.25048828125, -1.146881103515625, -1.04327392578125, -0.939666748046875, -0.8360595703125, -0.732452392578125, -0.62884521484375, -0.525238037109375, -0.421630859375, -0.318023681640625, -0.21441650390625, -0.110809326171875, -0.0072021484375, 0.096405029296875, 0.20001220703125, 0.303619384765625, 0.4072265625, 0.510833740234375, 0.61444091796875, 0.718048095703125, 0.8216552734375, 0.925262451171875, 1.02886962890625, 1.132476806640625, 1.236083984375, 1.339691162109375, 1.44329833984375, 1.546905517578125, 1.6505126953125, 1.754119873046875, 1.85772705078125, 1.961334228515625, 2.06494140625, 2.168548583984375, 2.27215576171875, 2.375762939453125, 2.4793701171875, 2.582977294921875, 2.68658447265625, 2.790191650390625, 2.893798828125, 2.997406005859375, 3.10101318359375, 3.204620361328125, 3.3082275390625, 3.411834716796875, 3.51544189453125, 3.619049072265625, 3.72265625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 9.0, 12.0, 14.0, 17.0, 29.0, 15.0, 50.0, 62.0, 77.0, 120.0, 218.0, 381.0, 645.0, 1248.0, 2502.0, 6112.0, 18544.0, 81312.0, 861924.0, 1990369.0, 139898.0, 27294.0, 8158.0, 3158.0, 1542.0, 786.0, 434.0, 285.0, 151.0, 79.0, 61.0, 42.0, 34.0, 24.0, 23.0, 12.0, 8.0, 11.0, 11.0, 5.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-5.2265625, -5.073486328125, -4.92041015625, -4.767333984375, -4.6142578125, -4.461181640625, -4.30810546875, -4.155029296875, -4.001953125, -3.848876953125, -3.69580078125, -3.542724609375, -3.3896484375, -3.236572265625, -3.08349609375, -2.930419921875, -2.77734375, -2.624267578125, -2.47119140625, -2.318115234375, -2.1650390625, -2.011962890625, -1.85888671875, -1.705810546875, -1.552734375, -1.399658203125, -1.24658203125, -1.093505859375, -0.9404296875, -0.787353515625, -0.63427734375, -0.481201171875, -0.328125, -0.175048828125, -0.02197265625, 0.131103515625, 0.2841796875, 0.437255859375, 0.59033203125, 0.743408203125, 0.896484375, 1.049560546875, 1.20263671875, 1.355712890625, 1.5087890625, 1.661865234375, 1.81494140625, 1.968017578125, 2.12109375, 2.274169921875, 2.42724609375, 2.580322265625, 2.7333984375, 2.886474609375, 3.03955078125, 3.192626953125, 3.345703125, 3.498779296875, 3.65185546875, 3.804931640625, 3.9580078125, 4.111083984375, 4.26416015625, 4.417236328125, 4.5703125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 27.0, 243.0, 563.0, 164.0, 15.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.67650032043457, -28.291778564453125, -26.90705680847168, -25.522335052490234, -24.13761329650879, -22.752891540527344, -21.3681697845459, -19.983448028564453, -18.598726272583008, -17.214004516601562, -15.829282760620117, -14.444561004638672, -13.059839248657227, -11.675117492675781, -10.290395736694336, -8.90567398071289, -7.520952224731445, -6.13623046875, -4.751508712768555, -3.3667869567871094, -1.982065200805664, -0.5973434448242188, 0.7873783111572266, 2.172100067138672, 3.556821823120117, 4.9415435791015625, 6.326265335083008, 7.710987091064453, 9.095708847045898, 10.480430603027344, 11.865152359008789, 13.249874114990234, 14.634597778320312, 16.019319534301758, 17.404041290283203, 18.78876304626465, 20.173484802246094, 21.55820655822754, 22.942928314208984, 24.32765007019043, 25.712371826171875, 27.09709358215332, 28.481815338134766, 29.86653709411621, 31.251258850097656, 32.63597869873047, 34.02070236206055, 35.405426025390625, 36.79014587402344, 38.17486572265625, 39.55958938598633, 40.944313049316406, 42.32903289794922, 43.71375274658203, 45.09847640991211, 46.48320007324219, 47.867919921875, 49.25263977050781, 50.63736343383789, 52.02208709716797, 53.40680694580078, 54.791526794433594, 56.17625045776367, 57.56097412109375, 58.94569396972656]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 7.0, 9.0, 9.0, 8.0, 11.0, 17.0, 10.0, 21.0, 22.0, 25.0, 22.0, 29.0, 31.0, 33.0, 37.0, 30.0, 37.0, 43.0, 39.0, 36.0, 35.0, 48.0, 36.0, 39.0, 35.0, 52.0, 36.0, 26.0, 25.0, 16.0, 25.0, 21.0, 25.0, 21.0, 11.0, 15.0, 16.0, 4.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.70910930633545, -9.40731143951416, -9.105514526367188, -8.803716659545898, -8.501919746398926, -8.200121879577637, -7.898324489593506, -7.596527099609375, -7.294729232788086, -6.992931842803955, -6.691134452819824, -6.389336585998535, -6.087539196014404, -5.785741806030273, -5.483944416046143, -5.182147026062012, -4.880349636077881, -4.57855224609375, -4.276754856109619, -3.974957227706909, -3.673159599304199, -3.3713622093200684, -3.0695648193359375, -2.7677671909332275, -2.4659698009490967, -2.164172410964966, -1.8623747825622559, -1.560577392578125, -1.2587798833847046, -0.9569823741912842, -0.6551849842071533, -0.35338735580444336, -0.0515899658203125, 0.2502075135707855, 0.5520049929618835, 0.8538024425506592, 1.1555999517440796, 1.4573974609375, 1.7591948509216309, 2.060992479324341, 2.3627898693084717, 2.6645872592926025, 2.9663848876953125, 3.2681822776794434, 3.569979667663574, 3.871777296066284, 4.173574447631836, 4.475372314453125, 4.777169704437256, 5.078967094421387, 5.380764484405518, 5.682561874389648, 5.9843597412109375, 6.286157131195068, 6.587954521179199, 6.889752388000488, 7.191549301147461, 7.493346691131592, 7.795144081115723, 8.096941947937012, 8.398738861083984, 8.700536727905273, 9.002334594726562, 9.304131507873535, 9.605929374694824]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 5.0, 7.0, 15.0, 9.0, 21.0, 15.0, 16.0, 15.0, 32.0, 35.0, 34.0, 33.0, 23.0, 37.0, 34.0, 38.0, 41.0, 41.0, 50.0, 39.0, 42.0, 39.0, 31.0, 34.0, 32.0, 32.0, 29.0, 31.0, 25.0, 27.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 12.0, 10.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.76806640625, -0.7436981201171875, -0.719329833984375, -0.6949615478515625, -0.67059326171875, -0.6462249755859375, -0.621856689453125, -0.5974884033203125, -0.5731201171875, -0.5487518310546875, -0.524383544921875, -0.5000152587890625, -0.47564697265625, -0.4512786865234375, -0.426910400390625, -0.4025421142578125, -0.378173828125, -0.3538055419921875, -0.329437255859375, -0.3050689697265625, -0.28070068359375, -0.2563323974609375, -0.231964111328125, -0.2075958251953125, -0.1832275390625, -0.1588592529296875, -0.134490966796875, -0.1101226806640625, -0.08575439453125, -0.0613861083984375, -0.037017822265625, -0.0126495361328125, 0.01171875, 0.0360870361328125, 0.060455322265625, 0.0848236083984375, 0.10919189453125, 0.1335601806640625, 0.157928466796875, 0.1822967529296875, 0.2066650390625, 0.2310333251953125, 0.255401611328125, 0.2797698974609375, 0.30413818359375, 0.3285064697265625, 0.352874755859375, 0.3772430419921875, 0.401611328125, 0.4259796142578125, 0.450347900390625, 0.4747161865234375, 0.49908447265625, 0.5234527587890625, 0.547821044921875, 0.5721893310546875, 0.5965576171875, 0.6209259033203125, 0.645294189453125, 0.6696624755859375, 0.69403076171875, 0.7183990478515625, 0.742767333984375, 0.7671356201171875, 0.79150390625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 15.0, 7.0, 18.0, 23.0, 32.0, 51.0, 60.0, 94.0, 151.0, 230.0, 418.0, 682.0, 1377.0, 2924.0, 5949.0, 14375.0, 38589.0, 141057.0, 2193865.0, 1616222.0, 119837.0, 34569.0, 12832.0, 5597.0, 2473.0, 1222.0, 663.0, 322.0, 194.0, 150.0, 69.0, 54.0, 44.0, 27.0, 11.0, 15.0, 14.0, 8.0, 8.0, 3.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.333984375, -3.214691162109375, -3.09539794921875, -2.976104736328125, -2.8568115234375, -2.737518310546875, -2.61822509765625, -2.498931884765625, -2.379638671875, -2.260345458984375, -2.14105224609375, -2.021759033203125, -1.9024658203125, -1.783172607421875, -1.66387939453125, -1.544586181640625, -1.42529296875, -1.305999755859375, -1.18670654296875, -1.067413330078125, -0.9481201171875, -0.828826904296875, -0.70953369140625, -0.590240478515625, -0.470947265625, -0.351654052734375, -0.23236083984375, -0.113067626953125, 0.0062255859375, 0.125518798828125, 0.24481201171875, 0.364105224609375, 0.4833984375, 0.602691650390625, 0.72198486328125, 0.841278076171875, 0.9605712890625, 1.079864501953125, 1.19915771484375, 1.318450927734375, 1.437744140625, 1.557037353515625, 1.67633056640625, 1.795623779296875, 1.9149169921875, 2.034210205078125, 2.15350341796875, 2.272796630859375, 2.39208984375, 2.511383056640625, 2.63067626953125, 2.749969482421875, 2.8692626953125, 2.988555908203125, 3.10784912109375, 3.227142333984375, 3.346435546875, 3.465728759765625, 3.58502197265625, 3.704315185546875, 3.8236083984375, 3.942901611328125, 4.06219482421875, 4.181488037109375, 4.30078125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 14.0, 11.0, 31.0, 38.0, 61.0, 94.0, 122.0, 257.0, 324.0, 561.0, 787.0, 667.0, 381.0, 246.0, 151.0, 96.0, 68.0, 50.0, 35.0, 17.0, 16.0, 12.0, 11.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.881103515625, -2.75439453125, -2.627685546875, -2.5009765625, -2.374267578125, -2.24755859375, -2.120849609375, -1.994140625, -1.867431640625, -1.74072265625, -1.614013671875, -1.4873046875, -1.360595703125, -1.23388671875, -1.107177734375, -0.98046875, -0.853759765625, -0.72705078125, -0.600341796875, -0.4736328125, -0.346923828125, -0.22021484375, -0.093505859375, 0.033203125, 0.159912109375, 0.28662109375, 0.413330078125, 0.5400390625, 0.666748046875, 0.79345703125, 0.920166015625, 1.046875, 1.173583984375, 1.30029296875, 1.427001953125, 1.5537109375, 1.680419921875, 1.80712890625, 1.933837890625, 2.060546875, 2.187255859375, 2.31396484375, 2.440673828125, 2.5673828125, 2.694091796875, 2.82080078125, 2.947509765625, 3.07421875, 3.200927734375, 3.32763671875, 3.454345703125, 3.5810546875, 3.707763671875, 3.83447265625, 3.961181640625, 4.087890625, 4.214599609375, 4.34130859375, 4.468017578125, 4.5947265625, 4.721435546875, 4.84814453125, 4.974853515625, 5.1015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 8.0, 13.0, 8.0, 19.0, 22.0, 35.0, 52.0, 85.0, 157.0, 266.0, 482.0, 1150.0, 2622.0, 6755.0, 19859.0, 72274.0, 384999.0, 3129320.0, 460608.0, 80633.0, 22228.0, 7368.0, 2809.0, 1243.0, 544.0, 277.0, 155.0, 87.0, 65.0, 29.0, 24.0, 16.0, 20.0, 6.0, 6.0, 7.0, 4.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.296875, -6.0682373046875, -5.839599609375, -5.6109619140625, -5.38232421875, -5.1536865234375, -4.925048828125, -4.6964111328125, -4.4677734375, -4.2391357421875, -4.010498046875, -3.7818603515625, -3.55322265625, -3.3245849609375, -3.095947265625, -2.8673095703125, -2.638671875, -2.4100341796875, -2.181396484375, -1.9527587890625, -1.72412109375, -1.4954833984375, -1.266845703125, -1.0382080078125, -0.8095703125, -0.5809326171875, -0.352294921875, -0.1236572265625, 0.10498046875, 0.3336181640625, 0.562255859375, 0.7908935546875, 1.01953125, 1.2481689453125, 1.476806640625, 1.7054443359375, 1.93408203125, 2.1627197265625, 2.391357421875, 2.6199951171875, 2.8486328125, 3.0772705078125, 3.305908203125, 3.5345458984375, 3.76318359375, 3.9918212890625, 4.220458984375, 4.4490966796875, 4.677734375, 4.9063720703125, 5.135009765625, 5.3636474609375, 5.59228515625, 5.8209228515625, 6.049560546875, 6.2781982421875, 6.5068359375, 6.7354736328125, 6.964111328125, 7.1927490234375, 7.42138671875, 7.6500244140625, 7.878662109375, 8.1072998046875, 8.3359375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 13.0, 16.0, 37.0, 55.0, 117.0, 153.0, 199.0, 168.0, 113.0, 58.0, 43.0, 20.0, 12.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.814542770385742, -17.848920822143555, -16.883298873901367, -15.917675971984863, -14.95205307006836, -13.986431121826172, -13.020809173583984, -12.055187225341797, -11.089564323425293, -10.123942375183105, -9.158319473266602, -8.192697525024414, -7.227075099945068, -6.261452674865723, -5.295830726623535, -4.3302083015441895, -3.3645858764648438, -2.398963451385498, -1.4333412647247314, -0.46771907806396484, 0.49790334701538086, 1.4635257720947266, 2.429147720336914, 3.3947701454162598, 4.3603925704956055, 5.326014995574951, 6.291637420654297, 7.257259368896484, 8.222881317138672, 9.188504219055176, 10.154126167297363, 11.119749069213867, 12.085372924804688, 13.050994873046875, 14.016617774963379, 14.982239723205566, 15.94786262512207, 16.913484573364258, 17.879106521606445, 18.844728469848633, 19.810352325439453, 20.77597427368164, 21.741596221923828, 22.707218170166016, 23.672842025756836, 24.638463973999023, 25.60408592224121, 26.5697078704834, 27.535329818725586, 28.500951766967773, 29.46657371520996, 30.43219757080078, 31.39781951904297, 32.363441467285156, 33.329063415527344, 34.29468536376953, 35.26030731201172, 36.225929260253906, 37.191551208496094, 38.15717315673828, 39.12279510498047, 40.088417053222656, 41.054039001464844, 42.0196647644043, 42.985286712646484]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 7.0, 2.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 16.0, 18.0, 16.0, 39.0, 35.0, 30.0, 34.0, 34.0, 39.0, 31.0, 50.0, 42.0, 35.0, 41.0, 40.0, 41.0, 52.0, 31.0, 27.0, 42.0, 34.0, 20.0, 32.0, 21.0, 18.0, 19.0, 17.0, 18.0, 22.0, 9.0, 7.0, 7.0, 8.0, 3.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.781227111816406, -9.474494934082031, -9.167762756347656, -8.861030578613281, -8.554298400878906, -8.247566223144531, -7.9408345222473145, -7.6341023445129395, -7.3273701667785645, -7.0206379890441895, -6.7139058113098145, -6.4071736335754395, -6.100441932678223, -5.793709754943848, -5.486977577209473, -5.180245399475098, -4.873513221740723, -4.566781044006348, -4.260048866271973, -3.9533169269561768, -3.6465847492218018, -3.3398525714874268, -3.033120632171631, -2.726388454437256, -2.419656276702881, -2.112924098968506, -1.8061920404434204, -1.499459981918335, -1.19272780418396, -0.885995626449585, -0.5792635679244995, -0.27253150939941406, 0.034201622009277344, 0.34093374013900757, 0.6476658582687378, 0.954397976398468, 1.2611300945281982, 1.5678622722625732, 1.8745943307876587, 2.181326389312744, 2.488058567047119, 2.794790744781494, 3.101522922515869, 3.408254861831665, 3.71498703956604, 4.021718978881836, 4.328451156616211, 4.635183334350586, 4.941915512084961, 5.248647689819336, 5.555379867553711, 5.862112045288086, 6.168844223022461, 6.475576400756836, 6.782308101654053, 7.089040279388428, 7.395772457122803, 7.702504634857178, 8.009236335754395, 8.31596851348877, 8.622700691223145, 8.92943286895752, 9.236165046691895, 9.54289722442627, 9.849629402160645]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 6.0, 9.0, 6.0, 12.0, 13.0, 12.0, 15.0, 9.0, 22.0, 28.0, 22.0, 19.0, 19.0, 34.0, 26.0, 34.0, 45.0, 36.0, 37.0, 35.0, 48.0, 36.0, 38.0, 33.0, 38.0, 30.0, 37.0, 27.0, 30.0, 28.0, 40.0, 32.0, 24.0, 17.0, 20.0, 10.0, 10.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 0.0, 6.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7724609375, -0.7477188110351562, -0.7229766845703125, -0.6982345581054688, -0.673492431640625, -0.6487503051757812, -0.6240081787109375, -0.5992660522460938, -0.57452392578125, -0.5497817993164062, -0.5250396728515625, -0.5002975463867188, -0.475555419921875, -0.45081329345703125, -0.4260711669921875, -0.40132904052734375, -0.3765869140625, -0.35184478759765625, -0.3271026611328125, -0.30236053466796875, -0.277618408203125, -0.25287628173828125, -0.2281341552734375, -0.20339202880859375, -0.17864990234375, -0.15390777587890625, -0.1291656494140625, -0.10442352294921875, -0.079681396484375, -0.05493927001953125, -0.0301971435546875, -0.00545501708984375, 0.019287109375, 0.04402923583984375, 0.0687713623046875, 0.09351348876953125, 0.118255615234375, 0.14299774169921875, 0.1677398681640625, 0.19248199462890625, 0.21722412109375, 0.24196624755859375, 0.2667083740234375, 0.29145050048828125, 0.316192626953125, 0.34093475341796875, 0.3656768798828125, 0.39041900634765625, 0.4151611328125, 0.43990325927734375, 0.4646453857421875, 0.48938751220703125, 0.514129638671875, 0.5388717651367188, 0.5636138916015625, 0.5883560180664062, 0.61309814453125, 0.6378402709960938, 0.6625823974609375, 0.6873245239257812, 0.712066650390625, 0.7368087768554688, 0.7615509033203125, 0.7862930297851562, 0.81103515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 10.0, 18.0, 20.0, 34.0, 53.0, 75.0, 117.0, 138.0, 269.0, 430.0, 554.0, 834.0, 1140.0, 1906.0, 2767.0, 4152.0, 6600.0, 9787.0, 14657.0, 22331.0, 34758.0, 55688.0, 91763.0, 156959.0, 228679.0, 160945.0, 94393.0, 56510.0, 35379.0, 23127.0, 15244.0, 9866.0, 6470.0, 4266.0, 2836.0, 1920.0, 1291.0, 852.0, 568.0, 380.0, 245.0, 196.0, 113.0, 74.0, 59.0, 32.0, 18.0, 13.0, 7.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-2.7890625, -2.70330810546875, -2.6175537109375, -2.53179931640625, -2.446044921875, -2.36029052734375, -2.2745361328125, -2.18878173828125, -2.10302734375, -2.01727294921875, -1.9315185546875, -1.84576416015625, -1.760009765625, -1.67425537109375, -1.5885009765625, -1.50274658203125, -1.4169921875, -1.33123779296875, -1.2454833984375, -1.15972900390625, -1.073974609375, -0.98822021484375, -0.9024658203125, -0.81671142578125, -0.73095703125, -0.64520263671875, -0.5594482421875, -0.47369384765625, -0.387939453125, -0.30218505859375, -0.2164306640625, -0.13067626953125, -0.044921875, 0.04083251953125, 0.1265869140625, 0.21234130859375, 0.298095703125, 0.38385009765625, 0.4696044921875, 0.55535888671875, 0.64111328125, 0.72686767578125, 0.8126220703125, 0.89837646484375, 0.984130859375, 1.06988525390625, 1.1556396484375, 1.24139404296875, 1.3271484375, 1.41290283203125, 1.4986572265625, 1.58441162109375, 1.670166015625, 1.75592041015625, 1.8416748046875, 1.92742919921875, 2.01318359375, 2.09893798828125, 2.1846923828125, 2.27044677734375, 2.356201171875, 2.44195556640625, 2.5277099609375, 2.61346435546875, 2.69921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 12.0, 4.0, 11.0, 14.0, 18.0, 15.0, 16.0, 19.0, 29.0, 31.0, 26.0, 26.0, 31.0, 31.0, 33.0, 27.0, 39.0, 28.0, 1063.0, 47.0, 51.0, 56.0, 47.0, 38.0, 35.0, 29.0, 19.0, 24.0, 31.0, 17.0, 28.0, 16.0, 14.0, 15.0, 7.0, 10.0, 10.0, 12.0, 5.0, 5.0, 11.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.600372314453125, -0.58013916015625, -0.559906005859375, -0.5396728515625, -0.519439697265625, -0.49920654296875, -0.478973388671875, -0.458740234375, -0.438507080078125, -0.41827392578125, -0.398040771484375, -0.3778076171875, -0.357574462890625, -0.33734130859375, -0.317108154296875, -0.296875, -0.276641845703125, -0.25640869140625, -0.236175537109375, -0.2159423828125, -0.195709228515625, -0.17547607421875, -0.155242919921875, -0.135009765625, -0.114776611328125, -0.09454345703125, -0.074310302734375, -0.0540771484375, -0.033843994140625, -0.01361083984375, 0.006622314453125, 0.02685546875, 0.047088623046875, 0.06732177734375, 0.087554931640625, 0.1077880859375, 0.128021240234375, 0.14825439453125, 0.168487548828125, 0.188720703125, 0.208953857421875, 0.22918701171875, 0.249420166015625, 0.2696533203125, 0.289886474609375, 0.31011962890625, 0.330352783203125, 0.3505859375, 0.370819091796875, 0.39105224609375, 0.411285400390625, 0.4315185546875, 0.451751708984375, 0.47198486328125, 0.492218017578125, 0.512451171875, 0.532684326171875, 0.55291748046875, 0.573150634765625, 0.5933837890625, 0.613616943359375, 0.63385009765625, 0.654083251953125, 0.67431640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 4.0, 4.0, 13.0, 19.0, 32.0, 42.0, 59.0, 82.0, 117.0, 161.0, 227.0, 320.0, 491.0, 753.0, 1160.0, 1765.0, 2754.0, 4571.0, 7679.0, 13571.0, 24801.0, 48625.0, 107707.0, 320197.0, 1102061.0, 266242.0, 95312.0, 44309.0, 22593.0, 12629.0, 7031.0, 4220.0, 2602.0, 1594.0, 1116.0, 729.0, 483.0, 279.0, 210.0, 149.0, 113.0, 96.0, 51.0, 49.0, 36.0, 26.0, 24.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.2578125, -2.190277099609375, -2.12274169921875, -2.055206298828125, -1.9876708984375, -1.920135498046875, -1.85260009765625, -1.785064697265625, -1.717529296875, -1.649993896484375, -1.58245849609375, -1.514923095703125, -1.4473876953125, -1.379852294921875, -1.31231689453125, -1.244781494140625, -1.17724609375, -1.109710693359375, -1.04217529296875, -0.974639892578125, -0.9071044921875, -0.839569091796875, -0.77203369140625, -0.704498291015625, -0.636962890625, -0.569427490234375, -0.50189208984375, -0.434356689453125, -0.3668212890625, -0.299285888671875, -0.23175048828125, -0.164215087890625, -0.0966796875, -0.029144287109375, 0.03839111328125, 0.105926513671875, 0.1734619140625, 0.240997314453125, 0.30853271484375, 0.376068115234375, 0.443603515625, 0.511138916015625, 0.57867431640625, 0.646209716796875, 0.7137451171875, 0.781280517578125, 0.84881591796875, 0.916351318359375, 0.98388671875, 1.051422119140625, 1.11895751953125, 1.186492919921875, 1.2540283203125, 1.321563720703125, 1.38909912109375, 1.456634521484375, 1.524169921875, 1.591705322265625, 1.65924072265625, 1.726776123046875, 1.7943115234375, 1.861846923828125, 1.92938232421875, 1.996917724609375, 2.064453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 10.0, 23.0, 33.0, 107.0, 151.0, 264.0, 155.0, 93.0, 54.0, 29.0, 25.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.02642822265625, -0.9766845703125, -0.92694091796875, -0.877197265625, -0.82745361328125, -0.7777099609375, -0.72796630859375, -0.67822265625, -0.62847900390625, -0.5787353515625, -0.52899169921875, -0.479248046875, -0.42950439453125, -0.3797607421875, -0.33001708984375, -0.2802734375, -0.23052978515625, -0.1807861328125, -0.13104248046875, -0.081298828125, -0.03155517578125, 0.0181884765625, 0.06793212890625, 0.11767578125, 0.16741943359375, 0.2171630859375, 0.26690673828125, 0.316650390625, 0.36639404296875, 0.4161376953125, 0.46588134765625, 0.515625, 0.56536865234375, 0.6151123046875, 0.66485595703125, 0.714599609375, 0.76434326171875, 0.8140869140625, 0.86383056640625, 0.91357421875, 0.96331787109375, 1.0130615234375, 1.06280517578125, 1.112548828125, 1.16229248046875, 1.2120361328125, 1.26177978515625, 1.3115234375, 1.36126708984375, 1.4110107421875, 1.46075439453125, 1.510498046875, 1.56024169921875, 1.6099853515625, 1.65972900390625, 1.70947265625, 1.75921630859375, 1.8089599609375, 1.85870361328125, 1.908447265625, 1.95819091796875, 2.0079345703125, 2.05767822265625, 2.107421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 9.0, 10.0, 18.0, 28.0, 65.0, 154.0, 666.0, 4964.0, 875411.0, 163401.0, 3034.0, 493.0, 118.0, 65.0, 34.0, 25.0, 9.0, 11.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.453125, -22.76123046875, -22.0693359375, -21.37744140625, -20.685546875, -19.99365234375, -19.3017578125, -18.60986328125, -17.91796875, -17.22607421875, -16.5341796875, -15.84228515625, -15.150390625, -14.45849609375, -13.7666015625, -13.07470703125, -12.3828125, -11.69091796875, -10.9990234375, -10.30712890625, -9.615234375, -8.92333984375, -8.2314453125, -7.53955078125, -6.84765625, -6.15576171875, -5.4638671875, -4.77197265625, -4.080078125, -3.38818359375, -2.6962890625, -2.00439453125, -1.3125, -0.62060546875, 0.0712890625, 0.76318359375, 1.455078125, 2.14697265625, 2.8388671875, 3.53076171875, 4.22265625, 4.91455078125, 5.6064453125, 6.29833984375, 6.990234375, 7.68212890625, 8.3740234375, 9.06591796875, 9.7578125, 10.44970703125, 11.1416015625, 11.83349609375, 12.525390625, 13.21728515625, 13.9091796875, 14.60107421875, 15.29296875, 15.98486328125, 16.6767578125, 17.36865234375, 18.060546875, 18.75244140625, 19.4443359375, 20.13623046875, 20.828125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 64.0, 190.0, 377.0, 231.0, 108.0, 17.0, 11.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.457576751708984, -9.274275779724121, -9.090975761413574, -8.907674789428711, -8.724373817443848, -8.5410737991333, -8.357772827148438, -8.174471855163574, -7.991171360015869, -7.807870864868164, -7.624569892883301, -7.441269397735596, -7.257968902587891, -7.074667930603027, -6.891367435455322, -6.708066940307617, -6.524765968322754, -6.341465473175049, -6.1581645011901855, -5.9748640060424805, -5.791563034057617, -5.608262538909912, -5.424962043762207, -5.241661071777344, -5.058360576629639, -4.875060081481934, -4.69175910949707, -4.508458614349365, -4.32515811920166, -4.141857147216797, -3.958556652069092, -3.7752559185028076, -3.5919549465179443, -3.40865421295166, -3.225353717803955, -3.042052984237671, -2.8587522506713867, -2.6754515171051025, -2.4921507835388184, -2.3088502883911133, -2.125549554824829, -1.942248821258545, -1.7589482069015503, -1.5756475925445557, -1.3923468589782715, -1.2090461254119873, -1.0257455110549927, -0.842444896697998, -0.6591441631317139, -0.47584348917007446, -0.29254281520843506, -0.10924214124679565, 0.07405853271484375, 0.25735920667648315, 0.44065988063812256, 0.6239604949951172, 0.8072612285614014, 0.9905619025230408, 1.1738625764846802, 1.3571631908416748, 1.540463924407959, 1.7237646579742432, 1.9070652723312378, 2.0903658866882324, 2.2736666202545166]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 17.0, 14.0, 17.0, 20.0, 28.0, 18.0, 18.0, 28.0, 33.0, 24.0, 33.0, 30.0, 43.0, 56.0, 35.0, 44.0, 38.0, 35.0, 41.0, 30.0, 30.0, 39.0, 38.0, 41.0, 34.0, 35.0, 35.0, 27.0, 17.0, 19.0, 11.0, 11.0, 6.0, 2.0, 6.0, 8.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.038132667541504, -1.0074701309204102, -0.9768075346946716, -0.9461449384689331, -0.9154824018478394, -0.8848198652267456, -0.8541572690010071, -0.8234946727752686, -0.7928321361541748, -0.762169599533081, -0.7315070033073425, -0.700844407081604, -0.6701818704605103, -0.6395193338394165, -0.608856737613678, -0.5781941413879395, -0.5475316047668457, -0.516869068145752, -0.4862064719200134, -0.4555439054965973, -0.42488133907318115, -0.394218772649765, -0.3635562062263489, -0.33289363980293274, -0.3022310733795166, -0.27156850695610046, -0.24090594053268433, -0.2102433741092682, -0.17958080768585205, -0.1489182412624359, -0.11825567483901978, -0.08759310841560364, -0.056930601596832275, -0.026268035173416138, 0.00439453125, 0.03505709767341614, 0.06571966409683228, 0.09638223052024841, 0.12704479694366455, 0.1577073633670807, 0.18836992979049683, 0.21903249621391296, 0.2496950626373291, 0.28035762906074524, 0.3110201954841614, 0.3416827619075775, 0.37234532833099365, 0.4030078947544098, 0.4336704611778259, 0.46433302760124207, 0.4949955940246582, 0.525658130645752, 0.5563207268714905, 0.586983323097229, 0.6176458597183228, 0.6483083963394165, 0.678970992565155, 0.7096335887908936, 0.7402961254119873, 0.770958662033081, 0.8016212582588196, 0.8322838544845581, 0.8629463911056519, 0.8936089277267456, 0.9242715239524841]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 4.0, 9.0, 11.0, 15.0, 13.0, 13.0, 12.0, 23.0, 22.0, 26.0, 19.0, 30.0, 30.0, 28.0, 34.0, 49.0, 32.0, 38.0, 31.0, 41.0, 35.0, 41.0, 31.0, 38.0, 31.0, 41.0, 26.0, 31.0, 33.0, 36.0, 26.0, 19.0, 19.0, 20.0, 15.0, 7.0, 11.0, 9.0, 9.0, 3.0, 6.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.76611328125, -0.7414016723632812, -0.7166900634765625, -0.6919784545898438, -0.667266845703125, -0.6425552368164062, -0.6178436279296875, -0.5931320190429688, -0.56842041015625, -0.5437088012695312, -0.5189971923828125, -0.49428558349609375, -0.469573974609375, -0.44486236572265625, -0.4201507568359375, -0.39543914794921875, -0.3707275390625, -0.34601593017578125, -0.3213043212890625, -0.29659271240234375, -0.271881103515625, -0.24716949462890625, -0.2224578857421875, -0.19774627685546875, -0.17303466796875, -0.14832305908203125, -0.1236114501953125, -0.09889984130859375, -0.074188232421875, -0.04947662353515625, -0.0247650146484375, -5.340576171875e-05, 0.024658203125, 0.04936981201171875, 0.0740814208984375, 0.09879302978515625, 0.123504638671875, 0.14821624755859375, 0.1729278564453125, 0.19763946533203125, 0.22235107421875, 0.24706268310546875, 0.2717742919921875, 0.29648590087890625, 0.321197509765625, 0.34590911865234375, 0.3706207275390625, 0.39533233642578125, 0.4200439453125, 0.44475555419921875, 0.4694671630859375, 0.49417877197265625, 0.518890380859375, 0.5436019897460938, 0.5683135986328125, 0.5930252075195312, 0.61773681640625, 0.6424484252929688, 0.6671600341796875, 0.6918716430664062, 0.716583251953125, 0.7412948608398438, 0.7660064697265625, 0.7907180786132812, 0.8154296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 11.0, 16.0, 24.0, 29.0, 41.0, 55.0, 81.0, 83.0, 137.0, 216.0, 282.0, 371.0, 501.0, 728.0, 1039.0, 1498.0, 2260.0, 3628.0, 6185.0, 12063.0, 28260.0, 129242.0, 667712.0, 135480.0, 29222.0, 12123.0, 6245.0, 3603.0, 2247.0, 1545.0, 1001.0, 669.0, 534.0, 393.0, 278.0, 199.0, 179.0, 102.0, 80.0, 53.0, 36.0, 19.0, 30.0, 14.0, 9.0, 13.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-2.830078125, -2.740264892578125, -2.65045166015625, -2.560638427734375, -2.4708251953125, -2.381011962890625, -2.29119873046875, -2.201385498046875, -2.111572265625, -2.021759033203125, -1.93194580078125, -1.842132568359375, -1.7523193359375, -1.662506103515625, -1.57269287109375, -1.482879638671875, -1.39306640625, -1.303253173828125, -1.21343994140625, -1.123626708984375, -1.0338134765625, -0.944000244140625, -0.85418701171875, -0.764373779296875, -0.674560546875, -0.584747314453125, -0.49493408203125, -0.405120849609375, -0.3153076171875, -0.225494384765625, -0.13568115234375, -0.045867919921875, 0.0439453125, 0.133758544921875, 0.22357177734375, 0.313385009765625, 0.4031982421875, 0.493011474609375, 0.58282470703125, 0.672637939453125, 0.762451171875, 0.852264404296875, 0.94207763671875, 1.031890869140625, 1.1217041015625, 1.211517333984375, 1.30133056640625, 1.391143798828125, 1.48095703125, 1.570770263671875, 1.66058349609375, 1.750396728515625, 1.8402099609375, 1.930023193359375, 2.01983642578125, 2.109649658203125, 2.199462890625, 2.289276123046875, 2.37908935546875, 2.468902587890625, 2.5587158203125, 2.648529052734375, 2.73834228515625, 2.828155517578125, 2.91796875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 8.0, 8.0, 15.0, 11.0, 13.0, 22.0, 19.0, 23.0, 28.0, 30.0, 30.0, 31.0, 46.0, 58.0, 62.0, 77.0, 127.0, 251.0, 1408.0, 199.0, 114.0, 81.0, 57.0, 54.0, 42.0, 40.0, 27.0, 32.0, 33.0, 21.0, 20.0, 16.0, 10.0, 10.0, 3.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.574127197265625, -3.45684814453125, -3.339569091796875, -3.2222900390625, -3.105010986328125, -2.98773193359375, -2.870452880859375, -2.753173828125, -2.635894775390625, -2.51861572265625, -2.401336669921875, -2.2840576171875, -2.166778564453125, -2.04949951171875, -1.932220458984375, -1.81494140625, -1.697662353515625, -1.58038330078125, -1.463104248046875, -1.3458251953125, -1.228546142578125, -1.11126708984375, -0.993988037109375, -0.876708984375, -0.759429931640625, -0.64215087890625, -0.524871826171875, -0.4075927734375, -0.290313720703125, -0.17303466796875, -0.055755615234375, 0.0615234375, 0.178802490234375, 0.29608154296875, 0.413360595703125, 0.5306396484375, 0.647918701171875, 0.76519775390625, 0.882476806640625, 0.999755859375, 1.117034912109375, 1.23431396484375, 1.351593017578125, 1.4688720703125, 1.586151123046875, 1.70343017578125, 1.820709228515625, 1.93798828125, 2.055267333984375, 2.17254638671875, 2.289825439453125, 2.4071044921875, 2.524383544921875, 2.64166259765625, 2.758941650390625, 2.876220703125, 2.993499755859375, 3.11077880859375, 3.228057861328125, 3.3453369140625, 3.462615966796875, 3.57989501953125, 3.697174072265625, 3.814453125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 9.0, 10.0, 18.0, 19.0, 43.0, 37.0, 73.0, 97.0, 140.0, 218.0, 379.0, 569.0, 1095.0, 1953.0, 4045.0, 9220.0, 24761.0, 88527.0, 1171492.0, 1693709.0, 102491.0, 27370.0, 10276.0, 4261.0, 2211.0, 1054.0, 595.0, 352.0, 216.0, 140.0, 98.0, 60.0, 43.0, 35.0, 20.0, 14.0, 20.0, 7.0, 10.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.21875, -5.0506591796875, -4.882568359375, -4.7144775390625, -4.54638671875, -4.3782958984375, -4.210205078125, -4.0421142578125, -3.8740234375, -3.7059326171875, -3.537841796875, -3.3697509765625, -3.20166015625, -3.0335693359375, -2.865478515625, -2.6973876953125, -2.529296875, -2.3612060546875, -2.193115234375, -2.0250244140625, -1.85693359375, -1.6888427734375, -1.520751953125, -1.3526611328125, -1.1845703125, -1.0164794921875, -0.848388671875, -0.6802978515625, -0.51220703125, -0.3441162109375, -0.176025390625, -0.0079345703125, 0.16015625, 0.3282470703125, 0.496337890625, 0.6644287109375, 0.83251953125, 1.0006103515625, 1.168701171875, 1.3367919921875, 1.5048828125, 1.6729736328125, 1.841064453125, 2.0091552734375, 2.17724609375, 2.3453369140625, 2.513427734375, 2.6815185546875, 2.849609375, 3.0177001953125, 3.185791015625, 3.3538818359375, 3.52197265625, 3.6900634765625, 3.858154296875, 4.0262451171875, 4.1943359375, 4.3624267578125, 4.530517578125, 4.6986083984375, 4.86669921875, 5.0347900390625, 5.202880859375, 5.3709716796875, 5.5390625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 35.0, 96.0, 262.0, 379.0, 171.0, 46.0, 23.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.553394317626953, -26.373926162719727, -25.1944580078125, -24.014991760253906, -22.83552360534668, -21.656055450439453, -20.47658920288086, -19.297121047973633, -18.117652893066406, -16.93818473815918, -15.75871753692627, -14.57925033569336, -13.399782180786133, -12.220314025878906, -11.040846824645996, -9.861379623413086, -8.68191146850586, -7.502443790435791, -6.322976112365723, -5.143508434295654, -3.964040756225586, -2.7845730781555176, -1.6051054000854492, -0.42563819885253906, 0.7538299560546875, 1.9332976341247559, 3.112765312194824, 4.292232990264893, 5.471700668334961, 6.651168346405029, 7.830636024475098, 9.010103225708008, 10.1895751953125, 11.369043350219727, 12.548510551452637, 13.727977752685547, 14.907445907592773, 16.0869140625, 17.266380310058594, 18.44584846496582, 19.625316619873047, 20.804784774780273, 21.9842529296875, 23.163719177246094, 24.34318733215332, 25.522655487060547, 26.70212173461914, 27.881589889526367, 29.061058044433594, 30.24052619934082, 31.419994354248047, 32.59946060180664, 33.7789306640625, 34.958396911621094, 36.13786315917969, 37.31732940673828, 38.49679946899414, 39.676265716552734, 40.855735778808594, 42.03520202636719, 43.21466827392578, 44.39413833618164, 45.573604583740234, 46.753074645996094, 47.93254089355469]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 8.0, 11.0, 10.0, 19.0, 14.0, 22.0, 16.0, 25.0, 34.0, 35.0, 36.0, 36.0, 34.0, 46.0, 46.0, 32.0, 43.0, 33.0, 41.0, 45.0, 36.0, 39.0, 43.0, 33.0, 35.0, 33.0, 31.0, 26.0, 19.0, 25.0, 17.0, 14.0, 3.0, 13.0, 9.0, 13.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.737288475036621, -12.349093437194824, -11.960899353027344, -11.572704315185547, -11.18450927734375, -10.796314239501953, -10.408120155334473, -10.019925117492676, -9.631731033325195, -9.243535995483398, -8.855341911315918, -8.467146873474121, -8.078951835632324, -7.6907572746276855, -7.302562713623047, -6.91436767578125, -6.526172637939453, -6.1379780769348145, -5.749783039093018, -5.361588478088379, -4.973393440246582, -4.585198879241943, -4.197004318237305, -3.808809518814087, -3.420614719390869, -3.0324199199676514, -2.6442251205444336, -2.256030559539795, -1.8678357601165771, -1.4796409606933594, -1.0914463996887207, -0.7032516002655029, -0.31505584716796875, 0.07313889265060425, 0.46133363246917725, 0.8495283126831055, 1.2377231121063232, 1.625917911529541, 2.0141124725341797, 2.4023072719573975, 2.7905020713806152, 3.178696870803833, 3.566891670227051, 3.9550862312316895, 4.343280792236328, 4.731475830078125, 5.119670391082764, 5.507864952087402, 5.896059989929199, 6.284254550933838, 6.672449588775635, 7.060644149780273, 7.44883918762207, 7.837033748626709, 8.225228309631348, 8.613423347473145, 9.001617431640625, 9.389812469482422, 9.778006553649902, 10.1662015914917, 10.554396629333496, 10.942590713500977, 11.330785751342773, 11.71898078918457, 12.107175827026367]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 8.0, 11.0, 8.0, 9.0, 9.0, 16.0, 8.0, 12.0, 26.0, 23.0, 25.0, 27.0, 29.0, 30.0, 32.0, 39.0, 36.0, 43.0, 34.0, 41.0, 41.0, 36.0, 32.0, 36.0, 39.0, 33.0, 29.0, 46.0, 33.0, 28.0, 26.0, 28.0, 16.0, 16.0, 16.0, 13.0, 12.0, 8.0, 8.0, 7.0, 9.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8642578125, -0.8368911743164062, -0.8095245361328125, -0.7821578979492188, -0.754791259765625, -0.7274246215820312, -0.7000579833984375, -0.6726913452148438, -0.64532470703125, -0.6179580688476562, -0.5905914306640625, -0.5632247924804688, -0.535858154296875, -0.5084915161132812, -0.4811248779296875, -0.45375823974609375, -0.4263916015625, -0.39902496337890625, -0.3716583251953125, -0.34429168701171875, -0.316925048828125, -0.28955841064453125, -0.2621917724609375, -0.23482513427734375, -0.20745849609375, -0.18009185791015625, -0.1527252197265625, -0.12535858154296875, -0.097991943359375, -0.07062530517578125, -0.0432586669921875, -0.01589202880859375, 0.011474609375, 0.03884124755859375, 0.0662078857421875, 0.09357452392578125, 0.120941162109375, 0.14830780029296875, 0.1756744384765625, 0.20304107666015625, 0.23040771484375, 0.25777435302734375, 0.2851409912109375, 0.31250762939453125, 0.339874267578125, 0.36724090576171875, 0.3946075439453125, 0.42197418212890625, 0.4493408203125, 0.47670745849609375, 0.5040740966796875, 0.5314407348632812, 0.558807373046875, 0.5861740112304688, 0.6135406494140625, 0.6409072875976562, 0.66827392578125, 0.6956405639648438, 0.7230072021484375, 0.7503738403320312, 0.777740478515625, 0.8051071166992188, 0.8324737548828125, 0.8598403930664062, 0.88720703125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 16.0, 22.0, 35.0, 32.0, 40.0, 90.0, 142.0, 217.0, 370.0, 547.0, 918.0, 1552.0, 2798.0, 5545.0, 11840.0, 27093.0, 73640.0, 341739.0, 2848924.0, 713744.0, 102784.0, 34034.0, 14046.0, 6333.0, 3223.0, 1830.0, 1060.0, 573.0, 346.0, 229.0, 159.0, 111.0, 73.0, 50.0, 27.0, 24.0, 15.0, 17.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.947265625, -2.85107421875, -2.7548828125, -2.65869140625, -2.5625, -2.46630859375, -2.3701171875, -2.27392578125, -2.177734375, -2.08154296875, -1.9853515625, -1.88916015625, -1.79296875, -1.69677734375, -1.6005859375, -1.50439453125, -1.408203125, -1.31201171875, -1.2158203125, -1.11962890625, -1.0234375, -0.92724609375, -0.8310546875, -0.73486328125, -0.638671875, -0.54248046875, -0.4462890625, -0.35009765625, -0.25390625, -0.15771484375, -0.0615234375, 0.03466796875, 0.130859375, 0.22705078125, 0.3232421875, 0.41943359375, 0.515625, 0.61181640625, 0.7080078125, 0.80419921875, 0.900390625, 0.99658203125, 1.0927734375, 1.18896484375, 1.28515625, 1.38134765625, 1.4775390625, 1.57373046875, 1.669921875, 1.76611328125, 1.8623046875, 1.95849609375, 2.0546875, 2.15087890625, 2.2470703125, 2.34326171875, 2.439453125, 2.53564453125, 2.6318359375, 2.72802734375, 2.82421875, 2.92041015625, 3.0166015625, 3.11279296875, 3.208984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 13.0, 22.0, 36.0, 55.0, 111.0, 174.0, 312.0, 569.0, 973.0, 780.0, 440.0, 229.0, 120.0, 97.0, 55.0, 35.0, 20.0, 12.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.8026123046875, -5.640380859375, -5.4781494140625, -5.31591796875, -5.1536865234375, -4.991455078125, -4.8292236328125, -4.6669921875, -4.5047607421875, -4.342529296875, -4.1802978515625, -4.01806640625, -3.8558349609375, -3.693603515625, -3.5313720703125, -3.369140625, -3.2069091796875, -3.044677734375, -2.8824462890625, -2.72021484375, -2.5579833984375, -2.395751953125, -2.2335205078125, -2.0712890625, -1.9090576171875, -1.746826171875, -1.5845947265625, -1.42236328125, -1.2601318359375, -1.097900390625, -0.9356689453125, -0.7734375, -0.6112060546875, -0.448974609375, -0.2867431640625, -0.12451171875, 0.0377197265625, 0.199951171875, 0.3621826171875, 0.5244140625, 0.6866455078125, 0.848876953125, 1.0111083984375, 1.17333984375, 1.3355712890625, 1.497802734375, 1.6600341796875, 1.822265625, 1.9844970703125, 2.146728515625, 2.3089599609375, 2.47119140625, 2.6334228515625, 2.795654296875, 2.9578857421875, 3.1201171875, 3.2823486328125, 3.444580078125, 3.6068115234375, 3.76904296875, 3.9312744140625, 4.093505859375, 4.2557373046875, 4.41796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 9.0, 4.0, 23.0, 19.0, 28.0, 39.0, 58.0, 77.0, 90.0, 154.0, 301.0, 544.0, 1256.0, 3162.0, 8739.0, 29905.0, 141362.0, 1785206.0, 2024314.0, 151994.0, 31821.0, 9224.0, 3201.0, 1308.0, 591.0, 292.0, 173.0, 112.0, 79.0, 67.0, 28.0, 25.0, 18.0, 15.0, 15.0, 8.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.14453125, -5.90838623046875, -5.6722412109375, -5.43609619140625, -5.199951171875, -4.96380615234375, -4.7276611328125, -4.49151611328125, -4.25537109375, -4.01922607421875, -3.7830810546875, -3.54693603515625, -3.310791015625, -3.07464599609375, -2.8385009765625, -2.60235595703125, -2.3662109375, -2.13006591796875, -1.8939208984375, -1.65777587890625, -1.421630859375, -1.18548583984375, -0.9493408203125, -0.71319580078125, -0.47705078125, -0.24090576171875, -0.0047607421875, 0.23138427734375, 0.467529296875, 0.70367431640625, 0.9398193359375, 1.17596435546875, 1.412109375, 1.64825439453125, 1.8843994140625, 2.12054443359375, 2.356689453125, 2.59283447265625, 2.8289794921875, 3.06512451171875, 3.30126953125, 3.53741455078125, 3.7735595703125, 4.00970458984375, 4.245849609375, 4.48199462890625, 4.7181396484375, 4.95428466796875, 5.1904296875, 5.42657470703125, 5.6627197265625, 5.89886474609375, 6.135009765625, 6.37115478515625, 6.6072998046875, 6.84344482421875, 7.07958984375, 7.31573486328125, 7.5518798828125, 7.78802490234375, 8.024169921875, 8.26031494140625, 8.4964599609375, 8.73260498046875, 8.96875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 6.0, 15.0, 21.0, 24.0, 47.0, 67.0, 99.0, 111.0, 145.0, 118.0, 105.0, 77.0, 51.0, 35.0, 35.0, 19.0, 9.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.36395263671875, -28.690937042236328, -28.01792335510254, -27.344907760620117, -26.671894073486328, -25.998878479003906, -25.325862884521484, -24.652847290039062, -23.979833602905273, -23.30681800842285, -22.633804321289062, -21.96078872680664, -21.28777313232422, -20.61475944519043, -19.941743850708008, -19.26873016357422, -18.595714569091797, -17.922698974609375, -17.249685287475586, -16.576669692993164, -15.903655052185059, -15.230640411376953, -14.557624816894531, -13.884610176086426, -13.21159553527832, -12.538580894470215, -11.86556625366211, -11.192550659179688, -10.519536018371582, -9.846521377563477, -9.173505783081055, -8.50049114227295, -7.827476501464844, -7.154461860656738, -6.481446743011475, -5.808431625366211, -5.1354169845581055, -4.46240234375, -3.7893872261047363, -3.1163721084594727, -2.443357467651367, -1.7703425884246826, -1.097327709197998, -0.4243128299713135, 0.2487020492553711, 0.9217169284820557, 1.5947318077087402, 2.267746925354004, 2.9407615661621094, 3.613776445388794, 4.2867913246154785, 4.959806442260742, 5.632821083068848, 6.305835723876953, 6.978850841522217, 7.6518659591674805, 8.324880599975586, 8.997895240783691, 9.670909881591797, 10.343925476074219, 11.016940116882324, 11.68995475769043, 12.362970352172852, 13.035984992980957, 13.708999633789062]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 8.0, 14.0, 9.0, 6.0, 17.0, 19.0, 17.0, 21.0, 26.0, 27.0, 23.0, 29.0, 36.0, 29.0, 40.0, 40.0, 34.0, 50.0, 39.0, 39.0, 32.0, 49.0, 31.0, 31.0, 35.0, 44.0, 23.0, 33.0, 28.0, 21.0, 22.0, 17.0, 16.0, 18.0, 8.0, 13.0, 15.0, 9.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.047755241394043, -8.756363868713379, -8.464972496032715, -8.17358112335205, -7.882190227508545, -7.590798854827881, -7.299407958984375, -7.008016586303711, -6.716625213623047, -6.425233840942383, -6.133842468261719, -5.842451572418213, -5.551060199737549, -5.259668827056885, -4.968277931213379, -4.676886558532715, -4.385495185852051, -4.094103813171387, -3.8027126789093018, -3.511321544647217, -3.2199301719665527, -2.9285387992858887, -2.6371476650238037, -2.3457565307617188, -2.0543651580810547, -1.7629739046096802, -1.4715826511383057, -1.1801913976669312, -0.8888001441955566, -0.5974088907241821, -0.3060176372528076, -0.014626502990722656, 0.2767648696899414, 0.5681561231613159, 0.8595473766326904, 1.150938630104065, 1.4423298835754395, 1.733721137046814, 2.0251123905181885, 2.3165035247802734, 2.6078948974609375, 2.8992862701416016, 3.1906774044036865, 3.4820685386657715, 3.7734599113464355, 4.0648512840271, 4.3562421798706055, 4.6476335525512695, 4.939024925231934, 5.230416297912598, 5.521807670593262, 5.813198566436768, 6.104589939117432, 6.395981311798096, 6.687372207641602, 6.978763580322266, 7.27015495300293, 7.561546325683594, 7.852937698364258, 8.144329071044922, 8.435720443725586, 8.727110862731934, 9.018502235412598, 9.309893608093262, 9.601284980773926]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 6.0, 10.0, 11.0, 17.0, 19.0, 18.0, 14.0, 20.0, 27.0, 26.0, 37.0, 29.0, 32.0, 36.0, 36.0, 53.0, 43.0, 30.0, 50.0, 38.0, 51.0, 33.0, 31.0, 42.0, 38.0, 32.0, 35.0, 25.0, 22.0, 20.0, 23.0, 9.0, 13.0, 14.0, 14.0, 4.0, 8.0, 9.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.8402252197265625, -0.809356689453125, -0.7784881591796875, -0.74761962890625, -0.7167510986328125, -0.685882568359375, -0.6550140380859375, -0.6241455078125, -0.5932769775390625, -0.562408447265625, -0.5315399169921875, -0.50067138671875, -0.4698028564453125, -0.438934326171875, -0.4080657958984375, -0.377197265625, -0.3463287353515625, -0.315460205078125, -0.2845916748046875, -0.25372314453125, -0.2228546142578125, -0.191986083984375, -0.1611175537109375, -0.1302490234375, -0.0993804931640625, -0.068511962890625, -0.0376434326171875, -0.00677490234375, 0.0240936279296875, 0.054962158203125, 0.0858306884765625, 0.11669921875, 0.1475677490234375, 0.178436279296875, 0.2093048095703125, 0.24017333984375, 0.2710418701171875, 0.301910400390625, 0.3327789306640625, 0.3636474609375, 0.3945159912109375, 0.425384521484375, 0.4562530517578125, 0.48712158203125, 0.5179901123046875, 0.548858642578125, 0.5797271728515625, 0.610595703125, 0.6414642333984375, 0.672332763671875, 0.7032012939453125, 0.73406982421875, 0.7649383544921875, 0.795806884765625, 0.8266754150390625, 0.8575439453125, 0.8884124755859375, 0.919281005859375, 0.9501495361328125, 0.98101806640625, 1.0118865966796875, 1.042755126953125, 1.0736236572265625, 1.1044921875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 13.0, 11.0, 19.0, 21.0, 38.0, 69.0, 89.0, 127.0, 183.0, 264.0, 391.0, 644.0, 980.0, 1543.0, 2451.0, 4098.0, 6702.0, 11214.0, 18741.0, 32265.0, 57030.0, 103490.0, 190893.0, 256939.0, 158749.0, 85993.0, 47802.0, 27010.0, 16090.0, 9544.0, 5632.0, 3501.0, 2210.0, 1325.0, 811.0, 570.0, 359.0, 229.0, 147.0, 117.0, 86.0, 56.0, 35.0, 19.0, 12.0, 10.0, 11.0, 5.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-3.75, -3.637542724609375, -3.52508544921875, -3.412628173828125, -3.3001708984375, -3.187713623046875, -3.07525634765625, -2.962799072265625, -2.850341796875, -2.737884521484375, -2.62542724609375, -2.512969970703125, -2.4005126953125, -2.288055419921875, -2.17559814453125, -2.063140869140625, -1.95068359375, -1.838226318359375, -1.72576904296875, -1.613311767578125, -1.5008544921875, -1.388397216796875, -1.27593994140625, -1.163482666015625, -1.051025390625, -0.938568115234375, -0.82611083984375, -0.713653564453125, -0.6011962890625, -0.488739013671875, -0.37628173828125, -0.263824462890625, -0.1513671875, -0.038909912109375, 0.07354736328125, 0.186004638671875, 0.2984619140625, 0.410919189453125, 0.52337646484375, 0.635833740234375, 0.748291015625, 0.860748291015625, 0.97320556640625, 1.085662841796875, 1.1981201171875, 1.310577392578125, 1.42303466796875, 1.535491943359375, 1.64794921875, 1.760406494140625, 1.87286376953125, 1.985321044921875, 2.0977783203125, 2.210235595703125, 2.32269287109375, 2.435150146484375, 2.547607421875, 2.660064697265625, 2.77252197265625, 2.884979248046875, 2.9974365234375, 3.109893798828125, 3.22235107421875, 3.334808349609375, 3.447265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 12.0, 21.0, 15.0, 31.0, 25.0, 28.0, 43.0, 29.0, 35.0, 29.0, 48.0, 40.0, 45.0, 54.0, 1057.0, 48.0, 42.0, 46.0, 35.0, 35.0, 36.0, 30.0, 40.0, 23.0, 25.0, 18.0, 21.0, 16.0, 13.0, 13.0, 13.0, 4.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.82470703125, -0.7993392944335938, -0.7739715576171875, -0.7486038208007812, -0.723236083984375, -0.6978683471679688, -0.6725006103515625, -0.6471328735351562, -0.62176513671875, -0.5963973999023438, -0.5710296630859375, -0.5456619262695312, -0.520294189453125, -0.49492645263671875, -0.4695587158203125, -0.44419097900390625, -0.4188232421875, -0.39345550537109375, -0.3680877685546875, -0.34272003173828125, -0.317352294921875, -0.29198455810546875, -0.2666168212890625, -0.24124908447265625, -0.21588134765625, -0.19051361083984375, -0.1651458740234375, -0.13977813720703125, -0.114410400390625, -0.08904266357421875, -0.0636749267578125, -0.03830718994140625, -0.012939453125, 0.01242828369140625, 0.0377960205078125, 0.06316375732421875, 0.088531494140625, 0.11389923095703125, 0.1392669677734375, 0.16463470458984375, 0.19000244140625, 0.21537017822265625, 0.2407379150390625, 0.26610565185546875, 0.291473388671875, 0.31684112548828125, 0.3422088623046875, 0.36757659912109375, 0.3929443359375, 0.41831207275390625, 0.4436798095703125, 0.46904754638671875, 0.494415283203125, 0.5197830200195312, 0.5451507568359375, 0.5705184936523438, 0.59588623046875, 0.6212539672851562, 0.6466217041015625, 0.6719894409179688, 0.697357177734375, 0.7227249145507812, 0.7480926513671875, 0.7734603881835938, 0.798828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 5.0, 4.0, 7.0, 16.0, 21.0, 25.0, 50.0, 67.0, 95.0, 121.0, 182.0, 268.0, 415.0, 647.0, 930.0, 1533.0, 2486.0, 4218.0, 7438.0, 13711.0, 28389.0, 64596.0, 183929.0, 1210545.0, 389969.0, 102708.0, 41602.0, 19302.0, 9791.0, 5445.0, 3146.0, 1889.0, 1247.0, 787.0, 502.0, 325.0, 222.0, 156.0, 83.0, 81.0, 56.0, 31.0, 31.0, 16.0, 15.0, 9.0, 4.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.595703125, -2.5084228515625, -2.421142578125, -2.3338623046875, -2.24658203125, -2.1593017578125, -2.072021484375, -1.9847412109375, -1.8974609375, -1.8101806640625, -1.722900390625, -1.6356201171875, -1.54833984375, -1.4610595703125, -1.373779296875, -1.2864990234375, -1.19921875, -1.1119384765625, -1.024658203125, -0.9373779296875, -0.85009765625, -0.7628173828125, -0.675537109375, -0.5882568359375, -0.5009765625, -0.4136962890625, -0.326416015625, -0.2391357421875, -0.15185546875, -0.0645751953125, 0.022705078125, 0.1099853515625, 0.197265625, 0.2845458984375, 0.371826171875, 0.4591064453125, 0.54638671875, 0.6336669921875, 0.720947265625, 0.8082275390625, 0.8955078125, 0.9827880859375, 1.070068359375, 1.1573486328125, 1.24462890625, 1.3319091796875, 1.419189453125, 1.5064697265625, 1.59375, 1.6810302734375, 1.768310546875, 1.8555908203125, 1.94287109375, 2.0301513671875, 2.117431640625, 2.2047119140625, 2.2919921875, 2.3792724609375, 2.466552734375, 2.5538330078125, 2.64111328125, 2.7283935546875, 2.815673828125, 2.9029541015625, 2.990234375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 12.0, 10.0, 16.0, 28.0, 76.0, 161.0, 281.0, 185.0, 99.0, 34.0, 20.0, 15.0, 12.0, 8.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251953125, -1.208251953125, -1.16455078125, -1.120849609375, -1.0771484375, -1.033447265625, -0.98974609375, -0.946044921875, -0.90234375, -0.858642578125, -0.81494140625, -0.771240234375, -0.7275390625, -0.683837890625, -0.64013671875, -0.596435546875, -0.552734375, -0.509033203125, -0.46533203125, -0.421630859375, -0.3779296875, -0.334228515625, -0.29052734375, -0.246826171875, -0.203125, -0.159423828125, -0.11572265625, -0.072021484375, -0.0283203125, 0.015380859375, 0.05908203125, 0.102783203125, 0.146484375, 0.190185546875, 0.23388671875, 0.277587890625, 0.3212890625, 0.364990234375, 0.40869140625, 0.452392578125, 0.49609375, 0.539794921875, 0.58349609375, 0.627197265625, 0.6708984375, 0.714599609375, 0.75830078125, 0.802001953125, 0.845703125, 0.889404296875, 0.93310546875, 0.976806640625, 1.0205078125, 1.064208984375, 1.10791015625, 1.151611328125, 1.1953125, 1.239013671875, 1.28271484375, 1.326416015625, 1.3701171875, 1.413818359375, 1.45751953125, 1.501220703125, 1.544921875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 5.0, 4.0, 7.0, 12.0, 11.0, 18.0, 25.0, 32.0, 95.0, 355.0, 1957.0, 20597.0, 1003640.0, 19364.0, 1878.0, 311.0, 104.0, 39.0, 18.0, 13.0, 16.0, 10.0, 6.0, 2.0, 4.0, 6.0, 1.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.5625, -19.96630859375, -19.3701171875, -18.77392578125, -18.177734375, -17.58154296875, -16.9853515625, -16.38916015625, -15.79296875, -15.19677734375, -14.6005859375, -14.00439453125, -13.408203125, -12.81201171875, -12.2158203125, -11.61962890625, -11.0234375, -10.42724609375, -9.8310546875, -9.23486328125, -8.638671875, -8.04248046875, -7.4462890625, -6.85009765625, -6.25390625, -5.65771484375, -5.0615234375, -4.46533203125, -3.869140625, -3.27294921875, -2.6767578125, -2.08056640625, -1.484375, -0.88818359375, -0.2919921875, 0.30419921875, 0.900390625, 1.49658203125, 2.0927734375, 2.68896484375, 3.28515625, 3.88134765625, 4.4775390625, 5.07373046875, 5.669921875, 6.26611328125, 6.8623046875, 7.45849609375, 8.0546875, 8.65087890625, 9.2470703125, 9.84326171875, 10.439453125, 11.03564453125, 11.6318359375, 12.22802734375, 12.82421875, 13.42041015625, 14.0166015625, 14.61279296875, 15.208984375, 15.80517578125, 16.4013671875, 16.99755859375, 17.59375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 13.0, 23.0, 36.0, 93.0, 154.0, 252.0, 208.0, 111.0, 44.0, 40.0, 12.0, 12.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.595698833465576, -4.497329235076904, -4.398959159851074, -4.300589561462402, -4.202219486236572, -4.1038498878479, -4.00547981262207, -3.9071099758148193, -3.8087401390075684, -3.7103703022003174, -3.6120004653930664, -3.5136306285858154, -3.4152607917785645, -3.3168909549713135, -3.2185211181640625, -3.1201512813568115, -3.0217814445495605, -2.9234116077423096, -2.8250417709350586, -2.7266719341278076, -2.6283020973205566, -2.5299322605133057, -2.4315624237060547, -2.3331925868988037, -2.234822988510132, -2.136453151702881, -2.03808331489563, -1.939713478088379, -1.841343641281128, -1.742973804473877, -1.644603967666626, -1.546234130859375, -1.4478644132614136, -1.3494945764541626, -1.2511247396469116, -1.1527549028396606, -1.0543850660324097, -0.9560152292251587, -0.8576454520225525, -0.7592756152153015, -0.6609057784080505, -0.5625359416007996, -0.4641661047935486, -0.36579629778862, -0.267426460981369, -0.16905662417411804, -0.07068681716918945, 0.027683019638061523, 0.1260528564453125, 0.22442269325256348, 0.32279253005981445, 0.42116233706474304, 0.5195322036743164, 0.6179020404815674, 0.7162718176841736, 0.8146416544914246, 0.9130114912986755, 1.0113812685012817, 1.1097511053085327, 1.2081209421157837, 1.3064907789230347, 1.4048606157302856, 1.5032304525375366, 1.6016002893447876, 1.6999701261520386]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 17.0, 10.0, 16.0, 11.0, 20.0, 10.0, 18.0, 23.0, 13.0, 23.0, 29.0, 28.0, 29.0, 46.0, 31.0, 37.0, 44.0, 43.0, 43.0, 42.0, 42.0, 33.0, 39.0, 32.0, 33.0, 20.0, 41.0, 21.0, 29.0, 22.0, 25.0, 16.0, 15.0, 12.0, 12.0, 10.0, 6.0, 8.0, 8.0, 5.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6772263646125793, -0.6555843949317932, -0.6339423656463623, -0.6123003959655762, -0.59065842628479, -0.5690164566040039, -0.547374427318573, -0.5257324576377869, -0.504090428352356, -0.48244842886924744, -0.4608064591884613, -0.4391644597053528, -0.41752249002456665, -0.39588049054145813, -0.3742384910583496, -0.3525965213775635, -0.33095455169677734, -0.3093125522136688, -0.2876705825328827, -0.26602858304977417, -0.24438659846782684, -0.22274461388587952, -0.201102614402771, -0.17946062982082367, -0.15781864523887634, -0.13617666065692902, -0.11453466862440109, -0.09289267659187317, -0.07125069200992584, -0.049608707427978516, -0.027966707944869995, -0.0063247233629226685, 0.015317261219024658, 0.03695924952626228, 0.05860123783349991, 0.08024322986602783, 0.10188521444797516, 0.12352719902992249, 0.145169198513031, 0.16681118309497833, 0.18845316767692566, 0.21009515225887299, 0.2317371368408203, 0.25337913632392883, 0.27502113580703735, 0.2966631054878235, 0.318305104970932, 0.3399471044540405, 0.36158907413482666, 0.3832310736179352, 0.4048730432987213, 0.42651504278182983, 0.44815701246261597, 0.4697990119457245, 0.491441011428833, 0.5130829811096191, 0.5347249507904053, 0.5563669204711914, 0.5780089497566223, 0.5996509194374084, 0.6212928891181946, 0.6429349184036255, 0.6645768880844116, 0.6862188577651978, 0.7078608870506287]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 6.0, 3.0, 9.0, 8.0, 13.0, 20.0, 15.0, 17.0, 21.0, 18.0, 24.0, 25.0, 29.0, 30.0, 34.0, 35.0, 52.0, 42.0, 39.0, 46.0, 35.0, 41.0, 48.0, 29.0, 36.0, 37.0, 42.0, 32.0, 36.0, 26.0, 21.0, 28.0, 17.0, 13.0, 13.0, 11.0, 12.0, 8.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.8402557373046875, -0.809417724609375, -0.7785797119140625, -0.74774169921875, -0.7169036865234375, -0.686065673828125, -0.6552276611328125, -0.6243896484375, -0.5935516357421875, -0.562713623046875, -0.5318756103515625, -0.50103759765625, -0.4701995849609375, -0.439361572265625, -0.4085235595703125, -0.377685546875, -0.3468475341796875, -0.316009521484375, -0.2851715087890625, -0.25433349609375, -0.2234954833984375, -0.192657470703125, -0.1618194580078125, -0.1309814453125, -0.1001434326171875, -0.069305419921875, -0.0384674072265625, -0.00762939453125, 0.0232086181640625, 0.054046630859375, 0.0848846435546875, 0.11572265625, 0.1465606689453125, 0.177398681640625, 0.2082366943359375, 0.23907470703125, 0.2699127197265625, 0.300750732421875, 0.3315887451171875, 0.3624267578125, 0.3932647705078125, 0.424102783203125, 0.4549407958984375, 0.48577880859375, 0.5166168212890625, 0.547454833984375, 0.5782928466796875, 0.609130859375, 0.6399688720703125, 0.670806884765625, 0.7016448974609375, 0.73248291015625, 0.7633209228515625, 0.794158935546875, 0.8249969482421875, 0.8558349609375, 0.8866729736328125, 0.917510986328125, 0.9483489990234375, 0.97918701171875, 1.0100250244140625, 1.040863037109375, 1.0717010498046875, 1.1025390625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 9.0, 5.0, 12.0, 10.0, 16.0, 27.0, 34.0, 50.0, 60.0, 102.0, 124.0, 164.0, 235.0, 323.0, 459.0, 549.0, 802.0, 1051.0, 1589.0, 2333.0, 3435.0, 5369.0, 8648.0, 15180.0, 28849.0, 61882.0, 154558.0, 334157.0, 241453.0, 94177.0, 40728.0, 20279.0, 11417.0, 6660.0, 4347.0, 2845.0, 1925.0, 1303.0, 969.0, 671.0, 461.0, 354.0, 237.0, 177.0, 149.0, 107.0, 79.0, 52.0, 36.0, 41.0, 19.0, 14.0, 11.0, 10.0, 8.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.865234375, -0.8379745483398438, -0.8107147216796875, -0.7834548950195312, -0.756195068359375, -0.7289352416992188, -0.7016754150390625, -0.6744155883789062, -0.64715576171875, -0.6198959350585938, -0.5926361083984375, -0.5653762817382812, -0.538116455078125, -0.5108566284179688, -0.4835968017578125, -0.45633697509765625, -0.4290771484375, -0.40181732177734375, -0.3745574951171875, -0.34729766845703125, -0.320037841796875, -0.29277801513671875, -0.2655181884765625, -0.23825836181640625, -0.21099853515625, -0.18373870849609375, -0.1564788818359375, -0.12921905517578125, -0.101959228515625, -0.07469940185546875, -0.0474395751953125, -0.02017974853515625, 0.007080078125, 0.03433990478515625, 0.0615997314453125, 0.08885955810546875, 0.116119384765625, 0.14337921142578125, 0.1706390380859375, 0.19789886474609375, 0.22515869140625, 0.25241851806640625, 0.2796783447265625, 0.30693817138671875, 0.334197998046875, 0.36145782470703125, 0.3887176513671875, 0.41597747802734375, 0.4432373046875, 0.47049713134765625, 0.4977569580078125, 0.5250167846679688, 0.552276611328125, 0.5795364379882812, 0.6067962646484375, 0.6340560913085938, 0.66131591796875, 0.6885757446289062, 0.7158355712890625, 0.7430953979492188, 0.770355224609375, 0.7976150512695312, 0.8248748779296875, 0.8521347045898438, 0.87939453125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 3.0, 12.0, 10.0, 10.0, 17.0, 21.0, 24.0, 16.0, 26.0, 40.0, 35.0, 37.0, 67.0, 63.0, 101.0, 213.0, 1501.0, 283.0, 126.0, 76.0, 73.0, 38.0, 46.0, 37.0, 26.0, 33.0, 20.0, 15.0, 15.0, 16.0, 10.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.984375, -4.8448486328125, -4.705322265625, -4.5657958984375, -4.42626953125, -4.2867431640625, -4.147216796875, -4.0076904296875, -3.8681640625, -3.7286376953125, -3.589111328125, -3.4495849609375, -3.31005859375, -3.1705322265625, -3.031005859375, -2.8914794921875, -2.751953125, -2.6124267578125, -2.472900390625, -2.3333740234375, -2.19384765625, -2.0543212890625, -1.914794921875, -1.7752685546875, -1.6357421875, -1.4962158203125, -1.356689453125, -1.2171630859375, -1.07763671875, -0.9381103515625, -0.798583984375, -0.6590576171875, -0.51953125, -0.3800048828125, -0.240478515625, -0.1009521484375, 0.03857421875, 0.1781005859375, 0.317626953125, 0.4571533203125, 0.5966796875, 0.7362060546875, 0.875732421875, 1.0152587890625, 1.15478515625, 1.2943115234375, 1.433837890625, 1.5733642578125, 1.712890625, 1.8524169921875, 1.991943359375, 2.1314697265625, 2.27099609375, 2.4105224609375, 2.550048828125, 2.6895751953125, 2.8291015625, 2.9686279296875, 3.108154296875, 3.2476806640625, 3.38720703125, 3.5267333984375, 3.666259765625, 3.8057861328125, 3.9453125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 11.0, 17.0, 17.0, 25.0, 25.0, 49.0, 67.0, 132.0, 189.0, 403.0, 934.0, 2409.0, 8421.0, 41428.0, 509847.0, 2442652.0, 114883.0, 17180.0, 4204.0, 1461.0, 613.0, 304.0, 154.0, 78.0, 59.0, 31.0, 26.0, 21.0, 19.0, 14.0, 7.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.25958251953125, -4.0972900390625, -3.93499755859375, -3.772705078125, -3.61041259765625, -3.4481201171875, -3.28582763671875, -3.12353515625, -2.96124267578125, -2.7989501953125, -2.63665771484375, -2.474365234375, -2.31207275390625, -2.1497802734375, -1.98748779296875, -1.8251953125, -1.66290283203125, -1.5006103515625, -1.33831787109375, -1.176025390625, -1.01373291015625, -0.8514404296875, -0.68914794921875, -0.52685546875, -0.36456298828125, -0.2022705078125, -0.03997802734375, 0.122314453125, 0.28460693359375, 0.4468994140625, 0.60919189453125, 0.771484375, 0.93377685546875, 1.0960693359375, 1.25836181640625, 1.420654296875, 1.58294677734375, 1.7452392578125, 1.90753173828125, 2.06982421875, 2.23211669921875, 2.3944091796875, 2.55670166015625, 2.718994140625, 2.88128662109375, 3.0435791015625, 3.20587158203125, 3.3681640625, 3.53045654296875, 3.6927490234375, 3.85504150390625, 4.017333984375, 4.17962646484375, 4.3419189453125, 4.50421142578125, 4.66650390625, 4.82879638671875, 4.9910888671875, 5.15338134765625, 5.315673828125, 5.47796630859375, 5.6402587890625, 5.80255126953125, 5.96484375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 4.0, 46.0, 443.0, 463.0, 56.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.737066745758057, -4.308887004852295, -2.8807075023651123, -1.4525279998779297, -0.02434825897216797, 1.4038314819335938, 2.8320107460021973, 4.260190486907959, 5.688370227813721, 7.116549968719482, 8.544729232788086, 9.972908973693848, 11.40108871459961, 12.829268455505371, 14.257448196411133, 15.685626983642578, 17.113807678222656, 18.5419864654541, 19.97016716003418, 21.398345947265625, 22.826526641845703, 24.25470542907715, 25.682884216308594, 27.111064910888672, 28.539243698120117, 29.967422485351562, 31.39560317993164, 32.82378387451172, 34.25196075439453, 35.68014144897461, 37.10832214355469, 38.5364990234375, 39.96467971801758, 41.392860412597656, 42.82103729248047, 44.24921798706055, 45.677398681640625, 47.1055793762207, 48.533756256103516, 49.961936950683594, 51.39011764526367, 52.81829833984375, 54.24647521972656, 55.67465591430664, 57.10283660888672, 58.5310173034668, 59.95919418334961, 61.38737487792969, 62.8155517578125, 64.24372863769531, 65.67191314697266, 67.10009002685547, 68.52826690673828, 69.95645141601562, 71.38462829589844, 72.81280517578125, 74.2409896850586, 75.6691665649414, 77.09735107421875, 78.52552795410156, 79.95370483398438, 81.38188934326172, 82.81006622314453, 84.23825073242188, 85.66642761230469]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 5.0, 12.0, 9.0, 18.0, 9.0, 22.0, 21.0, 23.0, 30.0, 33.0, 28.0, 43.0, 43.0, 45.0, 45.0, 37.0, 49.0, 40.0, 41.0, 42.0, 39.0, 37.0, 40.0, 37.0, 21.0, 30.0, 26.0, 22.0, 22.0, 14.0, 20.0, 15.0, 6.0, 6.0, 9.0, 12.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.056938171386719, -11.679476737976074, -11.30201530456543, -10.924552917480469, -10.547091484069824, -10.16963005065918, -9.792167663574219, -9.414706230163574, -9.03724479675293, -8.659783363342285, -8.28232192993164, -7.90485954284668, -7.527398109436035, -7.149936676025391, -6.772474765777588, -6.395012855529785, -6.017551422119141, -5.640089988708496, -5.262628078460693, -4.885166168212891, -4.507704734802246, -4.130243301391602, -3.752781391143799, -3.375319719314575, -2.9978580474853516, -2.620396375656128, -2.2429347038269043, -1.8654730319976807, -1.488011360168457, -1.1105496883392334, -0.7330880165100098, -0.35562634468078613, 0.0218353271484375, 0.39929699897766113, 0.7767586708068848, 1.1542203426361084, 1.531682014465332, 1.9091436862945557, 2.2866053581237793, 2.664067029953003, 3.0415287017822266, 3.41899037361145, 3.796452045440674, 4.173913955688477, 4.551375389099121, 4.928836822509766, 5.306298732757568, 5.683760643005371, 6.061222076416016, 6.43868350982666, 6.816145420074463, 7.193607330322266, 7.57106876373291, 7.948530197143555, 8.325992584228516, 8.70345401763916, 9.080915451049805, 9.45837688446045, 9.835838317871094, 10.213300704956055, 10.5907621383667, 10.968223571777344, 11.345685958862305, 11.72314739227295, 12.100608825683594]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 9.0, 9.0, 8.0, 20.0, 21.0, 17.0, 10.0, 27.0, 20.0, 22.0, 43.0, 20.0, 44.0, 27.0, 48.0, 50.0, 35.0, 45.0, 31.0, 38.0, 42.0, 45.0, 38.0, 31.0, 32.0, 29.0, 30.0, 34.0, 27.0, 27.0, 14.0, 20.0, 13.0, 6.0, 10.0, 13.0, 6.0, 8.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83837890625, -0.8076248168945312, -0.7768707275390625, -0.7461166381835938, -0.715362548828125, -0.6846084594726562, -0.6538543701171875, -0.6231002807617188, -0.59234619140625, -0.5615921020507812, -0.5308380126953125, -0.5000839233398438, -0.469329833984375, -0.43857574462890625, -0.4078216552734375, -0.37706756591796875, -0.3463134765625, -0.31555938720703125, -0.2848052978515625, -0.25405120849609375, -0.223297119140625, -0.19254302978515625, -0.1617889404296875, -0.13103485107421875, -0.10028076171875, -0.06952667236328125, -0.0387725830078125, -0.00801849365234375, 0.022735595703125, 0.05348968505859375, 0.0842437744140625, 0.11499786376953125, 0.145751953125, 0.17650604248046875, 0.2072601318359375, 0.23801422119140625, 0.268768310546875, 0.29952239990234375, 0.3302764892578125, 0.36103057861328125, 0.39178466796875, 0.42253875732421875, 0.4532928466796875, 0.48404693603515625, 0.514801025390625, 0.5455551147460938, 0.5763092041015625, 0.6070632934570312, 0.6378173828125, 0.6685714721679688, 0.6993255615234375, 0.7300796508789062, 0.760833740234375, 0.7915878295898438, 0.8223419189453125, 0.8530960083007812, 0.88385009765625, 0.9146041870117188, 0.9453582763671875, 0.9761123657226562, 1.006866455078125, 1.0376205444335938, 1.0683746337890625, 1.0991287231445312, 1.1298828125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 5.0, 13.0, 4.0, 11.0, 24.0, 36.0, 38.0, 74.0, 77.0, 106.0, 219.0, 303.0, 539.0, 980.0, 1702.0, 3347.0, 7092.0, 15564.0, 37916.0, 115456.0, 910038.0, 2679458.0, 307520.0, 67610.0, 24471.0, 10697.0, 5012.0, 2560.0, 1379.0, 778.0, 445.0, 264.0, 193.0, 95.0, 81.0, 46.0, 36.0, 23.0, 13.0, 10.0, 13.0, 7.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.111328125, -3.017852783203125, -2.92437744140625, -2.830902099609375, -2.7374267578125, -2.643951416015625, -2.55047607421875, -2.457000732421875, -2.363525390625, -2.270050048828125, -2.17657470703125, -2.083099365234375, -1.9896240234375, -1.896148681640625, -1.80267333984375, -1.709197998046875, -1.61572265625, -1.522247314453125, -1.42877197265625, -1.335296630859375, -1.2418212890625, -1.148345947265625, -1.05487060546875, -0.961395263671875, -0.867919921875, -0.774444580078125, -0.68096923828125, -0.587493896484375, -0.4940185546875, -0.400543212890625, -0.30706787109375, -0.213592529296875, -0.1201171875, -0.026641845703125, 0.06683349609375, 0.160308837890625, 0.2537841796875, 0.347259521484375, 0.44073486328125, 0.534210205078125, 0.627685546875, 0.721160888671875, 0.81463623046875, 0.908111572265625, 1.0015869140625, 1.095062255859375, 1.18853759765625, 1.282012939453125, 1.37548828125, 1.468963623046875, 1.56243896484375, 1.655914306640625, 1.7493896484375, 1.842864990234375, 1.93634033203125, 2.029815673828125, 2.123291015625, 2.216766357421875, 2.31024169921875, 2.403717041015625, 2.4971923828125, 2.590667724609375, 2.68414306640625, 2.777618408203125, 2.87109375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 12.0, 6.0, 11.0, 26.0, 29.0, 43.0, 49.0, 79.0, 103.0, 152.0, 221.0, 354.0, 600.0, 621.0, 580.0, 361.0, 242.0, 182.0, 102.0, 93.0, 63.0, 28.0, 42.0, 22.0, 13.0, 16.0, 6.0, 4.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.916107177734375, -2.81072998046875, -2.705352783203125, -2.5999755859375, -2.494598388671875, -2.38922119140625, -2.283843994140625, -2.178466796875, -2.073089599609375, -1.96771240234375, -1.862335205078125, -1.7569580078125, -1.651580810546875, -1.54620361328125, -1.440826416015625, -1.33544921875, -1.230072021484375, -1.12469482421875, -1.019317626953125, -0.9139404296875, -0.808563232421875, -0.70318603515625, -0.597808837890625, -0.492431640625, -0.387054443359375, -0.28167724609375, -0.176300048828125, -0.0709228515625, 0.034454345703125, 0.13983154296875, 0.245208740234375, 0.3505859375, 0.455963134765625, 0.56134033203125, 0.666717529296875, 0.7720947265625, 0.877471923828125, 0.98284912109375, 1.088226318359375, 1.193603515625, 1.298980712890625, 1.40435791015625, 1.509735107421875, 1.6151123046875, 1.720489501953125, 1.82586669921875, 1.931243896484375, 2.03662109375, 2.141998291015625, 2.24737548828125, 2.352752685546875, 2.4581298828125, 2.563507080078125, 2.66888427734375, 2.774261474609375, 2.879638671875, 2.985015869140625, 3.09039306640625, 3.195770263671875, 3.3011474609375, 3.406524658203125, 3.51190185546875, 3.617279052734375, 3.72265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 24.0, 50.0, 99.0, 269.0, 715.0, 2646.0, 12306.0, 86104.0, 2245075.0, 1756423.0, 75574.0, 11360.0, 2477.0, 729.0, 244.0, 98.0, 55.0, 25.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.6123046875, -13.302734375, -12.9931640625, -12.68359375, -12.3740234375, -12.064453125, -11.7548828125, -11.4453125, -11.1357421875, -10.826171875, -10.5166015625, -10.20703125, -9.8974609375, -9.587890625, -9.2783203125, -8.96875, -8.6591796875, -8.349609375, -8.0400390625, -7.73046875, -7.4208984375, -7.111328125, -6.8017578125, -6.4921875, -6.1826171875, -5.873046875, -5.5634765625, -5.25390625, -4.9443359375, -4.634765625, -4.3251953125, -4.015625, -3.7060546875, -3.396484375, -3.0869140625, -2.77734375, -2.4677734375, -2.158203125, -1.8486328125, -1.5390625, -1.2294921875, -0.919921875, -0.6103515625, -0.30078125, 0.0087890625, 0.318359375, 0.6279296875, 0.9375, 1.2470703125, 1.556640625, 1.8662109375, 2.17578125, 2.4853515625, 2.794921875, 3.1044921875, 3.4140625, 3.7236328125, 4.033203125, 4.3427734375, 4.65234375, 4.9619140625, 5.271484375, 5.5810546875, 5.890625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [5.0, 4.0, 18.0, 25.0, 52.0, 77.0, 135.0, 202.0, 203.0, 146.0, 79.0, 36.0, 19.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.895388126373291, -6.902324676513672, -5.909261226654053, -4.916197776794434, -3.9231345653533936, -2.9300713539123535, -1.9370079040527344, -0.9439444541931152, 0.049118995666503906, 1.042182445526123, 2.035245895385742, 3.0283091068267822, 4.0213727951049805, 5.014435768127441, 6.0074992179870605, 7.00056266784668, 7.993626117706299, 8.986689567565918, 9.979752540588379, 10.972816467285156, 11.965879440307617, 12.958942413330078, 13.952006340026855, 14.945070266723633, 15.938133239746094, 16.931196212768555, 17.924259185791016, 18.91732406616211, 19.91038703918457, 20.90345001220703, 21.896512985229492, 22.889575958251953, 23.882638931274414, 24.875701904296875, 25.868764877319336, 26.86182975769043, 27.85489273071289, 28.84795570373535, 29.841018676757812, 30.834083557128906, 31.827146530151367, 32.82020950317383, 33.81327438354492, 34.80633544921875, 35.799400329589844, 36.79246520996094, 37.785526275634766, 38.77859115600586, 39.77165222167969, 40.76471710205078, 41.75777816772461, 42.7508430480957, 43.74390411376953, 44.736968994140625, 45.73003387451172, 46.72309494018555, 47.71615982055664, 48.709224700927734, 49.70228576660156, 50.695350646972656, 51.688411712646484, 52.68147659301758, 53.67454147338867, 54.6676025390625, 55.660667419433594]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 9.0, 3.0, 7.0, 20.0, 15.0, 20.0, 19.0, 26.0, 23.0, 32.0, 33.0, 32.0, 44.0, 44.0, 36.0, 47.0, 41.0, 45.0, 51.0, 46.0, 55.0, 37.0, 39.0, 39.0, 32.0, 35.0, 24.0, 23.0, 15.0, 21.0, 13.0, 15.0, 11.0, 8.0, 7.0, 2.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.95344066619873, -9.648839950561523, -9.34423828125, -9.039637565612793, -8.73503589630127, -8.430435180664062, -8.125833511352539, -7.821232795715332, -7.516631603240967, -7.212030410766602, -6.907429218292236, -6.602828025817871, -6.298227310180664, -5.993625640869141, -5.689024925231934, -5.384423732757568, -5.079822540283203, -4.775221347808838, -4.470620155334473, -4.166018962860107, -3.8614180088043213, -3.556816816329956, -3.25221586227417, -2.9476146697998047, -2.6430134773254395, -2.338412284851074, -2.033811092376709, -1.7292101383209229, -1.4246089458465576, -1.1200077533721924, -0.8154066801071167, -0.510805606842041, -0.20620441436767578, 0.09839671850204468, 0.40299785137176514, 0.7075989842414856, 1.012200117111206, 1.3168013095855713, 1.621402382850647, 1.9260034561157227, 2.230604648590088, 2.535205841064453, 2.8398070335388184, 3.1444079875946045, 3.4490091800689697, 3.753610372543335, 4.058211326599121, 4.362812519073486, 4.667413711547852, 4.972014904022217, 5.276616096496582, 5.581217288970947, 5.8858184814453125, 6.1904191970825195, 6.495020389556885, 6.79962158203125, 7.104222774505615, 7.4088239669799805, 7.713425159454346, 8.018026351928711, 8.322627067565918, 8.627228736877441, 8.931829452514648, 9.236431121826172, 9.541031837463379]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 9.0, 10.0, 16.0, 9.0, 18.0, 17.0, 32.0, 31.0, 27.0, 29.0, 33.0, 41.0, 46.0, 50.0, 45.0, 40.0, 31.0, 43.0, 43.0, 48.0, 41.0, 38.0, 41.0, 31.0, 35.0, 31.0, 29.0, 20.0, 17.0, 16.0, 11.0, 18.0, 11.0, 8.0, 7.0, 8.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.9438323974609375, -0.910125732421875, -0.8764190673828125, -0.84271240234375, -0.8090057373046875, -0.775299072265625, -0.7415924072265625, -0.7078857421875, -0.6741790771484375, -0.640472412109375, -0.6067657470703125, -0.57305908203125, -0.5393524169921875, -0.505645751953125, -0.4719390869140625, -0.438232421875, -0.4045257568359375, -0.370819091796875, -0.3371124267578125, -0.30340576171875, -0.2696990966796875, -0.235992431640625, -0.2022857666015625, -0.1685791015625, -0.1348724365234375, -0.101165771484375, -0.0674591064453125, -0.03375244140625, -4.57763671875e-05, 0.033660888671875, 0.0673675537109375, 0.10107421875, 0.1347808837890625, 0.168487548828125, 0.2021942138671875, 0.23590087890625, 0.2696075439453125, 0.303314208984375, 0.3370208740234375, 0.3707275390625, 0.4044342041015625, 0.438140869140625, 0.4718475341796875, 0.50555419921875, 0.5392608642578125, 0.572967529296875, 0.6066741943359375, 0.640380859375, 0.6740875244140625, 0.707794189453125, 0.7415008544921875, 0.77520751953125, 0.8089141845703125, 0.842620849609375, 0.8763275146484375, 0.9100341796875, 0.9437408447265625, 0.977447509765625, 1.0111541748046875, 1.04486083984375, 1.0785675048828125, 1.112274169921875, 1.1459808349609375, 1.1796875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 4.0, 3.0, 11.0, 21.0, 25.0, 45.0, 71.0, 123.0, 166.0, 214.0, 375.0, 572.0, 842.0, 1301.0, 2027.0, 3173.0, 5164.0, 8275.0, 13794.0, 23253.0, 39616.0, 69716.0, 140090.0, 364449.0, 179005.0, 82529.0, 46035.0, 26361.0, 15904.0, 9433.0, 5781.0, 3688.0, 2295.0, 1448.0, 947.0, 608.0, 415.0, 256.0, 191.0, 109.0, 72.0, 48.0, 32.0, 22.0, 20.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.818359375, -2.73455810546875, -2.6507568359375, -2.56695556640625, -2.483154296875, -2.39935302734375, -2.3155517578125, -2.23175048828125, -2.14794921875, -2.06414794921875, -1.9803466796875, -1.89654541015625, -1.812744140625, -1.72894287109375, -1.6451416015625, -1.56134033203125, -1.4775390625, -1.39373779296875, -1.3099365234375, -1.22613525390625, -1.142333984375, -1.05853271484375, -0.9747314453125, -0.89093017578125, -0.80712890625, -0.72332763671875, -0.6395263671875, -0.55572509765625, -0.471923828125, -0.38812255859375, -0.3043212890625, -0.22052001953125, -0.13671875, -0.05291748046875, 0.0308837890625, 0.11468505859375, 0.198486328125, 0.28228759765625, 0.3660888671875, 0.44989013671875, 0.53369140625, 0.61749267578125, 0.7012939453125, 0.78509521484375, 0.868896484375, 0.95269775390625, 1.0364990234375, 1.12030029296875, 1.2041015625, 1.28790283203125, 1.3717041015625, 1.45550537109375, 1.539306640625, 1.62310791015625, 1.7069091796875, 1.79071044921875, 1.87451171875, 1.95831298828125, 2.0421142578125, 2.12591552734375, 2.209716796875, 2.29351806640625, 2.3773193359375, 2.46112060546875, 2.544921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 5.0, 4.0, 9.0, 11.0, 10.0, 9.0, 17.0, 13.0, 10.0, 17.0, 19.0, 28.0, 24.0, 30.0, 25.0, 31.0, 37.0, 34.0, 27.0, 33.0, 33.0, 37.0, 1072.0, 44.0, 42.0, 52.0, 38.0, 31.0, 30.0, 36.0, 21.0, 32.0, 24.0, 16.0, 25.0, 19.0, 19.0, 11.0, 8.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6640243530273438, -0.6420135498046875, -0.6200027465820312, -0.597991943359375, -0.5759811401367188, -0.5539703369140625, -0.5319595336914062, -0.50994873046875, -0.48793792724609375, -0.4659271240234375, -0.44391632080078125, -0.421905517578125, -0.39989471435546875, -0.3778839111328125, -0.35587310791015625, -0.3338623046875, -0.31185150146484375, -0.2898406982421875, -0.26782989501953125, -0.245819091796875, -0.22380828857421875, -0.2017974853515625, -0.17978668212890625, -0.15777587890625, -0.13576507568359375, -0.1137542724609375, -0.09174346923828125, -0.069732666015625, -0.04772186279296875, -0.0257110595703125, -0.00370025634765625, 0.018310546875, 0.04032135009765625, 0.0623321533203125, 0.08434295654296875, 0.106353759765625, 0.12836456298828125, 0.1503753662109375, 0.17238616943359375, 0.19439697265625, 0.21640777587890625, 0.2384185791015625, 0.26042938232421875, 0.282440185546875, 0.30445098876953125, 0.3264617919921875, 0.34847259521484375, 0.3704833984375, 0.39249420166015625, 0.4145050048828125, 0.43651580810546875, 0.458526611328125, 0.48053741455078125, 0.5025482177734375, 0.5245590209960938, 0.54656982421875, 0.5685806274414062, 0.5905914306640625, 0.6126022338867188, 0.634613037109375, 0.6566238403320312, 0.6786346435546875, 0.7006454467773438, 0.72265625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 11.0, 14.0, 19.0, 40.0, 52.0, 100.0, 151.0, 258.0, 438.0, 679.0, 1203.0, 2184.0, 3933.0, 7832.0, 16527.0, 39453.0, 115601.0, 1128049.0, 620478.0, 95626.0, 34350.0, 14637.0, 7044.0, 3719.0, 1969.0, 1102.0, 607.0, 389.0, 223.0, 147.0, 85.0, 58.0, 41.0, 27.0, 18.0, 20.0, 8.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.681640625, -2.58892822265625, -2.4962158203125, -2.40350341796875, -2.310791015625, -2.21807861328125, -2.1253662109375, -2.03265380859375, -1.93994140625, -1.84722900390625, -1.7545166015625, -1.66180419921875, -1.569091796875, -1.47637939453125, -1.3836669921875, -1.29095458984375, -1.1982421875, -1.10552978515625, -1.0128173828125, -0.92010498046875, -0.827392578125, -0.73468017578125, -0.6419677734375, -0.54925537109375, -0.45654296875, -0.36383056640625, -0.2711181640625, -0.17840576171875, -0.085693359375, 0.00701904296875, 0.0997314453125, 0.19244384765625, 0.28515625, 0.37786865234375, 0.4705810546875, 0.56329345703125, 0.656005859375, 0.74871826171875, 0.8414306640625, 0.93414306640625, 1.02685546875, 1.11956787109375, 1.2122802734375, 1.30499267578125, 1.397705078125, 1.49041748046875, 1.5831298828125, 1.67584228515625, 1.7685546875, 1.86126708984375, 1.9539794921875, 2.04669189453125, 2.139404296875, 2.23211669921875, 2.3248291015625, 2.41754150390625, 2.51025390625, 2.60296630859375, 2.6956787109375, 2.78839111328125, 2.881103515625, 2.97381591796875, 3.0665283203125, 3.15924072265625, 3.251953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 6.0, 11.0, 11.0, 13.0, 27.0, 36.0, 36.0, 45.0, 102.0, 139.0, 198.0, 99.0, 60.0, 44.0, 29.0, 19.0, 18.0, 11.0, 10.0, 12.0, 7.0, 8.0, 5.0, 5.0, 6.0, 9.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.95068359375, -0.9220733642578125, -0.893463134765625, -0.8648529052734375, -0.83624267578125, -0.8076324462890625, -0.779022216796875, -0.7504119873046875, -0.7218017578125, -0.6931915283203125, -0.664581298828125, -0.6359710693359375, -0.60736083984375, -0.5787506103515625, -0.550140380859375, -0.5215301513671875, -0.492919921875, -0.4643096923828125, -0.435699462890625, -0.4070892333984375, -0.37847900390625, -0.3498687744140625, -0.321258544921875, -0.2926483154296875, -0.2640380859375, -0.2354278564453125, -0.206817626953125, -0.1782073974609375, -0.14959716796875, -0.1209869384765625, -0.092376708984375, -0.0637664794921875, -0.03515625, -0.0065460205078125, 0.022064208984375, 0.0506744384765625, 0.07928466796875, 0.1078948974609375, 0.136505126953125, 0.1651153564453125, 0.1937255859375, 0.2223358154296875, 0.250946044921875, 0.2795562744140625, 0.30816650390625, 0.3367767333984375, 0.365386962890625, 0.3939971923828125, 0.422607421875, 0.4512176513671875, 0.479827880859375, 0.5084381103515625, 0.53704833984375, 0.5656585693359375, 0.594268798828125, 0.6228790283203125, 0.6514892578125, 0.6800994873046875, 0.708709716796875, 0.7373199462890625, 0.76593017578125, 0.7945404052734375, 0.823150634765625, 0.8517608642578125, 0.88037109375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 14.0, 20.0, 18.0, 27.0, 43.0, 49.0, 63.0, 150.0, 267.0, 769.0, 2516.0, 12160.0, 223173.0, 785803.0, 18393.0, 3317.0, 908.0, 327.0, 159.0, 90.0, 57.0, 43.0, 48.0, 39.0, 22.0, 10.0, 10.0, 4.0, 12.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.59375, -12.2349853515625, -11.876220703125, -11.5174560546875, -11.15869140625, -10.7999267578125, -10.441162109375, -10.0823974609375, -9.7236328125, -9.3648681640625, -9.006103515625, -8.6473388671875, -8.28857421875, -7.9298095703125, -7.571044921875, -7.2122802734375, -6.853515625, -6.4947509765625, -6.135986328125, -5.7772216796875, -5.41845703125, -5.0596923828125, -4.700927734375, -4.3421630859375, -3.9833984375, -3.6246337890625, -3.265869140625, -2.9071044921875, -2.54833984375, -2.1895751953125, -1.830810546875, -1.4720458984375, -1.11328125, -0.7545166015625, -0.395751953125, -0.0369873046875, 0.32177734375, 0.6805419921875, 1.039306640625, 1.3980712890625, 1.7568359375, 2.1156005859375, 2.474365234375, 2.8331298828125, 3.19189453125, 3.5506591796875, 3.909423828125, 4.2681884765625, 4.626953125, 4.9857177734375, 5.344482421875, 5.7032470703125, 6.06201171875, 6.4207763671875, 6.779541015625, 7.1383056640625, 7.4970703125, 7.8558349609375, 8.214599609375, 8.5733642578125, 8.93212890625, 9.2908935546875, 9.649658203125, 10.0084228515625, 10.3671875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 16.0, 17.0, 40.0, 40.0, 59.0, 82.0, 125.0, 142.0, 131.0, 97.0, 70.0, 47.0, 36.0, 25.0, 20.0, 14.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8947878479957581, -0.8520907759666443, -0.8093937635421753, -0.7666966915130615, -0.7239996194839478, -0.681302547454834, -0.6386054754257202, -0.5959084630012512, -0.5532113909721375, -0.5105143189430237, -0.4678172767162323, -0.4251202344894409, -0.38242316246032715, -0.3397260904312134, -0.297029048204422, -0.2543320059776306, -0.21163493394851685, -0.16893787682056427, -0.1262408196926117, -0.08354376256465912, -0.04084670543670654, 0.0018503516912460327, 0.04454740881919861, 0.08724445104598999, 0.12994152307510376, 0.17263858020305634, 0.2153356373310089, 0.2580326795578003, 0.30072975158691406, 0.34342682361602783, 0.3861238658428192, 0.4288209080696106, 0.4715179204940796, 0.5142149925231934, 0.5569120645523071, 0.5996090769767761, 0.6423061490058899, 0.6850032210350037, 0.7277002334594727, 0.7703973054885864, 0.8130943775177002, 0.855791449546814, 0.8984885215759277, 0.9411855340003967, 0.9838826060295105, 1.0265796184539795, 1.0692766904830933, 1.111973762512207, 1.1546708345413208, 1.1973679065704346, 1.2400649785995483, 1.282762050628662, 1.3254590034484863, 1.3681560754776, 1.4108531475067139, 1.4535502195358276, 1.4962472915649414, 1.5389443635940552, 1.581641435623169, 1.6243385076522827, 1.6670355796813965, 1.7097325325012207, 1.7524296045303345, 1.7951266765594482, 1.837823748588562]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 4.0, 8.0, 10.0, 9.0, 9.0, 16.0, 14.0, 19.0, 11.0, 20.0, 24.0, 23.0, 38.0, 21.0, 37.0, 36.0, 37.0, 50.0, 43.0, 51.0, 35.0, 50.0, 30.0, 37.0, 50.0, 34.0, 27.0, 29.0, 29.0, 23.0, 21.0, 18.0, 18.0, 14.0, 14.0, 11.0, 12.0, 10.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6925222873687744, -0.6706942915916443, -0.6488662958145142, -0.6270382404327393, -0.6052102446556091, -0.583382248878479, -0.5615542531013489, -0.5397262573242188, -0.5178982019424438, -0.4960702061653137, -0.4742421805858612, -0.4524141848087311, -0.43058615922927856, -0.40875816345214844, -0.3869301676750183, -0.3651021420955658, -0.34327414631843567, -0.32144615054130554, -0.299618124961853, -0.2777901291847229, -0.2559621036052704, -0.23413410782814026, -0.21230609714984894, -0.19047808647155762, -0.1686500757932663, -0.14682206511497498, -0.12499405443668365, -0.10316605120897293, -0.08133804053068161, -0.05951002985239029, -0.037682026624679565, -0.015854015946388245, 0.005973994731903076, 0.027802003547549248, 0.04963001236319542, 0.07145801931619644, 0.09328602999448776, 0.11511404067277908, 0.1369420439004898, 0.15877005457878113, 0.18059806525707245, 0.20242607593536377, 0.2242540866136551, 0.2460820972919464, 0.26791009306907654, 0.28973811864852905, 0.3115661144256592, 0.3333941102027893, 0.3552221357822418, 0.37705013155937195, 0.39887815713882446, 0.4207061529159546, 0.4425341784954071, 0.46436217427253723, 0.48619019985198975, 0.5080181956291199, 0.52984619140625, 0.5516741871833801, 0.5735021829605103, 0.5953302383422852, 0.6171582341194153, 0.6389862298965454, 0.6608142256736755, 0.6826422214508057, 0.7044702768325806]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 5.0, 7.0, 11.0, 10.0, 14.0, 21.0, 9.0, 33.0, 31.0, 31.0, 27.0, 34.0, 28.0, 61.0, 44.0, 35.0, 55.0, 33.0, 42.0, 39.0, 46.0, 42.0, 45.0, 37.0, 25.0, 42.0, 37.0, 18.0, 30.0, 17.0, 17.0, 10.0, 14.0, 13.0, 4.0, 10.0, 10.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9586105346679688, -0.9245452880859375, -0.8904800415039062, -0.856414794921875, -0.8223495483398438, -0.7882843017578125, -0.7542190551757812, -0.72015380859375, -0.6860885620117188, -0.6520233154296875, -0.6179580688476562, -0.583892822265625, -0.5498275756835938, -0.5157623291015625, -0.48169708251953125, -0.4476318359375, -0.41356658935546875, -0.3795013427734375, -0.34543609619140625, -0.311370849609375, -0.27730560302734375, -0.2432403564453125, -0.20917510986328125, -0.17510986328125, -0.14104461669921875, -0.1069793701171875, -0.07291412353515625, -0.038848876953125, -0.00478363037109375, 0.0292816162109375, 0.06334686279296875, 0.097412109375, 0.13147735595703125, 0.1655426025390625, 0.19960784912109375, 0.233673095703125, 0.26773834228515625, 0.3018035888671875, 0.33586883544921875, 0.36993408203125, 0.40399932861328125, 0.4380645751953125, 0.47212982177734375, 0.506195068359375, 0.5402603149414062, 0.5743255615234375, 0.6083908081054688, 0.6424560546875, 0.6765213012695312, 0.7105865478515625, 0.7446517944335938, 0.778717041015625, 0.8127822875976562, 0.8468475341796875, 0.8809127807617188, 0.91497802734375, 0.9490432739257812, 0.9831085205078125, 1.0171737670898438, 1.051239013671875, 1.0853042602539062, 1.1193695068359375, 1.1534347534179688, 1.1875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 4.0, 8.0, 7.0, 12.0, 24.0, 26.0, 31.0, 41.0, 56.0, 84.0, 85.0, 162.0, 218.0, 303.0, 468.0, 738.0, 1095.0, 1741.0, 2922.0, 4912.0, 8835.0, 15827.0, 32265.0, 74845.0, 213557.0, 375299.0, 184704.0, 66382.0, 28918.0, 14543.0, 8081.0, 4717.0, 2819.0, 1651.0, 1054.0, 658.0, 451.0, 298.0, 200.0, 138.0, 100.0, 71.0, 42.0, 57.0, 19.0, 20.0, 17.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.152557373046875, -1.11468505859375, -1.076812744140625, -1.0389404296875, -1.001068115234375, -0.96319580078125, -0.925323486328125, -0.887451171875, -0.849578857421875, -0.81170654296875, -0.773834228515625, -0.7359619140625, -0.698089599609375, -0.66021728515625, -0.622344970703125, -0.58447265625, -0.546600341796875, -0.50872802734375, -0.470855712890625, -0.4329833984375, -0.395111083984375, -0.35723876953125, -0.319366455078125, -0.281494140625, -0.243621826171875, -0.20574951171875, -0.167877197265625, -0.1300048828125, -0.092132568359375, -0.05426025390625, -0.016387939453125, 0.021484375, 0.059356689453125, 0.09722900390625, 0.135101318359375, 0.1729736328125, 0.210845947265625, 0.24871826171875, 0.286590576171875, 0.324462890625, 0.362335205078125, 0.40020751953125, 0.438079833984375, 0.4759521484375, 0.513824462890625, 0.55169677734375, 0.589569091796875, 0.62744140625, 0.665313720703125, 0.70318603515625, 0.741058349609375, 0.7789306640625, 0.816802978515625, 0.85467529296875, 0.892547607421875, 0.930419921875, 0.968292236328125, 1.00616455078125, 1.044036865234375, 1.0819091796875, 1.119781494140625, 1.15765380859375, 1.195526123046875, 1.2333984375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 7.0, 11.0, 15.0, 14.0, 16.0, 29.0, 20.0, 43.0, 36.0, 68.0, 61.0, 80.0, 169.0, 312.0, 1441.0, 187.0, 122.0, 93.0, 51.0, 55.0, 54.0, 41.0, 18.0, 22.0, 16.0, 24.0, 9.0, 10.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.45703125, -5.28765869140625, -5.1182861328125, -4.94891357421875, -4.779541015625, -4.61016845703125, -4.4407958984375, -4.27142333984375, -4.10205078125, -3.93267822265625, -3.7633056640625, -3.59393310546875, -3.424560546875, -3.25518798828125, -3.0858154296875, -2.91644287109375, -2.7470703125, -2.57769775390625, -2.4083251953125, -2.23895263671875, -2.069580078125, -1.90020751953125, -1.7308349609375, -1.56146240234375, -1.39208984375, -1.22271728515625, -1.0533447265625, -0.88397216796875, -0.714599609375, -0.54522705078125, -0.3758544921875, -0.20648193359375, -0.037109375, 0.13226318359375, 0.3016357421875, 0.47100830078125, 0.640380859375, 0.80975341796875, 0.9791259765625, 1.14849853515625, 1.31787109375, 1.48724365234375, 1.6566162109375, 1.82598876953125, 1.995361328125, 2.16473388671875, 2.3341064453125, 2.50347900390625, 2.6728515625, 2.84222412109375, 3.0115966796875, 3.18096923828125, 3.350341796875, 3.51971435546875, 3.6890869140625, 3.85845947265625, 4.02783203125, 4.19720458984375, 4.3665771484375, 4.53594970703125, 4.705322265625, 4.87469482421875, 5.0440673828125, 5.21343994140625, 5.3828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 11.0, 10.0, 13.0, 14.0, 21.0, 28.0, 60.0, 94.0, 156.0, 189.0, 283.0, 530.0, 821.0, 1443.0, 2889.0, 5796.0, 14743.0, 87286.0, 2821473.0, 176239.0, 19375.0, 6844.0, 3232.0, 1712.0, 917.0, 553.0, 340.0, 210.0, 127.0, 114.0, 63.0, 45.0, 20.0, 11.0, 15.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.0703125, -9.761474609375, -9.45263671875, -9.143798828125, -8.8349609375, -8.526123046875, -8.21728515625, -7.908447265625, -7.599609375, -7.290771484375, -6.98193359375, -6.673095703125, -6.3642578125, -6.055419921875, -5.74658203125, -5.437744140625, -5.12890625, -4.820068359375, -4.51123046875, -4.202392578125, -3.8935546875, -3.584716796875, -3.27587890625, -2.967041015625, -2.658203125, -2.349365234375, -2.04052734375, -1.731689453125, -1.4228515625, -1.114013671875, -0.80517578125, -0.496337890625, -0.1875, 0.121337890625, 0.43017578125, 0.739013671875, 1.0478515625, 1.356689453125, 1.66552734375, 1.974365234375, 2.283203125, 2.592041015625, 2.90087890625, 3.209716796875, 3.5185546875, 3.827392578125, 4.13623046875, 4.445068359375, 4.75390625, 5.062744140625, 5.37158203125, 5.680419921875, 5.9892578125, 6.298095703125, 6.60693359375, 6.915771484375, 7.224609375, 7.533447265625, 7.84228515625, 8.151123046875, 8.4599609375, 8.768798828125, 9.07763671875, 9.386474609375, 9.6953125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 21.0, 95.0, 362.0, 351.0, 137.0, 36.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.588401794433594, -44.868099212646484, -43.147796630859375, -41.427494049072266, -39.707191467285156, -37.98688888549805, -36.26658630371094, -34.54628372192383, -32.82598114013672, -31.10567855834961, -29.3853759765625, -27.66507339477539, -25.94477081298828, -24.224468231201172, -22.504165649414062, -20.783863067626953, -19.063560485839844, -17.343257904052734, -15.622955322265625, -13.902652740478516, -12.182350158691406, -10.462047576904297, -8.741744995117188, -7.021442413330078, -5.301139831542969, -3.5808372497558594, -1.86053466796875, -0.14023208618164062, 1.5800704956054688, 3.300373077392578, 5.0206756591796875, 6.740978240966797, 8.461284637451172, 10.181587219238281, 11.90188980102539, 13.6221923828125, 15.34249496459961, 17.06279754638672, 18.783100128173828, 20.503402709960938, 22.223705291748047, 23.944007873535156, 25.664310455322266, 27.384613037109375, 29.104915618896484, 30.825218200683594, 32.5455207824707, 34.26582336425781, 35.98612594604492, 37.70642852783203, 39.42673110961914, 41.14703369140625, 42.86733627319336, 44.58763885498047, 46.30794143676758, 48.02824401855469, 49.7485466003418, 51.468849182128906, 53.189151763916016, 54.909454345703125, 56.629756927490234, 58.350059509277344, 60.07036209106445, 61.79066467285156, 63.51096725463867]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 12.0, 10.0, 15.0, 15.0, 16.0, 15.0, 24.0, 28.0, 24.0, 29.0, 43.0, 43.0, 41.0, 37.0, 57.0, 55.0, 61.0, 50.0, 44.0, 47.0, 48.0, 45.0, 26.0, 41.0, 29.0, 31.0, 25.0, 19.0, 17.0, 15.0, 7.0, 11.0, 2.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.558062553405762, -14.09449291229248, -13.6309232711792, -13.167353630065918, -12.703784942626953, -12.240215301513672, -11.77664566040039, -11.31307601928711, -10.849506378173828, -10.385936737060547, -9.922367095947266, -9.458797454833984, -8.995227813720703, -8.531658172607422, -8.068089485168457, -7.604519844055176, -7.1409502029418945, -6.677380561828613, -6.213810920715332, -5.750241756439209, -5.286672115325928, -4.8231024742126465, -4.359533309936523, -3.895963668823242, -3.432394027709961, -2.9688243865966797, -2.5052549839019775, -2.0416855812072754, -1.5781159400939941, -1.114546298980713, -0.6509768962860107, -0.1874074935913086, 0.27616119384765625, 0.739730715751648, 1.2033002376556396, 1.6668697595596313, 2.130439281463623, 2.5940089225769043, 3.0575783252716064, 3.5211477279663086, 3.98471736907959, 4.448287010192871, 4.911856651306152, 5.375425815582275, 5.838995456695557, 6.302565097808838, 6.766134262084961, 7.229703903198242, 7.693273544311523, 8.156843185424805, 8.620412826538086, 9.083982467651367, 9.547552108764648, 10.01112174987793, 10.474690437316895, 10.938260078430176, 11.401829719543457, 11.865399360656738, 12.32896900177002, 12.7925386428833, 13.256107330322266, 13.719676971435547, 14.183246612548828, 14.64681625366211, 15.11038589477539]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 13.0, 20.0, 20.0, 13.0, 15.0, 30.0, 28.0, 30.0, 29.0, 39.0, 42.0, 31.0, 36.0, 51.0, 45.0, 41.0, 59.0, 45.0, 38.0, 44.0, 43.0, 32.0, 38.0, 26.0, 30.0, 21.0, 20.0, 17.0, 19.0, 9.0, 13.0, 12.0, 7.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.158905029296875, -1.12347412109375, -1.088043212890625, -1.0526123046875, -1.017181396484375, -0.98175048828125, -0.946319580078125, -0.910888671875, -0.875457763671875, -0.84002685546875, -0.804595947265625, -0.7691650390625, -0.733734130859375, -0.69830322265625, -0.662872314453125, -0.62744140625, -0.592010498046875, -0.55657958984375, -0.521148681640625, -0.4857177734375, -0.450286865234375, -0.41485595703125, -0.379425048828125, -0.343994140625, -0.308563232421875, -0.27313232421875, -0.237701416015625, -0.2022705078125, -0.166839599609375, -0.13140869140625, -0.095977783203125, -0.060546875, -0.025115966796875, 0.01031494140625, 0.045745849609375, 0.0811767578125, 0.116607666015625, 0.15203857421875, 0.187469482421875, 0.222900390625, 0.258331298828125, 0.29376220703125, 0.329193115234375, 0.3646240234375, 0.400054931640625, 0.43548583984375, 0.470916748046875, 0.50634765625, 0.541778564453125, 0.57720947265625, 0.612640380859375, 0.6480712890625, 0.683502197265625, 0.71893310546875, 0.754364013671875, 0.789794921875, 0.825225830078125, 0.86065673828125, 0.896087646484375, 0.9315185546875, 0.966949462890625, 1.00238037109375, 1.037811279296875, 1.0732421875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 25.0, 29.0, 45.0, 65.0, 118.0, 168.0, 225.0, 415.0, 617.0, 1054.0, 1671.0, 2894.0, 5118.0, 9253.0, 17609.0, 36029.0, 82946.0, 277788.0, 1654207.0, 1672369.0, 274972.0, 81615.0, 35694.0, 17274.0, 9178.0, 4987.0, 3032.0, 1794.0, 1137.0, 700.0, 419.0, 292.0, 186.0, 126.0, 68.0, 42.0, 24.0, 19.0, 12.0, 8.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.751251220703125, -1.67828369140625, -1.605316162109375, -1.5323486328125, -1.459381103515625, -1.38641357421875, -1.313446044921875, -1.240478515625, -1.167510986328125, -1.09454345703125, -1.021575927734375, -0.9486083984375, -0.875640869140625, -0.80267333984375, -0.729705810546875, -0.65673828125, -0.583770751953125, -0.51080322265625, -0.437835693359375, -0.3648681640625, -0.291900634765625, -0.21893310546875, -0.145965576171875, -0.072998046875, -3.0517578125e-05, 0.07293701171875, 0.145904541015625, 0.2188720703125, 0.291839599609375, 0.36480712890625, 0.437774658203125, 0.5107421875, 0.583709716796875, 0.65667724609375, 0.729644775390625, 0.8026123046875, 0.875579833984375, 0.94854736328125, 1.021514892578125, 1.094482421875, 1.167449951171875, 1.24041748046875, 1.313385009765625, 1.3863525390625, 1.459320068359375, 1.53228759765625, 1.605255126953125, 1.67822265625, 1.751190185546875, 1.82415771484375, 1.897125244140625, 1.9700927734375, 2.043060302734375, 2.11602783203125, 2.188995361328125, 2.261962890625, 2.334930419921875, 2.40789794921875, 2.480865478515625, 2.5538330078125, 2.626800537109375, 2.69976806640625, 2.772735595703125, 2.845703125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 4.0, 5.0, 5.0, 10.0, 7.0, 11.0, 26.0, 22.0, 23.0, 21.0, 34.0, 52.0, 63.0, 75.0, 98.0, 131.0, 172.0, 200.0, 270.0, 332.0, 429.0, 395.0, 331.0, 312.0, 222.0, 156.0, 119.0, 115.0, 95.0, 81.0, 49.0, 54.0, 34.0, 28.0, 22.0, 13.0, 11.0, 9.0, 8.0, 6.0, 7.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.0078125, -1.9365234375, -1.865234375, -1.7939453125, -1.72265625, -1.6513671875, -1.580078125, -1.5087890625, -1.4375, -1.3662109375, -1.294921875, -1.2236328125, -1.15234375, -1.0810546875, -1.009765625, -0.9384765625, -0.8671875, -0.7958984375, -0.724609375, -0.6533203125, -0.58203125, -0.5107421875, -0.439453125, -0.3681640625, -0.296875, -0.2255859375, -0.154296875, -0.0830078125, -0.01171875, 0.0595703125, 0.130859375, 0.2021484375, 0.2734375, 0.3447265625, 0.416015625, 0.4873046875, 0.55859375, 0.6298828125, 0.701171875, 0.7724609375, 0.84375, 0.9150390625, 0.986328125, 1.0576171875, 1.12890625, 1.2001953125, 1.271484375, 1.3427734375, 1.4140625, 1.4853515625, 1.556640625, 1.6279296875, 1.69921875, 1.7705078125, 1.841796875, 1.9130859375, 1.984375, 2.0556640625, 2.126953125, 2.1982421875, 2.26953125, 2.3408203125, 2.412109375, 2.4833984375, 2.5546875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 8.0, 14.0, 20.0, 33.0, 47.0, 59.0, 87.0, 185.0, 274.0, 457.0, 753.0, 1297.0, 2331.0, 4405.0, 8926.0, 19726.0, 46910.0, 127424.0, 450064.0, 2205336.0, 985506.0, 213189.0, 72391.0, 28573.0, 12839.0, 5978.0, 3180.0, 1721.0, 964.0, 545.0, 369.0, 247.0, 147.0, 88.0, 60.0, 47.0, 23.0, 16.0, 12.0, 6.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.7169189453125, -3.595947265625, -3.4749755859375, -3.35400390625, -3.2330322265625, -3.112060546875, -2.9910888671875, -2.8701171875, -2.7491455078125, -2.628173828125, -2.5072021484375, -2.38623046875, -2.2652587890625, -2.144287109375, -2.0233154296875, -1.90234375, -1.7813720703125, -1.660400390625, -1.5394287109375, -1.41845703125, -1.2974853515625, -1.176513671875, -1.0555419921875, -0.9345703125, -0.8135986328125, -0.692626953125, -0.5716552734375, -0.45068359375, -0.3297119140625, -0.208740234375, -0.0877685546875, 0.033203125, 0.1541748046875, 0.275146484375, 0.3961181640625, 0.51708984375, 0.6380615234375, 0.759033203125, 0.8800048828125, 1.0009765625, 1.1219482421875, 1.242919921875, 1.3638916015625, 1.48486328125, 1.6058349609375, 1.726806640625, 1.8477783203125, 1.96875, 2.0897216796875, 2.210693359375, 2.3316650390625, 2.45263671875, 2.5736083984375, 2.694580078125, 2.8155517578125, 2.9365234375, 3.0574951171875, 3.178466796875, 3.2994384765625, 3.42041015625, 3.5413818359375, 3.662353515625, 3.7833251953125, 3.904296875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 8.0, 5.0, 5.0, 6.0, 13.0, 14.0, 10.0, 19.0, 25.0, 27.0, 34.0, 49.0, 49.0, 62.0, 46.0, 68.0, 53.0, 67.0, 68.0, 62.0, 60.0, 52.0, 46.0, 26.0, 31.0, 24.0, 13.0, 11.0, 9.0, 12.0, 5.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.852054595947266, -8.496530532836914, -8.141006469726562, -7.785481929779053, -7.429957389831543, -7.074433326721191, -6.71890926361084, -6.363385200500488, -6.0078606605529785, -5.652336597442627, -5.296812057495117, -4.941287994384766, -4.585763931274414, -4.230239391326904, -3.8747153282165527, -3.519191026687622, -3.1636667251586914, -2.8081424236297607, -2.45261812210083, -2.0970940589904785, -1.7415697574615479, -1.3860454559326172, -1.0305213928222656, -0.674997091293335, -0.3194727897644043, 0.03605145215988159, 0.3915756940841675, 0.7470998764038086, 1.1026241779327393, 1.45814847946167, 1.8136725425720215, 2.169196844100952, 2.524721145629883, 2.8802454471588135, 3.235769748687744, 3.5912938117980957, 3.9468181133270264, 4.302342414855957, 4.657866477966309, 5.01339054107666, 5.36891508102417, 5.7244391441345215, 6.079963684082031, 6.435487747192383, 6.791011810302734, 7.146536350250244, 7.502060413360596, 7.8575849533081055, 8.213109016418457, 8.568633079528809, 8.92415714263916, 9.279682159423828, 9.63520622253418, 9.990730285644531, 10.346254348754883, 10.701778411865234, 11.057302474975586, 11.412826538085938, 11.768350601196289, 12.12387466430664, 12.479399681091309, 12.83492374420166, 13.190447807312012, 13.545971870422363, 13.901496887207031]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 6.0, 5.0, 7.0, 9.0, 10.0, 23.0, 17.0, 20.0, 18.0, 29.0, 32.0, 33.0, 30.0, 36.0, 40.0, 37.0, 33.0, 42.0, 52.0, 40.0, 48.0, 52.0, 41.0, 43.0, 39.0, 29.0, 32.0, 32.0, 27.0, 27.0, 21.0, 18.0, 9.0, 17.0, 12.0, 11.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-12.108345985412598, -11.79099178314209, -11.473636627197266, -11.156282424926758, -10.83892822265625, -10.521574020385742, -10.204219818115234, -9.88686466217041, -9.569510459899902, -9.252156257629395, -8.93480110168457, -8.617446899414062, -8.300092697143555, -7.982738494873047, -7.665383815765381, -7.348029136657715, -7.030674934387207, -6.713320732116699, -6.395966053009033, -6.078611373901367, -5.761257171630859, -5.443902969360352, -5.1265482902526855, -4.8091936111450195, -4.491839408874512, -4.174485206604004, -3.857130527496338, -3.539776086807251, -3.222421646118164, -2.905067205429077, -2.5877127647399902, -2.2703583240509033, -1.9530048370361328, -1.635650396347046, -1.318295955657959, -1.000941514968872, -0.6835870742797852, -0.36623263359069824, -0.04887819290161133, 0.2684762477874756, 0.5858306884765625, 0.9031851291656494, 1.2205395698547363, 1.5378940105438232, 1.8552484512329102, 2.172602891921997, 2.489957332611084, 2.807311773300171, 3.124666213989258, 3.4420206546783447, 3.7593750953674316, 4.076729774475098, 4.3940839767456055, 4.711438179016113, 5.028792858123779, 5.346147537231445, 5.663501739501953, 5.980855941772461, 6.298210620880127, 6.615565299987793, 6.932919502258301, 7.250273704528809, 7.567628383636475, 7.884983062744141, 8.202337265014648]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 7.0, 6.0, 9.0, 19.0, 17.0, 16.0, 21.0, 26.0, 21.0, 31.0, 36.0, 30.0, 37.0, 46.0, 48.0, 48.0, 37.0, 50.0, 49.0, 48.0, 52.0, 42.0, 36.0, 53.0, 33.0, 34.0, 20.0, 17.0, 26.0, 19.0, 20.0, 7.0, 8.0, 7.0, 8.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.087982177734375, -1.04998779296875, -1.011993408203125, -0.9739990234375, -0.936004638671875, -0.89801025390625, -0.860015869140625, -0.822021484375, -0.784027099609375, -0.74603271484375, -0.708038330078125, -0.6700439453125, -0.632049560546875, -0.59405517578125, -0.556060791015625, -0.51806640625, -0.480072021484375, -0.44207763671875, -0.404083251953125, -0.3660888671875, -0.328094482421875, -0.29010009765625, -0.252105712890625, -0.214111328125, -0.176116943359375, -0.13812255859375, -0.100128173828125, -0.0621337890625, -0.024139404296875, 0.01385498046875, 0.051849365234375, 0.08984375, 0.127838134765625, 0.16583251953125, 0.203826904296875, 0.2418212890625, 0.279815673828125, 0.31781005859375, 0.355804443359375, 0.393798828125, 0.431793212890625, 0.46978759765625, 0.507781982421875, 0.5457763671875, 0.583770751953125, 0.62176513671875, 0.659759521484375, 0.69775390625, 0.735748291015625, 0.77374267578125, 0.811737060546875, 0.8497314453125, 0.887725830078125, 0.92572021484375, 0.963714599609375, 1.001708984375, 1.039703369140625, 1.07769775390625, 1.115692138671875, 1.1536865234375, 1.191680908203125, 1.22967529296875, 1.267669677734375, 1.3056640625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 12.0, 9.0, 18.0, 17.0, 36.0, 63.0, 67.0, 137.0, 204.0, 308.0, 487.0, 786.0, 1178.0, 1928.0, 3084.0, 5069.0, 8152.0, 13521.0, 21956.0, 35783.0, 57553.0, 89966.0, 255687.0, 303878.0, 93623.0, 58910.0, 36931.0, 22847.0, 13974.0, 8674.0, 5204.0, 3184.0, 1900.0, 1240.0, 736.0, 505.0, 288.0, 238.0, 151.0, 81.0, 54.0, 41.0, 15.0, 20.0, 11.0, 16.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.603515625, -3.49102783203125, -3.3785400390625, -3.26605224609375, -3.153564453125, -3.04107666015625, -2.9285888671875, -2.81610107421875, -2.70361328125, -2.59112548828125, -2.4786376953125, -2.36614990234375, -2.253662109375, -2.14117431640625, -2.0286865234375, -1.91619873046875, -1.8037109375, -1.69122314453125, -1.5787353515625, -1.46624755859375, -1.353759765625, -1.24127197265625, -1.1287841796875, -1.01629638671875, -0.90380859375, -0.79132080078125, -0.6788330078125, -0.56634521484375, -0.453857421875, -0.34136962890625, -0.2288818359375, -0.11639404296875, -0.00390625, 0.10858154296875, 0.2210693359375, 0.33355712890625, 0.446044921875, 0.55853271484375, 0.6710205078125, 0.78350830078125, 0.89599609375, 1.00848388671875, 1.1209716796875, 1.23345947265625, 1.345947265625, 1.45843505859375, 1.5709228515625, 1.68341064453125, 1.7958984375, 1.90838623046875, 2.0208740234375, 2.13336181640625, 2.245849609375, 2.35833740234375, 2.4708251953125, 2.58331298828125, 2.69580078125, 2.80828857421875, 2.9207763671875, 3.03326416015625, 3.145751953125, 3.25823974609375, 3.3707275390625, 3.48321533203125, 3.595703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 13.0, 3.0, 11.0, 11.0, 12.0, 15.0, 17.0, 20.0, 31.0, 34.0, 31.0, 24.0, 52.0, 32.0, 35.0, 32.0, 49.0, 40.0, 1070.0, 36.0, 47.0, 41.0, 44.0, 42.0, 33.0, 32.0, 29.0, 25.0, 23.0, 15.0, 20.0, 14.0, 11.0, 14.0, 14.0, 11.0, 4.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.79541015625, -0.770477294921875, -0.74554443359375, -0.720611572265625, -0.6956787109375, -0.670745849609375, -0.64581298828125, -0.620880126953125, -0.595947265625, -0.571014404296875, -0.54608154296875, -0.521148681640625, -0.4962158203125, -0.471282958984375, -0.44635009765625, -0.421417236328125, -0.396484375, -0.371551513671875, -0.34661865234375, -0.321685791015625, -0.2967529296875, -0.271820068359375, -0.24688720703125, -0.221954345703125, -0.197021484375, -0.172088623046875, -0.14715576171875, -0.122222900390625, -0.0972900390625, -0.072357177734375, -0.04742431640625, -0.022491455078125, 0.00244140625, 0.027374267578125, 0.05230712890625, 0.077239990234375, 0.1021728515625, 0.127105712890625, 0.15203857421875, 0.176971435546875, 0.201904296875, 0.226837158203125, 0.25177001953125, 0.276702880859375, 0.3016357421875, 0.326568603515625, 0.35150146484375, 0.376434326171875, 0.4013671875, 0.426300048828125, 0.45123291015625, 0.476165771484375, 0.5010986328125, 0.526031494140625, 0.55096435546875, 0.575897216796875, 0.600830078125, 0.625762939453125, 0.65069580078125, 0.675628662109375, 0.7005615234375, 0.725494384765625, 0.75042724609375, 0.775360107421875, 0.80029296875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 11.0, 9.0, 13.0, 33.0, 31.0, 57.0, 85.0, 120.0, 192.0, 302.0, 505.0, 738.0, 1131.0, 1876.0, 2832.0, 4844.0, 8292.0, 15068.0, 27644.0, 56343.0, 141374.0, 1106772.0, 513048.0, 112435.0, 47431.0, 23962.0, 12944.0, 7393.0, 4413.0, 2694.0, 1612.0, 1075.0, 670.0, 422.0, 288.0, 172.0, 118.0, 64.0, 47.0, 27.0, 20.0, 8.0, 10.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.482421875, -2.406951904296875, -2.33148193359375, -2.256011962890625, -2.1805419921875, -2.105072021484375, -2.02960205078125, -1.954132080078125, -1.878662109375, -1.803192138671875, -1.72772216796875, -1.652252197265625, -1.5767822265625, -1.501312255859375, -1.42584228515625, -1.350372314453125, -1.27490234375, -1.199432373046875, -1.12396240234375, -1.048492431640625, -0.9730224609375, -0.897552490234375, -0.82208251953125, -0.746612548828125, -0.671142578125, -0.595672607421875, -0.52020263671875, -0.444732666015625, -0.3692626953125, -0.293792724609375, -0.21832275390625, -0.142852783203125, -0.0673828125, 0.008087158203125, 0.08355712890625, 0.159027099609375, 0.2344970703125, 0.309967041015625, 0.38543701171875, 0.460906982421875, 0.536376953125, 0.611846923828125, 0.68731689453125, 0.762786865234375, 0.8382568359375, 0.913726806640625, 0.98919677734375, 1.064666748046875, 1.14013671875, 1.215606689453125, 1.29107666015625, 1.366546630859375, 1.4420166015625, 1.517486572265625, 1.59295654296875, 1.668426513671875, 1.743896484375, 1.819366455078125, 1.89483642578125, 1.970306396484375, 2.0457763671875, 2.121246337890625, 2.19671630859375, 2.272186279296875, 2.34765625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 10.0, 10.0, 10.0, 11.0, 11.0, 24.0, 26.0, 31.0, 61.0, 57.0, 120.0, 212.0, 105.0, 67.0, 46.0, 36.0, 33.0, 23.0, 19.0, 15.0, 12.0, 14.0, 5.0, 6.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.71142578125, -0.690185546875, -0.6689453125, -0.647705078125, -0.62646484375, -0.605224609375, -0.583984375, -0.562744140625, -0.54150390625, -0.520263671875, -0.4990234375, -0.477783203125, -0.45654296875, -0.435302734375, -0.4140625, -0.392822265625, -0.37158203125, -0.350341796875, -0.3291015625, -0.307861328125, -0.28662109375, -0.265380859375, -0.244140625, -0.222900390625, -0.20166015625, -0.180419921875, -0.1591796875, -0.137939453125, -0.11669921875, -0.095458984375, -0.07421875, -0.052978515625, -0.03173828125, -0.010498046875, 0.0107421875, 0.031982421875, 0.05322265625, 0.074462890625, 0.095703125, 0.116943359375, 0.13818359375, 0.159423828125, 0.1806640625, 0.201904296875, 0.22314453125, 0.244384765625, 0.265625, 0.286865234375, 0.30810546875, 0.329345703125, 0.3505859375, 0.371826171875, 0.39306640625, 0.414306640625, 0.435546875, 0.456787109375, 0.47802734375, 0.499267578125, 0.5205078125, 0.541748046875, 0.56298828125, 0.584228515625, 0.60546875, 0.626708984375, 0.64794921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 12.0, 12.0, 22.0, 47.0, 85.0, 150.0, 407.0, 3705.0, 746111.0, 294428.0, 2844.0, 393.0, 157.0, 79.0, 41.0, 22.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.3046875, -12.8748779296875, -12.445068359375, -12.0152587890625, -11.58544921875, -11.1556396484375, -10.725830078125, -10.2960205078125, -9.8662109375, -9.4364013671875, -9.006591796875, -8.5767822265625, -8.14697265625, -7.7171630859375, -7.287353515625, -6.8575439453125, -6.427734375, -5.9979248046875, -5.568115234375, -5.1383056640625, -4.70849609375, -4.2786865234375, -3.848876953125, -3.4190673828125, -2.9892578125, -2.5594482421875, -2.129638671875, -1.6998291015625, -1.27001953125, -0.8402099609375, -0.410400390625, 0.0194091796875, 0.44921875, 0.8790283203125, 1.308837890625, 1.7386474609375, 2.16845703125, 2.5982666015625, 3.028076171875, 3.4578857421875, 3.8876953125, 4.3175048828125, 4.747314453125, 5.1771240234375, 5.60693359375, 6.0367431640625, 6.466552734375, 6.8963623046875, 7.326171875, 7.7559814453125, 8.185791015625, 8.6156005859375, 9.04541015625, 9.4752197265625, 9.905029296875, 10.3348388671875, 10.7646484375, 11.1944580078125, 11.624267578125, 12.0540771484375, 12.48388671875, 12.9136962890625, 13.343505859375, 13.7733154296875, 14.203125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 34.0, 75.0, 247.0, 324.0, 195.0, 82.0, 29.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.350859642028809, -4.252967834472656, -4.155076503753662, -4.05718469619751, -3.9592933654785156, -3.8614017963409424, -3.763510227203369, -3.665618658065796, -3.5677270889282227, -3.4698355197906494, -3.371943950653076, -3.274052381515503, -3.1761608123779297, -3.0782692432403564, -2.980377674102783, -2.88248610496521, -2.7845945358276367, -2.6867029666900635, -2.5888113975524902, -2.490919828414917, -2.3930282592773438, -2.2951366901397705, -2.1972451210021973, -2.099353551864624, -2.0014617443084717, -1.9035701751708984, -1.8056786060333252, -1.707787036895752, -1.6098954677581787, -1.5120038986206055, -1.4141123294830322, -1.316220760345459, -1.2183293104171753, -1.120437741279602, -1.0225461721420288, -0.9246546030044556, -0.8267630338668823, -0.7288714647293091, -0.6309798359870911, -0.5330882668495178, -0.4351966977119446, -0.33730512857437134, -0.2394135445356369, -0.14152196049690247, -0.043630391359329224, 0.05426117777824402, 0.15215277671813965, 0.2500443458557129, 0.34793591499328613, 0.4458274841308594, 0.5437190532684326, 0.6416106224060059, 0.7395021915435791, 0.8373937606811523, 0.9352853894233704, 1.0331768989562988, 1.131068468093872, 1.2289600372314453, 1.3268516063690186, 1.4247431755065918, 1.522634744644165, 1.6205263137817383, 1.7184178829193115, 1.8163094520568848, 1.9142011404037476]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 10.0, 10.0, 8.0, 14.0, 11.0, 9.0, 24.0, 13.0, 16.0, 14.0, 21.0, 35.0, 37.0, 30.0, 34.0, 29.0, 33.0, 36.0, 39.0, 34.0, 37.0, 37.0, 36.0, 52.0, 34.0, 42.0, 25.0, 34.0, 37.0, 33.0, 29.0, 26.0, 22.0, 14.0, 9.0, 10.0, 17.0, 14.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.6042309403419495, -0.5868264436721802, -0.5694219470024109, -0.5520173907279968, -0.5346128940582275, -0.5172083973884583, -0.49980390071868896, -0.4823994040489197, -0.464994877576828, -0.4475903809070587, -0.43018585443496704, -0.41278135776519775, -0.39537686109542847, -0.3779723346233368, -0.3605678379535675, -0.34316331148147583, -0.32575881481170654, -0.30835431814193726, -0.2909497916698456, -0.2735452950000763, -0.2561407685279846, -0.23873627185821533, -0.22133177518844604, -0.20392726361751556, -0.18652275204658508, -0.1691182404756546, -0.15171372890472412, -0.13430923223495483, -0.11690472066402435, -0.09950020909309387, -0.08209570497274399, -0.0646912008523941, -0.0472867488861084, -0.029882241040468216, -0.012477733194828033, 0.004926774650812149, 0.02233128249645233, 0.03973579406738281, 0.0571402981877327, 0.07454480230808258, 0.09194931387901306, 0.10935382544994354, 0.12675833702087402, 0.1441628336906433, 0.1615673452615738, 0.17897185683250427, 0.19637635350227356, 0.21378086507320404, 0.23118537664413452, 0.248589888215065, 0.2659943997859955, 0.28339889645576477, 0.30080342292785645, 0.31820791959762573, 0.335612416267395, 0.3530169129371643, 0.370421439409256, 0.38782593607902527, 0.40523046255111694, 0.42263495922088623, 0.4400394558906555, 0.4574439823627472, 0.4748484790325165, 0.49225300550460815, 0.5096575021743774]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 9.0, 6.0, 23.0, 15.0, 17.0, 20.0, 27.0, 24.0, 36.0, 30.0, 34.0, 40.0, 43.0, 48.0, 40.0, 43.0, 49.0, 49.0, 48.0, 51.0, 35.0, 41.0, 53.0, 26.0, 36.0, 18.0, 22.0, 24.0, 17.0, 18.0, 9.0, 7.0, 9.0, 2.0, 8.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0660400390625, -1.028564453125, -0.9910888671875, -0.95361328125, -0.9161376953125, -0.878662109375, -0.8411865234375, -0.8037109375, -0.7662353515625, -0.728759765625, -0.6912841796875, -0.65380859375, -0.6163330078125, -0.578857421875, -0.5413818359375, -0.50390625, -0.4664306640625, -0.428955078125, -0.3914794921875, -0.35400390625, -0.3165283203125, -0.279052734375, -0.2415771484375, -0.2041015625, -0.1666259765625, -0.129150390625, -0.0916748046875, -0.05419921875, -0.0167236328125, 0.020751953125, 0.0582275390625, 0.095703125, 0.1331787109375, 0.170654296875, 0.2081298828125, 0.24560546875, 0.2830810546875, 0.320556640625, 0.3580322265625, 0.3955078125, 0.4329833984375, 0.470458984375, 0.5079345703125, 0.54541015625, 0.5828857421875, 0.620361328125, 0.6578369140625, 0.6953125, 0.7327880859375, 0.770263671875, 0.8077392578125, 0.84521484375, 0.8826904296875, 0.920166015625, 0.9576416015625, 0.9951171875, 1.0325927734375, 1.070068359375, 1.1075439453125, 1.14501953125, 1.1824951171875, 1.219970703125, 1.2574462890625, 1.294921875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 14.0, 22.0, 28.0, 34.0, 75.0, 105.0, 177.0, 314.0, 521.0, 864.0, 1519.0, 2672.0, 4880.0, 9166.0, 18218.0, 43686.0, 165574.0, 579804.0, 143715.0, 40354.0, 17142.0, 8663.0, 4803.0, 2689.0, 1472.0, 871.0, 473.0, 275.0, 157.0, 94.0, 51.0, 29.0, 25.0, 13.0, 8.0, 4.0, 3.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.333984375, -2.259796142578125, -2.18560791015625, -2.111419677734375, -2.0372314453125, -1.963043212890625, -1.88885498046875, -1.814666748046875, -1.740478515625, -1.666290283203125, -1.59210205078125, -1.517913818359375, -1.4437255859375, -1.369537353515625, -1.29534912109375, -1.221160888671875, -1.14697265625, -1.072784423828125, -0.99859619140625, -0.924407958984375, -0.8502197265625, -0.776031494140625, -0.70184326171875, -0.627655029296875, -0.553466796875, -0.479278564453125, -0.40509033203125, -0.330902099609375, -0.2567138671875, -0.182525634765625, -0.10833740234375, -0.034149169921875, 0.0400390625, 0.114227294921875, 0.18841552734375, 0.262603759765625, 0.3367919921875, 0.410980224609375, 0.48516845703125, 0.559356689453125, 0.633544921875, 0.707733154296875, 0.78192138671875, 0.856109619140625, 0.9302978515625, 1.004486083984375, 1.07867431640625, 1.152862548828125, 1.22705078125, 1.301239013671875, 1.37542724609375, 1.449615478515625, 1.5238037109375, 1.597991943359375, 1.67218017578125, 1.746368408203125, 1.820556640625, 1.894744873046875, 1.96893310546875, 2.043121337890625, 2.1173095703125, 2.191497802734375, 2.26568603515625, 2.339874267578125, 2.4140625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 16.0, 11.0, 14.0, 26.0, 16.0, 20.0, 27.0, 27.0, 34.0, 51.0, 40.0, 45.0, 51.0, 80.0, 107.0, 276.0, 1471.0, 196.0, 112.0, 82.0, 52.0, 43.0, 29.0, 35.0, 36.0, 25.0, 31.0, 25.0, 21.0, 16.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.89453125, -4.75994873046875, -4.6253662109375, -4.49078369140625, -4.356201171875, -4.22161865234375, -4.0870361328125, -3.95245361328125, -3.81787109375, -3.68328857421875, -3.5487060546875, -3.41412353515625, -3.279541015625, -3.14495849609375, -3.0103759765625, -2.87579345703125, -2.7412109375, -2.60662841796875, -2.4720458984375, -2.33746337890625, -2.202880859375, -2.06829833984375, -1.9337158203125, -1.79913330078125, -1.66455078125, -1.52996826171875, -1.3953857421875, -1.26080322265625, -1.126220703125, -0.99163818359375, -0.8570556640625, -0.72247314453125, -0.587890625, -0.45330810546875, -0.3187255859375, -0.18414306640625, -0.049560546875, 0.08502197265625, 0.2196044921875, 0.35418701171875, 0.48876953125, 0.62335205078125, 0.7579345703125, 0.89251708984375, 1.027099609375, 1.16168212890625, 1.2962646484375, 1.43084716796875, 1.5654296875, 1.70001220703125, 1.8345947265625, 1.96917724609375, 2.103759765625, 2.23834228515625, 2.3729248046875, 2.50750732421875, 2.64208984375, 2.77667236328125, 2.9112548828125, 3.04583740234375, 3.180419921875, 3.31500244140625, 3.4495849609375, 3.58416748046875, 3.71875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 9.0, 9.0, 19.0, 21.0, 30.0, 54.0, 86.0, 141.0, 291.0, 689.0, 1992.0, 7237.0, 45163.0, 1919951.0, 1122378.0, 37636.0, 6694.0, 1931.0, 682.0, 290.0, 147.0, 86.0, 36.0, 35.0, 26.0, 15.0, 12.0, 9.0, 4.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.1129150390625, -7.850830078125, -7.5887451171875, -7.32666015625, -7.0645751953125, -6.802490234375, -6.5404052734375, -6.2783203125, -6.0162353515625, -5.754150390625, -5.4920654296875, -5.22998046875, -4.9678955078125, -4.705810546875, -4.4437255859375, -4.181640625, -3.9195556640625, -3.657470703125, -3.3953857421875, -3.13330078125, -2.8712158203125, -2.609130859375, -2.3470458984375, -2.0849609375, -1.8228759765625, -1.560791015625, -1.2987060546875, -1.03662109375, -0.7745361328125, -0.512451171875, -0.2503662109375, 0.01171875, 0.2738037109375, 0.535888671875, 0.7979736328125, 1.06005859375, 1.3221435546875, 1.584228515625, 1.8463134765625, 2.1083984375, 2.3704833984375, 2.632568359375, 2.8946533203125, 3.15673828125, 3.4188232421875, 3.680908203125, 3.9429931640625, 4.205078125, 4.4671630859375, 4.729248046875, 4.9913330078125, 5.25341796875, 5.5155029296875, 5.777587890625, 6.0396728515625, 6.3017578125, 6.5638427734375, 6.825927734375, 7.0880126953125, 7.35009765625, 7.6121826171875, 7.874267578125, 8.1363525390625, 8.3984375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 13.0, 62.0, 183.0, 354.0, 284.0, 91.0, 21.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.954977035522461, -7.9326066970825195, -6.910236358642578, -5.8878655433654785, -4.865495204925537, -3.8431248664855957, -2.820754051208496, -1.7983837127685547, -0.7760133743286133, 0.24635708332061768, 1.2687275409698486, 2.291098117828369, 3.3134684562683105, 4.335838794708252, 5.358209609985352, 6.380579948425293, 7.402950286865234, 8.425320625305176, 9.447690963745117, 10.470062255859375, 11.492431640625, 12.514802932739258, 13.5371732711792, 14.55954360961914, 15.581913948059082, 16.604284286499023, 17.62665557861328, 18.649024963378906, 19.671396255493164, 20.69376564025879, 21.716136932373047, 22.738506317138672, 23.760875701904297, 24.783246994018555, 25.80561637878418, 26.827987670898438, 27.850357055664062, 28.87272834777832, 29.895099639892578, 30.917469024658203, 31.939838409423828, 32.96220779418945, 33.984580993652344, 35.00695037841797, 36.029319763183594, 37.05168914794922, 38.07406234741211, 39.096431732177734, 40.118804931640625, 41.14117431640625, 42.16354751586914, 43.185916900634766, 44.20828628540039, 45.230655670166016, 46.253028869628906, 47.27539825439453, 48.297767639160156, 49.32013702392578, 50.34251022338867, 51.3648796081543, 52.38724899291992, 53.40961837768555, 54.43199157714844, 55.45436096191406, 56.47673034667969]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 1.0, 9.0, 5.0, 9.0, 10.0, 9.0, 11.0, 10.0, 18.0, 25.0, 23.0, 33.0, 19.0, 28.0, 21.0, 28.0, 31.0, 30.0, 31.0, 35.0, 35.0, 33.0, 33.0, 28.0, 31.0, 38.0, 30.0, 36.0, 27.0, 25.0, 30.0, 31.0, 29.0, 25.0, 20.0, 16.0, 18.0, 15.0, 15.0, 17.0, 11.0, 9.0, 5.0, 8.0, 5.0, 10.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-8.969758987426758, -8.674334526062012, -8.378910064697266, -8.08348560333252, -7.788061141967773, -7.492636680603027, -7.197211742401123, -6.901787281036377, -6.606362819671631, -6.310938358306885, -6.015513896942139, -5.720089435577393, -5.424664497375488, -5.129240036010742, -4.833815574645996, -4.53839111328125, -4.242966651916504, -3.947542190551758, -3.6521177291870117, -3.3566930294036865, -3.0612685680389404, -2.7658441066741943, -2.470419406890869, -2.174994945526123, -1.879570484161377, -1.5841460227966309, -1.2887214422225952, -0.9932969212532043, -0.6978724002838135, -0.4024479389190674, -0.10702335834503174, 0.1884012222290039, 0.4838266372680664, 0.7792511582374573, 1.0746756792068481, 1.3701002597808838, 1.6655247211456299, 1.960949182510376, 2.256373882293701, 2.5517983436584473, 2.8472228050231934, 3.1426472663879395, 3.4380717277526855, 3.7334964275360107, 4.028921127319336, 4.324345588684082, 4.619770050048828, 4.915194511413574, 5.21061897277832, 5.506043434143066, 5.8014678955078125, 6.096892356872559, 6.392316818237305, 6.687741279602051, 6.983166217803955, 7.278590679168701, 7.574015140533447, 7.869439601898193, 8.164864540100098, 8.460289001464844, 8.75571346282959, 9.051137924194336, 9.346562385559082, 9.641986846923828, 9.937411308288574]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 17.0, 15.0, 24.0, 20.0, 17.0, 22.0, 32.0, 33.0, 35.0, 30.0, 43.0, 46.0, 37.0, 49.0, 48.0, 42.0, 59.0, 49.0, 44.0, 43.0, 43.0, 30.0, 30.0, 22.0, 24.0, 30.0, 18.0, 10.0, 11.0, 8.0, 16.0, 6.0, 4.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.023529052734375, -0.98553466796875, -0.947540283203125, -0.9095458984375, -0.871551513671875, -0.83355712890625, -0.795562744140625, -0.757568359375, -0.719573974609375, -0.68157958984375, -0.643585205078125, -0.6055908203125, -0.567596435546875, -0.52960205078125, -0.491607666015625, -0.45361328125, -0.415618896484375, -0.37762451171875, -0.339630126953125, -0.3016357421875, -0.263641357421875, -0.22564697265625, -0.187652587890625, -0.149658203125, -0.111663818359375, -0.07366943359375, -0.035675048828125, 0.0023193359375, 0.040313720703125, 0.07830810546875, 0.116302490234375, 0.154296875, 0.192291259765625, 0.23028564453125, 0.268280029296875, 0.3062744140625, 0.344268798828125, 0.38226318359375, 0.420257568359375, 0.458251953125, 0.496246337890625, 0.53424072265625, 0.572235107421875, 0.6102294921875, 0.648223876953125, 0.68621826171875, 0.724212646484375, 0.76220703125, 0.800201416015625, 0.83819580078125, 0.876190185546875, 0.9141845703125, 0.952178955078125, 0.99017333984375, 1.028167724609375, 1.066162109375, 1.104156494140625, 1.14215087890625, 1.180145263671875, 1.2181396484375, 1.256134033203125, 1.29412841796875, 1.332122802734375, 1.3701171875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 10.0, 17.0, 24.0, 31.0, 58.0, 83.0, 126.0, 184.0, 310.0, 509.0, 871.0, 1520.0, 2570.0, 4615.0, 8455.0, 17400.0, 37902.0, 96986.0, 399881.0, 2069743.0, 1227552.0, 205883.0, 63732.0, 27182.0, 12901.0, 6669.0, 3690.0, 2078.0, 1250.0, 764.0, 476.0, 269.0, 196.0, 109.0, 77.0, 46.0, 37.0, 25.0, 16.0, 15.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1796875, -2.10400390625, -2.0283203125, -1.95263671875, -1.876953125, -1.80126953125, -1.7255859375, -1.64990234375, -1.57421875, -1.49853515625, -1.4228515625, -1.34716796875, -1.271484375, -1.19580078125, -1.1201171875, -1.04443359375, -0.96875, -0.89306640625, -0.8173828125, -0.74169921875, -0.666015625, -0.59033203125, -0.5146484375, -0.43896484375, -0.36328125, -0.28759765625, -0.2119140625, -0.13623046875, -0.060546875, 0.01513671875, 0.0908203125, 0.16650390625, 0.2421875, 0.31787109375, 0.3935546875, 0.46923828125, 0.544921875, 0.62060546875, 0.6962890625, 0.77197265625, 0.84765625, 0.92333984375, 0.9990234375, 1.07470703125, 1.150390625, 1.22607421875, 1.3017578125, 1.37744140625, 1.453125, 1.52880859375, 1.6044921875, 1.68017578125, 1.755859375, 1.83154296875, 1.9072265625, 1.98291015625, 2.05859375, 2.13427734375, 2.2099609375, 2.28564453125, 2.361328125, 2.43701171875, 2.5126953125, 2.58837890625, 2.6640625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 13.0, 16.0, 13.0, 29.0, 24.0, 39.0, 43.0, 78.0, 87.0, 109.0, 192.0, 227.0, 390.0, 454.0, 555.0, 482.0, 365.0, 274.0, 178.0, 154.0, 89.0, 77.0, 45.0, 18.0, 29.0, 21.0, 19.0, 12.0, 23.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.685546875, -2.594970703125, -2.50439453125, -2.413818359375, -2.3232421875, -2.232666015625, -2.14208984375, -2.051513671875, -1.9609375, -1.870361328125, -1.77978515625, -1.689208984375, -1.5986328125, -1.508056640625, -1.41748046875, -1.326904296875, -1.236328125, -1.145751953125, -1.05517578125, -0.964599609375, -0.8740234375, -0.783447265625, -0.69287109375, -0.602294921875, -0.51171875, -0.421142578125, -0.33056640625, -0.239990234375, -0.1494140625, -0.058837890625, 0.03173828125, 0.122314453125, 0.212890625, 0.303466796875, 0.39404296875, 0.484619140625, 0.5751953125, 0.665771484375, 0.75634765625, 0.846923828125, 0.9375, 1.028076171875, 1.11865234375, 1.209228515625, 1.2998046875, 1.390380859375, 1.48095703125, 1.571533203125, 1.662109375, 1.752685546875, 1.84326171875, 1.933837890625, 2.0244140625, 2.114990234375, 2.20556640625, 2.296142578125, 2.38671875, 2.477294921875, 2.56787109375, 2.658447265625, 2.7490234375, 2.839599609375, 2.93017578125, 3.020751953125, 3.111328125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 14.0, 11.0, 30.0, 40.0, 82.0, 103.0, 205.0, 367.0, 687.0, 1501.0, 3742.0, 10025.0, 30366.0, 109213.0, 602412.0, 2766140.0, 525368.0, 99833.0, 28080.0, 9357.0, 3621.0, 1495.0, 703.0, 344.0, 187.0, 127.0, 97.0, 46.0, 27.0, 19.0, 13.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.78125, -5.626953125, -5.47265625, -5.318359375, -5.1640625, -5.009765625, -4.85546875, -4.701171875, -4.546875, -4.392578125, -4.23828125, -4.083984375, -3.9296875, -3.775390625, -3.62109375, -3.466796875, -3.3125, -3.158203125, -3.00390625, -2.849609375, -2.6953125, -2.541015625, -2.38671875, -2.232421875, -2.078125, -1.923828125, -1.76953125, -1.615234375, -1.4609375, -1.306640625, -1.15234375, -0.998046875, -0.84375, -0.689453125, -0.53515625, -0.380859375, -0.2265625, -0.072265625, 0.08203125, 0.236328125, 0.390625, 0.544921875, 0.69921875, 0.853515625, 1.0078125, 1.162109375, 1.31640625, 1.470703125, 1.625, 1.779296875, 1.93359375, 2.087890625, 2.2421875, 2.396484375, 2.55078125, 2.705078125, 2.859375, 3.013671875, 3.16796875, 3.322265625, 3.4765625, 3.630859375, 3.78515625, 3.939453125, 4.09375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 6.0, 14.0, 22.0, 44.0, 54.0, 74.0, 85.0, 120.0, 125.0, 99.0, 99.0, 77.0, 60.0, 39.0, 27.0, 18.0, 12.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.6402530670166, -17.06482696533203, -16.489398956298828, -15.913972854614258, -15.338546752929688, -14.7631196975708, -14.187692642211914, -13.612266540527344, -13.036840438842773, -12.461413383483887, -11.885987281799316, -11.31056022644043, -10.73513412475586, -10.159707069396973, -9.584280014038086, -9.008853912353516, -8.433426856994629, -7.8580002784729, -7.282573699951172, -6.707146644592285, -6.131720542907715, -5.556293487548828, -4.9808669090271, -4.405440330505371, -3.8300137519836426, -3.254587173461914, -2.6791605949401855, -2.103733777999878, -1.5283071994781494, -0.9528806209564209, -0.3774538040161133, 0.19797277450561523, 0.7733993530273438, 1.3488259315490723, 1.9242526292800903, 2.4996793270111084, 3.075105905532837, 3.6505324840545654, 4.225959300994873, 4.801385879516602, 5.37681245803833, 5.952239036560059, 6.527665615081787, 7.103092193603516, 7.678519248962402, 8.253945350646973, 8.82937240600586, 9.40479850769043, 9.980225563049316, 10.555652618408203, 11.131078720092773, 11.70650577545166, 12.28193187713623, 12.857358932495117, 13.432785034179688, 14.008212089538574, 14.583639144897461, 15.159066200256348, 15.734492301940918, 16.309919357299805, 16.885345458984375, 17.460771560668945, 18.03619956970215, 18.61162567138672, 19.18705177307129]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 10.0, 9.0, 5.0, 12.0, 12.0, 12.0, 21.0, 15.0, 20.0, 21.0, 28.0, 25.0, 29.0, 40.0, 41.0, 34.0, 36.0, 45.0, 39.0, 27.0, 39.0, 43.0, 44.0, 32.0, 39.0, 37.0, 37.0, 41.0, 22.0, 19.0, 22.0, 30.0, 19.0, 14.0, 22.0, 12.0, 8.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.64356517791748, -9.366368293762207, -9.089171409606934, -8.811975479125977, -8.534778594970703, -8.25758171081543, -7.980384826660156, -7.703187942504883, -7.425991535186768, -7.148794651031494, -6.871598243713379, -6.5944013595581055, -6.317204475402832, -6.040008068084717, -5.762811183929443, -5.485614776611328, -5.208417892456055, -4.931221008300781, -4.654024600982666, -4.376827716827393, -4.099631309509277, -3.822434425354004, -3.5452375411987305, -3.268040895462036, -2.990844249725342, -2.7136476039886475, -2.436450958251953, -2.1592540740966797, -1.8820574283599854, -1.604860782623291, -1.3276640176773071, -1.0504672527313232, -0.7732715606689453, -0.4960748553276062, -0.2188781499862671, 0.05831855535507202, 0.33551526069641113, 0.6127119064331055, 0.8899086713790894, 1.1671054363250732, 1.4443020820617676, 1.721498727798462, 1.9986954927444458, 2.2758922576904297, 2.553088903427124, 2.8302855491638184, 3.107482433319092, 3.384679079055786, 3.6618757247924805, 3.939072370529175, 4.216269016265869, 4.493465900421143, 4.770662307739258, 5.047859191894531, 5.325056076049805, 5.602252960205078, 5.879449367523193, 6.156646251678467, 6.433842658996582, 6.7110395431518555, 6.988236427307129, 7.265432834625244, 7.542629718780518, 7.819826126098633, 8.097023010253906]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 6.0, 15.0, 12.0, 24.0, 19.0, 19.0, 22.0, 19.0, 26.0, 35.0, 37.0, 36.0, 31.0, 47.0, 43.0, 39.0, 33.0, 56.0, 46.0, 35.0, 38.0, 45.0, 38.0, 30.0, 30.0, 27.0, 23.0, 28.0, 16.0, 12.0, 16.0, 14.0, 12.0, 13.0, 5.0, 11.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.067138671875, -1.03173828125, -0.996337890625, -0.9609375, -0.925537109375, -0.89013671875, -0.854736328125, -0.8193359375, -0.783935546875, -0.74853515625, -0.713134765625, -0.677734375, -0.642333984375, -0.60693359375, -0.571533203125, -0.5361328125, -0.500732421875, -0.46533203125, -0.429931640625, -0.39453125, -0.359130859375, -0.32373046875, -0.288330078125, -0.2529296875, -0.217529296875, -0.18212890625, -0.146728515625, -0.111328125, -0.075927734375, -0.04052734375, -0.005126953125, 0.0302734375, 0.065673828125, 0.10107421875, 0.136474609375, 0.171875, 0.207275390625, 0.24267578125, 0.278076171875, 0.3134765625, 0.348876953125, 0.38427734375, 0.419677734375, 0.455078125, 0.490478515625, 0.52587890625, 0.561279296875, 0.5966796875, 0.632080078125, 0.66748046875, 0.702880859375, 0.73828125, 0.773681640625, 0.80908203125, 0.844482421875, 0.8798828125, 0.915283203125, 0.95068359375, 0.986083984375, 1.021484375, 1.056884765625, 1.09228515625, 1.127685546875, 1.1630859375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 4.0, 11.0, 26.0, 30.0, 35.0, 62.0, 88.0, 157.0, 197.0, 297.0, 457.0, 699.0, 1140.0, 1702.0, 2797.0, 4415.0, 7259.0, 12172.0, 21042.0, 36927.0, 67727.0, 124730.0, 243478.0, 241648.0, 124468.0, 67312.0, 37149.0, 21070.0, 12149.0, 7244.0, 4554.0, 2665.0, 1713.0, 1071.0, 718.0, 432.0, 280.0, 188.0, 132.0, 108.0, 69.0, 27.0, 34.0, 14.0, 16.0, 18.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.876953125, -3.75946044921875, -3.6419677734375, -3.52447509765625, -3.406982421875, -3.28948974609375, -3.1719970703125, -3.05450439453125, -2.93701171875, -2.81951904296875, -2.7020263671875, -2.58453369140625, -2.467041015625, -2.34954833984375, -2.2320556640625, -2.11456298828125, -1.9970703125, -1.87957763671875, -1.7620849609375, -1.64459228515625, -1.527099609375, -1.40960693359375, -1.2921142578125, -1.17462158203125, -1.05712890625, -0.93963623046875, -0.8221435546875, -0.70465087890625, -0.587158203125, -0.46966552734375, -0.3521728515625, -0.23468017578125, -0.1171875, 0.00030517578125, 0.1177978515625, 0.23529052734375, 0.352783203125, 0.47027587890625, 0.5877685546875, 0.70526123046875, 0.82275390625, 0.94024658203125, 1.0577392578125, 1.17523193359375, 1.292724609375, 1.41021728515625, 1.5277099609375, 1.64520263671875, 1.7626953125, 1.88018798828125, 1.9976806640625, 2.11517333984375, 2.232666015625, 2.35015869140625, 2.4676513671875, 2.58514404296875, 2.70263671875, 2.82012939453125, 2.9376220703125, 3.05511474609375, 3.172607421875, 3.29010009765625, 3.4075927734375, 3.52508544921875, 3.642578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 6.0, 11.0, 10.0, 17.0, 19.0, 19.0, 19.0, 15.0, 31.0, 20.0, 24.0, 27.0, 37.0, 48.0, 32.0, 43.0, 39.0, 43.0, 1065.0, 38.0, 38.0, 30.0, 26.0, 29.0, 29.0, 38.0, 22.0, 32.0, 35.0, 20.0, 27.0, 18.0, 22.0, 17.0, 14.0, 6.0, 4.0, 7.0, 11.0, 2.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.84423828125, -0.8199081420898438, -0.7955780029296875, -0.7712478637695312, -0.746917724609375, -0.7225875854492188, -0.6982574462890625, -0.6739273071289062, -0.64959716796875, -0.6252670288085938, -0.6009368896484375, -0.5766067504882812, -0.552276611328125, -0.5279464721679688, -0.5036163330078125, -0.47928619384765625, -0.4549560546875, -0.43062591552734375, -0.4062957763671875, -0.38196563720703125, -0.357635498046875, -0.33330535888671875, -0.3089752197265625, -0.28464508056640625, -0.26031494140625, -0.23598480224609375, -0.2116546630859375, -0.18732452392578125, -0.162994384765625, -0.13866424560546875, -0.1143341064453125, -0.09000396728515625, -0.065673828125, -0.04134368896484375, -0.0170135498046875, 0.00731658935546875, 0.031646728515625, 0.05597686767578125, 0.0803070068359375, 0.10463714599609375, 0.12896728515625, 0.15329742431640625, 0.1776275634765625, 0.20195770263671875, 0.226287841796875, 0.25061798095703125, 0.2749481201171875, 0.29927825927734375, 0.3236083984375, 0.34793853759765625, 0.3722686767578125, 0.39659881591796875, 0.420928955078125, 0.44525909423828125, 0.4695892333984375, 0.49391937255859375, 0.51824951171875, 0.5425796508789062, 0.5669097900390625, 0.5912399291992188, 0.615570068359375, 0.6399002075195312, 0.6642303466796875, 0.6885604858398438, 0.712890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 8.0, 12.0, 22.0, 34.0, 47.0, 82.0, 135.0, 217.0, 339.0, 536.0, 921.0, 1531.0, 2632.0, 4551.0, 7979.0, 15158.0, 30446.0, 68895.0, 200026.0, 1137368.0, 426594.0, 109137.0, 44196.0, 21022.0, 10810.0, 6084.0, 3419.0, 2021.0, 1133.0, 648.0, 428.0, 248.0, 154.0, 103.0, 75.0, 47.0, 22.0, 23.0, 10.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.16961669921875, -2.0853271484375, -2.00103759765625, -1.916748046875, -1.83245849609375, -1.7481689453125, -1.66387939453125, -1.57958984375, -1.49530029296875, -1.4110107421875, -1.32672119140625, -1.242431640625, -1.15814208984375, -1.0738525390625, -0.98956298828125, -0.9052734375, -0.82098388671875, -0.7366943359375, -0.65240478515625, -0.568115234375, -0.48382568359375, -0.3995361328125, -0.31524658203125, -0.23095703125, -0.14666748046875, -0.0623779296875, 0.02191162109375, 0.106201171875, 0.19049072265625, 0.2747802734375, 0.35906982421875, 0.443359375, 0.52764892578125, 0.6119384765625, 0.69622802734375, 0.780517578125, 0.86480712890625, 0.9490966796875, 1.03338623046875, 1.11767578125, 1.20196533203125, 1.2862548828125, 1.37054443359375, 1.454833984375, 1.53912353515625, 1.6234130859375, 1.70770263671875, 1.7919921875, 1.87628173828125, 1.9605712890625, 2.04486083984375, 2.129150390625, 2.21343994140625, 2.2977294921875, 2.38201904296875, 2.46630859375, 2.55059814453125, 2.6348876953125, 2.71917724609375, 2.803466796875, 2.88775634765625, 2.9720458984375, 3.05633544921875, 3.140625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 5.0, 18.0, 8.0, 16.0, 26.0, 31.0, 49.0, 51.0, 71.0, 92.0, 107.0, 111.0, 79.0, 65.0, 49.0, 35.0, 27.0, 29.0, 24.0, 18.0, 15.0, 10.0, 11.0, 3.0, 10.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.67877197265625, -0.6568603515625, -0.63494873046875, -0.613037109375, -0.59112548828125, -0.5692138671875, -0.54730224609375, -0.525390625, -0.50347900390625, -0.4815673828125, -0.45965576171875, -0.437744140625, -0.41583251953125, -0.3939208984375, -0.37200927734375, -0.35009765625, -0.32818603515625, -0.3062744140625, -0.28436279296875, -0.262451171875, -0.24053955078125, -0.2186279296875, -0.19671630859375, -0.1748046875, -0.15289306640625, -0.1309814453125, -0.10906982421875, -0.087158203125, -0.06524658203125, -0.0433349609375, -0.02142333984375, 0.00048828125, 0.02239990234375, 0.0443115234375, 0.06622314453125, 0.088134765625, 0.11004638671875, 0.1319580078125, 0.15386962890625, 0.17578125, 0.19769287109375, 0.2196044921875, 0.24151611328125, 0.263427734375, 0.28533935546875, 0.3072509765625, 0.32916259765625, 0.35107421875, 0.37298583984375, 0.3948974609375, 0.41680908203125, 0.438720703125, 0.46063232421875, 0.4825439453125, 0.50445556640625, 0.5263671875, 0.54827880859375, 0.5701904296875, 0.59210205078125, 0.614013671875, 0.63592529296875, 0.6578369140625, 0.67974853515625, 0.70166015625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 10.0, 6.0, 21.0, 16.0, 26.0, 41.0, 58.0, 67.0, 121.0, 215.0, 605.0, 2588.0, 17831.0, 531471.0, 474362.0, 17356.0, 2487.0, 561.0, 226.0, 138.0, 95.0, 54.0, 49.0, 27.0, 21.0, 16.0, 17.0, 10.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.81640625, -7.53717041015625, -7.2579345703125, -6.97869873046875, -6.699462890625, -6.42022705078125, -6.1409912109375, -5.86175537109375, -5.58251953125, -5.30328369140625, -5.0240478515625, -4.74481201171875, -4.465576171875, -4.18634033203125, -3.9071044921875, -3.62786865234375, -3.3486328125, -3.06939697265625, -2.7901611328125, -2.51092529296875, -2.231689453125, -1.95245361328125, -1.6732177734375, -1.39398193359375, -1.11474609375, -0.83551025390625, -0.5562744140625, -0.27703857421875, 0.002197265625, 0.28143310546875, 0.5606689453125, 0.83990478515625, 1.119140625, 1.39837646484375, 1.6776123046875, 1.95684814453125, 2.236083984375, 2.51531982421875, 2.7945556640625, 3.07379150390625, 3.35302734375, 3.63226318359375, 3.9114990234375, 4.19073486328125, 4.469970703125, 4.74920654296875, 5.0284423828125, 5.30767822265625, 5.5869140625, 5.86614990234375, 6.1453857421875, 6.42462158203125, 6.703857421875, 6.98309326171875, 7.2623291015625, 7.54156494140625, 7.82080078125, 8.10003662109375, 8.3792724609375, 8.65850830078125, 8.937744140625, 9.21697998046875, 9.4962158203125, 9.77545166015625, 10.0546875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 13.0, 36.0, 64.0, 132.0, 193.0, 197.0, 155.0, 100.0, 44.0, 32.0, 18.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.138214588165283, -4.050920486450195, -3.9636263847351074, -3.8763325214385986, -3.7890384197235107, -3.701744318008423, -3.614450216293335, -3.527156352996826, -3.4398622512817383, -3.3525681495666504, -3.2652740478515625, -3.1779801845550537, -3.090686082839966, -3.003391981124878, -2.91609787940979, -2.8288040161132812, -2.7415099143981934, -2.6542158126831055, -2.5669217109680176, -2.479627847671509, -2.392333745956421, -2.305039644241333, -2.217745542526245, -2.1304516792297363, -2.0431573390960693, -1.9558632373809814, -1.868569254875183, -1.7812751531600952, -1.6939811706542969, -1.606687068939209, -1.519392967224121, -1.4320989847183228, -1.3448050022125244, -1.2575109004974365, -1.1702169179916382, -1.0829228162765503, -0.995628833770752, -0.9083347320556641, -0.821040689945221, -0.7337466478347778, -0.6464526057243347, -0.5591585636138916, -0.4718645215034485, -0.384570449590683, -0.29727640748023987, -0.20998236536979675, -0.12268829345703125, -0.035394251346588135, 0.05189979076385498, 0.1391938328742981, 0.2264878898859024, 0.3137819468975067, 0.40107598900794983, 0.48837003111839294, 0.5756641030311584, 0.6629581451416016, 0.7502521872520447, 0.8375462293624878, 0.9248402714729309, 1.012134313583374, 1.099428415298462, 1.1867223978042603, 1.2740164995193481, 1.3613104820251465, 1.4486045837402344]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 9.0, 15.0, 10.0, 11.0, 15.0, 11.0, 20.0, 28.0, 21.0, 28.0, 25.0, 30.0, 30.0, 28.0, 36.0, 40.0, 45.0, 30.0, 24.0, 37.0, 50.0, 36.0, 32.0, 30.0, 36.0, 32.0, 31.0, 23.0, 30.0, 18.0, 23.0, 19.0, 23.0, 19.0, 15.0, 13.0, 10.0, 15.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.48903578519821167, -0.4725942313671112, -0.45615270733833313, -0.43971115350723267, -0.4232696294784546, -0.4068280756473541, -0.39038652181625366, -0.3739449977874756, -0.3575034737586975, -0.34106191992759705, -0.32462039589881897, -0.3081788420677185, -0.29173731803894043, -0.27529576420783997, -0.2588542103767395, -0.24241268634796143, -0.22597113251686096, -0.2095295935869217, -0.19308805465698242, -0.17664650082588196, -0.16020497679710388, -0.14376342296600342, -0.12732188403606415, -0.11088034510612488, -0.09443880617618561, -0.07799726724624634, -0.06155572459101677, -0.0451141819357872, -0.02867264300584793, -0.012231104075908661, 0.004210442304611206, 0.020651981234550476, 0.037093520164489746, 0.053535059094429016, 0.06997659802436829, 0.08641814440488815, 0.10285968333482742, 0.1193012222647667, 0.13574276864528656, 0.15218430757522583, 0.1686258465051651, 0.18506738543510437, 0.20150892436504364, 0.2179504632949829, 0.23439201712608337, 0.25083354115486145, 0.2672750949859619, 0.28371661901474, 0.30015817284584045, 0.3165997266769409, 0.333041250705719, 0.34948280453681946, 0.36592432856559753, 0.382365882396698, 0.3988074064254761, 0.41524896025657654, 0.431690514087677, 0.44813206791877747, 0.46457359194755554, 0.481015145778656, 0.4974566698074341, 0.5138981938362122, 0.530339777469635, 0.5467813014984131, 0.5632228255271912]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 5.0, 7.0, 8.0, 16.0, 18.0, 21.0, 21.0, 17.0, 20.0, 26.0, 36.0, 32.0, 35.0, 31.0, 45.0, 43.0, 33.0, 43.0, 50.0, 46.0, 40.0, 39.0, 39.0, 44.0, 33.0, 23.0, 33.0, 26.0, 20.0, 28.0, 12.0, 19.0, 16.0, 9.0, 9.0, 9.0, 7.0, 13.0, 9.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.0467376708984375, -1.011444091796875, -0.9761505126953125, -0.94085693359375, -0.9055633544921875, -0.870269775390625, -0.8349761962890625, -0.7996826171875, -0.7643890380859375, -0.729095458984375, -0.6938018798828125, -0.65850830078125, -0.6232147216796875, -0.587921142578125, -0.5526275634765625, -0.517333984375, -0.4820404052734375, -0.446746826171875, -0.4114532470703125, -0.37615966796875, -0.3408660888671875, -0.305572509765625, -0.2702789306640625, -0.2349853515625, -0.1996917724609375, -0.164398193359375, -0.1291046142578125, -0.09381103515625, -0.0585174560546875, -0.023223876953125, 0.0120697021484375, 0.04736328125, 0.0826568603515625, 0.117950439453125, 0.1532440185546875, 0.18853759765625, 0.2238311767578125, 0.259124755859375, 0.2944183349609375, 0.3297119140625, 0.3650054931640625, 0.400299072265625, 0.4355926513671875, 0.47088623046875, 0.5061798095703125, 0.541473388671875, 0.5767669677734375, 0.612060546875, 0.6473541259765625, 0.682647705078125, 0.7179412841796875, 0.75323486328125, 0.7885284423828125, 0.823822021484375, 0.8591156005859375, 0.8944091796875, 0.9297027587890625, 0.964996337890625, 1.0002899169921875, 1.03558349609375, 1.0708770751953125, 1.106170654296875, 1.1414642333984375, 1.1767578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 8.0, 7.0, 7.0, 15.0, 31.0, 41.0, 46.0, 90.0, 134.0, 201.0, 304.0, 530.0, 891.0, 1572.0, 2785.0, 5351.0, 10988.0, 23512.0, 55082.0, 146619.0, 378138.0, 260048.0, 91573.0, 37071.0, 16557.0, 7861.0, 3998.0, 2089.0, 1230.0, 711.0, 390.0, 226.0, 159.0, 92.0, 66.0, 44.0, 24.0, 18.0, 14.0, 11.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5830078125, -1.527984619140625, -1.47296142578125, -1.417938232421875, -1.3629150390625, -1.307891845703125, -1.25286865234375, -1.197845458984375, -1.142822265625, -1.087799072265625, -1.03277587890625, -0.977752685546875, -0.9227294921875, -0.867706298828125, -0.81268310546875, -0.757659912109375, -0.70263671875, -0.647613525390625, -0.59259033203125, -0.537567138671875, -0.4825439453125, -0.427520751953125, -0.37249755859375, -0.317474365234375, -0.262451171875, -0.207427978515625, -0.15240478515625, -0.097381591796875, -0.0423583984375, 0.012664794921875, 0.06768798828125, 0.122711181640625, 0.177734375, 0.232757568359375, 0.28778076171875, 0.342803955078125, 0.3978271484375, 0.452850341796875, 0.50787353515625, 0.562896728515625, 0.617919921875, 0.672943115234375, 0.72796630859375, 0.782989501953125, 0.8380126953125, 0.893035888671875, 0.94805908203125, 1.003082275390625, 1.05810546875, 1.113128662109375, 1.16815185546875, 1.223175048828125, 1.2781982421875, 1.333221435546875, 1.38824462890625, 1.443267822265625, 1.498291015625, 1.553314208984375, 1.60833740234375, 1.663360595703125, 1.7183837890625, 1.773406982421875, 1.82843017578125, 1.883453369140625, 1.9384765625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 13.0, 5.0, 9.0, 11.0, 11.0, 17.0, 15.0, 22.0, 24.0, 33.0, 29.0, 35.0, 42.0, 56.0, 98.0, 149.0, 244.0, 1386.0, 255.0, 130.0, 85.0, 64.0, 49.0, 43.0, 38.0, 31.0, 27.0, 22.0, 28.0, 13.0, 12.0, 12.0, 10.0, 11.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.21990966796875, -4.0765380859375, -3.93316650390625, -3.789794921875, -3.64642333984375, -3.5030517578125, -3.35968017578125, -3.21630859375, -3.07293701171875, -2.9295654296875, -2.78619384765625, -2.642822265625, -2.49945068359375, -2.3560791015625, -2.21270751953125, -2.0693359375, -1.92596435546875, -1.7825927734375, -1.63922119140625, -1.495849609375, -1.35247802734375, -1.2091064453125, -1.06573486328125, -0.92236328125, -0.77899169921875, -0.6356201171875, -0.49224853515625, -0.348876953125, -0.20550537109375, -0.0621337890625, 0.08123779296875, 0.224609375, 0.36798095703125, 0.5113525390625, 0.65472412109375, 0.798095703125, 0.94146728515625, 1.0848388671875, 1.22821044921875, 1.37158203125, 1.51495361328125, 1.6583251953125, 1.80169677734375, 1.945068359375, 2.08843994140625, 2.2318115234375, 2.37518310546875, 2.5185546875, 2.66192626953125, 2.8052978515625, 2.94866943359375, 3.092041015625, 3.23541259765625, 3.3787841796875, 3.52215576171875, 3.66552734375, 3.80889892578125, 3.9522705078125, 4.09564208984375, 4.239013671875, 4.38238525390625, 4.5257568359375, 4.66912841796875, 4.8125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 6.0, 10.0, 9.0, 16.0, 21.0, 15.0, 32.0, 58.0, 59.0, 67.0, 105.0, 133.0, 230.0, 432.0, 1053.0, 4122.0, 36892.0, 1360177.0, 1692430.0, 42990.0, 4475.0, 1124.0, 426.0, 225.0, 165.0, 104.0, 71.0, 57.0, 43.0, 37.0, 23.0, 21.0, 14.0, 9.0, 15.0, 10.0, 4.0, 4.0, 6.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.73046875, -6.5135498046875, -6.296630859375, -6.0797119140625, -5.86279296875, -5.6458740234375, -5.428955078125, -5.2120361328125, -4.9951171875, -4.7781982421875, -4.561279296875, -4.3443603515625, -4.12744140625, -3.9105224609375, -3.693603515625, -3.4766845703125, -3.259765625, -3.0428466796875, -2.825927734375, -2.6090087890625, -2.39208984375, -2.1751708984375, -1.958251953125, -1.7413330078125, -1.5244140625, -1.3074951171875, -1.090576171875, -0.8736572265625, -0.65673828125, -0.4398193359375, -0.222900390625, -0.0059814453125, 0.2109375, 0.4278564453125, 0.644775390625, 0.8616943359375, 1.07861328125, 1.2955322265625, 1.512451171875, 1.7293701171875, 1.9462890625, 2.1632080078125, 2.380126953125, 2.5970458984375, 2.81396484375, 3.0308837890625, 3.247802734375, 3.4647216796875, 3.681640625, 3.8985595703125, 4.115478515625, 4.3323974609375, 4.54931640625, 4.7662353515625, 4.983154296875, 5.2000732421875, 5.4169921875, 5.6339111328125, 5.850830078125, 6.0677490234375, 6.28466796875, 6.5015869140625, 6.718505859375, 6.9354248046875, 7.15234375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 12.0, 53.0, 170.0, 323.0, 276.0, 128.0, 43.0, 5.0, 4.0], "bins": [-47.58444595336914, -46.77586364746094, -45.967281341552734, -45.158695220947266, -44.35011291503906, -43.54153060913086, -42.732948303222656, -41.92436218261719, -41.115779876708984, -40.30719757080078, -39.49861526489258, -38.69002914428711, -37.881446838378906, -37.0728645324707, -36.2642822265625, -35.45569610595703, -34.647117614746094, -33.83853530883789, -33.02995300292969, -32.22136688232422, -31.412784576416016, -30.604202270507812, -29.79561996459961, -28.987035751342773, -28.178451538085938, -27.369869232177734, -26.5612850189209, -25.752702713012695, -24.94411849975586, -24.135536193847656, -23.326953887939453, -22.518369674682617, -21.70978355407715, -20.901201248168945, -20.09261703491211, -19.284034729003906, -18.47545051574707, -17.666868209838867, -16.85828399658203, -16.049701690673828, -15.241118431091309, -14.432535171508789, -13.62395191192627, -12.81536865234375, -12.006786346435547, -11.198202133178711, -10.389619827270508, -9.581036567687988, -8.772453308105469, -7.963870048522949, -7.15528678894043, -6.346704006195068, -5.538120746612549, -4.729537487030029, -3.920954704284668, -3.1123714447021484, -2.303788185119629, -1.495205044746399, -0.686621904373169, 0.12196111679077148, 0.930544376373291, 1.7391276359558105, 2.547710418701172, 3.3562936782836914, 4.164876937866211]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 13.0, 7.0, 11.0, 7.0, 15.0, 26.0, 25.0, 29.0, 21.0, 35.0, 32.0, 48.0, 50.0, 31.0, 50.0, 42.0, 50.0, 42.0, 42.0, 49.0, 53.0, 42.0, 36.0, 29.0, 36.0, 28.0, 25.0, 16.0, 22.0, 25.0, 15.0, 8.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.081113815307617, -11.702410697937012, -11.323708534240723, -10.945005416870117, -10.566302299499512, -10.187599182128906, -9.808897018432617, -9.430193901062012, -9.051490783691406, -8.6727876663208, -8.294085502624512, -7.915382385253906, -7.536679267883301, -7.1579766273498535, -6.779273986816406, -6.400570869445801, -6.0218682289123535, -5.643165588378906, -5.264462471008301, -4.8857598304748535, -4.507056713104248, -4.128354072570801, -3.7496511936187744, -3.370948314666748, -2.9922454357147217, -2.6135425567626953, -2.234839677810669, -1.8561369180679321, -1.4774340391159058, -1.0987311601638794, -0.7200284004211426, -0.3413255214691162, 0.037377357482910156, 0.41608020663261414, 0.7947830557823181, 1.1734858751296997, 1.552188754081726, 1.9308916330337524, 2.3095943927764893, 2.6882972717285156, 3.067000150680542, 3.4457030296325684, 3.8244059085845947, 4.203108787536621, 4.581811428070068, 4.960514545440674, 5.339217185974121, 5.717920303344727, 6.096622943878174, 6.475325584411621, 6.854028701782227, 7.232731342315674, 7.611434459686279, 7.990137100219727, 8.368840217590332, 8.747543334960938, 9.126245498657227, 9.504948616027832, 9.883650779724121, 10.262353897094727, 10.641057014465332, 11.019760131835938, 11.398462295532227, 11.777165412902832, 12.155868530273438]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 7.0, 7.0, 4.0, 20.0, 13.0, 15.0, 21.0, 20.0, 27.0, 20.0, 31.0, 40.0, 37.0, 38.0, 34.0, 41.0, 51.0, 46.0, 41.0, 36.0, 34.0, 54.0, 47.0, 36.0, 39.0, 38.0, 19.0, 24.0, 27.0, 20.0, 26.0, 13.0, 11.0, 8.0, 17.0, 5.0, 13.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1513671875, -1.113739013671875, -1.07611083984375, -1.038482666015625, -1.0008544921875, -0.963226318359375, -0.92559814453125, -0.887969970703125, -0.850341796875, -0.812713623046875, -0.77508544921875, -0.737457275390625, -0.6998291015625, -0.662200927734375, -0.62457275390625, -0.586944580078125, -0.54931640625, -0.511688232421875, -0.47406005859375, -0.436431884765625, -0.3988037109375, -0.361175537109375, -0.32354736328125, -0.285919189453125, -0.248291015625, -0.210662841796875, -0.17303466796875, -0.135406494140625, -0.0977783203125, -0.060150146484375, -0.02252197265625, 0.015106201171875, 0.052734375, 0.090362548828125, 0.12799072265625, 0.165618896484375, 0.2032470703125, 0.240875244140625, 0.27850341796875, 0.316131591796875, 0.353759765625, 0.391387939453125, 0.42901611328125, 0.466644287109375, 0.5042724609375, 0.541900634765625, 0.57952880859375, 0.617156982421875, 0.65478515625, 0.692413330078125, 0.73004150390625, 0.767669677734375, 0.8052978515625, 0.842926025390625, 0.88055419921875, 0.918182373046875, 0.955810546875, 0.993438720703125, 1.03106689453125, 1.068695068359375, 1.1063232421875, 1.143951416015625, 1.18157958984375, 1.219207763671875, 1.2568359375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 8.0, 17.0, 23.0, 29.0, 35.0, 73.0, 117.0, 177.0, 314.0, 559.0, 972.0, 1836.0, 3336.0, 6450.0, 13109.0, 28661.0, 73183.0, 290636.0, 2073749.0, 1409200.0, 189130.0, 56233.0, 23356.0, 10964.0, 5345.0, 2844.0, 1587.0, 905.0, 530.0, 297.0, 177.0, 142.0, 82.0, 53.0, 31.0, 28.0, 16.0, 18.0, 9.0, 17.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.537109375, -2.449249267578125, -2.36138916015625, -2.273529052734375, -2.1856689453125, -2.097808837890625, -2.00994873046875, -1.922088623046875, -1.834228515625, -1.746368408203125, -1.65850830078125, -1.570648193359375, -1.4827880859375, -1.394927978515625, -1.30706787109375, -1.219207763671875, -1.13134765625, -1.043487548828125, -0.95562744140625, -0.867767333984375, -0.7799072265625, -0.692047119140625, -0.60418701171875, -0.516326904296875, -0.428466796875, -0.340606689453125, -0.25274658203125, -0.164886474609375, -0.0770263671875, 0.010833740234375, 0.09869384765625, 0.186553955078125, 0.2744140625, 0.362274169921875, 0.45013427734375, 0.537994384765625, 0.6258544921875, 0.713714599609375, 0.80157470703125, 0.889434814453125, 0.977294921875, 1.065155029296875, 1.15301513671875, 1.240875244140625, 1.3287353515625, 1.416595458984375, 1.50445556640625, 1.592315673828125, 1.68017578125, 1.768035888671875, 1.85589599609375, 1.943756103515625, 2.0316162109375, 2.119476318359375, 2.20733642578125, 2.295196533203125, 2.383056640625, 2.470916748046875, 2.55877685546875, 2.646636962890625, 2.7344970703125, 2.822357177734375, 2.91021728515625, 2.998077392578125, 3.0859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 5.0, 7.0, 8.0, 13.0, 12.0, 16.0, 20.0, 31.0, 32.0, 51.0, 64.0, 84.0, 103.0, 149.0, 215.0, 308.0, 415.0, 533.0, 553.0, 410.0, 301.0, 199.0, 140.0, 93.0, 70.0, 65.0, 35.0, 33.0, 24.0, 30.0, 16.0, 8.0, 7.0, 9.0, 1.0, 7.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.58642578125, -2.5029296875, -2.41943359375, -2.3359375, -2.25244140625, -2.1689453125, -2.08544921875, -2.001953125, -1.91845703125, -1.8349609375, -1.75146484375, -1.66796875, -1.58447265625, -1.5009765625, -1.41748046875, -1.333984375, -1.25048828125, -1.1669921875, -1.08349609375, -1.0, -0.91650390625, -0.8330078125, -0.74951171875, -0.666015625, -0.58251953125, -0.4990234375, -0.41552734375, -0.33203125, -0.24853515625, -0.1650390625, -0.08154296875, 0.001953125, 0.08544921875, 0.1689453125, 0.25244140625, 0.3359375, 0.41943359375, 0.5029296875, 0.58642578125, 0.669921875, 0.75341796875, 0.8369140625, 0.92041015625, 1.00390625, 1.08740234375, 1.1708984375, 1.25439453125, 1.337890625, 1.42138671875, 1.5048828125, 1.58837890625, 1.671875, 1.75537109375, 1.8388671875, 1.92236328125, 2.005859375, 2.08935546875, 2.1728515625, 2.25634765625, 2.33984375, 2.42333984375, 2.5068359375, 2.59033203125, 2.673828125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 5.0, 10.0, 10.0, 20.0, 17.0, 31.0, 39.0, 74.0, 114.0, 216.0, 374.0, 784.0, 1682.0, 3881.0, 9747.0, 29242.0, 105675.0, 665374.0, 2822132.0, 436244.0, 81040.0, 23001.0, 8190.0, 3328.0, 1460.0, 678.0, 341.0, 197.0, 122.0, 60.0, 65.0, 33.0, 32.0, 24.0, 15.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.1015625, -4.9488525390625, -4.796142578125, -4.6434326171875, -4.49072265625, -4.3380126953125, -4.185302734375, -4.0325927734375, -3.8798828125, -3.7271728515625, -3.574462890625, -3.4217529296875, -3.26904296875, -3.1163330078125, -2.963623046875, -2.8109130859375, -2.658203125, -2.5054931640625, -2.352783203125, -2.2000732421875, -2.04736328125, -1.8946533203125, -1.741943359375, -1.5892333984375, -1.4365234375, -1.2838134765625, -1.131103515625, -0.9783935546875, -0.82568359375, -0.6729736328125, -0.520263671875, -0.3675537109375, -0.21484375, -0.0621337890625, 0.090576171875, 0.2432861328125, 0.39599609375, 0.5487060546875, 0.701416015625, 0.8541259765625, 1.0068359375, 1.1595458984375, 1.312255859375, 1.4649658203125, 1.61767578125, 1.7703857421875, 1.923095703125, 2.0758056640625, 2.228515625, 2.3812255859375, 2.533935546875, 2.6866455078125, 2.83935546875, 2.9920654296875, 3.144775390625, 3.2974853515625, 3.4501953125, 3.6029052734375, 3.755615234375, 3.9083251953125, 4.06103515625, 4.2137451171875, 4.366455078125, 4.5191650390625, 4.671875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 6.0, 5.0, 7.0, 18.0, 26.0, 22.0, 29.0, 60.0, 55.0, 59.0, 67.0, 71.0, 99.0, 86.0, 96.0, 60.0, 33.0, 48.0, 31.0, 28.0, 21.0, 21.0, 9.0, 15.0, 5.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.821662902832031, -14.431999206542969, -14.042335510253906, -13.652671813964844, -13.263008117675781, -12.873344421386719, -12.483680725097656, -12.09401798248291, -11.704354286193848, -11.314690589904785, -10.925026893615723, -10.53536319732666, -10.145699501037598, -9.756036758422852, -9.366373062133789, -8.976709365844727, -8.587045669555664, -8.197381973266602, -7.807718276977539, -7.418054580688477, -7.028391361236572, -6.63872766494751, -6.249063968658447, -5.859400749206543, -5.469736099243164, -5.080072402954102, -4.690408706665039, -4.300745010375977, -3.9110817909240723, -3.5214180946350098, -3.1317543983459473, -2.742090940475464, -2.3524274826049805, -1.9627639055252075, -1.5731003284454346, -1.183436632156372, -0.7937730550765991, -0.40410947799682617, -0.014445781707763672, 0.3752176761627197, 0.7648813724517822, 1.1545449495315552, 1.5442085266113281, 1.9338722229003906, 2.323535919189453, 2.7131993770599365, 3.102863073348999, 3.4925265312194824, 3.882190227508545, 4.271853923797607, 4.66151762008667, 5.051180839538574, 5.440844535827637, 5.830508232116699, 6.220171928405762, 6.609835624694824, 6.999499320983887, 7.389163017272949, 7.778826713562012, 8.168490409851074, 8.558154106140137, 8.947816848754883, 9.337480545043945, 9.727144241333008, 10.11680793762207]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 5.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 5.0, 19.0, 10.0, 16.0, 20.0, 10.0, 17.0, 18.0, 27.0, 31.0, 35.0, 29.0, 33.0, 29.0, 35.0, 28.0, 28.0, 40.0, 31.0, 38.0, 38.0, 38.0, 35.0, 38.0, 32.0, 26.0, 25.0, 28.0, 28.0, 37.0, 21.0, 16.0, 17.0, 24.0, 12.0, 13.0, 6.0, 8.0, 7.0, 3.0, 6.0, 2.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.9561567306518555, -6.717319488525391, -6.478482246398926, -6.239645481109619, -6.000808238983154, -5.7619709968566895, -5.523134231567383, -5.284296989440918, -5.045459747314453, -4.806622505187988, -4.567785263061523, -4.328948497772217, -4.090111255645752, -3.851274013519287, -3.6124370098114014, -3.3736000061035156, -3.134762763977051, -2.895925521850586, -2.6570885181427, -2.4182515144348145, -2.1794142723083496, -1.9405771493911743, -1.701740026473999, -1.4629029035568237, -1.2240657806396484, -0.9852286577224731, -0.7463915348052979, -0.5075544118881226, -0.26871728897094727, -0.029880166053771973, 0.20895695686340332, 0.4477940797805786, 0.6866312026977539, 0.9254683256149292, 1.1643054485321045, 1.4031425714492798, 1.641979694366455, 1.8808168172836304, 2.1196539402008057, 2.3584909439086914, 2.5973281860351562, 2.836165428161621, 3.075002431869507, 3.3138394355773926, 3.5526766777038574, 3.7915139198303223, 4.030350685119629, 4.269187927246094, 4.508025169372559, 4.746862411499023, 4.985699653625488, 5.224536418914795, 5.46337366104126, 5.702210903167725, 5.941047668457031, 6.179884910583496, 6.418722152709961, 6.657559394836426, 6.896396636962891, 7.135233402252197, 7.374070644378662, 7.612907886505127, 7.851744651794434, 8.090581893920898, 8.329419136047363]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 13.0, 16.0, 15.0, 25.0, 25.0, 22.0, 19.0, 33.0, 30.0, 35.0, 33.0, 36.0, 38.0, 41.0, 44.0, 44.0, 45.0, 49.0, 37.0, 29.0, 47.0, 34.0, 31.0, 28.0, 31.0, 30.0, 24.0, 25.0, 13.0, 18.0, 15.0, 12.0, 7.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.11328125, -1.0773162841796875, -1.041351318359375, -1.0053863525390625, -0.96942138671875, -0.9334564208984375, -0.897491455078125, -0.8615264892578125, -0.8255615234375, -0.7895965576171875, -0.753631591796875, -0.7176666259765625, -0.68170166015625, -0.6457366943359375, -0.609771728515625, -0.5738067626953125, -0.537841796875, -0.5018768310546875, -0.465911865234375, -0.4299468994140625, -0.39398193359375, -0.3580169677734375, -0.322052001953125, -0.2860870361328125, -0.2501220703125, -0.2141571044921875, -0.178192138671875, -0.1422271728515625, -0.10626220703125, -0.0702972412109375, -0.034332275390625, 0.0016326904296875, 0.03759765625, 0.0735626220703125, 0.109527587890625, 0.1454925537109375, 0.18145751953125, 0.2174224853515625, 0.253387451171875, 0.2893524169921875, 0.3253173828125, 0.3612823486328125, 0.397247314453125, 0.4332122802734375, 0.46917724609375, 0.5051422119140625, 0.541107177734375, 0.5770721435546875, 0.613037109375, 0.6490020751953125, 0.684967041015625, 0.7209320068359375, 0.75689697265625, 0.7928619384765625, 0.828826904296875, 0.8647918701171875, 0.9007568359375, 0.9367218017578125, 0.972686767578125, 1.0086517333984375, 1.04461669921875, 1.0805816650390625, 1.116546630859375, 1.1525115966796875, 1.1884765625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 11.0, 15.0, 13.0, 30.0, 51.0, 75.0, 146.0, 241.0, 341.0, 575.0, 984.0, 1704.0, 2844.0, 4923.0, 8597.0, 14998.0, 25286.0, 43388.0, 74874.0, 132315.0, 405567.0, 142097.0, 79459.0, 45697.0, 26705.0, 15682.0, 9252.0, 5229.0, 3041.0, 1764.0, 1039.0, 643.0, 365.0, 215.0, 154.0, 82.0, 39.0, 36.0, 23.0, 16.0, 15.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9942626953125, -3.863525390625, -3.7327880859375, -3.60205078125, -3.4713134765625, -3.340576171875, -3.2098388671875, -3.0791015625, -2.9483642578125, -2.817626953125, -2.6868896484375, -2.55615234375, -2.4254150390625, -2.294677734375, -2.1639404296875, -2.033203125, -1.9024658203125, -1.771728515625, -1.6409912109375, -1.51025390625, -1.3795166015625, -1.248779296875, -1.1180419921875, -0.9873046875, -0.8565673828125, -0.725830078125, -0.5950927734375, -0.46435546875, -0.3336181640625, -0.202880859375, -0.0721435546875, 0.05859375, 0.1893310546875, 0.320068359375, 0.4508056640625, 0.58154296875, 0.7122802734375, 0.843017578125, 0.9737548828125, 1.1044921875, 1.2352294921875, 1.365966796875, 1.4967041015625, 1.62744140625, 1.7581787109375, 1.888916015625, 2.0196533203125, 2.150390625, 2.2811279296875, 2.411865234375, 2.5426025390625, 2.67333984375, 2.8040771484375, 2.934814453125, 3.0655517578125, 3.1962890625, 3.3270263671875, 3.457763671875, 3.5885009765625, 3.71923828125, 3.8499755859375, 3.980712890625, 4.1114501953125, 4.2421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 7.0, 9.0, 7.0, 9.0, 15.0, 19.0, 9.0, 15.0, 18.0, 26.0, 24.0, 34.0, 31.0, 43.0, 32.0, 47.0, 40.0, 39.0, 42.0, 40.0, 1062.0, 53.0, 33.0, 27.0, 45.0, 41.0, 27.0, 22.0, 25.0, 32.0, 26.0, 22.0, 12.0, 17.0, 11.0, 10.0, 12.0, 8.0, 6.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.82470703125, -0.7999038696289062, -0.7751007080078125, -0.7502975463867188, -0.725494384765625, -0.7006912231445312, -0.6758880615234375, -0.6510848999023438, -0.62628173828125, -0.6014785766601562, -0.5766754150390625, -0.5518722534179688, -0.527069091796875, -0.5022659301757812, -0.4774627685546875, -0.45265960693359375, -0.4278564453125, -0.40305328369140625, -0.3782501220703125, -0.35344696044921875, -0.328643798828125, -0.30384063720703125, -0.2790374755859375, -0.25423431396484375, -0.22943115234375, -0.20462799072265625, -0.1798248291015625, -0.15502166748046875, -0.130218505859375, -0.10541534423828125, -0.0806121826171875, -0.05580902099609375, -0.031005859375, -0.00620269775390625, 0.0186004638671875, 0.04340362548828125, 0.068206787109375, 0.09300994873046875, 0.1178131103515625, 0.14261627197265625, 0.16741943359375, 0.19222259521484375, 0.2170257568359375, 0.24182891845703125, 0.266632080078125, 0.29143524169921875, 0.3162384033203125, 0.34104156494140625, 0.3658447265625, 0.39064788818359375, 0.4154510498046875, 0.44025421142578125, 0.465057373046875, 0.48986053466796875, 0.5146636962890625, 0.5394668579101562, 0.56427001953125, 0.5890731811523438, 0.6138763427734375, 0.6386795043945312, 0.663482666015625, 0.6882858276367188, 0.7130889892578125, 0.7378921508789062, 0.7626953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 12.0, 18.0, 22.0, 27.0, 48.0, 57.0, 115.0, 155.0, 210.0, 294.0, 497.0, 762.0, 1165.0, 1765.0, 2751.0, 4409.0, 7095.0, 12087.0, 21497.0, 41027.0, 88048.0, 282236.0, 1278499.0, 199824.0, 72695.0, 34632.0, 18833.0, 10851.0, 6466.0, 3998.0, 2475.0, 1522.0, 1005.0, 701.0, 433.0, 294.0, 206.0, 139.0, 86.0, 48.0, 30.0, 33.0, 16.0, 12.0, 9.0, 12.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.176422119140625, -2.10479736328125, -2.033172607421875, -1.9615478515625, -1.889923095703125, -1.81829833984375, -1.746673583984375, -1.675048828125, -1.603424072265625, -1.53179931640625, -1.460174560546875, -1.3885498046875, -1.316925048828125, -1.24530029296875, -1.173675537109375, -1.10205078125, -1.030426025390625, -0.95880126953125, -0.887176513671875, -0.8155517578125, -0.743927001953125, -0.67230224609375, -0.600677490234375, -0.529052734375, -0.457427978515625, -0.38580322265625, -0.314178466796875, -0.2425537109375, -0.170928955078125, -0.09930419921875, -0.027679443359375, 0.0439453125, 0.115570068359375, 0.18719482421875, 0.258819580078125, 0.3304443359375, 0.402069091796875, 0.47369384765625, 0.545318603515625, 0.616943359375, 0.688568115234375, 0.76019287109375, 0.831817626953125, 0.9034423828125, 0.975067138671875, 1.04669189453125, 1.118316650390625, 1.18994140625, 1.261566162109375, 1.33319091796875, 1.404815673828125, 1.4764404296875, 1.548065185546875, 1.61968994140625, 1.691314697265625, 1.762939453125, 1.834564208984375, 1.90618896484375, 1.977813720703125, 2.0494384765625, 2.121063232421875, 2.19268798828125, 2.264312744140625, 2.3359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 8.0, 5.0, 13.0, 15.0, 13.0, 23.0, 39.0, 60.0, 70.0, 178.0, 215.0, 93.0, 67.0, 50.0, 27.0, 22.0, 19.0, 14.0, 14.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5599441528320312, -0.5393218994140625, -0.5186996459960938, -0.498077392578125, -0.47745513916015625, -0.4568328857421875, -0.43621063232421875, -0.41558837890625, -0.39496612548828125, -0.3743438720703125, -0.35372161865234375, -0.333099365234375, -0.31247711181640625, -0.2918548583984375, -0.27123260498046875, -0.2506103515625, -0.22998809814453125, -0.2093658447265625, -0.18874359130859375, -0.168121337890625, -0.14749908447265625, -0.1268768310546875, -0.10625457763671875, -0.08563232421875, -0.06501007080078125, -0.0443878173828125, -0.02376556396484375, -0.003143310546875, 0.01747894287109375, 0.0381011962890625, 0.05872344970703125, 0.079345703125, 0.09996795654296875, 0.1205902099609375, 0.14121246337890625, 0.161834716796875, 0.18245697021484375, 0.2030792236328125, 0.22370147705078125, 0.24432373046875, 0.26494598388671875, 0.2855682373046875, 0.30619049072265625, 0.326812744140625, 0.34743499755859375, 0.3680572509765625, 0.38867950439453125, 0.4093017578125, 0.42992401123046875, 0.4505462646484375, 0.47116851806640625, 0.491790771484375, 0.5124130249023438, 0.5330352783203125, 0.5536575317382812, 0.57427978515625, 0.5949020385742188, 0.6155242919921875, 0.6361465454101562, 0.656768798828125, 0.6773910522460938, 0.6980133056640625, 0.7186355590820312, 0.7392578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 17.0, 8.0, 14.0, 23.0, 41.0, 80.0, 161.0, 358.0, 877.0, 2418.0, 9890.0, 121570.0, 880487.0, 25652.0, 4516.0, 1347.0, 571.0, 216.0, 109.0, 65.0, 24.0, 24.0, 18.0, 13.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.4765625, -8.2215576171875, -7.966552734375, -7.7115478515625, -7.45654296875, -7.2015380859375, -6.946533203125, -6.6915283203125, -6.4365234375, -6.1815185546875, -5.926513671875, -5.6715087890625, -5.41650390625, -5.1614990234375, -4.906494140625, -4.6514892578125, -4.396484375, -4.1414794921875, -3.886474609375, -3.6314697265625, -3.37646484375, -3.1214599609375, -2.866455078125, -2.6114501953125, -2.3564453125, -2.1014404296875, -1.846435546875, -1.5914306640625, -1.33642578125, -1.0814208984375, -0.826416015625, -0.5714111328125, -0.31640625, -0.0614013671875, 0.193603515625, 0.4486083984375, 0.70361328125, 0.9586181640625, 1.213623046875, 1.4686279296875, 1.7236328125, 1.9786376953125, 2.233642578125, 2.4886474609375, 2.74365234375, 2.9986572265625, 3.253662109375, 3.5086669921875, 3.763671875, 4.0186767578125, 4.273681640625, 4.5286865234375, 4.78369140625, 5.0386962890625, 5.293701171875, 5.5487060546875, 5.8037109375, 6.0587158203125, 6.313720703125, 6.5687255859375, 6.82373046875, 7.0787353515625, 7.333740234375, 7.5887451171875, 7.84375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 18.0, 35.0, 88.0, 199.0, 381.0, 181.0, 61.0, 21.0, 10.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.8809003829956055, -7.727471351623535, -7.574042320251465, -7.420613765716553, -7.267184734344482, -7.113755702972412, -6.960326671600342, -6.8068976402282715, -6.653469085693359, -6.500040054321289, -6.346611022949219, -6.193182468414307, -6.039753437042236, -5.886324405670166, -5.732895374298096, -5.579466342926025, -5.426037311553955, -5.272608280181885, -5.1191792488098145, -4.965750694274902, -4.812321662902832, -4.658892631530762, -4.505463600158691, -4.352034568786621, -4.198605537414551, -4.0451765060424805, -3.8917477130889893, -3.738318681716919, -3.5848898887634277, -3.4314608573913574, -3.278031826019287, -3.124602794647217, -2.971174478530884, -2.8177454471588135, -2.6643166542053223, -2.510887622833252, -2.3574585914611816, -2.2040297985076904, -2.05060076713562, -1.8971718549728394, -1.7437429428100586, -1.5903140306472778, -1.436885118484497, -1.2834560871124268, -1.130027174949646, -0.9765982627868652, -0.8231692910194397, -0.6697403192520142, -0.5163114070892334, -0.36288246512413025, -0.2094535231590271, -0.05602458119392395, 0.0974043607711792, 0.25083327293395996, 0.4042622447013855, 0.557691216468811, 0.7111201286315918, 0.8645490407943726, 1.0179779529571533, 1.1714069843292236, 1.3248358964920044, 1.4782648086547852, 1.6316938400268555, 1.7851227521896362, 1.938551664352417]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 8.0, 4.0, 9.0, 8.0, 22.0, 25.0, 22.0, 26.0, 31.0, 27.0, 40.0, 36.0, 48.0, 40.0, 59.0, 55.0, 47.0, 41.0, 53.0, 53.0, 46.0, 51.0, 43.0, 42.0, 31.0, 19.0, 17.0, 24.0, 16.0, 15.0, 6.0, 9.0, 8.0, 6.0, 3.0, 6.0, 1.0, 0.0, 4.0, 2.0], "bins": [-1.2720398902893066, -1.2410086393356323, -1.209977388381958, -1.1789461374282837, -1.1479148864746094, -1.1168837547302246, -1.0858525037765503, -1.054821252822876, -1.0237900018692017, -0.9927587509155273, -0.961727499961853, -0.9306963086128235, -0.8996650576591492, -0.8686338067054749, -0.8376026153564453, -0.806571364402771, -0.7755401134490967, -0.7445088624954224, -0.713477611541748, -0.6824464201927185, -0.6514151692390442, -0.6203839182853699, -0.5893527269363403, -0.558321475982666, -0.5272902250289917, -0.4962589740753174, -0.46522775292396545, -0.4341965317726135, -0.4031652808189392, -0.3721340298652649, -0.34110280871391296, -0.31007158756256104, -0.27904027700424194, -0.24800904095172882, -0.2169778048992157, -0.18594656884670258, -0.15491533279418945, -0.12388409674167633, -0.09285286068916321, -0.061821624636650085, -0.030790388584136963, 0.00024084746837615967, 0.03127208352088928, 0.062303319573402405, 0.09333455562591553, 0.12436579167842865, 0.15539702773094177, 0.1864282637834549, 0.21745949983596802, 0.24849073588848114, 0.27952197194099426, 0.3105531930923462, 0.3415844440460205, 0.3726156949996948, 0.40364691615104675, 0.4346781373023987, 0.465709388256073, 0.4967406392097473, 0.5277718305587769, 0.5588030815124512, 0.5898343324661255, 0.6208655834197998, 0.6518968343734741, 0.6829280257225037, 0.713959276676178]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 7.0, 9.0, 11.0, 16.0, 13.0, 16.0, 28.0, 21.0, 25.0, 24.0, 29.0, 26.0, 35.0, 32.0, 38.0, 44.0, 47.0, 34.0, 45.0, 43.0, 38.0, 42.0, 31.0, 50.0, 31.0, 32.0, 26.0, 35.0, 25.0, 26.0, 21.0, 23.0, 14.0, 14.0, 7.0, 12.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.10546875, -1.069549560546875, -1.03363037109375, -0.997711181640625, -0.9617919921875, -0.925872802734375, -0.88995361328125, -0.854034423828125, -0.818115234375, -0.782196044921875, -0.74627685546875, -0.710357666015625, -0.6744384765625, -0.638519287109375, -0.60260009765625, -0.566680908203125, -0.53076171875, -0.494842529296875, -0.45892333984375, -0.423004150390625, -0.3870849609375, -0.351165771484375, -0.31524658203125, -0.279327392578125, -0.243408203125, -0.207489013671875, -0.17156982421875, -0.135650634765625, -0.0997314453125, -0.063812255859375, -0.02789306640625, 0.008026123046875, 0.0439453125, 0.079864501953125, 0.11578369140625, 0.151702880859375, 0.1876220703125, 0.223541259765625, 0.25946044921875, 0.295379638671875, 0.331298828125, 0.367218017578125, 0.40313720703125, 0.439056396484375, 0.4749755859375, 0.510894775390625, 0.54681396484375, 0.582733154296875, 0.61865234375, 0.654571533203125, 0.69049072265625, 0.726409912109375, 0.7623291015625, 0.798248291015625, 0.83416748046875, 0.870086669921875, 0.906005859375, 0.941925048828125, 0.97784423828125, 1.013763427734375, 1.0496826171875, 1.085601806640625, 1.12152099609375, 1.157440185546875, 1.193359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 13.0, 26.0, 21.0, 36.0, 36.0, 81.0, 91.0, 129.0, 229.0, 279.0, 448.0, 645.0, 1038.0, 1603.0, 2529.0, 3914.0, 6456.0, 10835.0, 18628.0, 32837.0, 60389.0, 125970.0, 290917.0, 256503.0, 108344.0, 53935.0, 29643.0, 16828.0, 9858.0, 5984.0, 3599.0, 2323.0, 1483.0, 980.0, 596.0, 423.0, 270.0, 198.0, 152.0, 88.0, 45.0, 51.0, 23.0, 22.0, 19.0, 7.0, 2.0, 10.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.3876953125, -1.344207763671875, -1.30072021484375, -1.257232666015625, -1.2137451171875, -1.170257568359375, -1.12677001953125, -1.083282470703125, -1.039794921875, -0.996307373046875, -0.95281982421875, -0.909332275390625, -0.8658447265625, -0.822357177734375, -0.77886962890625, -0.735382080078125, -0.69189453125, -0.648406982421875, -0.60491943359375, -0.561431884765625, -0.5179443359375, -0.474456787109375, -0.43096923828125, -0.387481689453125, -0.343994140625, -0.300506591796875, -0.25701904296875, -0.213531494140625, -0.1700439453125, -0.126556396484375, -0.08306884765625, -0.039581298828125, 0.00390625, 0.047393798828125, 0.09088134765625, 0.134368896484375, 0.1778564453125, 0.221343994140625, 0.26483154296875, 0.308319091796875, 0.351806640625, 0.395294189453125, 0.43878173828125, 0.482269287109375, 0.5257568359375, 0.569244384765625, 0.61273193359375, 0.656219482421875, 0.69970703125, 0.743194580078125, 0.78668212890625, 0.830169677734375, 0.8736572265625, 0.917144775390625, 0.96063232421875, 1.004119873046875, 1.047607421875, 1.091094970703125, 1.13458251953125, 1.178070068359375, 1.2215576171875, 1.265045166015625, 1.30853271484375, 1.352020263671875, 1.3955078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 2.0, 4.0, 4.0, 13.0, 6.0, 11.0, 21.0, 22.0, 23.0, 24.0, 31.0, 41.0, 35.0, 39.0, 42.0, 66.0, 91.0, 141.0, 277.0, 1391.0, 199.0, 115.0, 67.0, 50.0, 58.0, 43.0, 44.0, 32.0, 22.0, 18.0, 21.0, 18.0, 18.0, 8.0, 9.0, 9.0, 4.0, 6.0, 8.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.55859375, -3.43255615234375, -3.3065185546875, -3.18048095703125, -3.054443359375, -2.92840576171875, -2.8023681640625, -2.67633056640625, -2.55029296875, -2.42425537109375, -2.2982177734375, -2.17218017578125, -2.046142578125, -1.92010498046875, -1.7940673828125, -1.66802978515625, -1.5419921875, -1.41595458984375, -1.2899169921875, -1.16387939453125, -1.037841796875, -0.91180419921875, -0.7857666015625, -0.65972900390625, -0.53369140625, -0.40765380859375, -0.2816162109375, -0.15557861328125, -0.029541015625, 0.09649658203125, 0.2225341796875, 0.34857177734375, 0.474609375, 0.60064697265625, 0.7266845703125, 0.85272216796875, 0.978759765625, 1.10479736328125, 1.2308349609375, 1.35687255859375, 1.48291015625, 1.60894775390625, 1.7349853515625, 1.86102294921875, 1.987060546875, 2.11309814453125, 2.2391357421875, 2.36517333984375, 2.4912109375, 2.61724853515625, 2.7432861328125, 2.86932373046875, 2.995361328125, 3.12139892578125, 3.2474365234375, 3.37347412109375, 3.49951171875, 3.62554931640625, 3.7515869140625, 3.87762451171875, 4.003662109375, 4.12969970703125, 4.2557373046875, 4.38177490234375, 4.5078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 2.0, 7.0, 5.0, 11.0, 5.0, 27.0, 30.0, 55.0, 51.0, 99.0, 157.0, 290.0, 707.0, 2340.0, 46963.0, 2994796.0, 95307.0, 3300.0, 744.0, 336.0, 182.0, 103.0, 70.0, 31.0, 34.0, 17.0, 16.0, 10.0, 5.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.6240234375, -9.232421875, -8.8408203125, -8.44921875, -8.0576171875, -7.666015625, -7.2744140625, -6.8828125, -6.4912109375, -6.099609375, -5.7080078125, -5.31640625, -4.9248046875, -4.533203125, -4.1416015625, -3.75, -3.3583984375, -2.966796875, -2.5751953125, -2.18359375, -1.7919921875, -1.400390625, -1.0087890625, -0.6171875, -0.2255859375, 0.166015625, 0.5576171875, 0.94921875, 1.3408203125, 1.732421875, 2.1240234375, 2.515625, 2.9072265625, 3.298828125, 3.6904296875, 4.08203125, 4.4736328125, 4.865234375, 5.2568359375, 5.6484375, 6.0400390625, 6.431640625, 6.8232421875, 7.21484375, 7.6064453125, 7.998046875, 8.3896484375, 8.78125, 9.1728515625, 9.564453125, 9.9560546875, 10.34765625, 10.7392578125, 11.130859375, 11.5224609375, 11.9140625, 12.3056640625, 12.697265625, 13.0888671875, 13.48046875, 13.8720703125, 14.263671875, 14.6552734375, 15.046875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 9.0, 16.0, 47.0, 65.0, 123.0, 161.0, 161.0, 167.0, 119.0, 69.0, 41.0, 24.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.373991012573242, -21.913969039916992, -21.45394515991211, -20.99392318725586, -20.533899307250977, -20.073877334594727, -19.613853454589844, -19.153831481933594, -18.693809509277344, -18.233787536621094, -17.77376365661621, -17.31374168395996, -16.853717803955078, -16.393695831298828, -15.933672904968262, -15.473649978637695, -15.013627052307129, -14.553604125976562, -14.093581199645996, -13.63355827331543, -13.17353630065918, -12.713513374328613, -12.253490447998047, -11.79346752166748, -11.333444595336914, -10.873421669006348, -10.413398742675781, -9.953376770019531, -9.493353843688965, -9.033330917358398, -8.573307991027832, -8.113285064697266, -7.653263092041016, -7.193240165710449, -6.733217716217041, -6.273194789886475, -5.813172340393066, -5.3531494140625, -4.893126487731934, -4.433103561401367, -3.973081111907959, -3.5130584239959717, -3.0530357360839844, -2.593012809753418, -2.1329901218414307, -1.6729674339294434, -1.212944507598877, -0.7529218196868896, -0.29289913177490234, 0.16712361574172974, 0.6271463632583618, 1.0871691703796387, 1.547191858291626, 2.0072145462036133, 2.4672374725341797, 2.927260160446167, 3.3872828483581543, 3.8473055362701416, 4.307328224182129, 4.767351150512695, 5.227374076843262, 5.68739652633667, 6.147419452667236, 6.6074419021606445, 7.067464828491211]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 4.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 8.0, 10.0, 17.0, 16.0, 11.0, 17.0, 29.0, 23.0, 25.0, 33.0, 30.0, 30.0, 23.0, 36.0, 36.0, 34.0, 40.0, 39.0, 39.0, 38.0, 34.0, 39.0, 34.0, 37.0, 25.0, 43.0, 35.0, 24.0, 17.0, 22.0, 26.0, 18.0, 13.0, 10.0, 9.0, 15.0, 10.0, 7.0, 5.0, 7.0, 4.0, 4.0, 3.0, 7.0, 2.0, 3.0, 1.0], "bins": [-11.981572151184082, -11.64344310760498, -11.305314064025879, -10.967184066772461, -10.62905502319336, -10.290925979614258, -9.952796936035156, -9.614667892456055, -9.276538848876953, -8.938409805297852, -8.60028076171875, -8.262151718139648, -7.9240217208862305, -7.585892677307129, -7.247763633728027, -6.909634590148926, -6.571504592895508, -6.233375549316406, -5.8952460289001465, -5.557116985321045, -5.218987464904785, -4.880858421325684, -4.542729377746582, -4.2046003341674805, -3.8664708137512207, -3.52834153175354, -3.1902122497558594, -2.852083206176758, -2.513953924179077, -2.1758246421813965, -1.837695598602295, -1.4995663166046143, -1.1614360809326172, -0.8233068585395813, -0.4851776361465454, -0.1470484733581543, 0.19108080863952637, 0.529210090637207, 0.8673391342163086, 1.2054684162139893, 1.54359769821167, 1.8817269802093506, 2.2198562622070312, 2.557985305786133, 2.8961145877838135, 3.234243869781494, 3.5723729133605957, 3.9105021953582764, 4.248631477355957, 4.586760520935059, 4.924890041351318, 5.26301908493042, 5.60114860534668, 5.939277648925781, 6.277406692504883, 6.615535736083984, 6.953665256500244, 7.291794300079346, 7.6299238204956055, 7.968052864074707, 8.306181907653809, 8.644311904907227, 8.982440948486328, 9.32056999206543, 9.658699035644531]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 12.0, 11.0, 15.0, 13.0, 21.0, 16.0, 27.0, 24.0, 22.0, 34.0, 31.0, 26.0, 30.0, 38.0, 44.0, 34.0, 44.0, 41.0, 39.0, 44.0, 34.0, 41.0, 35.0, 39.0, 40.0, 27.0, 28.0, 20.0, 24.0, 21.0, 20.0, 18.0, 18.0, 10.0, 10.0, 8.0, 7.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1591796875, -1.1226806640625, -1.086181640625, -1.0496826171875, -1.01318359375, -0.9766845703125, -0.940185546875, -0.9036865234375, -0.8671875, -0.8306884765625, -0.794189453125, -0.7576904296875, -0.72119140625, -0.6846923828125, -0.648193359375, -0.6116943359375, -0.5751953125, -0.5386962890625, -0.502197265625, -0.4656982421875, -0.42919921875, -0.3927001953125, -0.356201171875, -0.3197021484375, -0.283203125, -0.2467041015625, -0.210205078125, -0.1737060546875, -0.13720703125, -0.1007080078125, -0.064208984375, -0.0277099609375, 0.0087890625, 0.0452880859375, 0.081787109375, 0.1182861328125, 0.15478515625, 0.1912841796875, 0.227783203125, 0.2642822265625, 0.30078125, 0.3372802734375, 0.373779296875, 0.4102783203125, 0.44677734375, 0.4832763671875, 0.519775390625, 0.5562744140625, 0.5927734375, 0.6292724609375, 0.665771484375, 0.7022705078125, 0.73876953125, 0.7752685546875, 0.811767578125, 0.8482666015625, 0.884765625, 0.9212646484375, 0.957763671875, 0.9942626953125, 1.03076171875, 1.0672607421875, 1.103759765625, 1.1402587890625, 1.1767578125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 16.0, 22.0, 29.0, 31.0, 65.0, 74.0, 145.0, 223.0, 396.0, 604.0, 991.0, 1718.0, 3027.0, 5432.0, 10566.0, 21535.0, 49865.0, 143903.0, 711965.0, 2233200.0, 761038.0, 152823.0, 51891.0, 21874.0, 10461.0, 5406.0, 2838.0, 1608.0, 986.0, 600.0, 327.0, 204.0, 135.0, 84.0, 63.0, 43.0, 21.0, 20.0, 12.0, 5.0, 11.0, 6.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.310546875, -2.234832763671875, -2.15911865234375, -2.083404541015625, -2.0076904296875, -1.931976318359375, -1.85626220703125, -1.780548095703125, -1.704833984375, -1.629119873046875, -1.55340576171875, -1.477691650390625, -1.4019775390625, -1.326263427734375, -1.25054931640625, -1.174835205078125, -1.09912109375, -1.023406982421875, -0.94769287109375, -0.871978759765625, -0.7962646484375, -0.720550537109375, -0.64483642578125, -0.569122314453125, -0.493408203125, -0.417694091796875, -0.34197998046875, -0.266265869140625, -0.1905517578125, -0.114837646484375, -0.03912353515625, 0.036590576171875, 0.1123046875, 0.188018798828125, 0.26373291015625, 0.339447021484375, 0.4151611328125, 0.490875244140625, 0.56658935546875, 0.642303466796875, 0.718017578125, 0.793731689453125, 0.86944580078125, 0.945159912109375, 1.0208740234375, 1.096588134765625, 1.17230224609375, 1.248016357421875, 1.32373046875, 1.399444580078125, 1.47515869140625, 1.550872802734375, 1.6265869140625, 1.702301025390625, 1.77801513671875, 1.853729248046875, 1.929443359375, 2.005157470703125, 2.08087158203125, 2.156585693359375, 2.2322998046875, 2.308013916015625, 2.38372802734375, 2.459442138671875, 2.53515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 9.0, 11.0, 9.0, 20.0, 32.0, 53.0, 73.0, 113.0, 144.0, 193.0, 298.0, 502.0, 632.0, 625.0, 436.0, 298.0, 186.0, 134.0, 98.0, 59.0, 49.0, 32.0, 23.0, 16.0, 11.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0859375, -2.979461669921875, -2.87298583984375, -2.766510009765625, -2.6600341796875, -2.553558349609375, -2.44708251953125, -2.340606689453125, -2.234130859375, -2.127655029296875, -2.02117919921875, -1.914703369140625, -1.8082275390625, -1.701751708984375, -1.59527587890625, -1.488800048828125, -1.38232421875, -1.275848388671875, -1.16937255859375, -1.062896728515625, -0.9564208984375, -0.849945068359375, -0.74346923828125, -0.636993408203125, -0.530517578125, -0.424041748046875, -0.31756591796875, -0.211090087890625, -0.1046142578125, 0.001861572265625, 0.10833740234375, 0.214813232421875, 0.3212890625, 0.427764892578125, 0.53424072265625, 0.640716552734375, 0.7471923828125, 0.853668212890625, 0.96014404296875, 1.066619873046875, 1.173095703125, 1.279571533203125, 1.38604736328125, 1.492523193359375, 1.5989990234375, 1.705474853515625, 1.81195068359375, 1.918426513671875, 2.02490234375, 2.131378173828125, 2.23785400390625, 2.344329833984375, 2.4508056640625, 2.557281494140625, 2.66375732421875, 2.770233154296875, 2.876708984375, 2.983184814453125, 3.08966064453125, 3.196136474609375, 3.3026123046875, 3.409088134765625, 3.51556396484375, 3.622039794921875, 3.728515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 9.0, 7.0, 18.0, 26.0, 38.0, 41.0, 104.0, 166.0, 380.0, 925.0, 2521.0, 8418.0, 34614.0, 197487.0, 2359969.0, 1424436.0, 129896.0, 25072.0, 6660.0, 1997.0, 754.0, 324.0, 185.0, 86.0, 41.0, 27.0, 19.0, 21.0, 8.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37890625, -5.198974609375, -5.01904296875, -4.839111328125, -4.6591796875, -4.479248046875, -4.29931640625, -4.119384765625, -3.939453125, -3.759521484375, -3.57958984375, -3.399658203125, -3.2197265625, -3.039794921875, -2.85986328125, -2.679931640625, -2.5, -2.320068359375, -2.14013671875, -1.960205078125, -1.7802734375, -1.600341796875, -1.42041015625, -1.240478515625, -1.060546875, -0.880615234375, -0.70068359375, -0.520751953125, -0.3408203125, -0.160888671875, 0.01904296875, 0.198974609375, 0.37890625, 0.558837890625, 0.73876953125, 0.918701171875, 1.0986328125, 1.278564453125, 1.45849609375, 1.638427734375, 1.818359375, 1.998291015625, 2.17822265625, 2.358154296875, 2.5380859375, 2.718017578125, 2.89794921875, 3.077880859375, 3.2578125, 3.437744140625, 3.61767578125, 3.797607421875, 3.9775390625, 4.157470703125, 4.33740234375, 4.517333984375, 4.697265625, 4.877197265625, 5.05712890625, 5.237060546875, 5.4169921875, 5.596923828125, 5.77685546875, 5.956787109375, 6.13671875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 10.0, 7.0, 14.0, 27.0, 48.0, 58.0, 72.0, 96.0, 117.0, 98.0, 100.0, 99.0, 81.0, 73.0, 44.0, 20.0, 14.0, 13.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.06809425354004, -22.51380157470703, -21.959510803222656, -21.40521812438965, -20.850927352905273, -20.296634674072266, -19.74234390258789, -19.188051223754883, -18.633758544921875, -18.079465866088867, -17.525175094604492, -16.970882415771484, -16.41659164428711, -15.862298965454102, -15.30800724029541, -14.753715515136719, -14.199424743652344, -13.645133018493652, -13.090841293334961, -12.53654956817627, -11.982257843017578, -11.42796516418457, -10.873673439025879, -10.319381713867188, -9.765089988708496, -9.210798263549805, -8.656506538391113, -8.102214813232422, -7.547922611236572, -6.993630886077881, -6.439338684082031, -5.88504695892334, -5.330754280090332, -4.776462554931641, -4.222170829772949, -3.6678786277770996, -3.113586902618408, -2.559295177459717, -2.0050032138824463, -1.4507112503051758, -0.8964195251464844, -0.3421276807785034, 0.21216416358947754, 0.7664560079574585, 1.3207478523254395, 1.8750395774841309, 2.4293315410614014, 2.983623504638672, 3.5379152297973633, 4.092206954956055, 4.646498680114746, 5.200790882110596, 5.755082607269287, 6.3093743324279785, 6.863666534423828, 7.4179582595825195, 7.972249984741211, 8.526541709899902, 9.080833435058594, 9.635125160217285, 10.189416885375977, 10.743709564208984, 11.298001289367676, 11.852293014526367, 12.406584739685059]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 3.0, 4.0, 9.0, 11.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 25.0, 38.0, 29.0, 28.0, 50.0, 28.0, 47.0, 27.0, 43.0, 51.0, 42.0, 49.0, 46.0, 33.0, 29.0, 42.0, 28.0, 30.0, 30.0, 24.0, 20.0, 25.0, 15.0, 18.0, 25.0, 11.0, 8.0, 12.0, 5.0, 6.0, 11.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.608718872070312, -9.325465202331543, -9.042211532592773, -8.758956909179688, -8.475703239440918, -8.192449569702148, -7.909195899963379, -7.625941753387451, -7.342687606811523, -7.059433937072754, -6.776179790496826, -6.492926120758057, -6.209671974182129, -5.926418304443359, -5.64316463470459, -5.359910488128662, -5.076656818389893, -4.793403148651123, -4.510149002075195, -4.226895332336426, -3.943641185760498, -3.6603875160217285, -3.37713360786438, -3.0938796997070312, -2.8106257915496826, -2.527371883392334, -2.2441179752349854, -1.9608641862869263, -1.6776102781295776, -1.394356369972229, -1.11110258102417, -0.8278486728668213, -0.5445947647094727, -0.2613408863544464, 0.021912992000579834, 0.3051668405532837, 0.5884207487106323, 0.871674656867981, 1.15492844581604, 1.4381823539733887, 1.7214362621307373, 2.004690170288086, 2.2879440784454346, 2.571197986602783, 2.8544516563415527, 3.1377058029174805, 3.42095947265625, 3.7042133808135986, 3.9874672889709473, 4.270720958709717, 4.5539751052856445, 4.837228775024414, 5.120482921600342, 5.403736591339111, 5.686990737915039, 5.970244407653809, 6.253498077392578, 6.536751747131348, 6.820005893707275, 7.103259563446045, 7.386513710021973, 7.669767379760742, 7.953021049499512, 8.236274719238281, 8.519529342651367]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 9.0, 8.0, 6.0, 12.0, 12.0, 18.0, 20.0, 24.0, 22.0, 26.0, 29.0, 30.0, 37.0, 41.0, 49.0, 40.0, 33.0, 47.0, 51.0, 53.0, 40.0, 41.0, 47.0, 30.0, 31.0, 32.0, 31.0, 29.0, 22.0, 17.0, 17.0, 11.0, 18.0, 10.0, 14.0, 8.0, 13.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.1685791015625, -1.130126953125, -1.0916748046875, -1.05322265625, -1.0147705078125, -0.976318359375, -0.9378662109375, -0.8994140625, -0.8609619140625, -0.822509765625, -0.7840576171875, -0.74560546875, -0.7071533203125, -0.668701171875, -0.6302490234375, -0.591796875, -0.5533447265625, -0.514892578125, -0.4764404296875, -0.43798828125, -0.3995361328125, -0.361083984375, -0.3226318359375, -0.2841796875, -0.2457275390625, -0.207275390625, -0.1688232421875, -0.13037109375, -0.0919189453125, -0.053466796875, -0.0150146484375, 0.0234375, 0.0618896484375, 0.100341796875, 0.1387939453125, 0.17724609375, 0.2156982421875, 0.254150390625, 0.2926025390625, 0.3310546875, 0.3695068359375, 0.407958984375, 0.4464111328125, 0.48486328125, 0.5233154296875, 0.561767578125, 0.6002197265625, 0.638671875, 0.6771240234375, 0.715576171875, 0.7540283203125, 0.79248046875, 0.8309326171875, 0.869384765625, 0.9078369140625, 0.9462890625, 0.9847412109375, 1.023193359375, 1.0616455078125, 1.10009765625, 1.1385498046875, 1.177001953125, 1.2154541015625, 1.25390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 15.0, 22.0, 29.0, 41.0, 68.0, 81.0, 136.0, 190.0, 259.0, 385.0, 535.0, 757.0, 1189.0, 1696.0, 2479.0, 3845.0, 5924.0, 9532.0, 16079.0, 29199.0, 56559.0, 155560.0, 503469.0, 137573.0, 53334.0, 27949.0, 15470.0, 9137.0, 5739.0, 3668.0, 2389.0, 1666.0, 1133.0, 738.0, 545.0, 384.0, 245.0, 184.0, 109.0, 77.0, 47.0, 46.0, 33.0, 14.0, 9.0, 5.0, 7.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.9619140625, -1.8995513916015625, -1.837188720703125, -1.7748260498046875, -1.71246337890625, -1.6501007080078125, -1.587738037109375, -1.5253753662109375, -1.4630126953125, -1.4006500244140625, -1.338287353515625, -1.2759246826171875, -1.21356201171875, -1.1511993408203125, -1.088836669921875, -1.0264739990234375, -0.964111328125, -0.9017486572265625, -0.839385986328125, -0.7770233154296875, -0.71466064453125, -0.6522979736328125, -0.589935302734375, -0.5275726318359375, -0.4652099609375, -0.4028472900390625, -0.340484619140625, -0.2781219482421875, -0.21575927734375, -0.1533966064453125, -0.091033935546875, -0.0286712646484375, 0.03369140625, 0.0960540771484375, 0.158416748046875, 0.2207794189453125, 0.28314208984375, 0.3455047607421875, 0.407867431640625, 0.4702301025390625, 0.5325927734375, 0.5949554443359375, 0.657318115234375, 0.7196807861328125, 0.78204345703125, 0.8444061279296875, 0.906768798828125, 0.9691314697265625, 1.031494140625, 1.0938568115234375, 1.156219482421875, 1.2185821533203125, 1.28094482421875, 1.3433074951171875, 1.405670166015625, 1.4680328369140625, 1.5303955078125, 1.5927581787109375, 1.655120849609375, 1.7174835205078125, 1.77984619140625, 1.8422088623046875, 1.904571533203125, 1.9669342041015625, 2.029296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 2.0, 7.0, 8.0, 6.0, 3.0, 7.0, 14.0, 13.0, 16.0, 15.0, 16.0, 21.0, 17.0, 24.0, 25.0, 30.0, 37.0, 25.0, 26.0, 39.0, 35.0, 36.0, 41.0, 1064.0, 33.0, 38.0, 37.0, 37.0, 34.0, 27.0, 34.0, 27.0, 29.0, 24.0, 22.0, 27.0, 18.0, 19.0, 15.0, 15.0, 9.0, 12.0, 10.0, 5.0, 3.0, 6.0, 5.0, 1.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.75, -0.7263259887695312, -0.7026519775390625, -0.6789779663085938, -0.655303955078125, -0.6316299438476562, -0.6079559326171875, -0.5842819213867188, -0.56060791015625, -0.5369338989257812, -0.5132598876953125, -0.48958587646484375, -0.465911865234375, -0.44223785400390625, -0.4185638427734375, -0.39488983154296875, -0.3712158203125, -0.34754180908203125, -0.3238677978515625, -0.30019378662109375, -0.276519775390625, -0.25284576416015625, -0.2291717529296875, -0.20549774169921875, -0.18182373046875, -0.15814971923828125, -0.1344757080078125, -0.11080169677734375, -0.087127685546875, -0.06345367431640625, -0.0397796630859375, -0.01610565185546875, 0.007568359375, 0.03124237060546875, 0.0549163818359375, 0.07859039306640625, 0.102264404296875, 0.12593841552734375, 0.1496124267578125, 0.17328643798828125, 0.19696044921875, 0.22063446044921875, 0.2443084716796875, 0.26798248291015625, 0.291656494140625, 0.31533050537109375, 0.3390045166015625, 0.36267852783203125, 0.3863525390625, 0.41002655029296875, 0.4337005615234375, 0.45737457275390625, 0.481048583984375, 0.5047225952148438, 0.5283966064453125, 0.5520706176757812, 0.57574462890625, 0.5994186401367188, 0.6230926513671875, 0.6467666625976562, 0.670440673828125, 0.6941146850585938, 0.7177886962890625, 0.7414627075195312, 0.76513671875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 4.0, 11.0, 20.0, 29.0, 50.0, 49.0, 91.0, 112.0, 173.0, 243.0, 318.0, 500.0, 697.0, 1076.0, 1534.0, 2325.0, 3699.0, 6012.0, 10364.0, 19275.0, 40913.0, 127498.0, 1375501.0, 370717.0, 71405.0, 28430.0, 13963.0, 8114.0, 4822.0, 3080.0, 2012.0, 1332.0, 848.0, 597.0, 429.0, 276.0, 175.0, 141.0, 78.0, 79.0, 42.0, 34.0, 20.0, 14.0, 10.0, 8.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.580078125, -1.533294677734375, -1.48651123046875, -1.439727783203125, -1.3929443359375, -1.346160888671875, -1.29937744140625, -1.252593994140625, -1.205810546875, -1.159027099609375, -1.11224365234375, -1.065460205078125, -1.0186767578125, -0.971893310546875, -0.92510986328125, -0.878326416015625, -0.83154296875, -0.784759521484375, -0.73797607421875, -0.691192626953125, -0.6444091796875, -0.597625732421875, -0.55084228515625, -0.504058837890625, -0.457275390625, -0.410491943359375, -0.36370849609375, -0.316925048828125, -0.2701416015625, -0.223358154296875, -0.17657470703125, -0.129791259765625, -0.0830078125, -0.036224365234375, 0.01055908203125, 0.057342529296875, 0.1041259765625, 0.150909423828125, 0.19769287109375, 0.244476318359375, 0.291259765625, 0.338043212890625, 0.38482666015625, 0.431610107421875, 0.4783935546875, 0.525177001953125, 0.57196044921875, 0.618743896484375, 0.66552734375, 0.712310791015625, 0.75909423828125, 0.805877685546875, 0.8526611328125, 0.899444580078125, 0.94622802734375, 0.993011474609375, 1.039794921875, 1.086578369140625, 1.13336181640625, 1.180145263671875, 1.2269287109375, 1.273712158203125, 1.32049560546875, 1.367279052734375, 1.4140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 5.0, 4.0, 4.0, 11.0, 7.0, 12.0, 9.0, 21.0, 33.0, 29.0, 43.0, 87.0, 199.0, 183.0, 106.0, 57.0, 36.0, 29.0, 15.0, 16.0, 23.0, 11.0, 11.0, 10.0, 10.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29477691650390625, -0.2858428955078125, -0.27690887451171875, -0.267974853515625, -0.25904083251953125, -0.2501068115234375, -0.24117279052734375, -0.23223876953125, -0.22330474853515625, -0.2143707275390625, -0.20543670654296875, -0.196502685546875, -0.18756866455078125, -0.1786346435546875, -0.16970062255859375, -0.1607666015625, -0.15183258056640625, -0.1428985595703125, -0.13396453857421875, -0.125030517578125, -0.11609649658203125, -0.1071624755859375, -0.09822845458984375, -0.08929443359375, -0.08036041259765625, -0.0714263916015625, -0.06249237060546875, -0.053558349609375, -0.04462432861328125, -0.0356903076171875, -0.02675628662109375, -0.017822265625, -0.00888824462890625, 4.57763671875e-05, 0.00897979736328125, 0.017913818359375, 0.02684783935546875, 0.0357818603515625, 0.04471588134765625, 0.05364990234375, 0.06258392333984375, 0.0715179443359375, 0.08045196533203125, 0.089385986328125, 0.09832000732421875, 0.1072540283203125, 0.11618804931640625, 0.1251220703125, 0.13405609130859375, 0.1429901123046875, 0.15192413330078125, 0.160858154296875, 0.16979217529296875, 0.1787261962890625, 0.18766021728515625, 0.19659423828125, 0.20552825927734375, 0.2144622802734375, 0.22339630126953125, 0.232330322265625, 0.24126434326171875, 0.2501983642578125, 0.25913238525390625, 0.26806640625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 5.0, 10.0, 13.0, 18.0, 22.0, 21.0, 30.0, 36.0, 51.0, 67.0, 132.0, 257.0, 638.0, 1731.0, 5764.0, 25659.0, 723415.0, 263715.0, 19426.0, 4799.0, 1521.0, 556.0, 236.0, 119.0, 84.0, 50.0, 40.0, 27.0, 28.0, 10.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.083984375, -2.993072509765625, -2.90216064453125, -2.811248779296875, -2.7203369140625, -2.629425048828125, -2.53851318359375, -2.447601318359375, -2.356689453125, -2.265777587890625, -2.17486572265625, -2.083953857421875, -1.9930419921875, -1.902130126953125, -1.81121826171875, -1.720306396484375, -1.62939453125, -1.538482666015625, -1.44757080078125, -1.356658935546875, -1.2657470703125, -1.174835205078125, -1.08392333984375, -0.993011474609375, -0.902099609375, -0.811187744140625, -0.72027587890625, -0.629364013671875, -0.5384521484375, -0.447540283203125, -0.35662841796875, -0.265716552734375, -0.1748046875, -0.083892822265625, 0.00701904296875, 0.097930908203125, 0.1888427734375, 0.279754638671875, 0.37066650390625, 0.461578369140625, 0.552490234375, 0.643402099609375, 0.73431396484375, 0.825225830078125, 0.9161376953125, 1.007049560546875, 1.09796142578125, 1.188873291015625, 1.27978515625, 1.370697021484375, 1.46160888671875, 1.552520751953125, 1.6434326171875, 1.734344482421875, 1.82525634765625, 1.916168212890625, 2.007080078125, 2.097991943359375, 2.18890380859375, 2.279815673828125, 2.3707275390625, 2.461639404296875, 2.55255126953125, 2.643463134765625, 2.734375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 2.0, 5.0, 18.0, 40.0, 75.0, 181.0, 290.0, 193.0, 99.0, 46.0, 29.0, 17.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2737181186676025, -2.223802089691162, -2.1738860607147217, -2.123969793319702, -2.0740537643432617, -2.0241377353668213, -1.9742215871810913, -1.9243055582046509, -1.874389410018921, -1.8244733810424805, -1.7745572328567505, -1.72464120388031, -1.67472505569458, -1.6248090267181396, -1.5748928785324097, -1.5249768495559692, -1.4750607013702393, -1.4251446723937988, -1.3752285242080688, -1.3253124952316284, -1.2753963470458984, -1.225480318069458, -1.175564169883728, -1.1256481409072876, -1.0757321119308472, -1.0258160829544067, -0.9758999347686768, -0.9259838461875916, -0.8760677576065063, -0.8261516690254211, -0.7762355804443359, -0.7263195514678955, -0.6764034032821655, -0.6264873147010803, -0.5765712261199951, -0.5266551375389099, -0.4767390489578247, -0.4268229603767395, -0.3769069015979767, -0.3269908130168915, -0.2770747244358063, -0.22715863585472107, -0.17724254727363586, -0.12732647359371185, -0.07741038501262665, -0.027494296431541443, 0.02242177724838257, 0.07233786582946777, 0.12225395441055298, 0.17217004299163818, 0.2220861315727234, 0.2720022201538086, 0.3219183087348938, 0.371834397315979, 0.4217504560947418, 0.471666544675827, 0.5215826034545898, 0.571498692035675, 0.6214147806167603, 0.6713308691978455, 0.7212469577789307, 0.7711630463600159, 0.8210791349411011, 0.8709951639175415, 0.9209113121032715]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 0.0, 2.0, 6.0, 4.0, 11.0, 13.0, 8.0, 25.0, 17.0, 21.0, 27.0, 27.0, 40.0, 44.0, 33.0, 47.0, 53.0, 44.0, 44.0, 38.0, 40.0, 51.0, 45.0, 42.0, 34.0, 39.0, 29.0, 29.0, 34.0, 21.0, 21.0, 20.0, 13.0, 19.0, 11.0, 15.0, 9.0, 9.0, 6.0, 3.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.44118499755859375, -0.4293108284473419, -0.4174366891384125, -0.40556252002716064, -0.3936883807182312, -0.38181421160697937, -0.3699400722980499, -0.3580659031867981, -0.34619176387786865, -0.3343175947666168, -0.3224434554576874, -0.31056928634643555, -0.2986951470375061, -0.2868209779262543, -0.27494683861732483, -0.263072669506073, -0.25119853019714355, -0.23932437598705292, -0.22745022177696228, -0.21557606756687164, -0.203701913356781, -0.19182775914669037, -0.17995360493659973, -0.1680794358253479, -0.15620526671409607, -0.14433111250400543, -0.1324569582939148, -0.12058280408382416, -0.10870864987373352, -0.09683449566364288, -0.08496033400297165, -0.07308617979288101, -0.06121203303337097, -0.049337878823280334, -0.0374637246131897, -0.02558956667780876, -0.013715412467718124, -0.0018412582576274872, 0.010032899677753448, 0.021907053887844086, 0.03378120809793472, 0.04565536230802536, 0.057529516518116, 0.06940367817878723, 0.08127783238887787, 0.0931519865989685, 0.10502614080905914, 0.11690029501914978, 0.12877444922924042, 0.14064860343933105, 0.1525227576494217, 0.16439691185951233, 0.17627106606960297, 0.1881452202796936, 0.20001938939094543, 0.21189352869987488, 0.2237676978111267, 0.23564185202121735, 0.24751600623130798, 0.2593901753425598, 0.27126431465148926, 0.2831384837627411, 0.29501262307167053, 0.30688679218292236, 0.3187609314918518]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 11.0, 7.0, 7.0, 10.0, 18.0, 13.0, 19.0, 25.0, 27.0, 14.0, 31.0, 34.0, 39.0, 46.0, 39.0, 40.0, 33.0, 45.0, 52.0, 52.0, 43.0, 41.0, 47.0, 28.0, 31.0, 31.0, 30.0, 28.0, 28.0, 16.0, 18.0, 9.0, 18.0, 13.0, 11.0, 8.0, 16.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.163970947265625, -1.12579345703125, -1.087615966796875, -1.0494384765625, -1.011260986328125, -0.97308349609375, -0.934906005859375, -0.896728515625, -0.858551025390625, -0.82037353515625, -0.782196044921875, -0.7440185546875, -0.705841064453125, -0.66766357421875, -0.629486083984375, -0.59130859375, -0.553131103515625, -0.51495361328125, -0.476776123046875, -0.4385986328125, -0.400421142578125, -0.36224365234375, -0.324066162109375, -0.285888671875, -0.247711181640625, -0.20953369140625, -0.171356201171875, -0.1331787109375, -0.095001220703125, -0.05682373046875, -0.018646240234375, 0.01953125, 0.057708740234375, 0.09588623046875, 0.134063720703125, 0.1722412109375, 0.210418701171875, 0.24859619140625, 0.286773681640625, 0.324951171875, 0.363128662109375, 0.40130615234375, 0.439483642578125, 0.4776611328125, 0.515838623046875, 0.55401611328125, 0.592193603515625, 0.63037109375, 0.668548583984375, 0.70672607421875, 0.744903564453125, 0.7830810546875, 0.821258544921875, 0.85943603515625, 0.897613525390625, 0.935791015625, 0.973968505859375, 1.01214599609375, 1.050323486328125, 1.0885009765625, 1.126678466796875, 1.16485595703125, 1.203033447265625, 1.2412109375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 15.0, 33.0, 31.0, 59.0, 85.0, 168.0, 209.0, 322.0, 526.0, 859.0, 1437.0, 2658.0, 4720.0, 8787.0, 18382.0, 40432.0, 97210.0, 247763.0, 349021.0, 157931.0, 62981.0, 27086.0, 12774.0, 6590.0, 3526.0, 1922.0, 1160.0, 700.0, 412.0, 258.0, 181.0, 109.0, 73.0, 48.0, 35.0, 16.0, 14.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.08203125, -2.0212554931640625, -1.960479736328125, -1.8997039794921875, -1.83892822265625, -1.7781524658203125, -1.717376708984375, -1.6566009521484375, -1.5958251953125, -1.5350494384765625, -1.474273681640625, -1.4134979248046875, -1.35272216796875, -1.2919464111328125, -1.231170654296875, -1.1703948974609375, -1.109619140625, -1.0488433837890625, -0.988067626953125, -0.9272918701171875, -0.86651611328125, -0.8057403564453125, -0.744964599609375, -0.6841888427734375, -0.6234130859375, -0.5626373291015625, -0.501861572265625, -0.4410858154296875, -0.38031005859375, -0.3195343017578125, -0.258758544921875, -0.1979827880859375, -0.13720703125, -0.0764312744140625, -0.015655517578125, 0.0451202392578125, 0.10589599609375, 0.1666717529296875, 0.227447509765625, 0.2882232666015625, 0.3489990234375, 0.4097747802734375, 0.470550537109375, 0.5313262939453125, 0.59210205078125, 0.6528778076171875, 0.713653564453125, 0.7744293212890625, 0.835205078125, 0.8959808349609375, 0.956756591796875, 1.0175323486328125, 1.07830810546875, 1.1390838623046875, 1.199859619140625, 1.2606353759765625, 1.3214111328125, 1.3821868896484375, 1.442962646484375, 1.5037384033203125, 1.56451416015625, 1.6252899169921875, 1.686065673828125, 1.7468414306640625, 1.8076171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 5.0, 15.0, 11.0, 10.0, 19.0, 20.0, 22.0, 27.0, 51.0, 35.0, 43.0, 67.0, 69.0, 115.0, 161.0, 250.0, 1364.0, 190.0, 128.0, 80.0, 55.0, 63.0, 37.0, 42.0, 28.0, 22.0, 18.0, 24.0, 9.0, 10.0, 6.0, 7.0, 9.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.91448974609375, -3.7703857421875, -3.62628173828125, -3.482177734375, -3.33807373046875, -3.1939697265625, -3.04986572265625, -2.90576171875, -2.76165771484375, -2.6175537109375, -2.47344970703125, -2.329345703125, -2.18524169921875, -2.0411376953125, -1.89703369140625, -1.7529296875, -1.60882568359375, -1.4647216796875, -1.32061767578125, -1.176513671875, -1.03240966796875, -0.8883056640625, -0.74420166015625, -0.60009765625, -0.45599365234375, -0.3118896484375, -0.16778564453125, -0.023681640625, 0.12042236328125, 0.2645263671875, 0.40863037109375, 0.552734375, 0.69683837890625, 0.8409423828125, 0.98504638671875, 1.129150390625, 1.27325439453125, 1.4173583984375, 1.56146240234375, 1.70556640625, 1.84967041015625, 1.9937744140625, 2.13787841796875, 2.281982421875, 2.42608642578125, 2.5701904296875, 2.71429443359375, 2.8583984375, 3.00250244140625, 3.1466064453125, 3.29071044921875, 3.434814453125, 3.57891845703125, 3.7230224609375, 3.86712646484375, 4.01123046875, 4.15533447265625, 4.2994384765625, 4.44354248046875, 4.587646484375, 4.73175048828125, 4.8758544921875, 5.01995849609375, 5.1640625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 14.0, 8.0, 15.0, 13.0, 17.0, 31.0, 35.0, 38.0, 65.0, 87.0, 113.0, 187.0, 218.0, 474.0, 992.0, 2592.0, 12395.0, 159118.0, 2569760.0, 371667.0, 21617.0, 3489.0, 1189.0, 522.0, 315.0, 187.0, 121.0, 106.0, 74.0, 53.0, 41.0, 32.0, 23.0, 16.0, 12.0, 12.0, 16.0, 6.0, 8.0, 0.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.75, -7.52618408203125, -7.3023681640625, -7.07855224609375, -6.854736328125, -6.63092041015625, -6.4071044921875, -6.18328857421875, -5.95947265625, -5.73565673828125, -5.5118408203125, -5.28802490234375, -5.064208984375, -4.84039306640625, -4.6165771484375, -4.39276123046875, -4.1689453125, -3.94512939453125, -3.7213134765625, -3.49749755859375, -3.273681640625, -3.04986572265625, -2.8260498046875, -2.60223388671875, -2.37841796875, -2.15460205078125, -1.9307861328125, -1.70697021484375, -1.483154296875, -1.25933837890625, -1.0355224609375, -0.81170654296875, -0.587890625, -0.36407470703125, -0.1402587890625, 0.08355712890625, 0.307373046875, 0.53118896484375, 0.7550048828125, 0.97882080078125, 1.20263671875, 1.42645263671875, 1.6502685546875, 1.87408447265625, 2.097900390625, 2.32171630859375, 2.5455322265625, 2.76934814453125, 2.9931640625, 3.21697998046875, 3.4407958984375, 3.66461181640625, 3.888427734375, 4.11224365234375, 4.3360595703125, 4.55987548828125, 4.78369140625, 5.00750732421875, 5.2313232421875, 5.45513916015625, 5.678955078125, 5.90277099609375, 6.1265869140625, 6.35040283203125, 6.57421875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 12.0, 36.0, 39.0, 73.0, 85.0, 107.0, 129.0, 139.0, 120.0, 101.0, 70.0, 38.0, 24.0, 14.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.294337272644043, -10.860840797424316, -10.42734432220459, -9.993847846984863, -9.560352325439453, -9.126855850219727, -8.693359375, -8.259862899780273, -7.826366424560547, -7.39286994934082, -6.959373474121094, -6.525877475738525, -6.092381000518799, -5.658884525299072, -5.225388526916504, -4.791892051696777, -4.358395576477051, -3.924899101257324, -3.4914028644561768, -3.0579066276550293, -2.6244101524353027, -2.190913677215576, -1.7574174404144287, -1.3239212036132812, -0.8904247283935547, -0.4569283723831177, -0.023432016372680664, 0.41006433963775635, 0.8435606956481934, 1.27705717086792, 1.7105534076690674, 2.144049644470215, 2.577545166015625, 3.0110416412353516, 3.444537878036499, 3.8780341148376465, 4.311530590057373, 4.7450270652771, 5.178523063659668, 5.6120195388793945, 6.045516014099121, 6.479012489318848, 6.912508964538574, 7.346004962921143, 7.779501438140869, 8.212997436523438, 8.646493911743164, 9.07999038696289, 9.513486862182617, 9.946983337402344, 10.38047981262207, 10.813976287841797, 11.247472763061523, 11.68096923828125, 12.11446475982666, 12.547961235046387, 12.981457710266113, 13.41495418548584, 13.848450660705566, 14.281947135925293, 14.715442657470703, 15.14893913269043, 15.582435607910156, 16.015932083129883, 16.44942855834961]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 7.0, 10.0, 13.0, 22.0, 19.0, 17.0, 25.0, 21.0, 18.0, 19.0, 33.0, 30.0, 29.0, 26.0, 35.0, 34.0, 34.0, 36.0, 41.0, 42.0, 37.0, 43.0, 34.0, 38.0, 50.0, 33.0, 28.0, 24.0, 23.0, 17.0, 20.0, 18.0, 14.0, 17.0, 8.0, 17.0, 9.0, 5.0, 8.0, 9.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.739813804626465, -10.425835609436035, -10.111857414245605, -9.797879219055176, -9.483901023864746, -9.169922828674316, -8.855944633483887, -8.54196548461914, -8.227987289428711, -7.914009094238281, -7.600030899047852, -7.286052703857422, -6.972074508666992, -6.6580963134765625, -6.344117641448975, -6.030139446258545, -5.716161727905273, -5.402183532714844, -5.088205337524414, -4.774227142333984, -4.460248947143555, -4.146270751953125, -3.832292079925537, -3.5183138847351074, -3.2043356895446777, -2.890357494354248, -2.5763792991638184, -2.2624008655548096, -1.9484226703643799, -1.6344444751739502, -1.320466160774231, -1.0064878463745117, -0.692509651184082, -0.37853139638900757, -0.0645531415939331, 0.24942511320114136, 0.5634033679962158, 0.8773815631866455, 1.1913598775863647, 1.505338191986084, 1.8193163871765137, 2.1332945823669434, 2.447272777557373, 2.761251211166382, 3.0752294063568115, 3.389207601547241, 3.70318603515625, 4.01716423034668, 4.331142425537109, 4.645120620727539, 4.959098815917969, 5.273077011108398, 5.587055206298828, 5.901033401489258, 6.215012073516846, 6.528990268707275, 6.842968463897705, 7.156946659088135, 7.4709248542785645, 7.784903049468994, 8.098881721496582, 8.412859916687012, 8.726838111877441, 9.040816307067871, 9.3547945022583]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 8.0, 7.0, 7.0, 13.0, 13.0, 15.0, 15.0, 19.0, 15.0, 22.0, 19.0, 30.0, 30.0, 23.0, 46.0, 34.0, 46.0, 41.0, 33.0, 43.0, 42.0, 43.0, 39.0, 42.0, 33.0, 29.0, 35.0, 30.0, 27.0, 32.0, 23.0, 24.0, 16.0, 13.0, 16.0, 13.0, 9.0, 7.0, 10.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1435546875, -1.105712890625, -1.06787109375, -1.030029296875, -0.9921875, -0.954345703125, -0.91650390625, -0.878662109375, -0.8408203125, -0.802978515625, -0.76513671875, -0.727294921875, -0.689453125, -0.651611328125, -0.61376953125, -0.575927734375, -0.5380859375, -0.500244140625, -0.46240234375, -0.424560546875, -0.38671875, -0.348876953125, -0.31103515625, -0.273193359375, -0.2353515625, -0.197509765625, -0.15966796875, -0.121826171875, -0.083984375, -0.046142578125, -0.00830078125, 0.029541015625, 0.0673828125, 0.105224609375, 0.14306640625, 0.180908203125, 0.21875, 0.256591796875, 0.29443359375, 0.332275390625, 0.3701171875, 0.407958984375, 0.44580078125, 0.483642578125, 0.521484375, 0.559326171875, 0.59716796875, 0.635009765625, 0.6728515625, 0.710693359375, 0.74853515625, 0.786376953125, 0.82421875, 0.862060546875, 0.89990234375, 0.937744140625, 0.9755859375, 1.013427734375, 1.05126953125, 1.089111328125, 1.126953125, 1.164794921875, 1.20263671875, 1.240478515625, 1.2783203125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 6.0, 6.0, 9.0, 10.0, 9.0, 16.0, 18.0, 30.0, 32.0, 34.0, 60.0, 113.0, 154.0, 257.0, 412.0, 661.0, 1267.0, 2383.0, 4615.0, 10117.0, 26823.0, 89048.0, 538864.0, 2621490.0, 738259.0, 108492.0, 30072.0, 10959.0, 4664.0, 2317.0, 1245.0, 703.0, 402.0, 247.0, 167.0, 89.0, 64.0, 52.0, 23.0, 27.0, 17.0, 9.0, 11.0, 11.0, 7.0, 11.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.048828125, -2.945709228515625, -2.84259033203125, -2.739471435546875, -2.6363525390625, -2.533233642578125, -2.43011474609375, -2.326995849609375, -2.223876953125, -2.120758056640625, -2.01763916015625, -1.914520263671875, -1.8114013671875, -1.708282470703125, -1.60516357421875, -1.502044677734375, -1.39892578125, -1.295806884765625, -1.19268798828125, -1.089569091796875, -0.9864501953125, -0.883331298828125, -0.78021240234375, -0.677093505859375, -0.573974609375, -0.470855712890625, -0.36773681640625, -0.264617919921875, -0.1614990234375, -0.058380126953125, 0.04473876953125, 0.147857666015625, 0.2509765625, 0.354095458984375, 0.45721435546875, 0.560333251953125, 0.6634521484375, 0.766571044921875, 0.86968994140625, 0.972808837890625, 1.075927734375, 1.179046630859375, 1.28216552734375, 1.385284423828125, 1.4884033203125, 1.591522216796875, 1.69464111328125, 1.797760009765625, 1.90087890625, 2.003997802734375, 2.10711669921875, 2.210235595703125, 2.3133544921875, 2.416473388671875, 2.51959228515625, 2.622711181640625, 2.725830078125, 2.828948974609375, 2.93206787109375, 3.035186767578125, 3.1383056640625, 3.241424560546875, 3.34454345703125, 3.447662353515625, 3.55078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 3.0, 4.0, 9.0, 18.0, 20.0, 19.0, 26.0, 30.0, 64.0, 67.0, 102.0, 87.0, 154.0, 180.0, 256.0, 292.0, 379.0, 438.0, 403.0, 346.0, 276.0, 206.0, 169.0, 122.0, 77.0, 68.0, 59.0, 51.0, 28.0, 29.0, 13.0, 16.0, 13.0, 12.0, 5.0, 7.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.380859375, -2.3101806640625, -2.239501953125, -2.1688232421875, -2.09814453125, -2.0274658203125, -1.956787109375, -1.8861083984375, -1.8154296875, -1.7447509765625, -1.674072265625, -1.6033935546875, -1.53271484375, -1.4620361328125, -1.391357421875, -1.3206787109375, -1.25, -1.1793212890625, -1.108642578125, -1.0379638671875, -0.96728515625, -0.8966064453125, -0.825927734375, -0.7552490234375, -0.6845703125, -0.6138916015625, -0.543212890625, -0.4725341796875, -0.40185546875, -0.3311767578125, -0.260498046875, -0.1898193359375, -0.119140625, -0.0484619140625, 0.022216796875, 0.0928955078125, 0.16357421875, 0.2342529296875, 0.304931640625, 0.3756103515625, 0.4462890625, 0.5169677734375, 0.587646484375, 0.6583251953125, 0.72900390625, 0.7996826171875, 0.870361328125, 0.9410400390625, 1.01171875, 1.0823974609375, 1.153076171875, 1.2237548828125, 1.29443359375, 1.3651123046875, 1.435791015625, 1.5064697265625, 1.5771484375, 1.6478271484375, 1.718505859375, 1.7891845703125, 1.85986328125, 1.9305419921875, 2.001220703125, 2.0718994140625, 2.142578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 13.0, 9.0, 9.0, 20.0, 28.0, 42.0, 77.0, 102.0, 187.0, 356.0, 854.0, 2304.0, 7202.0, 29456.0, 158036.0, 1655304.0, 2099886.0, 193180.0, 34426.0, 8309.0, 2531.0, 982.0, 423.0, 179.0, 111.0, 58.0, 58.0, 38.0, 20.0, 18.0, 13.0, 10.0, 6.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-6.2734375, -6.1041259765625, -5.934814453125, -5.7655029296875, -5.59619140625, -5.4268798828125, -5.257568359375, -5.0882568359375, -4.9189453125, -4.7496337890625, -4.580322265625, -4.4110107421875, -4.24169921875, -4.0723876953125, -3.903076171875, -3.7337646484375, -3.564453125, -3.3951416015625, -3.225830078125, -3.0565185546875, -2.88720703125, -2.7178955078125, -2.548583984375, -2.3792724609375, -2.2099609375, -2.0406494140625, -1.871337890625, -1.7020263671875, -1.53271484375, -1.3634033203125, -1.194091796875, -1.0247802734375, -0.85546875, -0.6861572265625, -0.516845703125, -0.3475341796875, -0.17822265625, -0.0089111328125, 0.160400390625, 0.3297119140625, 0.4990234375, 0.6683349609375, 0.837646484375, 1.0069580078125, 1.17626953125, 1.3455810546875, 1.514892578125, 1.6842041015625, 1.853515625, 2.0228271484375, 2.192138671875, 2.3614501953125, 2.53076171875, 2.7000732421875, 2.869384765625, 3.0386962890625, 3.2080078125, 3.3773193359375, 3.546630859375, 3.7159423828125, 3.88525390625, 4.0545654296875, 4.223876953125, 4.3931884765625, 4.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 8.0, 29.0, 36.0, 44.0, 84.0, 112.0, 147.0, 119.0, 112.0, 103.0, 83.0, 48.0, 25.0, 23.0, 15.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.906599998474121, -14.295973777770996, -13.685346603393555, -13.07472038269043, -12.464094161987305, -11.85346794128418, -11.242840766906738, -10.632214546203613, -10.021587371826172, -9.410961151123047, -8.800333976745605, -8.18970775604248, -7.5790815353393555, -6.968454837799072, -6.357828140258789, -5.747201919555664, -5.136575698852539, -4.525949001312256, -3.915322780609131, -3.3046960830688477, -2.6940696239471436, -2.0834431648254395, -1.4728164672851562, -0.8621902465820312, -0.25156354904174805, 0.35906296968460083, 0.9696894884109497, 1.5803160667419434, 2.1909425258636475, 2.8015689849853516, 3.4121956825256348, 4.02282190322876, 4.633447647094727, 5.24407434463501, 5.854700565338135, 6.465327262878418, 7.075953483581543, 7.686580181121826, 8.29720687866211, 8.907833099365234, 9.51845932006836, 10.129085540771484, 10.739712715148926, 11.35033893585205, 11.960965156555176, 12.571592330932617, 13.182218551635742, 13.792844772338867, 14.403471946716309, 15.014098167419434, 15.624725341796875, 16.2353515625, 16.845977783203125, 17.45660400390625, 18.067230224609375, 18.6778564453125, 19.288484573364258, 19.899110794067383, 20.509737014770508, 21.120365142822266, 21.73099136352539, 22.341617584228516, 22.95224380493164, 23.562870025634766, 24.17349624633789]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 8.0, 6.0, 11.0, 13.0, 7.0, 11.0, 14.0, 17.0, 13.0, 24.0, 20.0, 28.0, 33.0, 27.0, 26.0, 41.0, 44.0, 33.0, 46.0, 35.0, 39.0, 48.0, 33.0, 32.0, 32.0, 25.0, 30.0, 35.0, 28.0, 21.0, 31.0, 25.0, 22.0, 23.0, 16.0, 22.0, 16.0, 13.0, 11.0, 6.0, 12.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.169623851776123, -6.929409980773926, -6.689196586608887, -6.4489827156066895, -6.208768844604492, -5.968555450439453, -5.728341579437256, -5.488127708435059, -5.2479143142700195, -5.007700443267822, -4.767487049102783, -4.527273178100586, -4.287059783935547, -4.04684591293335, -3.8066320419311523, -3.566418409347534, -3.326204776763916, -3.085991144180298, -2.8457775115966797, -2.6055636405944824, -2.3653500080108643, -2.125136375427246, -1.8849226236343384, -1.6447088718414307, -1.4044952392578125, -1.1642816066741943, -0.9240678548812866, -0.6838541626930237, -0.44364047050476074, -0.20342683792114258, 0.03678691387176514, 0.27700066566467285, 0.5172147750854492, 0.7574284672737122, 0.9976421594619751, 1.2378559112548828, 1.478069543838501, 1.7182831764221191, 1.9584969282150269, 2.1987106800079346, 2.4389243125915527, 2.679137945175171, 2.919351577758789, 3.1595654487609863, 3.3997790813446045, 3.6399927139282227, 3.88020658493042, 4.120420455932617, 4.360633850097656, 4.6008477210998535, 4.841061115264893, 5.08127498626709, 5.321488380432129, 5.561702251434326, 5.801916122436523, 6.0421295166015625, 6.28234338760376, 6.522557258605957, 6.762770652770996, 7.002984523773193, 7.243198394775391, 7.48341178894043, 7.723625659942627, 7.963839530944824, 8.204052925109863]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 8.0, 9.0, 7.0, 7.0, 17.0, 11.0, 22.0, 21.0, 29.0, 27.0, 25.0, 26.0, 40.0, 44.0, 45.0, 38.0, 45.0, 29.0, 48.0, 45.0, 38.0, 51.0, 40.0, 40.0, 33.0, 39.0, 46.0, 23.0, 30.0, 18.0, 25.0, 14.0, 6.0, 11.0, 9.0, 10.0, 12.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.337890625, -1.2957611083984375, -1.253631591796875, -1.2115020751953125, -1.16937255859375, -1.1272430419921875, -1.085113525390625, -1.0429840087890625, -1.0008544921875, -0.9587249755859375, -0.916595458984375, -0.8744659423828125, -0.83233642578125, -0.7902069091796875, -0.748077392578125, -0.7059478759765625, -0.663818359375, -0.6216888427734375, -0.579559326171875, -0.5374298095703125, -0.49530029296875, -0.4531707763671875, -0.411041259765625, -0.3689117431640625, -0.3267822265625, -0.2846527099609375, -0.242523193359375, -0.2003936767578125, -0.15826416015625, -0.1161346435546875, -0.074005126953125, -0.0318756103515625, 0.01025390625, 0.0523834228515625, 0.094512939453125, 0.1366424560546875, 0.17877197265625, 0.2209014892578125, 0.263031005859375, 0.3051605224609375, 0.3472900390625, 0.3894195556640625, 0.431549072265625, 0.4736785888671875, 0.51580810546875, 0.5579376220703125, 0.600067138671875, 0.6421966552734375, 0.684326171875, 0.7264556884765625, 0.768585205078125, 0.8107147216796875, 0.85284423828125, 0.8949737548828125, 0.937103271484375, 0.9792327880859375, 1.0213623046875, 1.0634918212890625, 1.105621337890625, 1.1477508544921875, 1.18988037109375, 1.2320098876953125, 1.274139404296875, 1.3162689208984375, 1.3583984375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 10.0, 16.0, 13.0, 15.0, 31.0, 53.0, 62.0, 71.0, 132.0, 207.0, 287.0, 355.0, 553.0, 868.0, 1179.0, 1769.0, 2676.0, 3823.0, 6116.0, 10031.0, 19096.0, 45304.0, 135211.0, 371650.0, 284708.0, 91988.0, 32768.0, 15205.0, 8465.0, 5195.0, 3476.0, 2277.0, 1494.0, 1081.0, 735.0, 549.0, 342.0, 220.0, 171.0, 101.0, 75.0, 51.0, 41.0, 25.0, 18.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.72265625, -0.7006454467773438, -0.6786346435546875, -0.6566238403320312, -0.634613037109375, -0.6126022338867188, -0.5905914306640625, -0.5685806274414062, -0.54656982421875, -0.5245590209960938, -0.5025482177734375, -0.48053741455078125, -0.458526611328125, -0.43651580810546875, -0.4145050048828125, -0.39249420166015625, -0.3704833984375, -0.34847259521484375, -0.3264617919921875, -0.30445098876953125, -0.282440185546875, -0.26042938232421875, -0.2384185791015625, -0.21640777587890625, -0.19439697265625, -0.17238616943359375, -0.1503753662109375, -0.12836456298828125, -0.106353759765625, -0.08434295654296875, -0.0623321533203125, -0.04032135009765625, -0.018310546875, 0.00370025634765625, 0.0257110595703125, 0.04772186279296875, 0.069732666015625, 0.09174346923828125, 0.1137542724609375, 0.13576507568359375, 0.15777587890625, 0.17978668212890625, 0.2017974853515625, 0.22380828857421875, 0.245819091796875, 0.26782989501953125, 0.2898406982421875, 0.31185150146484375, 0.3338623046875, 0.35587310791015625, 0.3778839111328125, 0.39989471435546875, 0.421905517578125, 0.44391632080078125, 0.4659271240234375, 0.48793792724609375, 0.50994873046875, 0.5319595336914062, 0.5539703369140625, 0.5759811401367188, 0.597991943359375, 0.6200027465820312, 0.6420135498046875, 0.6640243530273438, 0.68603515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 13.0, 11.0, 6.0, 6.0, 15.0, 8.0, 15.0, 13.0, 11.0, 20.0, 22.0, 34.0, 27.0, 37.0, 36.0, 31.0, 35.0, 35.0, 44.0, 55.0, 1075.0, 51.0, 33.0, 37.0, 39.0, 45.0, 29.0, 42.0, 30.0, 27.0, 30.0, 19.0, 17.0, 15.0, 9.0, 15.0, 9.0, 2.0, 4.0, 6.0, 11.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.93798828125, -0.90850830078125, -0.8790283203125, -0.84954833984375, -0.820068359375, -0.79058837890625, -0.7611083984375, -0.73162841796875, -0.7021484375, -0.67266845703125, -0.6431884765625, -0.61370849609375, -0.584228515625, -0.55474853515625, -0.5252685546875, -0.49578857421875, -0.46630859375, -0.43682861328125, -0.4073486328125, -0.37786865234375, -0.348388671875, -0.31890869140625, -0.2894287109375, -0.25994873046875, -0.23046875, -0.20098876953125, -0.1715087890625, -0.14202880859375, -0.112548828125, -0.08306884765625, -0.0535888671875, -0.02410888671875, 0.00537109375, 0.03485107421875, 0.0643310546875, 0.09381103515625, 0.123291015625, 0.15277099609375, 0.1822509765625, 0.21173095703125, 0.2412109375, 0.27069091796875, 0.3001708984375, 0.32965087890625, 0.359130859375, 0.38861083984375, 0.4180908203125, 0.44757080078125, 0.47705078125, 0.50653076171875, 0.5360107421875, 0.56549072265625, 0.594970703125, 0.62445068359375, 0.6539306640625, 0.68341064453125, 0.712890625, 0.74237060546875, 0.7718505859375, 0.80133056640625, 0.830810546875, 0.86029052734375, 0.8897705078125, 0.91925048828125, 0.94873046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 12.0, 6.0, 17.0, 10.0, 32.0, 41.0, 57.0, 102.0, 173.0, 258.0, 371.0, 679.0, 1217.0, 2294.0, 4900.0, 11909.0, 38835.0, 270669.0, 1588582.0, 134355.0, 25619.0, 8721.0, 3872.0, 1839.0, 953.0, 603.0, 358.0, 224.0, 127.0, 92.0, 62.0, 44.0, 34.0, 15.0, 12.0, 15.0, 7.0, 2.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.90625, -0.8798675537109375, -0.853485107421875, -0.8271026611328125, -0.80072021484375, -0.7743377685546875, -0.747955322265625, -0.7215728759765625, -0.6951904296875, -0.6688079833984375, -0.642425537109375, -0.6160430908203125, -0.58966064453125, -0.5632781982421875, -0.536895751953125, -0.5105133056640625, -0.484130859375, -0.4577484130859375, -0.431365966796875, -0.4049835205078125, -0.37860107421875, -0.3522186279296875, -0.325836181640625, -0.2994537353515625, -0.2730712890625, -0.2466888427734375, -0.220306396484375, -0.1939239501953125, -0.16754150390625, -0.1411590576171875, -0.114776611328125, -0.0883941650390625, -0.06201171875, -0.0356292724609375, -0.009246826171875, 0.0171356201171875, 0.04351806640625, 0.0699005126953125, 0.096282958984375, 0.1226654052734375, 0.1490478515625, 0.1754302978515625, 0.201812744140625, 0.2281951904296875, 0.25457763671875, 0.2809600830078125, 0.307342529296875, 0.3337249755859375, 0.360107421875, 0.3864898681640625, 0.412872314453125, 0.4392547607421875, 0.46563720703125, 0.4920196533203125, 0.518402099609375, 0.5447845458984375, 0.5711669921875, 0.5975494384765625, 0.623931884765625, 0.6503143310546875, 0.67669677734375, 0.7030792236328125, 0.729461669921875, 0.7558441162109375, 0.7822265625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 4.0, 8.0, 7.0, 4.0, 17.0, 32.0, 52.0, 122.0, 305.0, 226.0, 71.0, 48.0, 26.0, 10.0, 11.0, 9.0, 9.0, 3.0, 5.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1441650390625, -0.13723182678222656, -0.13029861450195312, -0.12336540222167969, -0.11643218994140625, -0.10949897766113281, -0.10256576538085938, -0.09563255310058594, -0.0886993408203125, -0.08176612854003906, -0.07483291625976562, -0.06789970397949219, -0.06096649169921875, -0.05403327941894531, -0.047100067138671875, -0.04016685485839844, -0.033233642578125, -0.026300430297851562, -0.019367218017578125, -0.012434005737304688, -0.00550079345703125, 0.0014324188232421875, 0.008365631103515625, 0.015298843383789062, 0.0222320556640625, 0.029165267944335938, 0.036098480224609375, 0.04303169250488281, 0.04996490478515625, 0.05689811706542969, 0.06383132934570312, 0.07076454162597656, 0.07769775390625, 0.08463096618652344, 0.09156417846679688, 0.09849739074707031, 0.10543060302734375, 0.11236381530761719, 0.11929702758789062, 0.12623023986816406, 0.1331634521484375, 0.14009666442871094, 0.14702987670898438, 0.1539630889892578, 0.16089630126953125, 0.1678295135498047, 0.17476272583007812, 0.18169593811035156, 0.188629150390625, 0.19556236267089844, 0.20249557495117188, 0.2094287872314453, 0.21636199951171875, 0.2232952117919922, 0.23022842407226562, 0.23716163635253906, 0.2440948486328125, 0.25102806091308594, 0.2579612731933594, 0.2648944854736328, 0.27182769775390625, 0.2787609100341797, 0.2856941223144531, 0.29262733459472656, 0.299560546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 4.0, 12.0, 13.0, 21.0, 51.0, 91.0, 205.0, 972.0, 24551.0, 1014572.0, 7174.0, 576.0, 146.0, 74.0, 29.0, 18.0, 14.0, 11.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.37109375, -5.247161865234375, -5.12322998046875, -4.999298095703125, -4.8753662109375, -4.751434326171875, -4.62750244140625, -4.503570556640625, -4.379638671875, -4.255706787109375, -4.13177490234375, -4.007843017578125, -3.8839111328125, -3.759979248046875, -3.63604736328125, -3.512115478515625, -3.38818359375, -3.264251708984375, -3.14031982421875, -3.016387939453125, -2.8924560546875, -2.768524169921875, -2.64459228515625, -2.520660400390625, -2.396728515625, -2.272796630859375, -2.14886474609375, -2.024932861328125, -1.9010009765625, -1.777069091796875, -1.65313720703125, -1.529205322265625, -1.4052734375, -1.281341552734375, -1.15740966796875, -1.033477783203125, -0.9095458984375, -0.785614013671875, -0.66168212890625, -0.537750244140625, -0.413818359375, -0.289886474609375, -0.16595458984375, -0.042022705078125, 0.0819091796875, 0.205841064453125, 0.32977294921875, 0.453704833984375, 0.57763671875, 0.701568603515625, 0.82550048828125, 0.949432373046875, 1.0733642578125, 1.197296142578125, 1.32122802734375, 1.445159912109375, 1.569091796875, 1.693023681640625, 1.81695556640625, 1.940887451171875, 2.0648193359375, 2.188751220703125, 2.31268310546875, 2.436614990234375, 2.560546875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 6.0, 12.0, 10.0, 36.0, 44.0, 57.0, 95.0, 89.0, 132.0, 110.0, 117.0, 91.0, 76.0, 42.0, 30.0, 19.0, 9.0, 7.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12797167897224426, -0.12009560316801071, -0.11221952736377716, -0.1043434590101242, -0.09646737575531006, -0.0885913074016571, -0.08071523159742355, -0.07283915579319, -0.06496307998895645, -0.0570870041847229, -0.04921092838048935, -0.0413348563015461, -0.033458780497312546, -0.025582704693078995, -0.017706632614135742, -0.009830556809902191, -0.00195448100566864, 0.005921593867242336, 0.013797668740153313, 0.021673742681741714, 0.029549818485975266, 0.037425894290208817, 0.04530196636915207, 0.05317804217338562, 0.06105411797761917, 0.06893019378185272, 0.07680626958608627, 0.08468234539031982, 0.09255841374397278, 0.10043449699878693, 0.10831056535243988, 0.11618664115667343, 0.12406271696090698, 0.13193878531455994, 0.13981486856937408, 0.14769093692302704, 0.1555670201778412, 0.16344308853149414, 0.1713191568851471, 0.17919524013996124, 0.1870713233947754, 0.19494739174842834, 0.2028234750032425, 0.21069954335689545, 0.2185756266117096, 0.22645169496536255, 0.2343277633190155, 0.24220384657382965, 0.2500799298286438, 0.25795599818229675, 0.2658320665359497, 0.27370816469192505, 0.281584233045578, 0.28946030139923096, 0.2973363697528839, 0.30521243810653687, 0.3130885064601898, 0.3209645748138428, 0.3288406431674957, 0.33671674132347107, 0.344592809677124, 0.352468878030777, 0.36034494638442993, 0.3682210445404053, 0.3760971128940582]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 9.0, 6.0, 10.0, 11.0, 9.0, 9.0, 18.0, 31.0, 22.0, 20.0, 28.0, 35.0, 36.0, 30.0, 37.0, 41.0, 32.0, 39.0, 51.0, 39.0, 46.0, 36.0, 38.0, 36.0, 25.0, 48.0, 29.0, 32.0, 23.0, 20.0, 24.0, 24.0, 15.0, 19.0, 19.0, 12.0, 12.0, 6.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.14386862516403198, -0.13949425518512726, -0.13511990010738373, -0.130745530128479, -0.12637116014957428, -0.12199679762125015, -0.11762243509292603, -0.1132480651140213, -0.10887370258569717, -0.10449934005737305, -0.10012497007846832, -0.0957506075501442, -0.09137624502182007, -0.08700187504291534, -0.08262751251459122, -0.07825314998626709, -0.07387878000736237, -0.06950441747903824, -0.06513004750013351, -0.06075568497180939, -0.05638131871819496, -0.052006952464580536, -0.04763258993625641, -0.04325822368264198, -0.03888385742902756, -0.03450949117541313, -0.030135126784443855, -0.02576076239347458, -0.021386396139860153, -0.017012029886245728, -0.012637665495276451, -0.008263301104307175, -0.003888934850692749, 0.000485430471599102, 0.004859795793890953, 0.009234161116182804, 0.013608526438474655, 0.01798289269208908, 0.022357257083058357, 0.026731621474027634, 0.03110598772764206, 0.035480353981256485, 0.03985472023487091, 0.04422908276319504, 0.048603449016809464, 0.05297781527042389, 0.057352177798748016, 0.06172654405236244, 0.06610091030597687, 0.070475272834301, 0.07484964281320572, 0.07922400534152985, 0.08359837532043457, 0.0879727378487587, 0.09234710037708282, 0.09672147035598755, 0.10109583288431168, 0.1054701954126358, 0.10984456539154053, 0.11421892791986465, 0.11859329044818878, 0.1229676604270935, 0.12734203040599823, 0.13171638548374176, 0.13609075546264648]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 7.0, 9.0, 8.0, 13.0, 11.0, 22.0, 23.0, 32.0, 24.0, 28.0, 23.0, 40.0, 42.0, 46.0, 40.0, 45.0, 30.0, 44.0, 50.0, 38.0, 48.0, 39.0, 41.0, 32.0, 41.0, 43.0, 28.0, 25.0, 20.0, 26.0, 15.0, 5.0, 12.0, 9.0, 10.0, 11.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2986297607421875, -1.256439208984375, -1.2142486572265625, -1.17205810546875, -1.1298675537109375, -1.087677001953125, -1.0454864501953125, -1.0032958984375, -0.9611053466796875, -0.918914794921875, -0.8767242431640625, -0.83453369140625, -0.7923431396484375, -0.750152587890625, -0.7079620361328125, -0.665771484375, -0.6235809326171875, -0.581390380859375, -0.5391998291015625, -0.49700927734375, -0.4548187255859375, -0.412628173828125, -0.3704376220703125, -0.3282470703125, -0.2860565185546875, -0.243865966796875, -0.2016754150390625, -0.15948486328125, -0.1172943115234375, -0.075103759765625, -0.0329132080078125, 0.00927734375, 0.0514678955078125, 0.093658447265625, 0.1358489990234375, 0.17803955078125, 0.2202301025390625, 0.262420654296875, 0.3046112060546875, 0.3468017578125, 0.3889923095703125, 0.431182861328125, 0.4733734130859375, 0.51556396484375, 0.5577545166015625, 0.599945068359375, 0.6421356201171875, 0.684326171875, 0.7265167236328125, 0.768707275390625, 0.8108978271484375, 0.85308837890625, 0.8952789306640625, 0.937469482421875, 0.9796600341796875, 1.0218505859375, 1.0640411376953125, 1.106231689453125, 1.1484222412109375, 1.19061279296875, 1.2328033447265625, 1.274993896484375, 1.3171844482421875, 1.359375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 11.0, 5.0, 16.0, 21.0, 29.0, 50.0, 73.0, 130.0, 200.0, 350.0, 626.0, 989.0, 1744.0, 2950.0, 5520.0, 10059.0, 19067.0, 36977.0, 73384.0, 151234.0, 280916.0, 231817.0, 114119.0, 56296.0, 28572.0, 15048.0, 7885.0, 4473.0, 2477.0, 1400.0, 853.0, 489.0, 292.0, 190.0, 112.0, 64.0, 53.0, 36.0, 13.0, 10.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5, -1.4569091796875, -1.413818359375, -1.3707275390625, -1.32763671875, -1.2845458984375, -1.241455078125, -1.1983642578125, -1.1552734375, -1.1121826171875, -1.069091796875, -1.0260009765625, -0.98291015625, -0.9398193359375, -0.896728515625, -0.8536376953125, -0.810546875, -0.7674560546875, -0.724365234375, -0.6812744140625, -0.63818359375, -0.5950927734375, -0.552001953125, -0.5089111328125, -0.4658203125, -0.4227294921875, -0.379638671875, -0.3365478515625, -0.29345703125, -0.2503662109375, -0.207275390625, -0.1641845703125, -0.12109375, -0.0780029296875, -0.034912109375, 0.0081787109375, 0.05126953125, 0.0943603515625, 0.137451171875, 0.1805419921875, 0.2236328125, 0.2667236328125, 0.309814453125, 0.3529052734375, 0.39599609375, 0.4390869140625, 0.482177734375, 0.5252685546875, 0.568359375, 0.6114501953125, 0.654541015625, 0.6976318359375, 0.74072265625, 0.7838134765625, 0.826904296875, 0.8699951171875, 0.9130859375, 0.9561767578125, 0.999267578125, 1.0423583984375, 1.08544921875, 1.1285400390625, 1.171630859375, 1.2147216796875, 1.2578125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 5.0, 6.0, 5.0, 11.0, 20.0, 18.0, 16.0, 28.0, 27.0, 30.0, 30.0, 53.0, 47.0, 66.0, 109.0, 239.0, 1462.0, 299.0, 111.0, 87.0, 68.0, 45.0, 42.0, 36.0, 38.0, 19.0, 26.0, 15.0, 17.0, 15.0, 14.0, 8.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.0362548828125, -3.900634765625, -3.7650146484375, -3.62939453125, -3.4937744140625, -3.358154296875, -3.2225341796875, -3.0869140625, -2.9512939453125, -2.815673828125, -2.6800537109375, -2.54443359375, -2.4088134765625, -2.273193359375, -2.1375732421875, -2.001953125, -1.8663330078125, -1.730712890625, -1.5950927734375, -1.45947265625, -1.3238525390625, -1.188232421875, -1.0526123046875, -0.9169921875, -0.7813720703125, -0.645751953125, -0.5101318359375, -0.37451171875, -0.2388916015625, -0.103271484375, 0.0323486328125, 0.16796875, 0.3035888671875, 0.439208984375, 0.5748291015625, 0.71044921875, 0.8460693359375, 0.981689453125, 1.1173095703125, 1.2529296875, 1.3885498046875, 1.524169921875, 1.6597900390625, 1.79541015625, 1.9310302734375, 2.066650390625, 2.2022705078125, 2.337890625, 2.4735107421875, 2.609130859375, 2.7447509765625, 2.88037109375, 3.0159912109375, 3.151611328125, 3.2872314453125, 3.4228515625, 3.5584716796875, 3.694091796875, 3.8297119140625, 3.96533203125, 4.1009521484375, 4.236572265625, 4.3721923828125, 4.5078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 8.0, 10.0, 20.0, 21.0, 16.0, 31.0, 44.0, 58.0, 88.0, 98.0, 103.0, 173.0, 281.0, 523.0, 1895.0, 15461.0, 360826.0, 2674594.0, 83077.0, 6165.0, 1026.0, 343.0, 190.0, 158.0, 108.0, 80.0, 69.0, 43.0, 42.0, 27.0, 17.0, 20.0, 17.0, 6.0, 12.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-7.75, -7.53045654296875, -7.3109130859375, -7.09136962890625, -6.871826171875, -6.65228271484375, -6.4327392578125, -6.21319580078125, -5.99365234375, -5.77410888671875, -5.5545654296875, -5.33502197265625, -5.115478515625, -4.89593505859375, -4.6763916015625, -4.45684814453125, -4.2373046875, -4.01776123046875, -3.7982177734375, -3.57867431640625, -3.359130859375, -3.13958740234375, -2.9200439453125, -2.70050048828125, -2.48095703125, -2.26141357421875, -2.0418701171875, -1.82232666015625, -1.602783203125, -1.38323974609375, -1.1636962890625, -0.94415283203125, -0.724609375, -0.50506591796875, -0.2855224609375, -0.06597900390625, 0.153564453125, 0.37310791015625, 0.5926513671875, 0.81219482421875, 1.03173828125, 1.25128173828125, 1.4708251953125, 1.69036865234375, 1.909912109375, 2.12945556640625, 2.3489990234375, 2.56854248046875, 2.7880859375, 3.00762939453125, 3.2271728515625, 3.44671630859375, 3.666259765625, 3.88580322265625, 4.1053466796875, 4.32489013671875, 4.54443359375, 4.76397705078125, 4.9835205078125, 5.20306396484375, 5.422607421875, 5.64215087890625, 5.8616943359375, 6.08123779296875, 6.30078125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [6.0, 114.0, 558.0, 298.0, 38.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.275930404663086, -2.7624034881591797, -1.2488768100738525, 0.2646498680114746, 1.7781767845153809, 3.291703701019287, 4.805230140686035, 6.318757057189941, 7.832283973693848, 9.345810890197754, 10.85933780670166, 12.37286376953125, 13.886390686035156, 15.399917602539062, 16.91344451904297, 18.426971435546875, 19.94049835205078, 21.454025268554688, 22.967552185058594, 24.4810791015625, 25.994606018066406, 27.508132934570312, 29.02165985107422, 30.535186767578125, 32.04871368408203, 33.56224060058594, 35.075767517089844, 36.58929443359375, 38.102821350097656, 39.61634826660156, 41.12987518310547, 42.643402099609375, 44.156925201416016, 45.67045211791992, 47.18397903442383, 48.697505950927734, 50.21103286743164, 51.72455978393555, 53.23808670043945, 54.75161361694336, 56.265140533447266, 57.77866744995117, 59.29219436645508, 60.805721282958984, 62.31924819946289, 63.8327751159668, 65.34629821777344, 66.85982513427734, 68.37335205078125, 69.88687896728516, 71.40040588378906, 72.91393280029297, 74.42745971679688, 75.94098663330078, 77.45451354980469, 78.9680404663086, 80.4815673828125, 81.9950942993164, 83.50862121582031, 85.02214813232422, 86.53567504882812, 88.04920196533203, 89.56272888183594, 91.07625579833984, 92.58978271484375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 2.0, 6.0, 7.0, 9.0, 14.0, 18.0, 21.0, 20.0, 20.0, 18.0, 37.0, 36.0, 40.0, 32.0, 45.0, 38.0, 34.0, 42.0, 35.0, 50.0, 46.0, 37.0, 39.0, 39.0, 34.0, 43.0, 40.0, 32.0, 20.0, 23.0, 25.0, 17.0, 23.0, 9.0, 11.0, 5.0, 7.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.125627517700195, -10.779850959777832, -10.434075355529785, -10.088298797607422, -9.742523193359375, -9.396746635437012, -9.050970077514648, -8.705194473266602, -8.359418869018555, -8.013642311096191, -7.6678667068481445, -7.322090148925781, -6.976314544677734, -6.630537986755371, -6.284761905670166, -5.938985824584961, -5.593209266662598, -5.247433185577393, -4.9016571044921875, -4.555880546569824, -4.210104942321777, -3.864328622817993, -3.518552303314209, -3.172776222229004, -2.827000141143799, -2.4812240600585938, -2.1354479789733887, -1.7896716594696045, -1.4438955783843994, -1.0981194972991943, -0.7523431777954102, -0.4065670967102051, -0.060791969299316406, 0.28498417139053345, 0.6307603120803833, 0.9765365123748779, 1.322312593460083, 1.668088674545288, 2.0138649940490723, 2.3596410751342773, 2.7054171562194824, 3.0511932373046875, 3.3969693183898926, 3.7427456378936768, 4.088521957397461, 4.434297561645508, 4.780074119567871, 5.125850200653076, 5.471626281738281, 5.817402362823486, 6.163178443908691, 6.508955001831055, 6.854730606079102, 7.200507164001465, 7.54628324508667, 7.892059326171875, 8.237834930419922, 8.583611488342285, 8.929387092590332, 9.275163650512695, 9.620939254760742, 9.966715812683105, 10.312492370605469, 10.658267974853516, 11.004044532775879]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 4.0, 8.0, 6.0, 13.0, 15.0, 16.0, 16.0, 18.0, 19.0, 23.0, 24.0, 28.0, 33.0, 29.0, 37.0, 32.0, 43.0, 35.0, 35.0, 43.0, 47.0, 39.0, 50.0, 39.0, 46.0, 32.0, 35.0, 31.0, 26.0, 27.0, 29.0, 21.0, 17.0, 16.0, 11.0, 12.0, 15.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3154296875, -1.274444580078125, -1.23345947265625, -1.192474365234375, -1.1514892578125, -1.110504150390625, -1.06951904296875, -1.028533935546875, -0.987548828125, -0.946563720703125, -0.90557861328125, -0.864593505859375, -0.8236083984375, -0.782623291015625, -0.74163818359375, -0.700653076171875, -0.65966796875, -0.618682861328125, -0.57769775390625, -0.536712646484375, -0.4957275390625, -0.454742431640625, -0.41375732421875, -0.372772216796875, -0.331787109375, -0.290802001953125, -0.24981689453125, -0.208831787109375, -0.1678466796875, -0.126861572265625, -0.08587646484375, -0.044891357421875, -0.00390625, 0.037078857421875, 0.07806396484375, 0.119049072265625, 0.1600341796875, 0.201019287109375, 0.24200439453125, 0.282989501953125, 0.323974609375, 0.364959716796875, 0.40594482421875, 0.446929931640625, 0.4879150390625, 0.528900146484375, 0.56988525390625, 0.610870361328125, 0.65185546875, 0.692840576171875, 0.73382568359375, 0.774810791015625, 0.8157958984375, 0.856781005859375, 0.89776611328125, 0.938751220703125, 0.979736328125, 1.020721435546875, 1.06170654296875, 1.102691650390625, 1.1436767578125, 1.184661865234375, 1.22564697265625, 1.266632080078125, 1.3076171875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 8.0, 6.0, 9.0, 27.0, 35.0, 40.0, 55.0, 75.0, 109.0, 163.0, 223.0, 387.0, 609.0, 937.0, 1536.0, 2794.0, 5532.0, 11535.0, 28285.0, 84448.0, 376399.0, 1900984.0, 1422673.0, 253829.0, 62249.0, 22057.0, 9207.0, 4380.0, 2241.0, 1254.0, 720.0, 451.0, 328.0, 205.0, 135.0, 106.0, 67.0, 52.0, 32.0, 23.0, 10.0, 13.0, 11.0, 5.0, 8.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 4.0], "bins": [-2.810546875, -2.725067138671875, -2.63958740234375, -2.554107666015625, -2.4686279296875, -2.383148193359375, -2.29766845703125, -2.212188720703125, -2.126708984375, -2.041229248046875, -1.95574951171875, -1.870269775390625, -1.7847900390625, -1.699310302734375, -1.61383056640625, -1.528350830078125, -1.44287109375, -1.357391357421875, -1.27191162109375, -1.186431884765625, -1.1009521484375, -1.015472412109375, -0.92999267578125, -0.844512939453125, -0.759033203125, -0.673553466796875, -0.58807373046875, -0.502593994140625, -0.4171142578125, -0.331634521484375, -0.24615478515625, -0.160675048828125, -0.0751953125, 0.010284423828125, 0.09576416015625, 0.181243896484375, 0.2667236328125, 0.352203369140625, 0.43768310546875, 0.523162841796875, 0.608642578125, 0.694122314453125, 0.77960205078125, 0.865081787109375, 0.9505615234375, 1.036041259765625, 1.12152099609375, 1.207000732421875, 1.29248046875, 1.377960205078125, 1.46343994140625, 1.548919677734375, 1.6343994140625, 1.719879150390625, 1.80535888671875, 1.890838623046875, 1.976318359375, 2.061798095703125, 2.14727783203125, 2.232757568359375, 2.3182373046875, 2.403717041015625, 2.48919677734375, 2.574676513671875, 2.66015625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 5.0, 2.0, 12.0, 8.0, 17.0, 20.0, 18.0, 29.0, 36.0, 41.0, 47.0, 69.0, 64.0, 91.0, 141.0, 164.0, 215.0, 271.0, 316.0, 373.0, 375.0, 355.0, 292.0, 243.0, 161.0, 149.0, 115.0, 97.0, 69.0, 57.0, 41.0, 38.0, 25.0, 28.0, 18.0, 11.0, 15.0, 9.0, 9.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.107421875, -2.043792724609375, -1.98016357421875, -1.916534423828125, -1.8529052734375, -1.789276123046875, -1.72564697265625, -1.662017822265625, -1.598388671875, -1.534759521484375, -1.47113037109375, -1.407501220703125, -1.3438720703125, -1.280242919921875, -1.21661376953125, -1.152984619140625, -1.08935546875, -1.025726318359375, -0.96209716796875, -0.898468017578125, -0.8348388671875, -0.771209716796875, -0.70758056640625, -0.643951416015625, -0.580322265625, -0.516693115234375, -0.45306396484375, -0.389434814453125, -0.3258056640625, -0.262176513671875, -0.19854736328125, -0.134918212890625, -0.0712890625, -0.007659912109375, 0.05596923828125, 0.119598388671875, 0.1832275390625, 0.246856689453125, 0.31048583984375, 0.374114990234375, 0.437744140625, 0.501373291015625, 0.56500244140625, 0.628631591796875, 0.6922607421875, 0.755889892578125, 0.81951904296875, 0.883148193359375, 0.94677734375, 1.010406494140625, 1.07403564453125, 1.137664794921875, 1.2012939453125, 1.264923095703125, 1.32855224609375, 1.392181396484375, 1.455810546875, 1.519439697265625, 1.58306884765625, 1.646697998046875, 1.7103271484375, 1.773956298828125, 1.83758544921875, 1.901214599609375, 1.96484375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 11.0, 9.0, 16.0, 13.0, 18.0, 18.0, 40.0, 38.0, 49.0, 66.0, 79.0, 126.0, 190.0, 328.0, 579.0, 1366.0, 4275.0, 14554.0, 62363.0, 406619.0, 2861153.0, 719580.0, 93406.0, 20040.0, 5665.0, 1847.0, 715.0, 346.0, 203.0, 141.0, 97.0, 69.0, 57.0, 55.0, 30.0, 23.0, 23.0, 25.0, 12.0, 9.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.34375, -5.179931640625, -5.01611328125, -4.852294921875, -4.6884765625, -4.524658203125, -4.36083984375, -4.197021484375, -4.033203125, -3.869384765625, -3.70556640625, -3.541748046875, -3.3779296875, -3.214111328125, -3.05029296875, -2.886474609375, -2.72265625, -2.558837890625, -2.39501953125, -2.231201171875, -2.0673828125, -1.903564453125, -1.73974609375, -1.575927734375, -1.412109375, -1.248291015625, -1.08447265625, -0.920654296875, -0.7568359375, -0.593017578125, -0.42919921875, -0.265380859375, -0.1015625, 0.062255859375, 0.22607421875, 0.389892578125, 0.5537109375, 0.717529296875, 0.88134765625, 1.045166015625, 1.208984375, 1.372802734375, 1.53662109375, 1.700439453125, 1.8642578125, 2.028076171875, 2.19189453125, 2.355712890625, 2.51953125, 2.683349609375, 2.84716796875, 3.010986328125, 3.1748046875, 3.338623046875, 3.50244140625, 3.666259765625, 3.830078125, 3.993896484375, 4.15771484375, 4.321533203125, 4.4853515625, 4.649169921875, 4.81298828125, 4.976806640625, 5.140625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 12.0, 25.0, 30.0, 44.0, 99.0, 146.0, 154.0, 172.0, 135.0, 92.0, 40.0, 24.0, 14.0, 11.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.03251838684082, -15.300535202026367, -14.568552017211914, -13.836569786071777, -13.104586601257324, -12.372603416442871, -11.640621185302734, -10.908638000488281, -10.176654815673828, -9.444671630859375, -8.712688446044922, -7.980706214904785, -7.248723030090332, -6.516739845275879, -5.784757137298584, -5.052774429321289, -4.320791244506836, -3.588808298110962, -2.856825351715088, -2.124842405319214, -1.3928594589233398, -0.6608765125274658, 0.0711064338684082, 0.8030891418457031, 1.5350723266601562, 2.2670552730560303, 2.9990382194519043, 3.7310211658477783, 4.463004112243652, 5.1949872970581055, 5.9269700050354, 6.658952713012695, 7.390933990478516, 8.122917175292969, 8.854900360107422, 9.586882591247559, 10.318865776062012, 11.050848960876465, 11.782831192016602, 12.514814376831055, 13.246797561645508, 13.978780746459961, 14.710763931274414, 15.44274616241455, 16.174728393554688, 16.90671157836914, 17.638694763183594, 18.370677947998047, 19.1026611328125, 19.834644317626953, 20.566627502441406, 21.29861068725586, 22.030593872070312, 22.762575149536133, 23.494558334350586, 24.22654151916504, 24.958524703979492, 25.690507888793945, 26.4224910736084, 27.15447425842285, 27.886455535888672, 28.618438720703125, 29.350421905517578, 30.08240509033203, 30.814388275146484]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 4.0, 8.0, 6.0, 8.0, 10.0, 12.0, 11.0, 16.0, 25.0, 21.0, 25.0, 19.0, 17.0, 21.0, 26.0, 25.0, 26.0, 33.0, 40.0, 30.0, 41.0, 36.0, 42.0, 38.0, 48.0, 36.0, 45.0, 40.0, 40.0, 25.0, 25.0, 21.0, 19.0, 23.0, 19.0, 20.0, 23.0, 14.0, 16.0, 19.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.558496475219727, -8.309937477111816, -8.061378479003906, -7.8128204345703125, -7.564261436462402, -7.315702438354492, -7.06714391708374, -6.818585395812988, -6.570026397705078, -6.321467399597168, -6.072908878326416, -5.824350357055664, -5.575791358947754, -5.327232360839844, -5.078673839569092, -4.83011531829834, -4.58155632019043, -4.3329973220825195, -4.084438800811768, -3.8358800411224365, -3.5873212814331055, -3.3387625217437744, -3.0902037620544434, -2.8416450023651123, -2.5930862426757812, -2.34452748298645, -2.095968723297119, -1.847409963607788, -1.598851203918457, -1.350292444229126, -1.101733684539795, -0.8531749248504639, -0.6046161651611328, -0.35605740547180176, -0.1074986457824707, 0.14106011390686035, 0.3896188735961914, 0.6381776332855225, 0.8867363929748535, 1.1352951526641846, 1.3838539123535156, 1.6324126720428467, 1.8809714317321777, 2.129530191421509, 2.37808895111084, 2.626647710800171, 2.875206470489502, 3.123765230178833, 3.372323989868164, 3.620882749557495, 3.869441509246826, 4.118000030517578, 4.366559028625488, 4.615118026733398, 4.86367654800415, 5.112235069274902, 5.3607940673828125, 5.609353065490723, 5.857911586761475, 6.106470108032227, 6.355029106140137, 6.603588104248047, 6.852146625518799, 7.100705146789551, 7.349264144897461]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 9.0, 10.0, 13.0, 12.0, 17.0, 9.0, 16.0, 27.0, 21.0, 13.0, 28.0, 28.0, 29.0, 32.0, 28.0, 26.0, 36.0, 30.0, 29.0, 30.0, 28.0, 38.0, 47.0, 31.0, 37.0, 34.0, 41.0, 26.0, 29.0, 26.0, 29.0, 26.0, 17.0, 20.0, 26.0, 17.0, 17.0, 10.0, 8.0, 2.0, 6.0, 9.0, 6.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.115234375, -1.0811614990234375, -1.047088623046875, -1.0130157470703125, -0.97894287109375, -0.9448699951171875, -0.910797119140625, -0.8767242431640625, -0.8426513671875, -0.8085784912109375, -0.774505615234375, -0.7404327392578125, -0.70635986328125, -0.6722869873046875, -0.638214111328125, -0.6041412353515625, -0.570068359375, -0.5359954833984375, -0.501922607421875, -0.4678497314453125, -0.43377685546875, -0.3997039794921875, -0.365631103515625, -0.3315582275390625, -0.2974853515625, -0.2634124755859375, -0.229339599609375, -0.1952667236328125, -0.16119384765625, -0.1271209716796875, -0.093048095703125, -0.0589752197265625, -0.02490234375, 0.0091705322265625, 0.043243408203125, 0.0773162841796875, 0.11138916015625, 0.1454620361328125, 0.179534912109375, 0.2136077880859375, 0.2476806640625, 0.2817535400390625, 0.315826416015625, 0.3498992919921875, 0.38397216796875, 0.4180450439453125, 0.452117919921875, 0.4861907958984375, 0.520263671875, 0.5543365478515625, 0.588409423828125, 0.6224822998046875, 0.65655517578125, 0.6906280517578125, 0.724700927734375, 0.7587738037109375, 0.7928466796875, 0.8269195556640625, 0.860992431640625, 0.8950653076171875, 0.92913818359375, 0.9632110595703125, 0.997283935546875, 1.0313568115234375, 1.0654296875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 4.0, 12.0, 12.0, 18.0, 31.0, 43.0, 61.0, 48.0, 75.0, 95.0, 139.0, 225.0, 301.0, 412.0, 635.0, 880.0, 1545.0, 2847.0, 6339.0, 18100.0, 107078.0, 719478.0, 153373.0, 21733.0, 6952.0, 3127.0, 1696.0, 1031.0, 681.0, 457.0, 287.0, 208.0, 160.0, 116.0, 87.0, 75.0, 38.0, 30.0, 27.0, 24.0, 22.0, 18.0, 9.0, 9.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5615234375, -1.506866455078125, -1.45220947265625, -1.397552490234375, -1.3428955078125, -1.288238525390625, -1.23358154296875, -1.178924560546875, -1.124267578125, -1.069610595703125, -1.01495361328125, -0.960296630859375, -0.9056396484375, -0.850982666015625, -0.79632568359375, -0.741668701171875, -0.68701171875, -0.632354736328125, -0.57769775390625, -0.523040771484375, -0.4683837890625, -0.413726806640625, -0.35906982421875, -0.304412841796875, -0.249755859375, -0.195098876953125, -0.14044189453125, -0.085784912109375, -0.0311279296875, 0.023529052734375, 0.07818603515625, 0.132843017578125, 0.1875, 0.242156982421875, 0.29681396484375, 0.351470947265625, 0.4061279296875, 0.460784912109375, 0.51544189453125, 0.570098876953125, 0.624755859375, 0.679412841796875, 0.73406982421875, 0.788726806640625, 0.8433837890625, 0.898040771484375, 0.95269775390625, 1.007354736328125, 1.06201171875, 1.116668701171875, 1.17132568359375, 1.225982666015625, 1.2806396484375, 1.335296630859375, 1.38995361328125, 1.444610595703125, 1.499267578125, 1.553924560546875, 1.60858154296875, 1.663238525390625, 1.7178955078125, 1.772552490234375, 1.82720947265625, 1.881866455078125, 1.9365234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 8.0, 6.0, 5.0, 8.0, 16.0, 20.0, 25.0, 30.0, 35.0, 28.0, 51.0, 44.0, 41.0, 49.0, 43.0, 49.0, 120.0, 1015.0, 33.0, 59.0, 46.0, 39.0, 35.0, 38.0, 31.0, 32.0, 18.0, 20.0, 10.0, 18.0, 10.0, 10.0, 13.0, 6.0, 6.0, 3.0, 2.0, 1.0, 4.0, 3.0], "bins": [-1.3935546875, -1.3595657348632812, -1.3255767822265625, -1.2915878295898438, -1.257598876953125, -1.2236099243164062, -1.1896209716796875, -1.1556320190429688, -1.12164306640625, -1.0876541137695312, -1.0536651611328125, -1.0196762084960938, -0.985687255859375, -0.9516983032226562, -0.9177093505859375, -0.8837203979492188, -0.8497314453125, -0.8157424926757812, -0.7817535400390625, -0.7477645874023438, -0.713775634765625, -0.6797866821289062, -0.6457977294921875, -0.6118087768554688, -0.57781982421875, -0.5438308715820312, -0.5098419189453125, -0.47585296630859375, -0.441864013671875, -0.40787506103515625, -0.3738861083984375, -0.33989715576171875, -0.305908203125, -0.27191925048828125, -0.2379302978515625, -0.20394134521484375, -0.169952392578125, -0.13596343994140625, -0.1019744873046875, -0.06798553466796875, -0.03399658203125, -7.62939453125e-06, 0.0339813232421875, 0.06797027587890625, 0.101959228515625, 0.13594818115234375, 0.1699371337890625, 0.20392608642578125, 0.2379150390625, 0.27190399169921875, 0.3058929443359375, 0.33988189697265625, 0.373870849609375, 0.40785980224609375, 0.4418487548828125, 0.47583770751953125, 0.50982666015625, 0.5438156127929688, 0.5778045654296875, 0.6117935180664062, 0.645782470703125, 0.6797714233398438, 0.7137603759765625, 0.7477493286132812, 0.78173828125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 5.0, 13.0, 19.0, 17.0, 23.0, 43.0, 59.0, 69.0, 120.0, 148.0, 160.0, 260.0, 355.0, 504.0, 829.0, 1205.0, 2056.0, 4312.0, 13173.0, 85551.0, 1748156.0, 206713.0, 20818.0, 5636.0, 2517.0, 1376.0, 879.0, 636.0, 418.0, 292.0, 190.0, 144.0, 123.0, 85.0, 61.0, 37.0, 32.0, 25.0, 16.0, 15.0, 9.0, 6.0, 8.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.109375, -1.07318115234375, -1.0369873046875, -1.00079345703125, -0.964599609375, -0.92840576171875, -0.8922119140625, -0.85601806640625, -0.81982421875, -0.78363037109375, -0.7474365234375, -0.71124267578125, -0.675048828125, -0.63885498046875, -0.6026611328125, -0.56646728515625, -0.5302734375, -0.49407958984375, -0.4578857421875, -0.42169189453125, -0.385498046875, -0.34930419921875, -0.3131103515625, -0.27691650390625, -0.24072265625, -0.20452880859375, -0.1683349609375, -0.13214111328125, -0.095947265625, -0.05975341796875, -0.0235595703125, 0.01263427734375, 0.048828125, 0.08502197265625, 0.1212158203125, 0.15740966796875, 0.193603515625, 0.22979736328125, 0.2659912109375, 0.30218505859375, 0.33837890625, 0.37457275390625, 0.4107666015625, 0.44696044921875, 0.483154296875, 0.51934814453125, 0.5555419921875, 0.59173583984375, 0.6279296875, 0.66412353515625, 0.7003173828125, 0.73651123046875, 0.772705078125, 0.80889892578125, 0.8450927734375, 0.88128662109375, 0.91748046875, 0.95367431640625, 0.9898681640625, 1.02606201171875, 1.062255859375, 1.09844970703125, 1.1346435546875, 1.17083740234375, 1.20703125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 7.0, 10.0, 24.0, 30.0, 50.0, 81.0, 130.0, 178.0, 164.0, 85.0, 71.0, 40.0, 26.0, 23.0, 12.0, 15.0, 6.0, 2.0, 5.0, 2.0, 5.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11334228515625, -0.10942363739013672, -0.10550498962402344, -0.10158634185791016, -0.09766769409179688, -0.0937490463256836, -0.08983039855957031, -0.08591175079345703, -0.08199310302734375, -0.07807445526123047, -0.07415580749511719, -0.0702371597290039, -0.06631851196289062, -0.062399864196777344, -0.05848121643066406, -0.05456256866455078, -0.0506439208984375, -0.04672527313232422, -0.04280662536621094, -0.038887977600097656, -0.034969329833984375, -0.031050682067871094, -0.027132034301757812, -0.02321338653564453, -0.01929473876953125, -0.015376091003417969, -0.011457443237304688, -0.007538795471191406, -0.003620147705078125, 0.00029850006103515625, 0.0042171478271484375, 0.008135795593261719, 0.012054443359375, 0.01597309112548828, 0.019891738891601562, 0.023810386657714844, 0.027729034423828125, 0.031647682189941406, 0.03556632995605469, 0.03948497772216797, 0.04340362548828125, 0.04732227325439453, 0.05124092102050781, 0.055159568786621094, 0.059078216552734375, 0.06299686431884766, 0.06691551208496094, 0.07083415985107422, 0.0747528076171875, 0.07867145538330078, 0.08259010314941406, 0.08650875091552734, 0.09042739868164062, 0.0943460464477539, 0.09826469421386719, 0.10218334197998047, 0.10610198974609375, 0.11002063751220703, 0.11393928527832031, 0.1178579330444336, 0.12177658081054688, 0.12569522857666016, 0.12961387634277344, 0.13353252410888672, 0.137451171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 17.0, 19.0, 29.0, 58.0, 158.0, 579.0, 3085.0, 94387.0, 942488.0, 6324.0, 958.0, 257.0, 76.0, 34.0, 18.0, 6.0, 9.0, 9.0, 2.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.20654296875, -2.1357421875, -2.06494140625, -1.994140625, -1.92333984375, -1.8525390625, -1.78173828125, -1.7109375, -1.64013671875, -1.5693359375, -1.49853515625, -1.427734375, -1.35693359375, -1.2861328125, -1.21533203125, -1.14453125, -1.07373046875, -1.0029296875, -0.93212890625, -0.861328125, -0.79052734375, -0.7197265625, -0.64892578125, -0.578125, -0.50732421875, -0.4365234375, -0.36572265625, -0.294921875, -0.22412109375, -0.1533203125, -0.08251953125, -0.01171875, 0.05908203125, 0.1298828125, 0.20068359375, 0.271484375, 0.34228515625, 0.4130859375, 0.48388671875, 0.5546875, 0.62548828125, 0.6962890625, 0.76708984375, 0.837890625, 0.90869140625, 0.9794921875, 1.05029296875, 1.12109375, 1.19189453125, 1.2626953125, 1.33349609375, 1.404296875, 1.47509765625, 1.5458984375, 1.61669921875, 1.6875, 1.75830078125, 1.8291015625, 1.89990234375, 1.970703125, 2.04150390625, 2.1123046875, 2.18310546875, 2.25390625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 26.0, 130.0, 370.0, 322.0, 107.0, 34.0, 10.0, 9.0], "bins": [-1.187180995941162, -1.167055368423462, -1.1469296216964722, -1.126803994178772, -1.1066782474517822, -1.086552619934082, -1.0664268732070923, -1.046301245689392, -1.0261754989624023, -1.0060498714447021, -0.9859241247177124, -0.9657984375953674, -0.9456727504730225, -0.9255471229553223, -0.9054213762283325, -0.8852957487106323, -0.8651701211929321, -0.8450444340705872, -0.8249187469482422, -0.8047930598258972, -0.7846673727035522, -0.764541745185852, -0.7444159984588623, -0.7242903709411621, -0.7041646242141724, -0.6840389370918274, -0.6639132499694824, -0.6437875628471375, -0.6236618757247925, -0.6035362482070923, -0.5834105014801025, -0.5632848739624023, -0.5431591868400574, -0.5230334997177124, -0.5029078125953674, -0.48278212547302246, -0.4626564681529999, -0.4425307810306549, -0.42240509390830994, -0.40227943658828735, -0.38215371966362, -0.362028032541275, -0.34190234541893005, -0.32177668809890747, -0.3016510009765625, -0.28152531385421753, -0.26139962673187256, -0.24127395451068878, -0.221148282289505, -0.20102259516716003, -0.18089692294597626, -0.1607712358236313, -0.1406455636024475, -0.12051987648010254, -0.10039418935775757, -0.08026851713657379, -0.060142822563648224, -0.04001714289188385, -0.019891459494829178, 0.00023422390222549438, 0.020359903573989868, 0.04048558324575424, 0.06061127036809921, 0.08073694258928299, 0.10086262971162796]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 6.0, 8.0, 9.0, 8.0, 8.0, 12.0, 12.0, 12.0, 15.0, 20.0, 23.0, 20.0, 35.0, 29.0, 28.0, 39.0, 27.0, 33.0, 36.0, 36.0, 36.0, 38.0, 28.0, 30.0, 36.0, 43.0, 28.0, 28.0, 36.0, 24.0, 34.0, 26.0, 31.0, 23.0, 22.0, 12.0, 11.0, 18.0, 15.0, 14.0, 8.0, 5.0, 6.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.09237515926361084, -0.08942973613739014, -0.08648431301116943, -0.08353888988494873, -0.08059346675872803, -0.07764804363250732, -0.07470262050628662, -0.07175719738006592, -0.06881177425384521, -0.06586635112762451, -0.06292092800140381, -0.059975504875183105, -0.0570300817489624, -0.0540846586227417, -0.051139235496520996, -0.04819381237030029, -0.04524838924407959, -0.04230296611785889, -0.039357542991638184, -0.03641211986541748, -0.03346669673919678, -0.030521273612976074, -0.02757585048675537, -0.024630427360534668, -0.021685004234313965, -0.01873958110809326, -0.01579415798187256, -0.012848734855651855, -0.009903311729431152, -0.006957888603210449, -0.004012465476989746, -0.001067042350769043, 0.0018783807754516602, 0.004823803901672363, 0.007769227027893066, 0.01071465015411377, 0.013660073280334473, 0.016605496406555176, 0.01955091953277588, 0.022496342658996582, 0.025441765785217285, 0.02838718891143799, 0.03133261203765869, 0.034278035163879395, 0.0372234582901001, 0.0401688814163208, 0.043114304542541504, 0.04605972766876221, 0.04900515079498291, 0.05195057392120361, 0.054895997047424316, 0.05784142017364502, 0.06078684329986572, 0.06373226642608643, 0.06667768955230713, 0.06962311267852783, 0.07256853580474854, 0.07551395893096924, 0.07845938205718994, 0.08140480518341064, 0.08435022830963135, 0.08729565143585205, 0.09024107456207275, 0.09318649768829346, 0.09613192081451416]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 12.0, 9.0, 13.0, 17.0, 11.0, 17.0, 25.0, 20.0, 15.0, 28.0, 28.0, 30.0, 31.0, 29.0, 29.0, 33.0, 30.0, 29.0, 29.0, 26.0, 45.0, 41.0, 33.0, 36.0, 38.0, 36.0, 30.0, 30.0, 21.0, 27.0, 29.0, 19.0, 19.0, 23.0, 21.0, 13.0, 10.0, 8.0, 3.0, 6.0, 7.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.11328125, -1.0791778564453125, -1.045074462890625, -1.0109710693359375, -0.97686767578125, -0.9427642822265625, -0.908660888671875, -0.8745574951171875, -0.8404541015625, -0.8063507080078125, -0.772247314453125, -0.7381439208984375, -0.70404052734375, -0.6699371337890625, -0.635833740234375, -0.6017303466796875, -0.567626953125, -0.5335235595703125, -0.499420166015625, -0.4653167724609375, -0.43121337890625, -0.3971099853515625, -0.363006591796875, -0.3289031982421875, -0.2947998046875, -0.2606964111328125, -0.226593017578125, -0.1924896240234375, -0.15838623046875, -0.1242828369140625, -0.090179443359375, -0.0560760498046875, -0.02197265625, 0.0121307373046875, 0.046234130859375, 0.0803375244140625, 0.11444091796875, 0.1485443115234375, 0.182647705078125, 0.2167510986328125, 0.2508544921875, 0.2849578857421875, 0.319061279296875, 0.3531646728515625, 0.38726806640625, 0.4213714599609375, 0.455474853515625, 0.4895782470703125, 0.523681640625, 0.5577850341796875, 0.591888427734375, 0.6259918212890625, 0.66009521484375, 0.6941986083984375, 0.728302001953125, 0.7624053955078125, 0.7965087890625, 0.8306121826171875, 0.864715576171875, 0.8988189697265625, 0.93292236328125, 0.9670257568359375, 1.001129150390625, 1.0352325439453125, 1.0693359375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 14.0, 21.0, 25.0, 65.0, 94.0, 174.0, 234.0, 426.0, 749.0, 1305.0, 2220.0, 3900.0, 7060.0, 13745.0, 28255.0, 66275.0, 177518.0, 401195.0, 204087.0, 76206.0, 31950.0, 15072.0, 7899.0, 4294.0, 2445.0, 1357.0, 815.0, 485.0, 287.0, 167.0, 96.0, 52.0, 28.0, 18.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.197265625, -2.135498046875, -2.07373046875, -2.011962890625, -1.9501953125, -1.888427734375, -1.82666015625, -1.764892578125, -1.703125, -1.641357421875, -1.57958984375, -1.517822265625, -1.4560546875, -1.394287109375, -1.33251953125, -1.270751953125, -1.208984375, -1.147216796875, -1.08544921875, -1.023681640625, -0.9619140625, -0.900146484375, -0.83837890625, -0.776611328125, -0.71484375, -0.653076171875, -0.59130859375, -0.529541015625, -0.4677734375, -0.406005859375, -0.34423828125, -0.282470703125, -0.220703125, -0.158935546875, -0.09716796875, -0.035400390625, 0.0263671875, 0.088134765625, 0.14990234375, 0.211669921875, 0.2734375, 0.335205078125, 0.39697265625, 0.458740234375, 0.5205078125, 0.582275390625, 0.64404296875, 0.705810546875, 0.767578125, 0.829345703125, 0.89111328125, 0.952880859375, 1.0146484375, 1.076416015625, 1.13818359375, 1.199951171875, 1.26171875, 1.323486328125, 1.38525390625, 1.447021484375, 1.5087890625, 1.570556640625, 1.63232421875, 1.694091796875, 1.755859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 14.0, 5.0, 19.0, 11.0, 14.0, 25.0, 30.0, 23.0, 33.0, 39.0, 29.0, 50.0, 55.0, 88.0, 147.0, 283.0, 1429.0, 202.0, 131.0, 55.0, 62.0, 59.0, 37.0, 31.0, 33.0, 35.0, 19.0, 20.0, 11.0, 13.0, 12.0, 10.0, 2.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.62109375, -4.486083984375, -4.35107421875, -4.216064453125, -4.0810546875, -3.946044921875, -3.81103515625, -3.676025390625, -3.541015625, -3.406005859375, -3.27099609375, -3.135986328125, -3.0009765625, -2.865966796875, -2.73095703125, -2.595947265625, -2.4609375, -2.325927734375, -2.19091796875, -2.055908203125, -1.9208984375, -1.785888671875, -1.65087890625, -1.515869140625, -1.380859375, -1.245849609375, -1.11083984375, -0.975830078125, -0.8408203125, -0.705810546875, -0.57080078125, -0.435791015625, -0.30078125, -0.165771484375, -0.03076171875, 0.104248046875, 0.2392578125, 0.374267578125, 0.50927734375, 0.644287109375, 0.779296875, 0.914306640625, 1.04931640625, 1.184326171875, 1.3193359375, 1.454345703125, 1.58935546875, 1.724365234375, 1.859375, 1.994384765625, 2.12939453125, 2.264404296875, 2.3994140625, 2.534423828125, 2.66943359375, 2.804443359375, 2.939453125, 3.074462890625, 3.20947265625, 3.344482421875, 3.4794921875, 3.614501953125, 3.74951171875, 3.884521484375, 4.01953125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 10.0, 8.0, 5.0, 18.0, 17.0, 12.0, 21.0, 31.0, 28.0, 48.0, 72.0, 59.0, 83.0, 139.0, 156.0, 208.0, 290.0, 531.0, 1669.0, 9367.0, 126608.0, 2698484.0, 287866.0, 15790.0, 2223.0, 631.0, 320.0, 237.0, 137.0, 144.0, 110.0, 84.0, 62.0, 52.0, 28.0, 35.0, 28.0, 22.0, 19.0, 13.0, 10.0, 10.0, 5.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.540283203125, -6.32666015625, -6.113037109375, -5.8994140625, -5.685791015625, -5.47216796875, -5.258544921875, -5.044921875, -4.831298828125, -4.61767578125, -4.404052734375, -4.1904296875, -3.976806640625, -3.76318359375, -3.549560546875, -3.3359375, -3.122314453125, -2.90869140625, -2.695068359375, -2.4814453125, -2.267822265625, -2.05419921875, -1.840576171875, -1.626953125, -1.413330078125, -1.19970703125, -0.986083984375, -0.7724609375, -0.558837890625, -0.34521484375, -0.131591796875, 0.08203125, 0.295654296875, 0.50927734375, 0.722900390625, 0.9365234375, 1.150146484375, 1.36376953125, 1.577392578125, 1.791015625, 2.004638671875, 2.21826171875, 2.431884765625, 2.6455078125, 2.859130859375, 3.07275390625, 3.286376953125, 3.5, 3.713623046875, 3.92724609375, 4.140869140625, 4.3544921875, 4.568115234375, 4.78173828125, 4.995361328125, 5.208984375, 5.422607421875, 5.63623046875, 5.849853515625, 6.0634765625, 6.277099609375, 6.49072265625, 6.704345703125, 6.91796875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 15.0, 47.0, 147.0, 292.0, 254.0, 173.0, 65.0, 22.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.716951847076416, -5.98073673248291, -5.244521617889404, -4.508306503295898, -3.7720913887023926, -3.0358762741088867, -2.299661159515381, -1.563446044921875, -0.8272309303283691, -0.09101581573486328, 0.6451992988586426, 1.3814144134521484, 2.1176295280456543, 2.85384464263916, 3.590059757232666, 4.326274871826172, 5.062489986419678, 5.798705101013184, 6.5349202156066895, 7.271135330200195, 8.00735092163086, 8.743565559387207, 9.479780197143555, 10.215995788574219, 10.952211380004883, 11.688426971435547, 12.424641609191895, 13.160856246948242, 13.897071838378906, 14.63328742980957, 15.369502067565918, 16.105716705322266, 16.841930389404297, 17.57814598083496, 18.314361572265625, 19.050575256347656, 19.78679084777832, 20.523006439208984, 21.259220123291016, 21.99543571472168, 22.731651306152344, 23.467866897583008, 24.204082489013672, 24.940296173095703, 25.676511764526367, 26.41272735595703, 27.148941040039062, 27.885156631469727, 28.62137222290039, 29.357587814331055, 30.09380340576172, 30.83001708984375, 31.566232681274414, 32.30244827270508, 33.03866195678711, 33.774879455566406, 34.51109313964844, 35.24730682373047, 35.983524322509766, 36.7197380065918, 37.455955505371094, 38.192169189453125, 38.928382873535156, 39.66460037231445, 40.400814056396484]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 11.0, 10.0, 19.0, 13.0, 18.0, 23.0, 27.0, 34.0, 35.0, 29.0, 53.0, 35.0, 33.0, 42.0, 30.0, 41.0, 52.0, 41.0, 42.0, 39.0, 41.0, 30.0, 25.0, 37.0, 26.0, 24.0, 19.0, 28.0, 20.0, 23.0, 15.0, 10.0, 6.0, 4.0, 10.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.161998748779297, -10.809913635253906, -10.457829475402832, -10.105744361877441, -9.753660202026367, -9.401575088500977, -9.049489974975586, -8.697405815124512, -8.345321655273438, -7.993237018585205, -7.641152381896973, -7.289067268371582, -6.936983108520508, -6.584897994995117, -6.232813358306885, -5.880728721618652, -5.528643608093262, -5.176558971405029, -4.824474334716797, -4.472389221191406, -4.120305061340332, -3.7682201862335205, -3.416135311126709, -3.0640506744384766, -2.711966037750244, -2.3598814010620117, -2.0077967643737793, -1.6557118892669678, -1.3036272525787354, -0.9515426158905029, -0.5994577407836914, -0.24737310409545898, 0.10471248626708984, 0.45679718255996704, 0.8088818788528442, 1.1609666347503662, 1.5130512714385986, 1.865135908126831, 2.2172207832336426, 2.569305419921875, 2.9213900566101074, 3.27347469329834, 3.6255593299865723, 3.977644205093384, 4.329729080200195, 4.6818132400512695, 5.03389835357666, 5.385982990264893, 5.738067626953125, 6.090152263641357, 6.44223690032959, 6.7943220138549805, 7.146406173706055, 7.498491287231445, 7.850575923919678, 8.20266056060791, 8.554744720458984, 8.906829833984375, 9.25891399383545, 9.61099910736084, 9.963083267211914, 10.315168380737305, 10.667253494262695, 11.01933765411377, 11.37142276763916]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 9.0, 8.0, 12.0, 15.0, 21.0, 19.0, 16.0, 18.0, 27.0, 22.0, 25.0, 28.0, 40.0, 37.0, 29.0, 30.0, 35.0, 34.0, 37.0, 50.0, 38.0, 30.0, 50.0, 42.0, 31.0, 32.0, 36.0, 25.0, 28.0, 27.0, 19.0, 23.0, 13.0, 14.0, 22.0, 12.0, 10.0, 6.0, 2.0, 9.0, 4.0, 0.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.294921875, -1.2559356689453125, -1.216949462890625, -1.1779632568359375, -1.13897705078125, -1.0999908447265625, -1.061004638671875, -1.0220184326171875, -0.9830322265625, -0.9440460205078125, -0.905059814453125, -0.8660736083984375, -0.82708740234375, -0.7881011962890625, -0.749114990234375, -0.7101287841796875, -0.671142578125, -0.6321563720703125, -0.593170166015625, -0.5541839599609375, -0.51519775390625, -0.4762115478515625, -0.437225341796875, -0.3982391357421875, -0.3592529296875, -0.3202667236328125, -0.281280517578125, -0.2422943115234375, -0.20330810546875, -0.1643218994140625, -0.125335693359375, -0.0863494873046875, -0.04736328125, -0.0083770751953125, 0.030609130859375, 0.0695953369140625, 0.10858154296875, 0.1475677490234375, 0.186553955078125, 0.2255401611328125, 0.2645263671875, 0.3035125732421875, 0.342498779296875, 0.3814849853515625, 0.42047119140625, 0.4594573974609375, 0.498443603515625, 0.5374298095703125, 0.576416015625, 0.6154022216796875, 0.654388427734375, 0.6933746337890625, 0.73236083984375, 0.7713470458984375, 0.810333251953125, 0.8493194580078125, 0.8883056640625, 0.9272918701171875, 0.966278076171875, 1.0052642822265625, 1.04425048828125, 1.0832366943359375, 1.122222900390625, 1.1612091064453125, 1.2001953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 5.0, 8.0, 11.0, 14.0, 17.0, 38.0, 47.0, 46.0, 77.0, 92.0, 109.0, 196.0, 330.0, 454.0, 696.0, 1165.0, 1907.0, 3365.0, 6504.0, 13287.0, 30558.0, 83611.0, 322388.0, 1574726.0, 1655611.0, 350451.0, 88244.0, 31229.0, 13813.0, 6691.0, 3537.0, 1921.0, 1180.0, 677.0, 420.0, 266.0, 189.0, 119.0, 84.0, 43.0, 60.0, 32.0, 20.0, 17.0, 13.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0], "bins": [-2.859375, -2.779998779296875, -2.70062255859375, -2.621246337890625, -2.5418701171875, -2.462493896484375, -2.38311767578125, -2.303741455078125, -2.224365234375, -2.144989013671875, -2.06561279296875, -1.986236572265625, -1.9068603515625, -1.827484130859375, -1.74810791015625, -1.668731689453125, -1.58935546875, -1.509979248046875, -1.43060302734375, -1.351226806640625, -1.2718505859375, -1.192474365234375, -1.11309814453125, -1.033721923828125, -0.954345703125, -0.874969482421875, -0.79559326171875, -0.716217041015625, -0.6368408203125, -0.557464599609375, -0.47808837890625, -0.398712158203125, -0.3193359375, -0.239959716796875, -0.16058349609375, -0.081207275390625, -0.0018310546875, 0.077545166015625, 0.15692138671875, 0.236297607421875, 0.315673828125, 0.395050048828125, 0.47442626953125, 0.553802490234375, 0.6331787109375, 0.712554931640625, 0.79193115234375, 0.871307373046875, 0.95068359375, 1.030059814453125, 1.10943603515625, 1.188812255859375, 1.2681884765625, 1.347564697265625, 1.42694091796875, 1.506317138671875, 1.585693359375, 1.665069580078125, 1.74444580078125, 1.823822021484375, 1.9031982421875, 1.982574462890625, 2.06195068359375, 2.141326904296875, 2.220703125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 17.0, 17.0, 28.0, 33.0, 59.0, 62.0, 84.0, 118.0, 120.0, 170.0, 245.0, 268.0, 368.0, 448.0, 456.0, 382.0, 295.0, 190.0, 162.0, 137.0, 99.0, 75.0, 49.0, 33.0, 26.0, 39.0, 17.0, 14.0, 13.0, 8.0, 4.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.420989990234375, -2.34979248046875, -2.278594970703125, -2.2073974609375, -2.136199951171875, -2.06500244140625, -1.993804931640625, -1.922607421875, -1.851409912109375, -1.78021240234375, -1.709014892578125, -1.6378173828125, -1.566619873046875, -1.49542236328125, -1.424224853515625, -1.35302734375, -1.281829833984375, -1.21063232421875, -1.139434814453125, -1.0682373046875, -0.997039794921875, -0.92584228515625, -0.854644775390625, -0.783447265625, -0.712249755859375, -0.64105224609375, -0.569854736328125, -0.4986572265625, -0.427459716796875, -0.35626220703125, -0.285064697265625, -0.2138671875, -0.142669677734375, -0.07147216796875, -0.000274658203125, 0.0709228515625, 0.142120361328125, 0.21331787109375, 0.284515380859375, 0.355712890625, 0.426910400390625, 0.49810791015625, 0.569305419921875, 0.6405029296875, 0.711700439453125, 0.78289794921875, 0.854095458984375, 0.92529296875, 0.996490478515625, 1.06768798828125, 1.138885498046875, 1.2100830078125, 1.281280517578125, 1.35247802734375, 1.423675537109375, 1.494873046875, 1.566070556640625, 1.63726806640625, 1.708465576171875, 1.7796630859375, 1.850860595703125, 1.92205810546875, 1.993255615234375, 2.064453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 8.0, 9.0, 14.0, 14.0, 31.0, 31.0, 46.0, 53.0, 69.0, 95.0, 127.0, 177.0, 335.0, 695.0, 1908.0, 6751.0, 31714.0, 199017.0, 2249705.0, 1531481.0, 139723.0, 23560.0, 5386.0, 1685.0, 602.0, 325.0, 200.0, 131.0, 84.0, 85.0, 49.0, 43.0, 31.0, 22.0, 24.0, 14.0, 14.0, 10.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.61749267578125, -4.4459228515625, -4.27435302734375, -4.102783203125, -3.93121337890625, -3.7596435546875, -3.58807373046875, -3.41650390625, -3.24493408203125, -3.0733642578125, -2.90179443359375, -2.730224609375, -2.55865478515625, -2.3870849609375, -2.21551513671875, -2.0439453125, -1.87237548828125, -1.7008056640625, -1.52923583984375, -1.357666015625, -1.18609619140625, -1.0145263671875, -0.84295654296875, -0.67138671875, -0.49981689453125, -0.3282470703125, -0.15667724609375, 0.014892578125, 0.18646240234375, 0.3580322265625, 0.52960205078125, 0.701171875, 0.87274169921875, 1.0443115234375, 1.21588134765625, 1.387451171875, 1.55902099609375, 1.7305908203125, 1.90216064453125, 2.07373046875, 2.24530029296875, 2.4168701171875, 2.58843994140625, 2.760009765625, 2.93157958984375, 3.1031494140625, 3.27471923828125, 3.4462890625, 3.61785888671875, 3.7894287109375, 3.96099853515625, 4.132568359375, 4.30413818359375, 4.4757080078125, 4.64727783203125, 4.81884765625, 4.99041748046875, 5.1619873046875, 5.33355712890625, 5.505126953125, 5.67669677734375, 5.8482666015625, 6.01983642578125, 6.19140625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 14.0, 34.0, 33.0, 48.0, 42.0, 71.0, 77.0, 87.0, 93.0, 103.0, 95.0, 83.0, 58.0, 43.0, 45.0, 22.0, 16.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.091376304626465, -12.691540718078613, -12.291706085205078, -11.891870498657227, -11.492034912109375, -11.092199325561523, -10.692363739013672, -10.292529106140137, -9.892693519592285, -9.492857933044434, -9.093023300170898, -8.693187713623047, -8.293352127075195, -7.893516540527344, -7.49368143081665, -7.093846321105957, -6.6940107345581055, -6.294175148010254, -5.8943400382995605, -5.494504928588867, -5.094669342041016, -4.694833755493164, -4.294998645782471, -3.8951632976531982, -3.495327949523926, -3.0954926013946533, -2.695657253265381, -2.2958219051361084, -1.895986557006836, -1.4961512088775635, -1.096315860748291, -0.6964805126190186, -0.2966461181640625, 0.10318922996520996, 0.5030245780944824, 0.9028599262237549, 1.3026952743530273, 1.7025306224822998, 2.1023659706115723, 2.5022013187408447, 2.902036666870117, 3.3018720149993896, 3.701707363128662, 4.1015424728393555, 4.501378059387207, 4.901213645935059, 5.301048755645752, 5.700883865356445, 6.100719451904297, 6.500555038452148, 6.900390148162842, 7.300225257873535, 7.700060844421387, 8.099896430969238, 8.499731063842773, 8.899566650390625, 9.299402236938477, 9.699237823486328, 10.09907341003418, 10.498908042907715, 10.898743629455566, 11.298579216003418, 11.698413848876953, 12.098249435424805, 12.498085021972656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 10.0, 11.0, 5.0, 16.0, 8.0, 13.0, 13.0, 17.0, 34.0, 25.0, 27.0, 33.0, 30.0, 37.0, 28.0, 34.0, 36.0, 33.0, 44.0, 44.0, 41.0, 48.0, 43.0, 41.0, 38.0, 32.0, 22.0, 35.0, 23.0, 18.0, 25.0, 21.0, 13.0, 17.0, 23.0, 11.0, 14.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.456425666809082, -7.211144924163818, -6.965864181518555, -6.720583438873291, -6.475302696228027, -6.230021953582764, -5.9847412109375, -5.739459991455078, -5.494179725646973, -5.248898983001709, -5.003618240356445, -4.758337497711182, -4.513056755065918, -4.267776012420654, -4.022495269775391, -3.777214288711548, -3.531933307647705, -3.2866525650024414, -3.0413718223571777, -2.796091079711914, -2.5508103370666504, -2.3055295944213867, -2.060248613357544, -1.8149678707122803, -1.5696871280670166, -1.324406385421753, -1.0791256427764893, -0.833844780921936, -0.5885640382766724, -0.3432832956314087, -0.09800243377685547, 0.1472783088684082, 0.3925590515136719, 0.6378397941589355, 0.883120596408844, 1.1284013986587524, 1.3736821413040161, 1.6189628839492798, 1.864243745803833, 2.1095244884490967, 2.3548052310943604, 2.600085973739624, 2.8453667163848877, 3.0906476974487305, 3.335928440093994, 3.581209182739258, 3.8264899253845215, 4.071770668029785, 4.317051410675049, 4.5623321533203125, 4.807612895965576, 5.05289363861084, 5.2981743812561035, 5.543455123901367, 5.788736343383789, 6.0340166091918945, 6.279297828674316, 6.52457857131958, 6.769859313964844, 7.015140056610107, 7.260420799255371, 7.505701541900635, 7.750982284545898, 7.99626350402832, 8.241543769836426]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 9.0, 6.0, 14.0, 20.0, 14.0, 17.0, 14.0, 17.0, 23.0, 28.0, 26.0, 25.0, 28.0, 33.0, 31.0, 35.0, 31.0, 36.0, 49.0, 33.0, 49.0, 48.0, 36.0, 42.0, 33.0, 35.0, 32.0, 33.0, 28.0, 24.0, 18.0, 21.0, 18.0, 20.0, 22.0, 10.0, 4.0, 4.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3681640625, -1.3296356201171875, -1.291107177734375, -1.2525787353515625, -1.21405029296875, -1.1755218505859375, -1.136993408203125, -1.0984649658203125, -1.0599365234375, -1.0214080810546875, -0.982879638671875, -0.9443511962890625, -0.90582275390625, -0.8672943115234375, -0.828765869140625, -0.7902374267578125, -0.751708984375, -0.7131805419921875, -0.674652099609375, -0.6361236572265625, -0.59759521484375, -0.5590667724609375, -0.520538330078125, -0.4820098876953125, -0.4434814453125, -0.4049530029296875, -0.366424560546875, -0.3278961181640625, -0.28936767578125, -0.2508392333984375, -0.212310791015625, -0.1737823486328125, -0.13525390625, -0.0967254638671875, -0.058197021484375, -0.0196685791015625, 0.01885986328125, 0.0573883056640625, 0.095916748046875, 0.1344451904296875, 0.1729736328125, 0.2115020751953125, 0.250030517578125, 0.2885589599609375, 0.32708740234375, 0.3656158447265625, 0.404144287109375, 0.4426727294921875, 0.481201171875, 0.5197296142578125, 0.558258056640625, 0.5967864990234375, 0.63531494140625, 0.6738433837890625, 0.712371826171875, 0.7509002685546875, 0.7894287109375, 0.8279571533203125, 0.866485595703125, 0.9050140380859375, 0.94354248046875, 0.9820709228515625, 1.020599365234375, 1.0591278076171875, 1.09765625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 12.0, 21.0, 17.0, 34.0, 47.0, 60.0, 83.0, 126.0, 174.0, 266.0, 392.0, 554.0, 766.0, 1151.0, 1703.0, 3077.0, 6930.0, 20996.0, 81131.0, 344220.0, 428524.0, 112448.0, 27737.0, 8685.0, 3498.0, 1937.0, 1225.0, 796.0, 581.0, 418.0, 291.0, 195.0, 148.0, 101.0, 69.0, 46.0, 26.0, 20.0, 22.0, 8.0, 7.0, 8.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7119140625, -0.6856536865234375, -0.659393310546875, -0.6331329345703125, -0.60687255859375, -0.5806121826171875, -0.554351806640625, -0.5280914306640625, -0.5018310546875, -0.4755706787109375, -0.449310302734375, -0.4230499267578125, -0.39678955078125, -0.3705291748046875, -0.344268798828125, -0.3180084228515625, -0.291748046875, -0.2654876708984375, -0.239227294921875, -0.2129669189453125, -0.18670654296875, -0.1604461669921875, -0.134185791015625, -0.1079254150390625, -0.0816650390625, -0.0554046630859375, -0.029144287109375, -0.0028839111328125, 0.02337646484375, 0.0496368408203125, 0.075897216796875, 0.1021575927734375, 0.12841796875, 0.1546783447265625, 0.180938720703125, 0.2071990966796875, 0.23345947265625, 0.2597198486328125, 0.285980224609375, 0.3122406005859375, 0.3385009765625, 0.3647613525390625, 0.391021728515625, 0.4172821044921875, 0.44354248046875, 0.4698028564453125, 0.496063232421875, 0.5223236083984375, 0.548583984375, 0.5748443603515625, 0.601104736328125, 0.6273651123046875, 0.65362548828125, 0.6798858642578125, 0.706146240234375, 0.7324066162109375, 0.7586669921875, 0.7849273681640625, 0.811187744140625, 0.8374481201171875, 0.86370849609375, 0.8899688720703125, 0.916229248046875, 0.9424896240234375, 0.96875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 10.0, 12.0, 14.0, 13.0, 28.0, 22.0, 30.0, 23.0, 21.0, 39.0, 28.0, 38.0, 40.0, 44.0, 48.0, 38.0, 1071.0, 51.0, 33.0, 49.0, 36.0, 32.0, 21.0, 45.0, 35.0, 27.0, 27.0, 18.0, 19.0, 13.0, 17.0, 7.0, 11.0, 8.0, 5.0, 7.0, 5.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0], "bins": [-1.0068359375, -0.98016357421875, -0.9534912109375, -0.92681884765625, -0.900146484375, -0.87347412109375, -0.8468017578125, -0.82012939453125, -0.79345703125, -0.76678466796875, -0.7401123046875, -0.71343994140625, -0.686767578125, -0.66009521484375, -0.6334228515625, -0.60675048828125, -0.580078125, -0.55340576171875, -0.5267333984375, -0.50006103515625, -0.473388671875, -0.44671630859375, -0.4200439453125, -0.39337158203125, -0.36669921875, -0.34002685546875, -0.3133544921875, -0.28668212890625, -0.260009765625, -0.23333740234375, -0.2066650390625, -0.17999267578125, -0.1533203125, -0.12664794921875, -0.0999755859375, -0.07330322265625, -0.046630859375, -0.01995849609375, 0.0067138671875, 0.03338623046875, 0.06005859375, 0.08673095703125, 0.1134033203125, 0.14007568359375, 0.166748046875, 0.19342041015625, 0.2200927734375, 0.24676513671875, 0.2734375, 0.30010986328125, 0.3267822265625, 0.35345458984375, 0.380126953125, 0.40679931640625, 0.4334716796875, 0.46014404296875, 0.48681640625, 0.51348876953125, 0.5401611328125, 0.56683349609375, 0.593505859375, 0.62017822265625, 0.6468505859375, 0.67352294921875, 0.7001953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 3.0, 8.0, 11.0, 8.0, 17.0, 27.0, 19.0, 39.0, 56.0, 72.0, 117.0, 151.0, 236.0, 385.0, 696.0, 1658.0, 5314.0, 35254.0, 1082986.0, 928109.0, 33370.0, 5209.0, 1559.0, 661.0, 369.0, 231.0, 174.0, 121.0, 68.0, 58.0, 36.0, 41.0, 15.0, 13.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83203125, -0.8033294677734375, -0.774627685546875, -0.7459259033203125, -0.71722412109375, -0.6885223388671875, -0.659820556640625, -0.6311187744140625, -0.6024169921875, -0.5737152099609375, -0.545013427734375, -0.5163116455078125, -0.48760986328125, -0.4589080810546875, -0.430206298828125, -0.4015045166015625, -0.372802734375, -0.3441009521484375, -0.315399169921875, -0.2866973876953125, -0.25799560546875, -0.2292938232421875, -0.200592041015625, -0.1718902587890625, -0.1431884765625, -0.1144866943359375, -0.085784912109375, -0.0570831298828125, -0.02838134765625, 0.0003204345703125, 0.029022216796875, 0.0577239990234375, 0.08642578125, 0.1151275634765625, 0.143829345703125, 0.1725311279296875, 0.20123291015625, 0.2299346923828125, 0.258636474609375, 0.2873382568359375, 0.3160400390625, 0.3447418212890625, 0.373443603515625, 0.4021453857421875, 0.43084716796875, 0.4595489501953125, 0.488250732421875, 0.5169525146484375, 0.545654296875, 0.5743560791015625, 0.603057861328125, 0.6317596435546875, 0.66046142578125, 0.6891632080078125, 0.717864990234375, 0.7465667724609375, 0.7752685546875, 0.8039703369140625, 0.832672119140625, 0.8613739013671875, 0.89007568359375, 0.9187774658203125, 0.947479248046875, 0.9761810302734375, 1.0048828125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 10.0, 13.0, 18.0, 27.0, 36.0, 78.0, 108.0, 163.0, 147.0, 124.0, 93.0, 52.0, 27.0, 23.0, 10.0, 10.0, 3.0, 9.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08514404296875, -0.08214187622070312, -0.07913970947265625, -0.07613754272460938, -0.0731353759765625, -0.07013320922851562, -0.06713104248046875, -0.06412887573242188, -0.061126708984375, -0.058124542236328125, -0.05512237548828125, -0.052120208740234375, -0.0491180419921875, -0.046115875244140625, -0.04311370849609375, -0.040111541748046875, -0.037109375, -0.034107208251953125, -0.03110504150390625, -0.028102874755859375, -0.0251007080078125, -0.022098541259765625, -0.01909637451171875, -0.016094207763671875, -0.013092041015625, -0.010089874267578125, -0.00708770751953125, -0.004085540771484375, -0.0010833740234375, 0.001918792724609375, 0.00492095947265625, 0.007923126220703125, 0.01092529296875, 0.013927459716796875, 0.01692962646484375, 0.019931793212890625, 0.0229339599609375, 0.025936126708984375, 0.02893829345703125, 0.031940460205078125, 0.034942626953125, 0.037944793701171875, 0.04094696044921875, 0.043949127197265625, 0.0469512939453125, 0.049953460693359375, 0.05295562744140625, 0.055957794189453125, 0.0589599609375, 0.061962127685546875, 0.06496429443359375, 0.06796646118164062, 0.0709686279296875, 0.07397079467773438, 0.07697296142578125, 0.07997512817382812, 0.082977294921875, 0.08597946166992188, 0.08898162841796875, 0.09198379516601562, 0.0949859619140625, 0.09798812866210938, 0.10099029541015625, 0.10399246215820312, 0.10699462890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 11.0, 9.0, 14.0, 13.0, 36.0, 50.0, 78.0, 207.0, 800.0, 8802.0, 1003111.0, 33180.0, 1634.0, 295.0, 128.0, 59.0, 45.0, 18.0, 12.0, 14.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.005859375, -1.949615478515625, -1.89337158203125, -1.837127685546875, -1.7808837890625, -1.724639892578125, -1.66839599609375, -1.612152099609375, -1.555908203125, -1.499664306640625, -1.44342041015625, -1.387176513671875, -1.3309326171875, -1.274688720703125, -1.21844482421875, -1.162200927734375, -1.10595703125, -1.049713134765625, -0.99346923828125, -0.937225341796875, -0.8809814453125, -0.824737548828125, -0.76849365234375, -0.712249755859375, -0.656005859375, -0.599761962890625, -0.54351806640625, -0.487274169921875, -0.4310302734375, -0.374786376953125, -0.31854248046875, -0.262298583984375, -0.2060546875, -0.149810791015625, -0.09356689453125, -0.037322998046875, 0.0189208984375, 0.075164794921875, 0.13140869140625, 0.187652587890625, 0.243896484375, 0.300140380859375, 0.35638427734375, 0.412628173828125, 0.4688720703125, 0.525115966796875, 0.58135986328125, 0.637603759765625, 0.69384765625, 0.750091552734375, 0.80633544921875, 0.862579345703125, 0.9188232421875, 0.975067138671875, 1.03131103515625, 1.087554931640625, 1.143798828125, 1.200042724609375, 1.25628662109375, 1.312530517578125, 1.3687744140625, 1.425018310546875, 1.48126220703125, 1.537506103515625, 1.59375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 14.0, 25.0, 10.0, 28.0, 38.0, 44.0, 68.0, 71.0, 79.0, 93.0, 88.0, 87.0, 65.0, 64.0, 40.0, 48.0, 18.0, 20.0, 14.0, 13.0, 19.0, 7.0, 5.0, 0.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08038259297609329, -0.07748378813266754, -0.07458499073982239, -0.07168618589639664, -0.06878738105297089, -0.06588858366012573, -0.06298977881669998, -0.06009097397327423, -0.05719217285513878, -0.054293371737003326, -0.051394566893577576, -0.04849576577544212, -0.04559696465730667, -0.04269815981388092, -0.03979935869574547, -0.036900557577610016, -0.034001752734184265, -0.031102949753403664, -0.028204146772623062, -0.02530534565448761, -0.02240654267370701, -0.019507739692926407, -0.016608938574790955, -0.013710135594010353, -0.010811332613229752, -0.00791252963244915, -0.005013727582991123, -0.0021149255335330963, 0.0007838774472475052, 0.0036826804280281067, 0.006581481546163559, 0.00948028452694416, 0.012379094958305359, 0.01527789793908596, 0.018176700919866562, 0.021075502038002014, 0.023974305018782616, 0.026873107999563217, 0.02977190911769867, 0.03267071396112442, 0.03556951507925987, 0.038468316197395325, 0.041367121040821075, 0.04426592215895653, 0.04716472327709198, 0.05006352812051773, 0.05296232923865318, 0.055861130356788635, 0.058759935200214386, 0.06165873631834984, 0.06455753743648529, 0.06745634227991104, 0.07035514712333679, 0.07325394451618195, 0.0761527493596077, 0.07905155420303345, 0.0819503515958786, 0.08484915643930435, 0.0877479538321495, 0.09064675867557526, 0.09354556351900101, 0.09644436836242676, 0.09934316575527191, 0.10224197059869766, 0.10514077544212341]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 7.0, 4.0, 10.0, 12.0, 19.0, 8.0, 17.0, 18.0, 16.0, 17.0, 23.0, 25.0, 22.0, 37.0, 35.0, 29.0, 32.0, 32.0, 49.0, 48.0, 55.0, 44.0, 43.0, 42.0, 32.0, 41.0, 35.0, 39.0, 27.0, 27.0, 16.0, 24.0, 17.0, 17.0, 15.0, 14.0, 9.0, 9.0, 7.0, 8.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06886523962020874, -0.06667792797088623, -0.06449062377214432, -0.06230331212282181, -0.0601160041987896, -0.057928696274757385, -0.055741384625434875, -0.053554076701402664, -0.05136676877737045, -0.04917946085333824, -0.04699215292930603, -0.04480484127998352, -0.04261753335595131, -0.0404302254319191, -0.03824291378259659, -0.03605560585856438, -0.033868297934532166, -0.031680990010499954, -0.029493680223822594, -0.027306370437145233, -0.025119062513113022, -0.02293175458908081, -0.02074444480240345, -0.01855713501572609, -0.016369827091693878, -0.014182518236339092, -0.011995209380984306, -0.00980790052562952, -0.0076205916702747345, -0.005433282814919949, -0.0032459739595651627, -0.0010586651042103767, 0.0011286437511444092, 0.003315952606499195, 0.005503261461853981, 0.007690570317208767, 0.009877879172563553, 0.012065188027918339, 0.014252496883273125, 0.016439806669950485, 0.018627114593982697, 0.020814422518014908, 0.02300173230469227, 0.02518904209136963, 0.02737635001540184, 0.02956365793943405, 0.03175096958875656, 0.03393827751278877, 0.036125585436820984, 0.038312893360853195, 0.040500201284885406, 0.042687512934207916, 0.04487482085824013, 0.04706212878227234, 0.04924944043159485, 0.05143674835562706, 0.05362405627965927, 0.05581136420369148, 0.057998672127723694, 0.060185983777046204, 0.062373291701078415, 0.06456059962511063, 0.06674791127443314, 0.06893521547317505, 0.07112252712249756]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 9.0, 6.0, 14.0, 21.0, 14.0, 16.0, 15.0, 16.0, 24.0, 27.0, 25.0, 24.0, 28.0, 34.0, 32.0, 34.0, 32.0, 35.0, 47.0, 32.0, 50.0, 53.0, 35.0, 42.0, 34.0, 32.0, 31.0, 35.0, 28.0, 24.0, 17.0, 22.0, 18.0, 20.0, 23.0, 10.0, 4.0, 3.0, 11.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.369140625, -1.3306427001953125, -1.292144775390625, -1.2536468505859375, -1.21514892578125, -1.1766510009765625, -1.138153076171875, -1.0996551513671875, -1.0611572265625, -1.0226593017578125, -0.984161376953125, -0.9456634521484375, -0.90716552734375, -0.8686676025390625, -0.830169677734375, -0.7916717529296875, -0.753173828125, -0.7146759033203125, -0.676177978515625, -0.6376800537109375, -0.59918212890625, -0.5606842041015625, -0.522186279296875, -0.4836883544921875, -0.4451904296875, -0.4066925048828125, -0.368194580078125, -0.3296966552734375, -0.29119873046875, -0.2527008056640625, -0.214202880859375, -0.1757049560546875, -0.13720703125, -0.0987091064453125, -0.060211181640625, -0.0217132568359375, 0.01678466796875, 0.0552825927734375, 0.093780517578125, 0.1322784423828125, 0.1707763671875, 0.2092742919921875, 0.247772216796875, 0.2862701416015625, 0.32476806640625, 0.3632659912109375, 0.401763916015625, 0.4402618408203125, 0.478759765625, 0.5172576904296875, 0.555755615234375, 0.5942535400390625, 0.63275146484375, 0.6712493896484375, 0.709747314453125, 0.7482452392578125, 0.7867431640625, 0.8252410888671875, 0.863739013671875, 0.9022369384765625, 0.94073486328125, 0.9792327880859375, 1.017730712890625, 1.0562286376953125, 1.0947265625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 14.0, 7.0, 11.0, 12.0, 30.0, 22.0, 48.0, 53.0, 84.0, 137.0, 182.0, 261.0, 427.0, 609.0, 948.0, 1658.0, 2759.0, 4524.0, 7803.0, 13352.0, 24570.0, 47119.0, 97717.0, 204443.0, 287854.0, 177400.0, 84478.0, 40924.0, 21635.0, 12012.0, 6795.0, 4048.0, 2433.0, 1457.0, 957.0, 610.0, 381.0, 241.0, 164.0, 98.0, 72.0, 58.0, 33.0, 27.0, 19.0, 17.0, 16.0, 9.0, 7.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-1.908203125, -1.84930419921875, -1.7904052734375, -1.73150634765625, -1.672607421875, -1.61370849609375, -1.5548095703125, -1.49591064453125, -1.43701171875, -1.37811279296875, -1.3192138671875, -1.26031494140625, -1.201416015625, -1.14251708984375, -1.0836181640625, -1.02471923828125, -0.9658203125, -0.90692138671875, -0.8480224609375, -0.78912353515625, -0.730224609375, -0.67132568359375, -0.6124267578125, -0.55352783203125, -0.49462890625, -0.43572998046875, -0.3768310546875, -0.31793212890625, -0.259033203125, -0.20013427734375, -0.1412353515625, -0.08233642578125, -0.0234375, 0.03546142578125, 0.0943603515625, 0.15325927734375, 0.212158203125, 0.27105712890625, 0.3299560546875, 0.38885498046875, 0.44775390625, 0.50665283203125, 0.5655517578125, 0.62445068359375, 0.683349609375, 0.74224853515625, 0.8011474609375, 0.86004638671875, 0.9189453125, 0.97784423828125, 1.0367431640625, 1.09564208984375, 1.154541015625, 1.21343994140625, 1.2723388671875, 1.33123779296875, 1.39013671875, 1.44903564453125, 1.5079345703125, 1.56683349609375, 1.625732421875, 1.68463134765625, 1.7435302734375, 1.80242919921875, 1.861328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 8.0, 12.0, 16.0, 11.0, 19.0, 16.0, 24.0, 27.0, 30.0, 24.0, 34.0, 34.0, 47.0, 52.0, 83.0, 85.0, 149.0, 237.0, 1311.0, 188.0, 134.0, 88.0, 62.0, 60.0, 37.0, 37.0, 26.0, 26.0, 22.0, 21.0, 25.0, 12.0, 9.0, 8.0, 10.0, 12.0, 6.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.681640625, -3.567596435546875, -3.45355224609375, -3.339508056640625, -3.2254638671875, -3.111419677734375, -2.99737548828125, -2.883331298828125, -2.769287109375, -2.655242919921875, -2.54119873046875, -2.427154541015625, -2.3131103515625, -2.199066162109375, -2.08502197265625, -1.970977783203125, -1.85693359375, -1.742889404296875, -1.62884521484375, -1.514801025390625, -1.4007568359375, -1.286712646484375, -1.17266845703125, -1.058624267578125, -0.944580078125, -0.830535888671875, -0.71649169921875, -0.602447509765625, -0.4884033203125, -0.374359130859375, -0.26031494140625, -0.146270751953125, -0.0322265625, 0.081817626953125, 0.19586181640625, 0.309906005859375, 0.4239501953125, 0.537994384765625, 0.65203857421875, 0.766082763671875, 0.880126953125, 0.994171142578125, 1.10821533203125, 1.222259521484375, 1.3363037109375, 1.450347900390625, 1.56439208984375, 1.678436279296875, 1.79248046875, 1.906524658203125, 2.02056884765625, 2.134613037109375, 2.2486572265625, 2.362701416015625, 2.47674560546875, 2.590789794921875, 2.704833984375, 2.818878173828125, 2.93292236328125, 3.046966552734375, 3.1610107421875, 3.275054931640625, 3.38909912109375, 3.503143310546875, 3.6171875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 0.0, 5.0, 11.0, 16.0, 17.0, 28.0, 34.0, 31.0, 43.0, 64.0, 110.0, 140.0, 245.0, 336.0, 516.0, 1193.0, 5631.0, 103549.0, 2798205.0, 223505.0, 8754.0, 1443.0, 601.0, 382.0, 250.0, 169.0, 113.0, 76.0, 58.0, 45.0, 37.0, 29.0, 20.0, 9.0, 12.0, 9.0, 8.0, 5.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.7689208984375, -9.459716796875, -9.1505126953125, -8.84130859375, -8.5321044921875, -8.222900390625, -7.9136962890625, -7.6044921875, -7.2952880859375, -6.986083984375, -6.6768798828125, -6.36767578125, -6.0584716796875, -5.749267578125, -5.4400634765625, -5.130859375, -4.8216552734375, -4.512451171875, -4.2032470703125, -3.89404296875, -3.5848388671875, -3.275634765625, -2.9664306640625, -2.6572265625, -2.3480224609375, -2.038818359375, -1.7296142578125, -1.42041015625, -1.1112060546875, -0.802001953125, -0.4927978515625, -0.18359375, 0.1256103515625, 0.434814453125, 0.7440185546875, 1.05322265625, 1.3624267578125, 1.671630859375, 1.9808349609375, 2.2900390625, 2.5992431640625, 2.908447265625, 3.2176513671875, 3.52685546875, 3.8360595703125, 4.145263671875, 4.4544677734375, 4.763671875, 5.0728759765625, 5.382080078125, 5.6912841796875, 6.00048828125, 6.3096923828125, 6.618896484375, 6.9281005859375, 7.2373046875, 7.5465087890625, 7.855712890625, 8.1649169921875, 8.47412109375, 8.7833251953125, 9.092529296875, 9.4017333984375, 9.7109375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 11.0, 24.0, 50.0, 97.0, 175.0, 192.0, 168.0, 131.0, 90.0, 30.0, 25.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.726999282836914, -8.23893928527832, -7.750879287719727, -7.262819290161133, -6.774759292602539, -6.286699295043945, -5.79863977432251, -5.310579776763916, -4.822519779205322, -4.3344597816467285, -3.8463997840881348, -3.35834002494812, -2.8702800273895264, -2.3822200298309326, -1.894160270690918, -1.4061002731323242, -0.9180402755737305, -0.4299803376197815, 0.05807960033416748, 0.5461394786834717, 1.0341994762420654, 1.5222594738006592, 2.010319232940674, 2.4983792304992676, 2.9864392280578613, 3.474499225616455, 3.962559223175049, 4.450618743896484, 4.938678741455078, 5.426738739013672, 5.914798736572266, 6.402858734130859, 6.890918731689453, 7.378978729248047, 7.867038726806641, 8.355098724365234, 8.843158721923828, 9.331218719482422, 9.819278717041016, 10.30733871459961, 10.795398712158203, 11.283458709716797, 11.77151870727539, 12.259578704833984, 12.747638702392578, 13.235698699951172, 13.723758697509766, 14.21181869506836, 14.699877738952637, 15.18793773651123, 15.675997734069824, 16.1640567779541, 16.652116775512695, 17.14017677307129, 17.628236770629883, 18.116296768188477, 18.60435676574707, 19.092416763305664, 19.580476760864258, 20.06853675842285, 20.556596755981445, 21.04465675354004, 21.532716751098633, 22.020776748657227, 22.50883674621582]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 14.0, 15.0, 16.0, 6.0, 25.0, 16.0, 31.0, 20.0, 30.0, 30.0, 33.0, 39.0, 41.0, 46.0, 41.0, 35.0, 52.0, 40.0, 49.0, 50.0, 35.0, 35.0, 37.0, 29.0, 34.0, 27.0, 23.0, 28.0, 19.0, 18.0, 16.0, 13.0, 12.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53671646118164, -10.225370407104492, -9.91402530670166, -9.602679252624512, -9.291333198547363, -8.979988098144531, -8.668642044067383, -8.357295989990234, -8.045949935913086, -7.734604358673096, -7.423258304595947, -7.111912727355957, -6.800566673278809, -6.489221096038818, -6.177875518798828, -5.86652946472168, -5.555184364318848, -5.243838787078857, -4.932492733001709, -4.621147155761719, -4.30980110168457, -3.99845552444458, -3.68710994720459, -3.3757641315460205, -3.064418315887451, -2.753072500228882, -2.4417266845703125, -2.1303811073303223, -1.819035291671753, -1.5076894760131836, -1.1963437795639038, -0.884998083114624, -0.5736532211303711, -0.26230746507644653, 0.04903829097747803, 0.3603840470314026, 0.6717298030853271, 0.9830756187438965, 1.2944213151931763, 1.605767011642456, 1.9171128273010254, 2.2284586429595947, 2.539804458618164, 2.8511500358581543, 3.1624958515167236, 3.473841667175293, 3.785187244415283, 4.096532821655273, 4.407878875732422, 4.719224452972412, 5.0305705070495605, 5.341916084289551, 5.653262138366699, 5.9646077156066895, 6.27595329284668, 6.587299346923828, 6.898644924163818, 7.209990501403809, 7.521336555480957, 7.832682132720947, 8.144027709960938, 8.455373764038086, 8.766719818115234, 9.078064918518066, 9.389410972595215]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 6.0, 6.0, 7.0, 11.0, 21.0, 18.0, 14.0, 30.0, 20.0, 9.0, 25.0, 24.0, 32.0, 27.0, 40.0, 24.0, 30.0, 40.0, 37.0, 36.0, 44.0, 38.0, 41.0, 43.0, 26.0, 42.0, 34.0, 31.0, 34.0, 31.0, 25.0, 23.0, 23.0, 17.0, 15.0, 18.0, 11.0, 7.0, 5.0, 9.0, 5.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.4345703125, -1.39483642578125, -1.3551025390625, -1.31536865234375, -1.275634765625, -1.23590087890625, -1.1961669921875, -1.15643310546875, -1.11669921875, -1.07696533203125, -1.0372314453125, -0.99749755859375, -0.957763671875, -0.91802978515625, -0.8782958984375, -0.83856201171875, -0.798828125, -0.75909423828125, -0.7193603515625, -0.67962646484375, -0.639892578125, -0.60015869140625, -0.5604248046875, -0.52069091796875, -0.48095703125, -0.44122314453125, -0.4014892578125, -0.36175537109375, -0.322021484375, -0.28228759765625, -0.2425537109375, -0.20281982421875, -0.1630859375, -0.12335205078125, -0.0836181640625, -0.04388427734375, -0.004150390625, 0.03558349609375, 0.0753173828125, 0.11505126953125, 0.15478515625, 0.19451904296875, 0.2342529296875, 0.27398681640625, 0.313720703125, 0.35345458984375, 0.3931884765625, 0.43292236328125, 0.47265625, 0.51239013671875, 0.5521240234375, 0.59185791015625, 0.631591796875, 0.67132568359375, 0.7110595703125, 0.75079345703125, 0.79052734375, 0.83026123046875, 0.8699951171875, 0.90972900390625, 0.949462890625, 0.98919677734375, 1.0289306640625, 1.06866455078125, 1.1083984375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 5.0, 8.0, 13.0, 15.0, 31.0, 50.0, 68.0, 77.0, 105.0, 179.0, 263.0, 368.0, 560.0, 926.0, 1520.0, 2452.0, 4709.0, 9217.0, 20768.0, 54775.0, 179067.0, 730709.0, 1900862.0, 941479.0, 232653.0, 67023.0, 24225.0, 10299.0, 4939.0, 2678.0, 1599.0, 933.0, 586.0, 378.0, 267.0, 152.0, 114.0, 73.0, 45.0, 38.0, 25.0, 8.0, 6.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.572265625, -2.5019683837890625, -2.431671142578125, -2.3613739013671875, -2.29107666015625, -2.2207794189453125, -2.150482177734375, -2.0801849365234375, -2.0098876953125, -1.9395904541015625, -1.869293212890625, -1.7989959716796875, -1.72869873046875, -1.6584014892578125, -1.588104248046875, -1.5178070068359375, -1.447509765625, -1.3772125244140625, -1.306915283203125, -1.2366180419921875, -1.16632080078125, -1.0960235595703125, -1.025726318359375, -0.9554290771484375, -0.8851318359375, -0.8148345947265625, -0.744537353515625, -0.6742401123046875, -0.60394287109375, -0.5336456298828125, -0.463348388671875, -0.3930511474609375, -0.32275390625, -0.2524566650390625, -0.182159423828125, -0.1118621826171875, -0.04156494140625, 0.0287322998046875, 0.099029541015625, 0.1693267822265625, 0.2396240234375, 0.3099212646484375, 0.380218505859375, 0.4505157470703125, 0.52081298828125, 0.5911102294921875, 0.661407470703125, 0.7317047119140625, 0.802001953125, 0.8722991943359375, 0.942596435546875, 1.0128936767578125, 1.08319091796875, 1.1534881591796875, 1.223785400390625, 1.2940826416015625, 1.3643798828125, 1.4346771240234375, 1.504974365234375, 1.5752716064453125, 1.64556884765625, 1.7158660888671875, 1.786163330078125, 1.8564605712890625, 1.9267578125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 8.0, 6.0, 7.0, 13.0, 8.0, 11.0, 12.0, 33.0, 37.0, 47.0, 57.0, 70.0, 100.0, 117.0, 140.0, 220.0, 260.0, 358.0, 382.0, 438.0, 369.0, 320.0, 259.0, 183.0, 136.0, 112.0, 81.0, 55.0, 51.0, 39.0, 43.0, 22.0, 18.0, 20.0, 9.0, 12.0, 4.0, 3.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.189666748046875, -2.11956787109375, -2.049468994140625, -1.9793701171875, -1.909271240234375, -1.83917236328125, -1.769073486328125, -1.698974609375, -1.628875732421875, -1.55877685546875, -1.488677978515625, -1.4185791015625, -1.348480224609375, -1.27838134765625, -1.208282470703125, -1.13818359375, -1.068084716796875, -0.99798583984375, -0.927886962890625, -0.8577880859375, -0.787689208984375, -0.71759033203125, -0.647491455078125, -0.577392578125, -0.507293701171875, -0.43719482421875, -0.367095947265625, -0.2969970703125, -0.226898193359375, -0.15679931640625, -0.086700439453125, -0.0166015625, 0.053497314453125, 0.12359619140625, 0.193695068359375, 0.2637939453125, 0.333892822265625, 0.40399169921875, 0.474090576171875, 0.544189453125, 0.614288330078125, 0.68438720703125, 0.754486083984375, 0.8245849609375, 0.894683837890625, 0.96478271484375, 1.034881591796875, 1.10498046875, 1.175079345703125, 1.24517822265625, 1.315277099609375, 1.3853759765625, 1.455474853515625, 1.52557373046875, 1.595672607421875, 1.665771484375, 1.735870361328125, 1.80596923828125, 1.876068115234375, 1.9461669921875, 2.016265869140625, 2.08636474609375, 2.156463623046875, 2.2265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 8.0, 7.0, 16.0, 12.0, 22.0, 19.0, 39.0, 43.0, 68.0, 55.0, 91.0, 126.0, 185.0, 315.0, 693.0, 2569.0, 19295.0, 302266.0, 3512994.0, 330330.0, 20655.0, 2717.0, 704.0, 289.0, 220.0, 128.0, 106.0, 72.0, 76.0, 49.0, 28.0, 18.0, 20.0, 10.0, 10.0, 6.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.90625, -8.648193359375, -8.39013671875, -8.132080078125, -7.8740234375, -7.615966796875, -7.35791015625, -7.099853515625, -6.841796875, -6.583740234375, -6.32568359375, -6.067626953125, -5.8095703125, -5.551513671875, -5.29345703125, -5.035400390625, -4.77734375, -4.519287109375, -4.26123046875, -4.003173828125, -3.7451171875, -3.487060546875, -3.22900390625, -2.970947265625, -2.712890625, -2.454833984375, -2.19677734375, -1.938720703125, -1.6806640625, -1.422607421875, -1.16455078125, -0.906494140625, -0.6484375, -0.390380859375, -0.13232421875, 0.125732421875, 0.3837890625, 0.641845703125, 0.89990234375, 1.157958984375, 1.416015625, 1.674072265625, 1.93212890625, 2.190185546875, 2.4482421875, 2.706298828125, 2.96435546875, 3.222412109375, 3.48046875, 3.738525390625, 3.99658203125, 4.254638671875, 4.5126953125, 4.770751953125, 5.02880859375, 5.286865234375, 5.544921875, 5.802978515625, 6.06103515625, 6.319091796875, 6.5771484375, 6.835205078125, 7.09326171875, 7.351318359375, 7.609375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 18.0, 42.0, 78.0, 126.0, 184.0, 190.0, 143.0, 109.0, 54.0, 31.0, 16.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8051118850708, -13.044912338256836, -12.284713745117188, -11.524514198303223, -10.764315605163574, -10.00411605834961, -9.243917465209961, -8.483717918395996, -7.7235188484191895, -6.963319778442383, -6.203120708465576, -5.4429216384887695, -4.682722091674805, -3.922523260116577, -3.1623239517211914, -2.4021248817443848, -1.6419258117675781, -0.8817266821861267, -0.12152755260467529, 0.6386716365814209, 1.3988707065582275, 2.159069776535034, 2.91926908493042, 3.6794681549072266, 4.439667224884033, 5.19986629486084, 5.9600653648376465, 6.720264434814453, 7.480463981628418, 8.240662574768066, 9.000862121582031, 9.76106071472168, 10.521261215209961, 11.281460762023926, 12.041659355163574, 12.801858901977539, 13.562057495117188, 14.322257041931152, 15.082456588745117, 15.842655181884766, 16.602853775024414, 17.363052368164062, 18.123252868652344, 18.883451461791992, 19.64365005493164, 20.40384864807129, 21.16404914855957, 21.92424774169922, 22.6844482421875, 23.44464683532715, 24.20484733581543, 24.965045928955078, 25.725244522094727, 26.485443115234375, 27.245643615722656, 28.005842208862305, 28.766040802001953, 29.5262393951416, 30.286439895629883, 31.04663848876953, 31.80683708190918, 32.56703567504883, 33.32723617553711, 34.087432861328125, 34.847633361816406]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 5.0, 6.0, 9.0, 13.0, 11.0, 10.0, 11.0, 21.0, 17.0, 23.0, 23.0, 29.0, 27.0, 31.0, 45.0, 26.0, 35.0, 29.0, 44.0, 39.0, 47.0, 35.0, 41.0, 41.0, 24.0, 39.0, 39.0, 28.0, 24.0, 37.0, 20.0, 17.0, 26.0, 24.0, 17.0, 18.0, 11.0, 13.0, 8.0, 9.0, 2.0, 4.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.213454246520996, -6.97361946105957, -6.733785152435303, -6.493950366973877, -6.254115581512451, -6.014281272888184, -5.774446487426758, -5.534611701965332, -5.294776916503906, -5.0549421310424805, -4.815107822418213, -4.575273036956787, -4.335438251495361, -4.095603942871094, -3.855769157409668, -3.615934371948242, -3.3760998249053955, -3.136265277862549, -2.896430492401123, -2.6565959453582764, -2.4167611598968506, -2.176926612854004, -1.9370919466018677, -1.6972572803497314, -1.4574226140975952, -1.217587947845459, -0.9777532815933228, -0.7379186749458313, -0.49808400869369507, -0.2582494020462036, -0.018414735794067383, 0.22141993045806885, 0.4612545967102051, 0.7010892629623413, 0.9409239292144775, 1.1807584762573242, 1.42059326171875, 1.6604278087615967, 1.900262475013733, 2.140097141265869, 2.379931926727295, 2.6197664737701416, 2.8596012592315674, 3.099435806274414, 3.33927059173584, 3.5791051387786865, 3.818939685821533, 4.058774471282959, 4.298608779907227, 4.538443565368652, 4.77827787399292, 5.018112659454346, 5.2579474449157715, 5.497781753540039, 5.737616539001465, 5.977451324462891, 6.217286109924316, 6.457120895385742, 6.69695520401001, 6.9367899894714355, 7.176624774932861, 7.416459083557129, 7.656293869018555, 7.8961286544799805, 8.135963439941406]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 6.0, 7.0, 8.0, 13.0, 20.0, 16.0, 17.0, 15.0, 18.0, 23.0, 24.0, 22.0, 33.0, 31.0, 33.0, 33.0, 30.0, 41.0, 35.0, 43.0, 41.0, 40.0, 28.0, 25.0, 38.0, 37.0, 36.0, 32.0, 33.0, 34.0, 24.0, 23.0, 21.0, 15.0, 20.0, 13.0, 8.0, 13.0, 8.0, 4.0, 5.0, 2.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.2734375, -1.235992431640625, -1.19854736328125, -1.161102294921875, -1.1236572265625, -1.086212158203125, -1.04876708984375, -1.011322021484375, -0.973876953125, -0.936431884765625, -0.89898681640625, -0.861541748046875, -0.8240966796875, -0.786651611328125, -0.74920654296875, -0.711761474609375, -0.67431640625, -0.636871337890625, -0.59942626953125, -0.561981201171875, -0.5245361328125, -0.487091064453125, -0.44964599609375, -0.412200927734375, -0.374755859375, -0.337310791015625, -0.29986572265625, -0.262420654296875, -0.2249755859375, -0.187530517578125, -0.15008544921875, -0.112640380859375, -0.0751953125, -0.037750244140625, -0.00030517578125, 0.037139892578125, 0.0745849609375, 0.112030029296875, 0.14947509765625, 0.186920166015625, 0.224365234375, 0.261810302734375, 0.29925537109375, 0.336700439453125, 0.3741455078125, 0.411590576171875, 0.44903564453125, 0.486480712890625, 0.52392578125, 0.561370849609375, 0.59881591796875, 0.636260986328125, 0.6737060546875, 0.711151123046875, 0.74859619140625, 0.786041259765625, 0.823486328125, 0.860931396484375, 0.89837646484375, 0.935821533203125, 0.9732666015625, 1.010711669921875, 1.04815673828125, 1.085601806640625, 1.123046875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 11.0, 14.0, 28.0, 30.0, 51.0, 58.0, 87.0, 125.0, 178.0, 332.0, 575.0, 1007.0, 1896.0, 3641.0, 6957.0, 14167.0, 30153.0, 70361.0, 168643.0, 306942.0, 244997.0, 110792.0, 46121.0, 20512.0, 9823.0, 5031.0, 2670.0, 1460.0, 736.0, 441.0, 218.0, 159.0, 107.0, 71.0, 44.0, 29.0, 21.0, 14.0, 12.0, 13.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.416015625, -0.40404510498046875, -0.3920745849609375, -0.38010406494140625, -0.368133544921875, -0.35616302490234375, -0.3441925048828125, -0.33222198486328125, -0.32025146484375, -0.30828094482421875, -0.2963104248046875, -0.28433990478515625, -0.272369384765625, -0.26039886474609375, -0.2484283447265625, -0.23645782470703125, -0.2244873046875, -0.21251678466796875, -0.2005462646484375, -0.18857574462890625, -0.176605224609375, -0.16463470458984375, -0.1526641845703125, -0.14069366455078125, -0.12872314453125, -0.11675262451171875, -0.1047821044921875, -0.09281158447265625, -0.080841064453125, -0.06887054443359375, -0.0569000244140625, -0.04492950439453125, -0.032958984375, -0.02098846435546875, -0.0090179443359375, 0.00295257568359375, 0.014923095703125, 0.02689361572265625, 0.0388641357421875, 0.05083465576171875, 0.06280517578125, 0.07477569580078125, 0.0867462158203125, 0.09871673583984375, 0.110687255859375, 0.12265777587890625, 0.1346282958984375, 0.14659881591796875, 0.1585693359375, 0.17053985595703125, 0.1825103759765625, 0.19448089599609375, 0.206451416015625, 0.21842193603515625, 0.2303924560546875, 0.24236297607421875, 0.25433349609375, 0.26630401611328125, 0.2782745361328125, 0.29024505615234375, 0.302215576171875, 0.31418609619140625, 0.3261566162109375, 0.33812713623046875, 0.35009765625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 1.0, 9.0, 5.0, 16.0, 22.0, 15.0, 13.0, 15.0, 15.0, 25.0, 22.0, 34.0, 32.0, 19.0, 26.0, 25.0, 24.0, 26.0, 43.0, 36.0, 45.0, 1066.0, 42.0, 31.0, 34.0, 34.0, 38.0, 31.0, 39.0, 25.0, 23.0, 20.0, 18.0, 23.0, 17.0, 10.0, 16.0, 15.0, 12.0, 12.0, 9.0, 9.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7763671875, -0.7516937255859375, -0.727020263671875, -0.7023468017578125, -0.67767333984375, -0.6529998779296875, -0.628326416015625, -0.6036529541015625, -0.5789794921875, -0.5543060302734375, -0.529632568359375, -0.5049591064453125, -0.48028564453125, -0.4556121826171875, -0.430938720703125, -0.4062652587890625, -0.381591796875, -0.3569183349609375, -0.332244873046875, -0.3075714111328125, -0.28289794921875, -0.2582244873046875, -0.233551025390625, -0.2088775634765625, -0.1842041015625, -0.1595306396484375, -0.134857177734375, -0.1101837158203125, -0.08551025390625, -0.0608367919921875, -0.036163330078125, -0.0114898681640625, 0.01318359375, 0.0378570556640625, 0.062530517578125, 0.0872039794921875, 0.11187744140625, 0.1365509033203125, 0.161224365234375, 0.1858978271484375, 0.2105712890625, 0.2352447509765625, 0.259918212890625, 0.2845916748046875, 0.30926513671875, 0.3339385986328125, 0.358612060546875, 0.3832855224609375, 0.407958984375, 0.4326324462890625, 0.457305908203125, 0.4819793701171875, 0.50665283203125, 0.5313262939453125, 0.555999755859375, 0.5806732177734375, 0.6053466796875, 0.6300201416015625, 0.654693603515625, 0.6793670654296875, 0.70404052734375, 0.7287139892578125, 0.753387451171875, 0.7780609130859375, 0.802734375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 14.0, 20.0, 16.0, 26.0, 57.0, 60.0, 93.0, 127.0, 177.0, 324.0, 475.0, 828.0, 1353.0, 2450.0, 5056.0, 11692.0, 31100.0, 95022.0, 347009.0, 1267426.0, 225441.0, 66767.0, 23206.0, 9224.0, 4051.0, 2109.0, 1143.0, 689.0, 372.0, 254.0, 165.0, 104.0, 80.0, 58.0, 28.0, 28.0, 17.0, 19.0, 11.0, 7.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.295166015625, -0.28631591796875, -0.2774658203125, -0.26861572265625, -0.259765625, -0.25091552734375, -0.2420654296875, -0.23321533203125, -0.224365234375, -0.21551513671875, -0.2066650390625, -0.19781494140625, -0.18896484375, -0.18011474609375, -0.1712646484375, -0.16241455078125, -0.153564453125, -0.14471435546875, -0.1358642578125, -0.12701416015625, -0.1181640625, -0.10931396484375, -0.1004638671875, -0.09161376953125, -0.082763671875, -0.07391357421875, -0.0650634765625, -0.05621337890625, -0.04736328125, -0.03851318359375, -0.0296630859375, -0.02081298828125, -0.011962890625, -0.00311279296875, 0.0057373046875, 0.01458740234375, 0.0234375, 0.03228759765625, 0.0411376953125, 0.04998779296875, 0.058837890625, 0.06768798828125, 0.0765380859375, 0.08538818359375, 0.09423828125, 0.10308837890625, 0.1119384765625, 0.12078857421875, 0.129638671875, 0.13848876953125, 0.1473388671875, 0.15618896484375, 0.1650390625, 0.17388916015625, 0.1827392578125, 0.19158935546875, 0.200439453125, 0.20928955078125, 0.2181396484375, 0.22698974609375, 0.23583984375, 0.24468994140625, 0.2535400390625, 0.26239013671875, 0.271240234375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 10.0, 14.0, 22.0, 35.0, 39.0, 57.0, 70.0, 88.0, 109.0, 125.0, 95.0, 86.0, 59.0, 49.0, 26.0, 30.0, 19.0, 11.0, 14.0, 7.0, 4.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.054901123046875, -0.05345773696899414, -0.05201435089111328, -0.05057096481323242, -0.04912757873535156, -0.0476841926574707, -0.046240806579589844, -0.044797420501708984, -0.043354034423828125, -0.041910648345947266, -0.040467262268066406, -0.03902387619018555, -0.03758049011230469, -0.03613710403442383, -0.03469371795654297, -0.03325033187866211, -0.03180694580078125, -0.03036355972290039, -0.02892017364501953, -0.027476787567138672, -0.026033401489257812, -0.024590015411376953, -0.023146629333496094, -0.021703243255615234, -0.020259857177734375, -0.018816471099853516, -0.017373085021972656, -0.015929698944091797, -0.014486312866210938, -0.013042926788330078, -0.011599540710449219, -0.01015615463256836, -0.0087127685546875, -0.007269382476806641, -0.005825996398925781, -0.004382610321044922, -0.0029392242431640625, -0.0014958381652832031, -5.245208740234375e-05, 0.0013909339904785156, 0.002834320068359375, 0.004277706146240234, 0.005721092224121094, 0.007164478302001953, 0.008607864379882812, 0.010051250457763672, 0.011494636535644531, 0.01293802261352539, 0.01438140869140625, 0.01582479476928711, 0.01726818084716797, 0.018711566925048828, 0.020154953002929688, 0.021598339080810547, 0.023041725158691406, 0.024485111236572266, 0.025928497314453125, 0.027371883392333984, 0.028815269470214844, 0.030258655548095703, 0.03170204162597656, 0.03314542770385742, 0.03458881378173828, 0.03603219985961914, 0.0374755859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 14.0, 19.0, 31.0, 58.0, 102.0, 315.0, 3480.0, 1031884.0, 11876.0, 494.0, 127.0, 60.0, 38.0, 22.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3291015625, -1.2810211181640625, -1.232940673828125, -1.1848602294921875, -1.13677978515625, -1.0886993408203125, -1.040618896484375, -0.9925384521484375, -0.9444580078125, -0.8963775634765625, -0.848297119140625, -0.8002166748046875, -0.75213623046875, -0.7040557861328125, -0.655975341796875, -0.6078948974609375, -0.559814453125, -0.5117340087890625, -0.463653564453125, -0.4155731201171875, -0.36749267578125, -0.3194122314453125, -0.271331787109375, -0.2232513427734375, -0.1751708984375, -0.1270904541015625, -0.079010009765625, -0.0309295654296875, 0.01715087890625, 0.0652313232421875, 0.113311767578125, 0.1613922119140625, 0.20947265625, 0.2575531005859375, 0.305633544921875, 0.3537139892578125, 0.40179443359375, 0.4498748779296875, 0.497955322265625, 0.5460357666015625, 0.5941162109375, 0.6421966552734375, 0.690277099609375, 0.7383575439453125, 0.78643798828125, 0.8345184326171875, 0.882598876953125, 0.9306793212890625, 0.978759765625, 1.0268402099609375, 1.074920654296875, 1.1230010986328125, 1.17108154296875, 1.2191619873046875, 1.267242431640625, 1.3153228759765625, 1.3634033203125, 1.4114837646484375, 1.459564208984375, 1.5076446533203125, 1.55572509765625, 1.6038055419921875, 1.651885986328125, 1.6999664306640625, 1.748046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 14.0, 36.0, 41.0, 93.0, 174.0, 222.0, 175.0, 104.0, 76.0, 34.0, 25.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1687709540128708, -0.16461357474327087, -0.16045618057250977, -0.15629880130290985, -0.15214142203330994, -0.14798404276371002, -0.1438266634941101, -0.139669269323349, -0.13551189005374908, -0.13135451078414917, -0.12719711661338806, -0.12303973734378815, -0.11888235807418823, -0.11472497880458832, -0.1105675920844078, -0.1064102053642273, -0.10225282609462738, -0.09809544682502747, -0.09393806010484695, -0.08978067338466644, -0.08562329411506653, -0.08146591484546661, -0.0773085281252861, -0.07315114140510559, -0.06899376213550568, -0.06483638286590576, -0.06067899614572525, -0.05652161315083504, -0.052364230155944824, -0.04820684716105461, -0.0440494641661644, -0.039892081171274185, -0.035734690725803375, -0.03157730773091316, -0.02741992473602295, -0.023262541741132736, -0.019105158746242523, -0.01494777575135231, -0.010790392756462097, -0.006633009761571884, -0.002475626766681671, 0.0016817562282085419, 0.005839139223098755, 0.009996522217988968, 0.014153905212879181, 0.018311288207769394, 0.022468671202659607, 0.02662605419754982, 0.030783437192440033, 0.034940820187330246, 0.03909820318222046, 0.04325558617711067, 0.047412969172000885, 0.0515703521668911, 0.05572773516178131, 0.059885118156671524, 0.06404250115156174, 0.06819988787174225, 0.07235726714134216, 0.07651464641094208, 0.08067203313112259, 0.0848294198513031, 0.08898679912090302, 0.09314417839050293, 0.09730156511068344]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 12.0, 10.0, 6.0, 20.0, 19.0, 26.0, 29.0, 31.0, 21.0, 31.0, 29.0, 41.0, 39.0, 37.0, 47.0, 42.0, 47.0, 36.0, 46.0, 45.0, 49.0, 47.0, 44.0, 22.0, 35.0, 26.0, 17.0, 19.0, 17.0, 18.0, 12.0, 16.0, 6.0, 6.0, 6.0, 11.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0368427038192749, -0.035757970064878464, -0.034673236310482025, -0.03358850255608559, -0.03250376880168915, -0.03141903504729271, -0.03033430129289627, -0.029249567538499832, -0.028164833784103394, -0.027080100029706955, -0.025995366275310516, -0.024910632520914078, -0.02382589876651764, -0.0227411650121212, -0.021656431257724762, -0.020571697503328323, -0.019486963748931885, -0.018402229994535446, -0.017317496240139008, -0.01623276248574257, -0.01514802873134613, -0.014063294976949692, -0.012978561222553253, -0.011893827468156815, -0.010809093713760376, -0.009724359959363937, -0.008639626204967499, -0.00755489245057106, -0.006470158696174622, -0.005385424941778183, -0.004300691187381744, -0.003215957432985306, -0.002131223678588867, -0.0010464899241924286, 3.824383020401001e-05, 0.0011229775846004486, 0.002207711338996887, 0.003292445093393326, 0.004377178847789764, 0.005461912602186203, 0.006546646356582642, 0.00763138011097908, 0.008716113865375519, 0.009800847619771957, 0.010885581374168396, 0.011970315128564835, 0.013055048882961273, 0.014139782637357712, 0.01522451639175415, 0.01630925014615059, 0.017393983900547028, 0.018478717654943466, 0.019563451409339905, 0.020648185163736343, 0.021732918918132782, 0.02281765267252922, 0.02390238642692566, 0.024987120181322098, 0.026071853935718536, 0.027156587690114975, 0.028241321444511414, 0.029326055198907852, 0.03041078895330429, 0.03149552270770073, 0.03258025646209717]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 6.0, 8.0, 9.0, 13.0, 17.0, 17.0, 17.0, 14.0, 19.0, 24.0, 22.0, 24.0, 31.0, 33.0, 32.0, 33.0, 29.0, 42.0, 36.0, 40.0, 42.0, 40.0, 30.0, 26.0, 36.0, 39.0, 36.0, 31.0, 31.0, 35.0, 23.0, 25.0, 21.0, 14.0, 21.0, 12.0, 8.0, 13.0, 8.0, 4.0, 5.0, 2.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2724609375, -1.2350311279296875, -1.197601318359375, -1.1601715087890625, -1.12274169921875, -1.0853118896484375, -1.047882080078125, -1.0104522705078125, -0.9730224609375, -0.9355926513671875, -0.898162841796875, -0.8607330322265625, -0.82330322265625, -0.7858734130859375, -0.748443603515625, -0.7110137939453125, -0.673583984375, -0.6361541748046875, -0.598724365234375, -0.5612945556640625, -0.52386474609375, -0.4864349365234375, -0.449005126953125, -0.4115753173828125, -0.3741455078125, -0.3367156982421875, -0.299285888671875, -0.2618560791015625, -0.22442626953125, -0.1869964599609375, -0.149566650390625, -0.1121368408203125, -0.07470703125, -0.0372772216796875, 0.000152587890625, 0.0375823974609375, 0.07501220703125, 0.1124420166015625, 0.149871826171875, 0.1873016357421875, 0.2247314453125, 0.2621612548828125, 0.299591064453125, 0.3370208740234375, 0.37445068359375, 0.4118804931640625, 0.449310302734375, 0.4867401123046875, 0.524169921875, 0.5615997314453125, 0.599029541015625, 0.6364593505859375, 0.67388916015625, 0.7113189697265625, 0.748748779296875, 0.7861785888671875, 0.8236083984375, 0.8610382080078125, 0.898468017578125, 0.9358978271484375, 0.97332763671875, 1.0107574462890625, 1.048187255859375, 1.0856170654296875, 1.123046875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 11.0, 12.0, 7.0, 13.0, 20.0, 32.0, 65.0, 64.0, 131.0, 199.0, 363.0, 534.0, 889.0, 1569.0, 2748.0, 4964.0, 8840.0, 15606.0, 29596.0, 56622.0, 108904.0, 205529.0, 262868.0, 165226.0, 86282.0, 44673.0, 23520.0, 12764.0, 7105.0, 3895.0, 2247.0, 1334.0, 736.0, 465.0, 278.0, 179.0, 97.0, 74.0, 34.0, 23.0, 17.0, 7.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.481689453125, -1.43115234375, -1.380615234375, -1.330078125, -1.279541015625, -1.22900390625, -1.178466796875, -1.1279296875, -1.077392578125, -1.02685546875, -0.976318359375, -0.92578125, -0.875244140625, -0.82470703125, -0.774169921875, -0.7236328125, -0.673095703125, -0.62255859375, -0.572021484375, -0.521484375, -0.470947265625, -0.42041015625, -0.369873046875, -0.3193359375, -0.268798828125, -0.21826171875, -0.167724609375, -0.1171875, -0.066650390625, -0.01611328125, 0.034423828125, 0.0849609375, 0.135498046875, 0.18603515625, 0.236572265625, 0.287109375, 0.337646484375, 0.38818359375, 0.438720703125, 0.4892578125, 0.539794921875, 0.59033203125, 0.640869140625, 0.69140625, 0.741943359375, 0.79248046875, 0.843017578125, 0.8935546875, 0.944091796875, 0.99462890625, 1.045166015625, 1.095703125, 1.146240234375, 1.19677734375, 1.247314453125, 1.2978515625, 1.348388671875, 1.39892578125, 1.449462890625, 1.5, 1.550537109375, 1.60107421875, 1.651611328125, 1.7021484375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 6.0, 9.0, 6.0, 7.0, 11.0, 11.0, 19.0, 17.0, 16.0, 12.0, 14.0, 22.0, 28.0, 39.0, 48.0, 42.0, 50.0, 56.0, 72.0, 141.0, 217.0, 1301.0, 243.0, 155.0, 99.0, 76.0, 50.0, 48.0, 29.0, 32.0, 28.0, 24.0, 22.0, 15.0, 11.0, 10.0, 16.0, 10.0, 10.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.930267333984375, -3.80584716796875, -3.681427001953125, -3.5570068359375, -3.432586669921875, -3.30816650390625, -3.183746337890625, -3.059326171875, -2.934906005859375, -2.81048583984375, -2.686065673828125, -2.5616455078125, -2.437225341796875, -2.31280517578125, -2.188385009765625, -2.06396484375, -1.939544677734375, -1.81512451171875, -1.690704345703125, -1.5662841796875, -1.441864013671875, -1.31744384765625, -1.193023681640625, -1.068603515625, -0.944183349609375, -0.81976318359375, -0.695343017578125, -0.5709228515625, -0.446502685546875, -0.32208251953125, -0.197662353515625, -0.0732421875, 0.051177978515625, 0.17559814453125, 0.300018310546875, 0.4244384765625, 0.548858642578125, 0.67327880859375, 0.797698974609375, 0.922119140625, 1.046539306640625, 1.17095947265625, 1.295379638671875, 1.4197998046875, 1.544219970703125, 1.66864013671875, 1.793060302734375, 1.91748046875, 2.041900634765625, 2.16632080078125, 2.290740966796875, 2.4151611328125, 2.539581298828125, 2.66400146484375, 2.788421630859375, 2.912841796875, 3.037261962890625, 3.16168212890625, 3.286102294921875, 3.4105224609375, 3.534942626953125, 3.65936279296875, 3.783782958984375, 3.908203125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 1.0, 2.0, 6.0, 5.0, 10.0, 13.0, 18.0, 20.0, 16.0, 29.0, 45.0, 47.0, 68.0, 87.0, 110.0, 130.0, 259.0, 380.0, 768.0, 2734.0, 25077.0, 815562.0, 2228927.0, 63854.0, 5159.0, 966.0, 395.0, 237.0, 203.0, 127.0, 88.0, 92.0, 49.0, 47.0, 30.0, 32.0, 25.0, 20.0, 11.0, 13.0, 7.0, 12.0, 9.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58203125, -7.33062744140625, -7.0792236328125, -6.82781982421875, -6.576416015625, -6.32501220703125, -6.0736083984375, -5.82220458984375, -5.57080078125, -5.31939697265625, -5.0679931640625, -4.81658935546875, -4.565185546875, -4.31378173828125, -4.0623779296875, -3.81097412109375, -3.5595703125, -3.30816650390625, -3.0567626953125, -2.80535888671875, -2.553955078125, -2.30255126953125, -2.0511474609375, -1.79974365234375, -1.54833984375, -1.29693603515625, -1.0455322265625, -0.79412841796875, -0.542724609375, -0.29132080078125, -0.0399169921875, 0.21148681640625, 0.462890625, 0.71429443359375, 0.9656982421875, 1.21710205078125, 1.468505859375, 1.71990966796875, 1.9713134765625, 2.22271728515625, 2.47412109375, 2.72552490234375, 2.9769287109375, 3.22833251953125, 3.479736328125, 3.73114013671875, 3.9825439453125, 4.23394775390625, 4.4853515625, 4.73675537109375, 4.9881591796875, 5.23956298828125, 5.490966796875, 5.74237060546875, 5.9937744140625, 6.24517822265625, 6.49658203125, 6.74798583984375, 6.9993896484375, 7.25079345703125, 7.502197265625, 7.75360107421875, 8.0050048828125, 8.25640869140625, 8.5078125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 51.0, 584.0, 367.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.94912719726562, -108.9262924194336, -106.90345764160156, -104.88062286376953, -102.8577880859375, -100.83494567871094, -98.8121109008789, -96.78927612304688, -94.76644134521484, -92.74360656738281, -90.72077178955078, -88.69793701171875, -86.67509460449219, -84.65225982666016, -82.62942504882812, -80.6065902709961, -78.58375549316406, -76.56092071533203, -74.5380859375, -72.51525115966797, -70.49241638183594, -68.46957397460938, -66.44673919677734, -64.42390441894531, -62.40106964111328, -60.37823486328125, -58.35540008544922, -56.33256149291992, -54.30972671508789, -52.28689193725586, -50.26405334472656, -48.24121856689453, -46.2183837890625, -44.19554901123047, -42.17271423339844, -40.14987564086914, -38.12704086303711, -36.10420608520508, -34.08136749267578, -32.05853271484375, -30.03569793701172, -28.012863159179688, -25.990026473999023, -23.96718978881836, -21.944355010986328, -19.921520233154297, -17.898683547973633, -15.875847816467285, -13.853012084960938, -11.83017635345459, -9.807340621948242, -7.7845048904418945, -5.761669158935547, -3.738833427429199, -1.7159976959228516, 0.3068380355834961, 2.3296737670898438, 4.352509498596191, 6.375345230102539, 8.398180961608887, 10.421016693115234, 12.443852424621582, 14.46668815612793, 16.489524841308594, 18.512359619140625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 0.0, 11.0, 9.0, 8.0, 12.0, 12.0, 12.0, 19.0, 9.0, 22.0, 16.0, 30.0, 20.0, 25.0, 26.0, 33.0, 34.0, 30.0, 35.0, 28.0, 38.0, 32.0, 26.0, 42.0, 37.0, 40.0, 35.0, 31.0, 34.0, 28.0, 22.0, 22.0, 29.0, 26.0, 17.0, 15.0, 17.0, 9.0, 18.0, 17.0, 12.0, 14.0, 9.0, 12.0, 3.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.198797225952148, -8.908488273620605, -8.618179321289062, -8.32787036895752, -8.037561416625977, -7.747252941131592, -7.456944465637207, -7.166635513305664, -6.876326560974121, -6.586017608642578, -6.295708656311035, -6.00540018081665, -5.715091228485107, -5.4247822761535645, -5.13447380065918, -4.844164848327637, -4.553855895996094, -4.263546943664551, -3.973238229751587, -3.682929515838623, -3.39262056350708, -3.102311611175537, -2.8120028972625732, -2.5216941833496094, -2.2313852310180664, -1.941076397895813, -1.6507675647735596, -1.3604587316513062, -1.0701498985290527, -0.7798410654067993, -0.4895322322845459, -0.19922351837158203, 0.09108543395996094, 0.38139426708221436, 0.6717031002044678, 0.9620119333267212, 1.2523207664489746, 1.542629599571228, 1.8329384326934814, 2.1232471466064453, 2.4135560989379883, 2.7038650512695312, 2.994173765182495, 3.284482479095459, 3.574791431427002, 3.865100383758545, 4.15540885925293, 4.445717811584473, 4.736026763916016, 5.026335716247559, 5.316644668579102, 5.606953144073486, 5.897262096405029, 6.187571048736572, 6.477879524230957, 6.7681884765625, 7.058497428894043, 7.348806381225586, 7.639115333557129, 7.929423809051514, 8.219732284545898, 8.510041236877441, 8.800350189208984, 9.090659141540527, 9.38096809387207]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 11.0, 10.0, 15.0, 12.0, 18.0, 20.0, 21.0, 21.0, 18.0, 25.0, 26.0, 33.0, 29.0, 44.0, 36.0, 34.0, 38.0, 33.0, 34.0, 44.0, 54.0, 30.0, 26.0, 37.0, 24.0, 26.0, 36.0, 37.0, 28.0, 17.0, 17.0, 26.0, 21.0, 21.0, 9.0, 11.0, 4.0, 5.0, 7.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.3505859375, -1.3102569580078125, -1.269927978515625, -1.2295989990234375, -1.18927001953125, -1.1489410400390625, -1.108612060546875, -1.0682830810546875, -1.0279541015625, -0.9876251220703125, -0.947296142578125, -0.9069671630859375, -0.86663818359375, -0.8263092041015625, -0.785980224609375, -0.7456512451171875, -0.705322265625, -0.6649932861328125, -0.624664306640625, -0.5843353271484375, -0.54400634765625, -0.5036773681640625, -0.463348388671875, -0.4230194091796875, -0.3826904296875, -0.3423614501953125, -0.302032470703125, -0.2617034912109375, -0.22137451171875, -0.1810455322265625, -0.140716552734375, -0.1003875732421875, -0.06005859375, -0.0197296142578125, 0.020599365234375, 0.0609283447265625, 0.10125732421875, 0.1415863037109375, 0.181915283203125, 0.2222442626953125, 0.2625732421875, 0.3029022216796875, 0.343231201171875, 0.3835601806640625, 0.42388916015625, 0.4642181396484375, 0.504547119140625, 0.5448760986328125, 0.585205078125, 0.6255340576171875, 0.665863037109375, 0.7061920166015625, 0.74652099609375, 0.7868499755859375, 0.827178955078125, 0.8675079345703125, 0.9078369140625, 0.9481658935546875, 0.988494873046875, 1.0288238525390625, 1.06915283203125, 1.1094818115234375, 1.149810791015625, 1.1901397705078125, 1.23046875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 5.0, 6.0, 8.0, 17.0, 17.0, 22.0, 17.0, 34.0, 46.0, 65.0, 69.0, 113.0, 179.0, 261.0, 359.0, 571.0, 944.0, 1482.0, 2509.0, 4346.0, 8508.0, 17327.0, 41345.0, 114503.0, 396076.0, 1372483.0, 1538710.0, 476231.0, 132952.0, 45767.0, 19175.0, 8881.0, 4557.0, 2526.0, 1491.0, 942.0, 538.0, 374.0, 264.0, 161.0, 109.0, 92.0, 43.0, 41.0, 32.0, 24.0, 18.0, 13.0, 5.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0], "bins": [-2.330078125, -2.2636260986328125, -2.197174072265625, -2.1307220458984375, -2.06427001953125, -1.9978179931640625, -1.931365966796875, -1.8649139404296875, -1.7984619140625, -1.7320098876953125, -1.665557861328125, -1.5991058349609375, -1.53265380859375, -1.4662017822265625, -1.399749755859375, -1.3332977294921875, -1.266845703125, -1.2003936767578125, -1.133941650390625, -1.0674896240234375, -1.00103759765625, -0.9345855712890625, -0.868133544921875, -0.8016815185546875, -0.7352294921875, -0.6687774658203125, -0.602325439453125, -0.5358734130859375, -0.46942138671875, -0.4029693603515625, -0.336517333984375, -0.2700653076171875, -0.20361328125, -0.1371612548828125, -0.070709228515625, -0.0042572021484375, 0.06219482421875, 0.1286468505859375, 0.195098876953125, 0.2615509033203125, 0.3280029296875, 0.3944549560546875, 0.460906982421875, 0.5273590087890625, 0.59381103515625, 0.6602630615234375, 0.726715087890625, 0.7931671142578125, 0.859619140625, 0.9260711669921875, 0.992523193359375, 1.0589752197265625, 1.12542724609375, 1.1918792724609375, 1.258331298828125, 1.3247833251953125, 1.3912353515625, 1.4576873779296875, 1.524139404296875, 1.5905914306640625, 1.65704345703125, 1.7234954833984375, 1.789947509765625, 1.8563995361328125, 1.9228515625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 14.0, 12.0, 15.0, 16.0, 14.0, 42.0, 36.0, 64.0, 88.0, 96.0, 132.0, 195.0, 271.0, 363.0, 425.0, 476.0, 440.0, 349.0, 260.0, 185.0, 132.0, 106.0, 76.0, 55.0, 50.0, 33.0, 25.0, 17.0, 16.0, 11.0, 12.0, 6.0, 10.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.306640625, -2.22857666015625, -2.1505126953125, -2.07244873046875, -1.994384765625, -1.91632080078125, -1.8382568359375, -1.76019287109375, -1.68212890625, -1.60406494140625, -1.5260009765625, -1.44793701171875, -1.369873046875, -1.29180908203125, -1.2137451171875, -1.13568115234375, -1.0576171875, -0.97955322265625, -0.9014892578125, -0.82342529296875, -0.745361328125, -0.66729736328125, -0.5892333984375, -0.51116943359375, -0.43310546875, -0.35504150390625, -0.2769775390625, -0.19891357421875, -0.120849609375, -0.04278564453125, 0.0352783203125, 0.11334228515625, 0.19140625, 0.26947021484375, 0.3475341796875, 0.42559814453125, 0.503662109375, 0.58172607421875, 0.6597900390625, 0.73785400390625, 0.81591796875, 0.89398193359375, 0.9720458984375, 1.05010986328125, 1.128173828125, 1.20623779296875, 1.2843017578125, 1.36236572265625, 1.4404296875, 1.51849365234375, 1.5965576171875, 1.67462158203125, 1.752685546875, 1.83074951171875, 1.9088134765625, 1.98687744140625, 2.06494140625, 2.14300537109375, 2.2210693359375, 2.29913330078125, 2.377197265625, 2.45526123046875, 2.5333251953125, 2.61138916015625, 2.689453125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 14.0, 12.0, 16.0, 19.0, 32.0, 39.0, 60.0, 88.0, 111.0, 128.0, 228.0, 419.0, 1273.0, 8830.0, 161317.0, 3635703.0, 367550.0, 15062.0, 1939.0, 518.0, 279.0, 157.0, 138.0, 79.0, 74.0, 42.0, 35.0, 28.0, 14.0, 18.0, 15.0, 6.0, 6.0, 3.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8671875, -10.56201171875, -10.2568359375, -9.95166015625, -9.646484375, -9.34130859375, -9.0361328125, -8.73095703125, -8.42578125, -8.12060546875, -7.8154296875, -7.51025390625, -7.205078125, -6.89990234375, -6.5947265625, -6.28955078125, -5.984375, -5.67919921875, -5.3740234375, -5.06884765625, -4.763671875, -4.45849609375, -4.1533203125, -3.84814453125, -3.54296875, -3.23779296875, -2.9326171875, -2.62744140625, -2.322265625, -2.01708984375, -1.7119140625, -1.40673828125, -1.1015625, -0.79638671875, -0.4912109375, -0.18603515625, 0.119140625, 0.42431640625, 0.7294921875, 1.03466796875, 1.33984375, 1.64501953125, 1.9501953125, 2.25537109375, 2.560546875, 2.86572265625, 3.1708984375, 3.47607421875, 3.78125, 4.08642578125, 4.3916015625, 4.69677734375, 5.001953125, 5.30712890625, 5.6123046875, 5.91748046875, 6.22265625, 6.52783203125, 6.8330078125, 7.13818359375, 7.443359375, 7.74853515625, 8.0537109375, 8.35888671875, 8.6640625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 9.0, 11.0, 16.0, 28.0, 28.0, 42.0, 34.0, 46.0, 62.0, 63.0, 80.0, 66.0, 72.0, 56.0, 69.0, 59.0, 54.0, 40.0, 40.0, 30.0, 22.0, 12.0, 13.0, 17.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.605474472045898, -10.317895889282227, -10.030316352844238, -9.742737770080566, -9.455159187316895, -9.167579650878906, -8.880001068115234, -8.592422485351562, -8.30484390258789, -8.017265319824219, -7.729686260223389, -7.442107200622559, -7.154528617858887, -6.866949558258057, -6.579370498657227, -6.291791915893555, -6.004212379455566, -5.716633319854736, -5.4290547370910645, -5.141475677490234, -4.8538970947265625, -4.566318035125732, -4.278738975524902, -3.9911601543426514, -3.7035813331604004, -3.4160025119781494, -3.1284236907958984, -2.8408446311950684, -2.5532658100128174, -2.2656869888305664, -1.9781080484390259, -1.6905291080474854, -1.4029498100280762, -1.1153709888458252, -0.8277920484542847, -0.5402131676673889, -0.25263428688049316, 0.03494453430175781, 0.32252347469329834, 0.6101024150848389, 0.8976812362670898, 1.1852600574493408, 1.4728389978408813, 1.7604179382324219, 2.047996759414673, 2.335575580596924, 2.623154640197754, 2.910733461380005, 3.198312282562256, 3.485891103744507, 3.773469924926758, 4.061048984527588, 4.348628044128418, 4.63620662689209, 4.92378568649292, 5.21136474609375, 5.498943328857422, 5.786522388458252, 6.074100971221924, 6.361680030822754, 6.649258613586426, 6.936837673187256, 7.224416732788086, 7.511995315551758, 7.799574375152588]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 5.0, 7.0, 4.0, 14.0, 11.0, 17.0, 13.0, 15.0, 25.0, 26.0, 25.0, 29.0, 23.0, 35.0, 36.0, 52.0, 27.0, 47.0, 34.0, 29.0, 36.0, 35.0, 48.0, 22.0, 33.0, 38.0, 26.0, 33.0, 26.0, 35.0, 24.0, 32.0, 23.0, 21.0, 14.0, 10.0, 10.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.866444110870361, -7.615448474884033, -7.364452362060547, -7.113456726074219, -6.862461090087891, -6.6114654541015625, -6.360469818115234, -6.109473705291748, -5.85847806930542, -5.607482433319092, -5.3564863204956055, -5.105490684509277, -4.854495048522949, -4.603499412536621, -4.352503776550293, -4.101507663726807, -3.8505120277404785, -3.5995163917541504, -3.348520517349243, -3.097524642944336, -2.846529006958008, -2.5955333709716797, -2.3445374965667725, -2.0935416221618652, -1.842545986175537, -1.5915502309799194, -1.3405544757843018, -1.089558720588684, -0.8385629653930664, -0.5875672101974487, -0.33657145500183105, -0.08557569980621338, 0.1654195785522461, 0.41641533374786377, 0.6674110889434814, 0.9184068441390991, 1.1694025993347168, 1.4203983545303345, 1.6713941097259521, 1.9223898649215698, 2.1733856201171875, 2.4243812561035156, 2.675377130508423, 2.92637300491333, 3.177368640899658, 3.4283642768859863, 3.6793601512908936, 3.930356025695801, 4.181351661682129, 4.432347297668457, 4.683342933654785, 4.9343390464782715, 5.1853346824646, 5.436330318450928, 5.687326431274414, 5.938322067260742, 6.18931770324707, 6.440313339233398, 6.691308975219727, 6.942305088043213, 7.193300724029541, 7.444296360015869, 7.6952924728393555, 7.946288108825684, 8.197283744812012]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 6.0, 8.0, 6.0, 18.0, 13.0, 13.0, 11.0, 14.0, 8.0, 19.0, 15.0, 25.0, 24.0, 26.0, 31.0, 24.0, 38.0, 35.0, 53.0, 33.0, 39.0, 35.0, 41.0, 47.0, 44.0, 33.0, 35.0, 34.0, 31.0, 22.0, 24.0, 29.0, 18.0, 25.0, 18.0, 17.0, 17.0, 22.0, 12.0, 6.0, 12.0, 6.0, 7.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2353515625, -1.1966400146484375, -1.157928466796875, -1.1192169189453125, -1.08050537109375, -1.0417938232421875, -1.003082275390625, -0.9643707275390625, -0.9256591796875, -0.8869476318359375, -0.848236083984375, -0.8095245361328125, -0.77081298828125, -0.7321014404296875, -0.693389892578125, -0.6546783447265625, -0.615966796875, -0.5772552490234375, -0.538543701171875, -0.4998321533203125, -0.46112060546875, -0.4224090576171875, -0.383697509765625, -0.3449859619140625, -0.3062744140625, -0.2675628662109375, -0.228851318359375, -0.1901397705078125, -0.15142822265625, -0.1127166748046875, -0.074005126953125, -0.0352935791015625, 0.00341796875, 0.0421295166015625, 0.080841064453125, 0.1195526123046875, 0.15826416015625, 0.1969757080078125, 0.235687255859375, 0.2743988037109375, 0.3131103515625, 0.3518218994140625, 0.390533447265625, 0.4292449951171875, 0.46795654296875, 0.5066680908203125, 0.545379638671875, 0.5840911865234375, 0.622802734375, 0.6615142822265625, 0.700225830078125, 0.7389373779296875, 0.77764892578125, 0.8163604736328125, 0.855072021484375, 0.8937835693359375, 0.9324951171875, 0.9712066650390625, 1.009918212890625, 1.0486297607421875, 1.08734130859375, 1.1260528564453125, 1.164764404296875, 1.2034759521484375, 1.2421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 11.0, 12.0, 38.0, 61.0, 93.0, 190.0, 341.0, 712.0, 1354.0, 2935.0, 6973.0, 38696.0, 774898.0, 201829.0, 12117.0, 4280.0, 2018.0, 912.0, 511.0, 263.0, 136.0, 84.0, 34.0, 22.0, 13.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.33984375, -1.3001251220703125, -1.260406494140625, -1.2206878662109375, -1.18096923828125, -1.1412506103515625, -1.101531982421875, -1.0618133544921875, -1.0220947265625, -0.9823760986328125, -0.942657470703125, -0.9029388427734375, -0.86322021484375, -0.8235015869140625, -0.783782958984375, -0.7440643310546875, -0.704345703125, -0.6646270751953125, -0.624908447265625, -0.5851898193359375, -0.54547119140625, -0.5057525634765625, -0.466033935546875, -0.4263153076171875, -0.3865966796875, -0.3468780517578125, -0.307159423828125, -0.2674407958984375, -0.22772216796875, -0.1880035400390625, -0.148284912109375, -0.1085662841796875, -0.06884765625, -0.0291290283203125, 0.010589599609375, 0.0503082275390625, 0.09002685546875, 0.1297454833984375, 0.169464111328125, 0.2091827392578125, 0.2489013671875, 0.2886199951171875, 0.328338623046875, 0.3680572509765625, 0.40777587890625, 0.4474945068359375, 0.487213134765625, 0.5269317626953125, 0.566650390625, 0.6063690185546875, 0.646087646484375, 0.6858062744140625, 0.72552490234375, 0.7652435302734375, 0.804962158203125, 0.8446807861328125, 0.8843994140625, 0.9241180419921875, 0.963836669921875, 1.0035552978515625, 1.04327392578125, 1.0829925537109375, 1.122711181640625, 1.1624298095703125, 1.2021484375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 3.0, 16.0, 17.0, 11.0, 16.0, 10.0, 25.0, 22.0, 26.0, 27.0, 27.0, 40.0, 23.0, 49.0, 37.0, 41.0, 40.0, 1057.0, 53.0, 39.0, 47.0, 47.0, 23.0, 46.0, 37.0, 34.0, 26.0, 23.0, 28.0, 23.0, 22.0, 14.0, 14.0, 7.0, 11.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.80487060546875, -0.7757568359375, -0.74664306640625, -0.717529296875, -0.68841552734375, -0.6593017578125, -0.63018798828125, -0.60107421875, -0.57196044921875, -0.5428466796875, -0.51373291015625, -0.484619140625, -0.45550537109375, -0.4263916015625, -0.39727783203125, -0.3681640625, -0.33905029296875, -0.3099365234375, -0.28082275390625, -0.251708984375, -0.22259521484375, -0.1934814453125, -0.16436767578125, -0.13525390625, -0.10614013671875, -0.0770263671875, -0.04791259765625, -0.018798828125, 0.01031494140625, 0.0394287109375, 0.06854248046875, 0.09765625, 0.12677001953125, 0.1558837890625, 0.18499755859375, 0.214111328125, 0.24322509765625, 0.2723388671875, 0.30145263671875, 0.33056640625, 0.35968017578125, 0.3887939453125, 0.41790771484375, 0.447021484375, 0.47613525390625, 0.5052490234375, 0.53436279296875, 0.5634765625, 0.59259033203125, 0.6217041015625, 0.65081787109375, 0.679931640625, 0.70904541015625, 0.7381591796875, 0.76727294921875, 0.79638671875, 0.82550048828125, 0.8546142578125, 0.88372802734375, 0.912841796875, 0.94195556640625, 0.9710693359375, 1.00018310546875, 1.029296875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 11.0, 14.0, 28.0, 26.0, 28.0, 58.0, 62.0, 69.0, 89.0, 144.0, 158.0, 184.0, 275.0, 415.0, 541.0, 804.0, 1215.0, 2048.0, 4286.0, 12086.0, 61545.0, 542489.0, 1350658.0, 91962.0, 15989.0, 5011.0, 2360.0, 1383.0, 851.0, 606.0, 434.0, 301.0, 227.0, 184.0, 127.0, 101.0, 86.0, 71.0, 58.0, 34.0, 19.0, 26.0, 25.0, 8.0, 6.0, 8.0, 5.0, 0.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.393310546875, -0.3806648254394531, -0.36801910400390625, -0.3553733825683594, -0.3427276611328125, -0.3300819396972656, -0.31743621826171875, -0.3047904968261719, -0.292144775390625, -0.2794990539550781, -0.26685333251953125, -0.2542076110839844, -0.2415618896484375, -0.22891616821289062, -0.21627044677734375, -0.20362472534179688, -0.19097900390625, -0.17833328247070312, -0.16568756103515625, -0.15304183959960938, -0.1403961181640625, -0.12775039672851562, -0.11510467529296875, -0.10245895385742188, -0.089813232421875, -0.07716751098632812, -0.06452178955078125, -0.051876068115234375, -0.0392303466796875, -0.026584625244140625, -0.01393890380859375, -0.001293182373046875, 0.0113525390625, 0.023998260498046875, 0.03664398193359375, 0.049289703369140625, 0.0619354248046875, 0.07458114624023438, 0.08722686767578125, 0.09987258911132812, 0.112518310546875, 0.12516403198242188, 0.13780975341796875, 0.15045547485351562, 0.1631011962890625, 0.17574691772460938, 0.18839263916015625, 0.20103836059570312, 0.21368408203125, 0.22632980346679688, 0.23897552490234375, 0.2516212463378906, 0.2642669677734375, 0.2769126892089844, 0.28955841064453125, 0.3022041320800781, 0.314849853515625, 0.3274955749511719, 0.34014129638671875, 0.3527870178222656, 0.3654327392578125, 0.3780784606933594, 0.39072418212890625, 0.4033699035644531, 0.416015625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 8.0, 16.0, 27.0, 54.0, 63.0, 106.0, 166.0, 169.0, 134.0, 76.0, 55.0, 36.0, 22.0, 22.0, 11.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052642822265625, -0.05122661590576172, -0.04981040954589844, -0.048394203186035156, -0.046977996826171875, -0.045561790466308594, -0.04414558410644531, -0.04272937774658203, -0.04131317138671875, -0.03989696502685547, -0.03848075866699219, -0.037064552307128906, -0.035648345947265625, -0.034232139587402344, -0.03281593322753906, -0.03139972686767578, -0.0299835205078125, -0.02856731414794922, -0.027151107788085938, -0.025734901428222656, -0.024318695068359375, -0.022902488708496094, -0.021486282348632812, -0.02007007598876953, -0.01865386962890625, -0.01723766326904297, -0.015821456909179688, -0.014405250549316406, -0.012989044189453125, -0.011572837829589844, -0.010156631469726562, -0.008740425109863281, -0.00732421875, -0.005908012390136719, -0.0044918060302734375, -0.0030755996704101562, -0.001659393310546875, -0.00024318695068359375, 0.0011730194091796875, 0.0025892257690429688, 0.00400543212890625, 0.005421638488769531, 0.0068378448486328125, 0.008254051208496094, 0.009670257568359375, 0.011086463928222656, 0.012502670288085938, 0.013918876647949219, 0.0153350830078125, 0.01675128936767578, 0.018167495727539062, 0.019583702087402344, 0.020999908447265625, 0.022416114807128906, 0.023832321166992188, 0.02524852752685547, 0.02666473388671875, 0.02808094024658203, 0.029497146606445312, 0.030913352966308594, 0.032329559326171875, 0.033745765686035156, 0.03516197204589844, 0.03657817840576172, 0.037994384765625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 9.0, 14.0, 20.0, 24.0, 37.0, 56.0, 94.0, 298.0, 3700.0, 1010187.0, 32770.0, 980.0, 144.0, 70.0, 45.0, 30.0, 17.0, 12.0, 9.0, 12.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8544921875, -0.82373046875, -0.79296875, -0.76220703125, -0.7314453125, -0.70068359375, -0.669921875, -0.63916015625, -0.6083984375, -0.57763671875, -0.546875, -0.51611328125, -0.4853515625, -0.45458984375, -0.423828125, -0.39306640625, -0.3623046875, -0.33154296875, -0.30078125, -0.27001953125, -0.2392578125, -0.20849609375, -0.177734375, -0.14697265625, -0.1162109375, -0.08544921875, -0.0546875, -0.02392578125, 0.0068359375, 0.03759765625, 0.068359375, 0.09912109375, 0.1298828125, 0.16064453125, 0.19140625, 0.22216796875, 0.2529296875, 0.28369140625, 0.314453125, 0.34521484375, 0.3759765625, 0.40673828125, 0.4375, 0.46826171875, 0.4990234375, 0.52978515625, 0.560546875, 0.59130859375, 0.6220703125, 0.65283203125, 0.68359375, 0.71435546875, 0.7451171875, 0.77587890625, 0.806640625, 0.83740234375, 0.8681640625, 0.89892578125, 0.9296875, 0.96044921875, 0.9912109375, 1.02197265625, 1.052734375, 1.08349609375, 1.1142578125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 24.0, 117.0, 428.0, 357.0, 76.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042202409356832504, -0.03498657047748566, -0.02777072787284851, -0.020554888993501663, -0.013339048251509666, -0.00612320750951767, 0.0010926313698291779, 0.008308473974466324, 0.015524312853813171, 0.022740153595805168, 0.029955994337797165, 0.03717183321714401, 0.04438767582178116, 0.051603514701128006, 0.058819353580474854, 0.066035196185112, 0.07325103878974915, 0.08046688139438629, 0.08768271654844284, 0.09489855915307999, 0.10211440175771713, 0.10933023691177368, 0.11654607951641083, 0.12376192212104797, 0.13097774982452393, 0.13819359242916107, 0.14540943503379822, 0.15262526273727417, 0.15984110534191132, 0.16705694794654846, 0.1742727905511856, 0.18148863315582275, 0.1887044757604599, 0.19592031836509705, 0.2031361609697342, 0.21035200357437134, 0.2175678312778473, 0.22478367388248444, 0.23199951648712158, 0.23921535909175873, 0.24643120169639587, 0.2536470293998718, 0.26086288690567017, 0.2680787146091461, 0.27529457211494446, 0.2825103998184204, 0.28972625732421875, 0.2969420850276947, 0.30415791273117065, 0.3113737404346466, 0.31858959794044495, 0.3258054256439209, 0.33302128314971924, 0.3402371108531952, 0.34745293855667114, 0.3546687960624695, 0.3618846535682678, 0.3691004812717438, 0.3763163387775421, 0.38353216648101807, 0.3907480239868164, 0.39796385169029236, 0.4051796793937683, 0.41239553689956665, 0.4196113646030426]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 13.0, 7.0, 13.0, 23.0, 11.0, 22.0, 20.0, 28.0, 28.0, 34.0, 29.0, 37.0, 32.0, 36.0, 39.0, 37.0, 46.0, 35.0, 25.0, 41.0, 50.0, 34.0, 43.0, 28.0, 31.0, 31.0, 35.0, 25.0, 28.0, 24.0, 13.0, 12.0, 15.0, 12.0, 14.0, 9.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.03391587734222412, -0.03291811794042587, -0.031920358538627625, -0.030922595411539078, -0.02992483600974083, -0.02892707660794258, -0.027929315343499184, -0.026931554079055786, -0.025933794677257538, -0.02493603527545929, -0.023938274011015892, -0.022940512746572495, -0.021942753344774246, -0.020944993942975998, -0.0199472326785326, -0.018949471414089203, -0.017951712012290955, -0.016953952610492706, -0.01595619134604931, -0.014958431012928486, -0.013960670679807663, -0.01296291034668684, -0.011965150013566017, -0.010967389680445194, -0.009969629347324371, -0.008971869014203548, -0.007974108681082726, -0.006976348347961903, -0.00597858801484108, -0.004980827681720257, -0.003983067348599434, -0.002985307015478611, -0.001987546682357788, -0.0009897863492369652, 7.973983883857727e-06, 0.0010057343170046806, 0.0020034946501255035, 0.0030012549832463264, 0.003999015316367149, 0.004996775649487972, 0.005994535982608795, 0.006992296315729618, 0.007990056648850441, 0.008987816981971264, 0.009985577315092087, 0.01098333764821291, 0.011981097981333733, 0.012978858314454556, 0.013976618647575378, 0.014974378980696201, 0.015972139313817024, 0.016969900578260422, 0.01796765998005867, 0.01896541938185692, 0.019963180646300316, 0.020960941910743713, 0.02195870131254196, 0.02295646071434021, 0.023954221978783607, 0.024951983243227005, 0.025949742645025253, 0.0269475020468235, 0.0279452633112669, 0.028943024575710297, 0.029940783977508545]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 8.0, 6.0, 18.0, 13.0, 13.0, 11.0, 14.0, 8.0, 19.0, 15.0, 25.0, 24.0, 27.0, 30.0, 25.0, 38.0, 32.0, 55.0, 31.0, 40.0, 36.0, 41.0, 46.0, 45.0, 31.0, 37.0, 34.0, 30.0, 23.0, 24.0, 29.0, 18.0, 25.0, 16.0, 19.0, 17.0, 22.0, 11.0, 7.0, 11.0, 6.0, 7.0, 5.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.234375, -1.195709228515625, -1.15704345703125, -1.118377685546875, -1.0797119140625, -1.041046142578125, -1.00238037109375, -0.963714599609375, -0.925048828125, -0.886383056640625, -0.84771728515625, -0.809051513671875, -0.7703857421875, -0.731719970703125, -0.69305419921875, -0.654388427734375, -0.61572265625, -0.577056884765625, -0.53839111328125, -0.499725341796875, -0.4610595703125, -0.422393798828125, -0.38372802734375, -0.345062255859375, -0.306396484375, -0.267730712890625, -0.22906494140625, -0.190399169921875, -0.1517333984375, -0.113067626953125, -0.07440185546875, -0.035736083984375, 0.0029296875, 0.041595458984375, 0.08026123046875, 0.118927001953125, 0.1575927734375, 0.196258544921875, 0.23492431640625, 0.273590087890625, 0.312255859375, 0.350921630859375, 0.38958740234375, 0.428253173828125, 0.4669189453125, 0.505584716796875, 0.54425048828125, 0.582916259765625, 0.62158203125, 0.660247802734375, 0.69891357421875, 0.737579345703125, 0.7762451171875, 0.814910888671875, 0.85357666015625, 0.892242431640625, 0.930908203125, 0.969573974609375, 1.00823974609375, 1.046905517578125, 1.0855712890625, 1.124237060546875, 1.16290283203125, 1.201568603515625, 1.240234375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 8.0, 10.0, 18.0, 25.0, 33.0, 40.0, 63.0, 116.0, 180.0, 285.0, 441.0, 741.0, 1279.0, 2224.0, 3900.0, 6760.0, 11820.0, 20599.0, 35604.0, 60255.0, 97867.0, 160083.0, 252722.0, 156050.0, 96521.0, 58869.0, 34762.0, 20148.0, 11434.0, 6473.0, 3702.0, 2158.0, 1314.0, 799.0, 440.0, 292.0, 186.0, 115.0, 70.0, 46.0, 37.0, 22.0, 13.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4453125, -1.3993988037109375, -1.353485107421875, -1.3075714111328125, -1.26165771484375, -1.2157440185546875, -1.169830322265625, -1.1239166259765625, -1.0780029296875, -1.0320892333984375, -0.986175537109375, -0.9402618408203125, -0.89434814453125, -0.8484344482421875, -0.802520751953125, -0.7566070556640625, -0.710693359375, -0.6647796630859375, -0.618865966796875, -0.5729522705078125, -0.52703857421875, -0.4811248779296875, -0.435211181640625, -0.3892974853515625, -0.3433837890625, -0.2974700927734375, -0.251556396484375, -0.2056427001953125, -0.15972900390625, -0.1138153076171875, -0.067901611328125, -0.0219879150390625, 0.02392578125, 0.0698394775390625, 0.115753173828125, 0.1616668701171875, 0.20758056640625, 0.2534942626953125, 0.299407958984375, 0.3453216552734375, 0.3912353515625, 0.4371490478515625, 0.483062744140625, 0.5289764404296875, 0.57489013671875, 0.6208038330078125, 0.666717529296875, 0.7126312255859375, 0.758544921875, 0.8044586181640625, 0.850372314453125, 0.8962860107421875, 0.94219970703125, 0.9881134033203125, 1.034027099609375, 1.0799407958984375, 1.1258544921875, 1.1717681884765625, 1.217681884765625, 1.2635955810546875, 1.30950927734375, 1.3554229736328125, 1.401336669921875, 1.4472503662109375, 1.4931640625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 6.0, 3.0, 10.0, 6.0, 8.0, 13.0, 15.0, 15.0, 14.0, 17.0, 23.0, 37.0, 35.0, 25.0, 32.0, 52.0, 62.0, 77.0, 137.0, 175.0, 1335.0, 252.0, 152.0, 121.0, 77.0, 57.0, 45.0, 40.0, 31.0, 29.0, 21.0, 22.0, 10.0, 22.0, 14.0, 7.0, 15.0, 8.0, 2.0, 9.0, 5.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.740234375, -3.626678466796875, -3.51312255859375, -3.399566650390625, -3.2860107421875, -3.172454833984375, -3.05889892578125, -2.945343017578125, -2.831787109375, -2.718231201171875, -2.60467529296875, -2.491119384765625, -2.3775634765625, -2.264007568359375, -2.15045166015625, -2.036895751953125, -1.92333984375, -1.809783935546875, -1.69622802734375, -1.582672119140625, -1.4691162109375, -1.355560302734375, -1.24200439453125, -1.128448486328125, -1.014892578125, -0.901336669921875, -0.78778076171875, -0.674224853515625, -0.5606689453125, -0.447113037109375, -0.33355712890625, -0.220001220703125, -0.1064453125, 0.007110595703125, 0.12066650390625, 0.234222412109375, 0.3477783203125, 0.461334228515625, 0.57489013671875, 0.688446044921875, 0.802001953125, 0.915557861328125, 1.02911376953125, 1.142669677734375, 1.2562255859375, 1.369781494140625, 1.48333740234375, 1.596893310546875, 1.71044921875, 1.824005126953125, 1.93756103515625, 2.051116943359375, 2.1646728515625, 2.278228759765625, 2.39178466796875, 2.505340576171875, 2.618896484375, 2.732452392578125, 2.84600830078125, 2.959564208984375, 3.0731201171875, 3.186676025390625, 3.30023193359375, 3.413787841796875, 3.52734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 10.0, 16.0, 18.0, 17.0, 25.0, 44.0, 59.0, 72.0, 98.0, 123.0, 164.0, 260.0, 509.0, 1040.0, 5018.0, 122165.0, 2835936.0, 171335.0, 6130.0, 1143.0, 517.0, 308.0, 173.0, 140.0, 89.0, 77.0, 53.0, 38.0, 35.0, 22.0, 9.0, 11.0, 8.0, 11.0, 11.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.359375, -10.0594482421875, -9.759521484375, -9.4595947265625, -9.15966796875, -8.8597412109375, -8.559814453125, -8.2598876953125, -7.9599609375, -7.6600341796875, -7.360107421875, -7.0601806640625, -6.76025390625, -6.4603271484375, -6.160400390625, -5.8604736328125, -5.560546875, -5.2606201171875, -4.960693359375, -4.6607666015625, -4.36083984375, -4.0609130859375, -3.760986328125, -3.4610595703125, -3.1611328125, -2.8612060546875, -2.561279296875, -2.2613525390625, -1.96142578125, -1.6614990234375, -1.361572265625, -1.0616455078125, -0.76171875, -0.4617919921875, -0.161865234375, 0.1380615234375, 0.43798828125, 0.7379150390625, 1.037841796875, 1.3377685546875, 1.6376953125, 1.9376220703125, 2.237548828125, 2.5374755859375, 2.83740234375, 3.1373291015625, 3.437255859375, 3.7371826171875, 4.037109375, 4.3370361328125, 4.636962890625, 4.9368896484375, 5.23681640625, 5.5367431640625, 5.836669921875, 6.1365966796875, 6.4365234375, 6.7364501953125, 7.036376953125, 7.3363037109375, 7.63623046875, 7.9361572265625, 8.236083984375, 8.5360107421875, 8.8359375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 47.0, 172.0, 343.0, 275.0, 140.0, 23.0, 10.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34880447387695, -50.42807388305664, -49.50733947753906, -48.58660888671875, -47.66587829589844, -46.745147705078125, -45.82441711425781, -44.903682708740234, -43.98295211791992, -43.06222152709961, -42.14148712158203, -41.22075653076172, -40.300025939941406, -39.379295349121094, -38.45856475830078, -37.5378303527832, -36.61709976196289, -35.69636917114258, -34.775634765625, -33.85490417480469, -32.934173583984375, -32.01344299316406, -31.092710494995117, -30.171977996826172, -29.25124740600586, -28.330516815185547, -27.4097843170166, -26.489051818847656, -25.568321228027344, -24.64759063720703, -23.726858139038086, -22.80612564086914, -21.885393142700195, -20.96466064453125, -20.043930053710938, -19.123199462890625, -18.20246696472168, -17.281734466552734, -16.361003875732422, -15.440272331237793, -14.519540786743164, -13.598809242248535, -12.678077697753906, -11.757346153259277, -10.836614608764648, -9.91588306427002, -8.99515151977539, -8.074419975280762, -7.153688430786133, -6.232956886291504, -5.312225341796875, -4.391493797302246, -3.470762252807617, -2.5500307083129883, -1.6292991638183594, -0.7085676193237305, 0.21216392517089844, 1.1328954696655273, 2.0536270141601562, 2.974358558654785, 3.895090103149414, 4.815821647644043, 5.736553192138672, 6.657284736633301, 7.57801628112793]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 5.0, 9.0, 14.0, 12.0, 12.0, 11.0, 20.0, 28.0, 34.0, 22.0, 31.0, 40.0, 39.0, 43.0, 41.0, 44.0, 54.0, 36.0, 54.0, 39.0, 42.0, 36.0, 38.0, 40.0, 24.0, 34.0, 28.0, 27.0, 20.0, 20.0, 28.0, 17.0, 11.0, 11.0, 11.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.273069381713867, -11.90623664855957, -11.539403915405273, -11.172571182250977, -10.805737495422363, -10.438904762268066, -10.07207202911377, -9.705239295959473, -9.33840560913086, -8.971572875976562, -8.604740142822266, -8.237907409667969, -7.8710737228393555, -7.504240989685059, -7.137408256530762, -6.770575523376465, -6.403742790222168, -6.036910057067871, -5.670076847076416, -5.303244113922119, -4.936410903930664, -4.569578170776367, -4.20274543762207, -3.8359124660491943, -3.4690794944763184, -3.1022465229034424, -2.7354135513305664, -2.3685808181762695, -2.0017478466033936, -1.6349148750305176, -1.2680821418762207, -0.9012491703033447, -0.5344152450561523, -0.16758233308792114, 0.19925057888031006, 0.5660834312438965, 0.9329164028167725, 1.2997493743896484, 1.6665821075439453, 2.0334150791168213, 2.4002480506896973, 2.7670810222625732, 3.133913993835449, 3.500746726989746, 3.867579698562622, 4.234412670135498, 4.601245403289795, 4.96807861328125, 5.334911346435547, 5.701744079589844, 6.068577289581299, 6.435410022735596, 6.802243232727051, 7.169075965881348, 7.5359086990356445, 7.902741432189941, 8.269575119018555, 8.636407852172852, 9.003240585327148, 9.370073318481445, 9.736907005310059, 10.103739738464355, 10.470572471618652, 10.83740520477295, 11.204237937927246]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 7.0, 8.0, 11.0, 11.0, 15.0, 19.0, 12.0, 16.0, 26.0, 17.0, 28.0, 35.0, 27.0, 32.0, 38.0, 37.0, 28.0, 42.0, 52.0, 41.0, 44.0, 38.0, 36.0, 42.0, 37.0, 31.0, 23.0, 32.0, 22.0, 39.0, 23.0, 15.0, 13.0, 29.0, 10.0, 18.0, 12.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.3467254638671875, -1.302825927734375, -1.2589263916015625, -1.21502685546875, -1.1711273193359375, -1.127227783203125, -1.0833282470703125, -1.0394287109375, -0.9955291748046875, -0.951629638671875, -0.9077301025390625, -0.86383056640625, -0.8199310302734375, -0.776031494140625, -0.7321319580078125, -0.688232421875, -0.6443328857421875, -0.600433349609375, -0.5565338134765625, -0.51263427734375, -0.4687347412109375, -0.424835205078125, -0.3809356689453125, -0.3370361328125, -0.2931365966796875, -0.249237060546875, -0.2053375244140625, -0.16143798828125, -0.1175384521484375, -0.073638916015625, -0.0297393798828125, 0.01416015625, 0.0580596923828125, 0.101959228515625, 0.1458587646484375, 0.18975830078125, 0.2336578369140625, 0.277557373046875, 0.3214569091796875, 0.3653564453125, 0.4092559814453125, 0.453155517578125, 0.4970550537109375, 0.54095458984375, 0.5848541259765625, 0.628753662109375, 0.6726531982421875, 0.716552734375, 0.7604522705078125, 0.804351806640625, 0.8482513427734375, 0.89215087890625, 0.9360504150390625, 0.979949951171875, 1.0238494873046875, 1.0677490234375, 1.1116485595703125, 1.155548095703125, 1.1994476318359375, 1.24334716796875, 1.2872467041015625, 1.331146240234375, 1.3750457763671875, 1.4189453125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 13.0, 11.0, 8.0, 16.0, 22.0, 28.0, 36.0, 61.0, 76.0, 113.0, 169.0, 218.0, 371.0, 653.0, 1205.0, 2432.0, 5175.0, 11728.0, 30867.0, 96968.0, 398566.0, 1676125.0, 1494912.0, 342220.0, 85202.0, 27298.0, 10389.0, 4456.0, 2168.0, 1146.0, 579.0, 324.0, 214.0, 138.0, 88.0, 79.0, 53.0, 41.0, 31.0, 22.0, 20.0, 8.0, 10.0, 8.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0], "bins": [-2.66796875, -2.59375, -2.51953125, -2.4453125, -2.37109375, -2.296875, -2.22265625, -2.1484375, -2.07421875, -2.0, -1.92578125, -1.8515625, -1.77734375, -1.703125, -1.62890625, -1.5546875, -1.48046875, -1.40625, -1.33203125, -1.2578125, -1.18359375, -1.109375, -1.03515625, -0.9609375, -0.88671875, -0.8125, -0.73828125, -0.6640625, -0.58984375, -0.515625, -0.44140625, -0.3671875, -0.29296875, -0.21875, -0.14453125, -0.0703125, 0.00390625, 0.078125, 0.15234375, 0.2265625, 0.30078125, 0.375, 0.44921875, 0.5234375, 0.59765625, 0.671875, 0.74609375, 0.8203125, 0.89453125, 0.96875, 1.04296875, 1.1171875, 1.19140625, 1.265625, 1.33984375, 1.4140625, 1.48828125, 1.5625, 1.63671875, 1.7109375, 1.78515625, 1.859375, 1.93359375, 2.0078125, 2.08203125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 3.0, 15.0, 19.0, 24.0, 13.0, 28.0, 26.0, 48.0, 54.0, 81.0, 106.0, 151.0, 180.0, 242.0, 334.0, 487.0, 508.0, 449.0, 341.0, 261.0, 164.0, 132.0, 99.0, 79.0, 61.0, 42.0, 31.0, 19.0, 17.0, 4.0, 10.0, 6.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.412109375, -2.33984375, -2.267578125, -2.1953125, -2.123046875, -2.05078125, -1.978515625, -1.90625, -1.833984375, -1.76171875, -1.689453125, -1.6171875, -1.544921875, -1.47265625, -1.400390625, -1.328125, -1.255859375, -1.18359375, -1.111328125, -1.0390625, -0.966796875, -0.89453125, -0.822265625, -0.75, -0.677734375, -0.60546875, -0.533203125, -0.4609375, -0.388671875, -0.31640625, -0.244140625, -0.171875, -0.099609375, -0.02734375, 0.044921875, 0.1171875, 0.189453125, 0.26171875, 0.333984375, 0.40625, 0.478515625, 0.55078125, 0.623046875, 0.6953125, 0.767578125, 0.83984375, 0.912109375, 0.984375, 1.056640625, 1.12890625, 1.201171875, 1.2734375, 1.345703125, 1.41796875, 1.490234375, 1.5625, 1.634765625, 1.70703125, 1.779296875, 1.8515625, 1.923828125, 1.99609375, 2.068359375, 2.140625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 11.0, 10.0, 21.0, 27.0, 49.0, 54.0, 71.0, 120.0, 176.0, 194.0, 371.0, 1125.0, 13752.0, 816759.0, 3314229.0, 43737.0, 2070.0, 483.0, 287.0, 189.0, 129.0, 89.0, 82.0, 45.0, 30.0, 43.0, 24.0, 23.0, 12.0, 10.0, 9.0, 10.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.4716796875, -9.123046875, -8.7744140625, -8.42578125, -8.0771484375, -7.728515625, -7.3798828125, -7.03125, -6.6826171875, -6.333984375, -5.9853515625, -5.63671875, -5.2880859375, -4.939453125, -4.5908203125, -4.2421875, -3.8935546875, -3.544921875, -3.1962890625, -2.84765625, -2.4990234375, -2.150390625, -1.8017578125, -1.453125, -1.1044921875, -0.755859375, -0.4072265625, -0.05859375, 0.2900390625, 0.638671875, 0.9873046875, 1.3359375, 1.6845703125, 2.033203125, 2.3818359375, 2.73046875, 3.0791015625, 3.427734375, 3.7763671875, 4.125, 4.4736328125, 4.822265625, 5.1708984375, 5.51953125, 5.8681640625, 6.216796875, 6.5654296875, 6.9140625, 7.2626953125, 7.611328125, 7.9599609375, 8.30859375, 8.6572265625, 9.005859375, 9.3544921875, 9.703125, 10.0517578125, 10.400390625, 10.7490234375, 11.09765625, 11.4462890625, 11.794921875, 12.1435546875, 12.4921875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 15.0, 47.0, 123.0, 195.0, 254.0, 206.0, 103.0, 52.0, 14.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.896546363830566, -12.011033058166504, -11.125520706176758, -10.240007400512695, -9.354494094848633, -8.46898078918457, -7.583467960357666, -6.697955131530762, -5.812441825866699, -4.926928520202637, -4.041415691375732, -3.155902624130249, -2.2703895568847656, -1.3848762512207031, -0.49936342239379883, 0.38614940643310547, 1.271662712097168, 2.1571757793426514, 3.0426888465881348, 3.928201913833618, 4.813714981079102, 5.699228286743164, 6.584741115570068, 7.470253944396973, 8.355767250061035, 9.241280555725098, 10.126792907714844, 11.012306213378906, 11.897819519042969, 12.783332824707031, 13.668846130371094, 14.55435848236084, 15.439872741699219, 16.32538604736328, 17.210899353027344, 18.096412658691406, 18.98192596435547, 19.86743927001953, 20.75295066833496, 21.638463973999023, 22.523977279663086, 23.40949058532715, 24.29500389099121, 25.180517196655273, 26.066028594970703, 26.951541900634766, 27.837055206298828, 28.72256851196289, 29.608081817626953, 30.493595123291016, 31.379108428955078, 32.26462173461914, 33.1501350402832, 34.035648345947266, 34.92116165161133, 35.806671142578125, 36.69218444824219, 37.57769775390625, 38.46321105957031, 39.348724365234375, 40.23423767089844, 41.1197509765625, 42.00526428222656, 42.890777587890625, 43.77629089355469]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 8.0, 2.0, 7.0, 10.0, 9.0, 7.0, 9.0, 12.0, 16.0, 13.0, 13.0, 17.0, 19.0, 24.0, 21.0, 23.0, 22.0, 28.0, 26.0, 36.0, 46.0, 33.0, 36.0, 39.0, 30.0, 55.0, 41.0, 40.0, 38.0, 30.0, 26.0, 32.0, 31.0, 34.0, 18.0, 22.0, 22.0, 12.0, 19.0, 14.0, 14.0, 9.0, 7.0, 5.0, 9.0, 4.0, 5.0, 4.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.102952480316162, -6.883153438568115, -6.66335391998291, -6.443554878234863, -6.223755836486816, -6.003956317901611, -5.7841572761535645, -5.564357757568359, -5.3445587158203125, -5.124759674072266, -4.9049601554870605, -4.685161113739014, -4.465362071990967, -4.245562553405762, -4.025763511657715, -3.805964231491089, -3.586165189743042, -3.366365909576416, -3.146566867828369, -2.926767587661743, -2.706968307495117, -2.4871692657470703, -2.2673699855804443, -2.0475707054138184, -1.827771544456482, -1.6079723834991455, -1.3881731033325195, -1.168373942375183, -0.9485747218132019, -0.7287755012512207, -0.5089763402938843, -0.2891770601272583, -0.06937789916992188, 0.15042130649089813, 0.37022051215171814, 0.590019702911377, 0.8098189234733582, 1.0296181440353394, 1.2494173049926758, 1.4692165851593018, 1.6890157461166382, 1.9088149070739746, 2.1286141872406006, 2.3484134674072266, 2.5682125091552734, 2.7880117893218994, 3.0078110694885254, 3.2276101112365723, 3.4474093914031982, 3.667208671569824, 3.887007713317871, 4.106806755065918, 4.326606273651123, 4.54640531539917, 4.766204833984375, 4.986003875732422, 5.205802917480469, 5.425601959228516, 5.645401477813721, 5.865200519561768, 6.0849995613098145, 6.3047990798950195, 6.524598121643066, 6.744397163391113, 6.964196681976318]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 10.0, 9.0, 12.0, 16.0, 9.0, 20.0, 15.0, 25.0, 23.0, 32.0, 30.0, 35.0, 38.0, 28.0, 33.0, 52.0, 41.0, 45.0, 41.0, 40.0, 45.0, 36.0, 37.0, 28.0, 41.0, 28.0, 34.0, 26.0, 34.0, 22.0, 18.0, 24.0, 11.0, 12.0, 10.0, 10.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.1973114013671875, -1.153411865234375, -1.1095123291015625, -1.06561279296875, -1.0217132568359375, -0.977813720703125, -0.9339141845703125, -0.8900146484375, -0.8461151123046875, -0.802215576171875, -0.7583160400390625, -0.71441650390625, -0.6705169677734375, -0.626617431640625, -0.5827178955078125, -0.538818359375, -0.4949188232421875, -0.451019287109375, -0.4071197509765625, -0.36322021484375, -0.3193206787109375, -0.275421142578125, -0.2315216064453125, -0.1876220703125, -0.1437225341796875, -0.099822998046875, -0.0559234619140625, -0.01202392578125, 0.0318756103515625, 0.075775146484375, 0.1196746826171875, 0.16357421875, 0.2074737548828125, 0.251373291015625, 0.2952728271484375, 0.33917236328125, 0.3830718994140625, 0.426971435546875, 0.4708709716796875, 0.5147705078125, 0.5586700439453125, 0.602569580078125, 0.6464691162109375, 0.69036865234375, 0.7342681884765625, 0.778167724609375, 0.8220672607421875, 0.865966796875, 0.9098663330078125, 0.953765869140625, 0.9976654052734375, 1.04156494140625, 1.0854644775390625, 1.129364013671875, 1.1732635498046875, 1.2171630859375, 1.2610626220703125, 1.304962158203125, 1.3488616943359375, 1.39276123046875, 1.4366607666015625, 1.480560302734375, 1.5244598388671875, 1.568359375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 1.0, 13.0, 10.0, 17.0, 29.0, 36.0, 36.0, 72.0, 77.0, 107.0, 142.0, 183.0, 284.0, 368.0, 550.0, 724.0, 1143.0, 1835.0, 2992.0, 5520.0, 13713.0, 46557.0, 187294.0, 442114.0, 247032.0, 63729.0, 17600.0, 6727.0, 3453.0, 1982.0, 1209.0, 868.0, 630.0, 416.0, 282.0, 200.0, 181.0, 121.0, 67.0, 72.0, 69.0, 31.0, 25.0, 10.0, 10.0, 5.0, 11.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.489501953125, -0.4740180969238281, -0.45853424072265625, -0.4430503845214844, -0.4275665283203125, -0.4120826721191406, -0.39659881591796875, -0.3811149597167969, -0.365631103515625, -0.3501472473144531, -0.33466339111328125, -0.3191795349121094, -0.3036956787109375, -0.2882118225097656, -0.27272796630859375, -0.2572441101074219, -0.24176025390625, -0.22627639770507812, -0.21079254150390625, -0.19530868530273438, -0.1798248291015625, -0.16434097290039062, -0.14885711669921875, -0.13337326049804688, -0.117889404296875, -0.10240554809570312, -0.08692169189453125, -0.07143783569335938, -0.0559539794921875, -0.040470123291015625, -0.02498626708984375, -0.009502410888671875, 0.0059814453125, 0.021465301513671875, 0.03694915771484375, 0.052433013916015625, 0.0679168701171875, 0.08340072631835938, 0.09888458251953125, 0.11436843872070312, 0.129852294921875, 0.14533615112304688, 0.16082000732421875, 0.17630386352539062, 0.1917877197265625, 0.20727157592773438, 0.22275543212890625, 0.23823928833007812, 0.25372314453125, 0.2692070007324219, 0.28469085693359375, 0.3001747131347656, 0.3156585693359375, 0.3311424255371094, 0.34662628173828125, 0.3621101379394531, 0.377593994140625, 0.3930778503417969, 0.40856170654296875, 0.4240455627441406, 0.4395294189453125, 0.4550132751464844, 0.47049713134765625, 0.4859809875488281, 0.50146484375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 2.0, 7.0, 8.0, 7.0, 11.0, 11.0, 9.0, 14.0, 12.0, 3.0, 16.0, 23.0, 19.0, 17.0, 24.0, 26.0, 34.0, 37.0, 41.0, 34.0, 34.0, 39.0, 24.0, 45.0, 1059.0, 27.0, 33.0, 27.0, 39.0, 33.0, 39.0, 25.0, 22.0, 28.0, 32.0, 24.0, 14.0, 13.0, 16.0, 14.0, 16.0, 13.0, 12.0, 13.0, 4.0, 6.0, 5.0, 7.0, 8.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.7470703125, -0.7225112915039062, -0.6979522705078125, -0.6733932495117188, -0.648834228515625, -0.6242752075195312, -0.5997161865234375, -0.5751571655273438, -0.55059814453125, -0.5260391235351562, -0.5014801025390625, -0.47692108154296875, -0.452362060546875, -0.42780303955078125, -0.4032440185546875, -0.37868499755859375, -0.3541259765625, -0.32956695556640625, -0.3050079345703125, -0.28044891357421875, -0.255889892578125, -0.23133087158203125, -0.2067718505859375, -0.18221282958984375, -0.15765380859375, -0.13309478759765625, -0.1085357666015625, -0.08397674560546875, -0.059417724609375, -0.03485870361328125, -0.0102996826171875, 0.01425933837890625, 0.038818359375, 0.06337738037109375, 0.0879364013671875, 0.11249542236328125, 0.137054443359375, 0.16161346435546875, 0.1861724853515625, 0.21073150634765625, 0.23529052734375, 0.25984954833984375, 0.2844085693359375, 0.30896759033203125, 0.333526611328125, 0.35808563232421875, 0.3826446533203125, 0.40720367431640625, 0.4317626953125, 0.45632171630859375, 0.4808807373046875, 0.5054397583007812, 0.529998779296875, 0.5545578002929688, 0.5791168212890625, 0.6036758422851562, 0.62823486328125, 0.6527938842773438, 0.6773529052734375, 0.7019119262695312, 0.726470947265625, 0.7510299682617188, 0.7755889892578125, 0.8001480102539062, 0.82470703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 6.0, 12.0, 15.0, 30.0, 22.0, 24.0, 34.0, 57.0, 92.0, 92.0, 156.0, 201.0, 249.0, 377.0, 604.0, 796.0, 1165.0, 1976.0, 3600.0, 8596.0, 28891.0, 136860.0, 1379349.0, 427710.0, 74638.0, 17640.0, 6093.0, 2883.0, 1636.0, 944.0, 682.0, 418.0, 352.0, 210.0, 169.0, 139.0, 111.0, 72.0, 72.0, 35.0, 30.0, 22.0, 19.0, 14.0, 14.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.383544921875, -0.371856689453125, -0.36016845703125, -0.348480224609375, -0.3367919921875, -0.325103759765625, -0.31341552734375, -0.301727294921875, -0.2900390625, -0.278350830078125, -0.26666259765625, -0.254974365234375, -0.2432861328125, -0.231597900390625, -0.21990966796875, -0.208221435546875, -0.196533203125, -0.184844970703125, -0.17315673828125, -0.161468505859375, -0.1497802734375, -0.138092041015625, -0.12640380859375, -0.114715576171875, -0.10302734375, -0.091339111328125, -0.07965087890625, -0.067962646484375, -0.0562744140625, -0.044586181640625, -0.03289794921875, -0.021209716796875, -0.009521484375, 0.002166748046875, 0.01385498046875, 0.025543212890625, 0.0372314453125, 0.048919677734375, 0.06060791015625, 0.072296142578125, 0.083984375, 0.095672607421875, 0.10736083984375, 0.119049072265625, 0.1307373046875, 0.142425537109375, 0.15411376953125, 0.165802001953125, 0.177490234375, 0.189178466796875, 0.20086669921875, 0.212554931640625, 0.2242431640625, 0.235931396484375, 0.24761962890625, 0.259307861328125, 0.27099609375, 0.282684326171875, 0.29437255859375, 0.306060791015625, 0.3177490234375, 0.329437255859375, 0.34112548828125, 0.352813720703125, 0.364501953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 7.0, 10.0, 12.0, 19.0, 33.0, 51.0, 71.0, 122.0, 200.0, 161.0, 105.0, 55.0, 38.0, 26.0, 17.0, 15.0, 13.0, 7.0, 4.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06927490234375, -0.06710052490234375, -0.0649261474609375, -0.06275177001953125, -0.060577392578125, -0.05840301513671875, -0.0562286376953125, -0.05405426025390625, -0.0518798828125, -0.04970550537109375, -0.0475311279296875, -0.04535675048828125, -0.043182373046875, -0.04100799560546875, -0.0388336181640625, -0.03665924072265625, -0.03448486328125, -0.03231048583984375, -0.0301361083984375, -0.02796173095703125, -0.025787353515625, -0.02361297607421875, -0.0214385986328125, -0.01926422119140625, -0.01708984375, -0.01491546630859375, -0.0127410888671875, -0.01056671142578125, -0.008392333984375, -0.00621795654296875, -0.0040435791015625, -0.00186920166015625, 0.00030517578125, 0.00247955322265625, 0.0046539306640625, 0.00682830810546875, 0.009002685546875, 0.01117706298828125, 0.0133514404296875, 0.01552581787109375, 0.0177001953125, 0.01987457275390625, 0.0220489501953125, 0.02422332763671875, 0.026397705078125, 0.02857208251953125, 0.0307464599609375, 0.03292083740234375, 0.03509521484375, 0.03726959228515625, 0.0394439697265625, 0.04161834716796875, 0.043792724609375, 0.04596710205078125, 0.0481414794921875, 0.05031585693359375, 0.052490234375, 0.05466461181640625, 0.0568389892578125, 0.05901336669921875, 0.061187744140625, 0.06336212158203125, 0.0655364990234375, 0.06771087646484375, 0.06988525390625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 17.0, 13.0, 18.0, 26.0, 32.0, 47.0, 67.0, 219.0, 1565.0, 106777.0, 936933.0, 2253.0, 275.0, 101.0, 43.0, 41.0, 33.0, 13.0, 10.0, 12.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.3907928466796875, -1.346038818359375, -1.3012847900390625, -1.25653076171875, -1.2117767333984375, -1.167022705078125, -1.1222686767578125, -1.0775146484375, -1.0327606201171875, -0.988006591796875, -0.9432525634765625, -0.89849853515625, -0.8537445068359375, -0.808990478515625, -0.7642364501953125, -0.719482421875, -0.6747283935546875, -0.629974365234375, -0.5852203369140625, -0.54046630859375, -0.4957122802734375, -0.450958251953125, -0.4062042236328125, -0.3614501953125, -0.3166961669921875, -0.271942138671875, -0.2271881103515625, -0.18243408203125, -0.1376800537109375, -0.092926025390625, -0.0481719970703125, -0.00341796875, 0.0413360595703125, 0.086090087890625, 0.1308441162109375, 0.17559814453125, 0.2203521728515625, 0.265106201171875, 0.3098602294921875, 0.3546142578125, 0.3993682861328125, 0.444122314453125, 0.4888763427734375, 0.53363037109375, 0.5783843994140625, 0.623138427734375, 0.6678924560546875, 0.712646484375, 0.7574005126953125, 0.802154541015625, 0.8469085693359375, 0.89166259765625, 0.9364166259765625, 0.981170654296875, 1.0259246826171875, 1.0706787109375, 1.1154327392578125, 1.160186767578125, 1.2049407958984375, 1.24969482421875, 1.2944488525390625, 1.339202880859375, 1.3839569091796875, 1.4287109375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 10.0, 18.0, 76.0, 491.0, 362.0, 46.0, 8.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11667288094758987, -0.09980170428752899, -0.08293052017688751, -0.06605933606624603, -0.04918815940618515, -0.03231697529554367, -0.015445798635482788, 0.0014253780245780945, 0.018296562135219574, 0.035167742520570755, 0.052038922905921936, 0.06891010701656342, 0.0857812836766243, 0.10265246778726578, 0.11952364444732666, 0.13639482855796814, 0.15326601266860962, 0.1701371967792511, 0.18700838088989258, 0.20387955009937286, 0.22075073421001434, 0.23762191832065582, 0.2544930875301361, 0.2713642716407776, 0.28823545575141907, 0.30510663986206055, 0.321977823972702, 0.3388490080833435, 0.3557201623916626, 0.37259137630462646, 0.38946253061294556, 0.40633371472358704, 0.4232048988342285, 0.44007608294487, 0.4569472670555115, 0.47381845116615295, 0.49068963527679443, 0.5075607895851135, 0.5244320034980774, 0.5413031578063965, 0.5581743717193604, 0.5750455260276794, 0.5919167399406433, 0.6087878942489624, 0.6256591081619263, 0.6425302624702454, 0.6594014763832092, 0.6762726306915283, 0.6931437849998474, 0.7100149393081665, 0.7268861532211304, 0.7437573075294495, 0.7606285214424133, 0.7774996757507324, 0.7943708896636963, 0.8112420439720154, 0.8281131982803345, 0.8449843525886536, 0.8618555665016174, 0.8787267208099365, 0.8955979347229004, 0.9124690890312195, 0.9293403029441833, 0.9462114572525024, 0.9630826711654663]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 8.0, 3.0, 10.0, 13.0, 21.0, 12.0, 18.0, 19.0, 21.0, 22.0, 29.0, 23.0, 40.0, 48.0, 32.0, 45.0, 37.0, 43.0, 34.0, 48.0, 45.0, 34.0, 34.0, 26.0, 27.0, 29.0, 40.0, 28.0, 29.0, 19.0, 33.0, 15.0, 11.0, 17.0, 18.0, 9.0, 12.0, 10.0, 3.0, 7.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.08404541015625, -0.08136726170778275, -0.0786891058087349, -0.07601095736026764, -0.07333280146121979, -0.07065465301275253, -0.06797650456428528, -0.06529834866523743, -0.06262020021677017, -0.05994204804301262, -0.057263895869255066, -0.05458574742078781, -0.05190759524703026, -0.049229443073272705, -0.04655129462480545, -0.0438731424510479, -0.041194990277290344, -0.03851683810353279, -0.03583868592977524, -0.03316053748130798, -0.03048238530755043, -0.027804233133792877, -0.025126082822680473, -0.02244793251156807, -0.019769780337810516, -0.017091628164052963, -0.01441347785294056, -0.011735326610505581, -0.009057175368070602, -0.006379024125635624, -0.0037008728832006454, -0.0010227225720882416, 0.0016554296016693115, 0.00433358084410429, 0.0070117320865392685, 0.009689883328974247, 0.012368034571409225, 0.015046185813844204, 0.017724337056279182, 0.020402487367391586, 0.02308063954114914, 0.025758791714906693, 0.028436942026019096, 0.0311150923371315, 0.03379324451088905, 0.036471396684646606, 0.03914954513311386, 0.041827697306871414, 0.04450584948062897, 0.04718400165438652, 0.049862153828144073, 0.05254030227661133, 0.05521845445036888, 0.057896606624126434, 0.06057475507259369, 0.06325291097164154, 0.0659310594201088, 0.06860920786857605, 0.0712873637676239, 0.07396551221609116, 0.07664366066455841, 0.07932181656360626, 0.08199996501207352, 0.08467811346054077, 0.08735626935958862]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 9.0, 12.0, 15.0, 11.0, 15.0, 17.0, 26.0, 26.0, 27.0, 30.0, 35.0, 41.0, 26.0, 33.0, 49.0, 42.0, 43.0, 45.0, 36.0, 49.0, 37.0, 36.0, 29.0, 41.0, 31.0, 31.0, 28.0, 32.0, 22.0, 16.0, 28.0, 11.0, 11.0, 10.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.203125, -1.1591796875, -1.115234375, -1.0712890625, -1.02734375, -0.9833984375, -0.939453125, -0.8955078125, -0.8515625, -0.8076171875, -0.763671875, -0.7197265625, -0.67578125, -0.6318359375, -0.587890625, -0.5439453125, -0.5, -0.4560546875, -0.412109375, -0.3681640625, -0.32421875, -0.2802734375, -0.236328125, -0.1923828125, -0.1484375, -0.1044921875, -0.060546875, -0.0166015625, 0.02734375, 0.0712890625, 0.115234375, 0.1591796875, 0.203125, 0.2470703125, 0.291015625, 0.3349609375, 0.37890625, 0.4228515625, 0.466796875, 0.5107421875, 0.5546875, 0.5986328125, 0.642578125, 0.6865234375, 0.73046875, 0.7744140625, 0.818359375, 0.8623046875, 0.90625, 0.9501953125, 0.994140625, 1.0380859375, 1.08203125, 1.1259765625, 1.169921875, 1.2138671875, 1.2578125, 1.3017578125, 1.345703125, 1.3896484375, 1.43359375, 1.4775390625, 1.521484375, 1.5654296875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 12.0, 9.0, 18.0, 18.0, 21.0, 36.0, 47.0, 81.0, 126.0, 277.0, 552.0, 1244.0, 2904.0, 7543.0, 20358.0, 55101.0, 164337.0, 478322.0, 208790.0, 68565.0, 24769.0, 9009.0, 3513.0, 1466.0, 667.0, 299.0, 169.0, 75.0, 46.0, 41.0, 31.0, 20.0, 19.0, 12.0, 10.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.108245849609375, -2.02899169921875, -1.949737548828125, -1.8704833984375, -1.791229248046875, -1.71197509765625, -1.632720947265625, -1.553466796875, -1.474212646484375, -1.39495849609375, -1.315704345703125, -1.2364501953125, -1.157196044921875, -1.07794189453125, -0.998687744140625, -0.91943359375, -0.840179443359375, -0.76092529296875, -0.681671142578125, -0.6024169921875, -0.523162841796875, -0.44390869140625, -0.364654541015625, -0.285400390625, -0.206146240234375, -0.12689208984375, -0.047637939453125, 0.0316162109375, 0.110870361328125, 0.19012451171875, 0.269378662109375, 0.3486328125, 0.427886962890625, 0.50714111328125, 0.586395263671875, 0.6656494140625, 0.744903564453125, 0.82415771484375, 0.903411865234375, 0.982666015625, 1.061920166015625, 1.14117431640625, 1.220428466796875, 1.2996826171875, 1.378936767578125, 1.45819091796875, 1.537445068359375, 1.61669921875, 1.695953369140625, 1.77520751953125, 1.854461669921875, 1.9337158203125, 2.012969970703125, 2.09222412109375, 2.171478271484375, 2.250732421875, 2.329986572265625, 2.40924072265625, 2.488494873046875, 2.5677490234375, 2.647003173828125, 2.72625732421875, 2.805511474609375, 2.884765625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 9.0, 13.0, 11.0, 17.0, 18.0, 30.0, 27.0, 28.0, 42.0, 56.0, 49.0, 70.0, 86.0, 177.0, 328.0, 1415.0, 168.0, 113.0, 71.0, 44.0, 41.0, 48.0, 32.0, 31.0, 30.0, 13.0, 25.0, 13.0, 13.0, 9.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.7879638671875, -4.638427734375, -4.4888916015625, -4.33935546875, -4.1898193359375, -4.040283203125, -3.8907470703125, -3.7412109375, -3.5916748046875, -3.442138671875, -3.2926025390625, -3.14306640625, -2.9935302734375, -2.843994140625, -2.6944580078125, -2.544921875, -2.3953857421875, -2.245849609375, -2.0963134765625, -1.94677734375, -1.7972412109375, -1.647705078125, -1.4981689453125, -1.3486328125, -1.1990966796875, -1.049560546875, -0.9000244140625, -0.75048828125, -0.6009521484375, -0.451416015625, -0.3018798828125, -0.15234375, -0.0028076171875, 0.146728515625, 0.2962646484375, 0.44580078125, 0.5953369140625, 0.744873046875, 0.8944091796875, 1.0439453125, 1.1934814453125, 1.343017578125, 1.4925537109375, 1.64208984375, 1.7916259765625, 1.941162109375, 2.0906982421875, 2.240234375, 2.3897705078125, 2.539306640625, 2.6888427734375, 2.83837890625, 2.9879150390625, 3.137451171875, 3.2869873046875, 3.4365234375, 3.5860595703125, 3.735595703125, 3.8851318359375, 4.03466796875, 4.1842041015625, 4.333740234375, 4.4832763671875, 4.6328125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 5.0, 9.0, 10.0, 16.0, 30.0, 23.0, 43.0, 56.0, 82.0, 107.0, 167.0, 242.0, 488.0, 1384.0, 15146.0, 1999096.0, 1115507.0, 10865.0, 1231.0, 414.0, 238.0, 167.0, 110.0, 73.0, 60.0, 40.0, 23.0, 15.0, 17.0, 11.0, 7.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.1380615234375, -9.799560546875, -9.4610595703125, -9.12255859375, -8.7840576171875, -8.445556640625, -8.1070556640625, -7.7685546875, -7.4300537109375, -7.091552734375, -6.7530517578125, -6.41455078125, -6.0760498046875, -5.737548828125, -5.3990478515625, -5.060546875, -4.7220458984375, -4.383544921875, -4.0450439453125, -3.70654296875, -3.3680419921875, -3.029541015625, -2.6910400390625, -2.3525390625, -2.0140380859375, -1.675537109375, -1.3370361328125, -0.99853515625, -0.6600341796875, -0.321533203125, 0.0169677734375, 0.35546875, 0.6939697265625, 1.032470703125, 1.3709716796875, 1.70947265625, 2.0479736328125, 2.386474609375, 2.7249755859375, 3.0634765625, 3.4019775390625, 3.740478515625, 4.0789794921875, 4.41748046875, 4.7559814453125, 5.094482421875, 5.4329833984375, 5.771484375, 6.1099853515625, 6.448486328125, 6.7869873046875, 7.12548828125, 7.4639892578125, 7.802490234375, 8.1409912109375, 8.4794921875, 8.8179931640625, 9.156494140625, 9.4949951171875, 9.83349609375, 10.1719970703125, 10.510498046875, 10.8489990234375, 11.1875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 36.0, 309.0, 481.0, 176.0, 12.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.914794921875, -66.73052215576172, -65.54624938964844, -64.36198425292969, -63.17770767211914, -61.993438720703125, -60.809165954589844, -59.62489318847656, -58.44062423706055, -57.256351470947266, -56.07208251953125, -54.88780975341797, -53.70353698730469, -52.51926803588867, -51.33499526977539, -50.150726318359375, -48.966453552246094, -47.78218078613281, -46.5979118347168, -45.413639068603516, -44.229366302490234, -43.04509735107422, -41.86082458496094, -40.676551818847656, -39.492279052734375, -38.308006286621094, -37.12373733520508, -35.9394645690918, -34.755191802978516, -33.5709228515625, -32.38665008544922, -31.20237922668457, -30.018112182617188, -28.83384132385254, -27.649568557739258, -26.46529769897461, -25.28102684020996, -24.096755981445312, -22.91248321533203, -21.728212356567383, -20.5439395904541, -19.359668731689453, -18.175395965576172, -16.991125106811523, -15.806854248046875, -14.62258243560791, -13.438310623168945, -12.254039764404297, -11.069768905639648, -9.885497093200684, -8.701226234436035, -7.51695442199707, -6.332683086395264, -5.148411750793457, -3.964139938354492, -2.7798690795898438, -1.5955967903137207, -0.4113253355026245, 0.7729461193084717, 1.9572176933288574, 3.141489028930664, 4.325760364532471, 5.5100321769714355, 6.694303035736084, 7.878574848175049]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 8.0, 7.0, 13.0, 14.0, 12.0, 22.0, 8.0, 14.0, 16.0, 33.0, 19.0, 39.0, 31.0, 41.0, 33.0, 42.0, 44.0, 39.0, 47.0, 42.0, 41.0, 42.0, 36.0, 43.0, 31.0, 29.0, 26.0, 41.0, 29.0, 23.0, 19.0, 15.0, 24.0, 15.0, 14.0, 11.0, 6.0, 5.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.2998046875, -10.942829132080078, -10.585854530334473, -10.22887897491455, -9.871904373168945, -9.514928817749023, -9.157953262329102, -8.800978660583496, -8.444003105163574, -8.087027549743652, -7.730052947998047, -7.373077392578125, -7.016102313995361, -6.659127235412598, -6.302152156829834, -5.94517707824707, -5.588201999664307, -5.231226921081543, -4.874251842498779, -4.517276763916016, -4.160301208496094, -3.80332612991333, -3.4463510513305664, -3.0893757343292236, -2.73240065574646, -2.3754255771636963, -2.0184502601623535, -1.6614751815795898, -1.3044999837875366, -0.9475247859954834, -0.5905497074127197, -0.23357439041137695, 0.12340068817138672, 0.48037585616111755, 0.8373510241508484, 1.1943261623382568, 1.55130136013031, 1.9082765579223633, 2.265251636505127, 2.6222269535064697, 2.9792020320892334, 3.336177110671997, 3.69315242767334, 4.0501275062561035, 4.407102584838867, 4.764078140258789, 5.1210527420043945, 5.478028297424316, 5.83500337600708, 6.191978454589844, 6.548953533172607, 6.905928611755371, 7.262904167175293, 7.619879245758057, 7.97685432434082, 8.333829879760742, 8.690804481506348, 9.04778003692627, 9.404754638671875, 9.761730194091797, 10.118704795837402, 10.475680351257324, 10.83265495300293, 11.189630508422852, 11.546606063842773]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 11.0, 15.0, 12.0, 14.0, 17.0, 14.0, 19.0, 20.0, 20.0, 22.0, 38.0, 26.0, 27.0, 32.0, 32.0, 37.0, 44.0, 40.0, 36.0, 36.0, 41.0, 34.0, 34.0, 30.0, 31.0, 29.0, 32.0, 35.0, 35.0, 23.0, 23.0, 21.0, 16.0, 18.0, 16.0, 9.0, 13.0, 3.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2734375, -1.23101806640625, -1.1885986328125, -1.14617919921875, -1.103759765625, -1.06134033203125, -1.0189208984375, -0.97650146484375, -0.93408203125, -0.89166259765625, -0.8492431640625, -0.80682373046875, -0.764404296875, -0.72198486328125, -0.6795654296875, -0.63714599609375, -0.5947265625, -0.55230712890625, -0.5098876953125, -0.46746826171875, -0.425048828125, -0.38262939453125, -0.3402099609375, -0.29779052734375, -0.25537109375, -0.21295166015625, -0.1705322265625, -0.12811279296875, -0.085693359375, -0.04327392578125, -0.0008544921875, 0.04156494140625, 0.083984375, 0.12640380859375, 0.1688232421875, 0.21124267578125, 0.253662109375, 0.29608154296875, 0.3385009765625, 0.38092041015625, 0.42333984375, 0.46575927734375, 0.5081787109375, 0.55059814453125, 0.593017578125, 0.63543701171875, 0.6778564453125, 0.72027587890625, 0.7626953125, 0.80511474609375, 0.8475341796875, 0.88995361328125, 0.932373046875, 0.97479248046875, 1.0172119140625, 1.05963134765625, 1.10205078125, 1.14447021484375, 1.1868896484375, 1.22930908203125, 1.271728515625, 1.31414794921875, 1.3565673828125, 1.39898681640625, 1.44140625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 8.0, 6.0, 13.0, 13.0, 14.0, 24.0, 24.0, 40.0, 47.0, 90.0, 117.0, 180.0, 277.0, 440.0, 676.0, 1276.0, 2444.0, 4897.0, 10753.0, 25685.0, 66839.0, 197201.0, 634505.0, 1557829.0, 1126169.0, 373447.0, 118546.0, 41874.0, 16229.0, 7115.0, 3355.0, 1709.0, 890.0, 541.0, 348.0, 228.0, 137.0, 97.0, 58.0, 40.0, 28.0, 13.0, 16.0, 13.0, 10.0, 8.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.287109375, -2.2213287353515625, -2.155548095703125, -2.0897674560546875, -2.02398681640625, -1.9582061767578125, -1.892425537109375, -1.8266448974609375, -1.7608642578125, -1.6950836181640625, -1.629302978515625, -1.5635223388671875, -1.49774169921875, -1.4319610595703125, -1.366180419921875, -1.3003997802734375, -1.234619140625, -1.1688385009765625, -1.103057861328125, -1.0372772216796875, -0.97149658203125, -0.9057159423828125, -0.839935302734375, -0.7741546630859375, -0.7083740234375, -0.6425933837890625, -0.576812744140625, -0.5110321044921875, -0.44525146484375, -0.3794708251953125, -0.313690185546875, -0.2479095458984375, -0.18212890625, -0.1163482666015625, -0.050567626953125, 0.0152130126953125, 0.08099365234375, 0.1467742919921875, 0.212554931640625, 0.2783355712890625, 0.3441162109375, 0.4098968505859375, 0.475677490234375, 0.5414581298828125, 0.60723876953125, 0.6730194091796875, 0.738800048828125, 0.8045806884765625, 0.870361328125, 0.9361419677734375, 1.001922607421875, 1.0677032470703125, 1.13348388671875, 1.1992645263671875, 1.265045166015625, 1.3308258056640625, 1.3966064453125, 1.4623870849609375, 1.528167724609375, 1.5939483642578125, 1.65972900390625, 1.7255096435546875, 1.791290283203125, 1.8570709228515625, 1.9228515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 6.0, 4.0, 11.0, 19.0, 22.0, 22.0, 31.0, 39.0, 53.0, 73.0, 91.0, 88.0, 146.0, 169.0, 202.0, 285.0, 341.0, 379.0, 375.0, 346.0, 293.0, 229.0, 188.0, 139.0, 108.0, 93.0, 55.0, 56.0, 36.0, 40.0, 26.0, 20.0, 18.0, 15.0, 8.0, 6.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.119140625, -2.051177978515625, -1.98321533203125, -1.915252685546875, -1.8472900390625, -1.779327392578125, -1.71136474609375, -1.643402099609375, -1.575439453125, -1.507476806640625, -1.43951416015625, -1.371551513671875, -1.3035888671875, -1.235626220703125, -1.16766357421875, -1.099700927734375, -1.03173828125, -0.963775634765625, -0.89581298828125, -0.827850341796875, -0.7598876953125, -0.691925048828125, -0.62396240234375, -0.555999755859375, -0.488037109375, -0.420074462890625, -0.35211181640625, -0.284149169921875, -0.2161865234375, -0.148223876953125, -0.08026123046875, -0.012298583984375, 0.0556640625, 0.123626708984375, 0.19158935546875, 0.259552001953125, 0.3275146484375, 0.395477294921875, 0.46343994140625, 0.531402587890625, 0.599365234375, 0.667327880859375, 0.73529052734375, 0.803253173828125, 0.8712158203125, 0.939178466796875, 1.00714111328125, 1.075103759765625, 1.14306640625, 1.211029052734375, 1.27899169921875, 1.346954345703125, 1.4149169921875, 1.482879638671875, 1.55084228515625, 1.618804931640625, 1.686767578125, 1.754730224609375, 1.82269287109375, 1.890655517578125, 1.9586181640625, 2.026580810546875, 2.09454345703125, 2.162506103515625, 2.23046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 7.0, 17.0, 19.0, 17.0, 24.0, 37.0, 40.0, 70.0, 102.0, 109.0, 157.0, 214.0, 350.0, 572.0, 1132.0, 4574.0, 37786.0, 700252.0, 3223757.0, 204959.0, 15197.0, 2463.0, 815.0, 442.0, 283.0, 228.0, 165.0, 113.0, 100.0, 57.0, 47.0, 37.0, 36.0, 28.0, 12.0, 11.0, 6.0, 10.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.765625, -7.532470703125, -7.29931640625, -7.066162109375, -6.8330078125, -6.599853515625, -6.36669921875, -6.133544921875, -5.900390625, -5.667236328125, -5.43408203125, -5.200927734375, -4.9677734375, -4.734619140625, -4.50146484375, -4.268310546875, -4.03515625, -3.802001953125, -3.56884765625, -3.335693359375, -3.1025390625, -2.869384765625, -2.63623046875, -2.403076171875, -2.169921875, -1.936767578125, -1.70361328125, -1.470458984375, -1.2373046875, -1.004150390625, -0.77099609375, -0.537841796875, -0.3046875, -0.071533203125, 0.16162109375, 0.394775390625, 0.6279296875, 0.861083984375, 1.09423828125, 1.327392578125, 1.560546875, 1.793701171875, 2.02685546875, 2.260009765625, 2.4931640625, 2.726318359375, 2.95947265625, 3.192626953125, 3.42578125, 3.658935546875, 3.89208984375, 4.125244140625, 4.3583984375, 4.591552734375, 4.82470703125, 5.057861328125, 5.291015625, 5.524169921875, 5.75732421875, 5.990478515625, 6.2236328125, 6.456787109375, 6.68994140625, 6.923095703125, 7.15625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 19.0, 35.0, 83.0, 129.0, 198.0, 166.0, 155.0, 119.0, 51.0, 26.0, 18.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.426438331604004, -13.716657638549805, -13.006875991821289, -12.29709529876709, -11.58731460571289, -10.877532958984375, -10.167752265930176, -9.457971572875977, -8.748189926147461, -8.038409233093262, -7.328628063201904, -6.618846893310547, -5.909066200256348, -5.19928503036499, -4.489503860473633, -3.7797231674194336, -3.0699424743652344, -2.360161542892456, -1.6503804922103882, -0.9405994415283203, -0.230818510055542, 0.47896242141723633, 1.1887435913085938, 1.898524284362793, 2.6083054542541504, 3.3180863857269287, 4.027867317199707, 4.7376484870910645, 5.447429656982422, 6.157210350036621, 6.8669915199279785, 7.576772212982178, 8.286554336547852, 8.99633502960205, 9.706116676330566, 10.415897369384766, 11.125678062438965, 11.835458755493164, 12.54524040222168, 13.255021095275879, 13.964801788330078, 14.674582481384277, 15.384364128112793, 16.094144821166992, 16.803926467895508, 17.51370620727539, 18.223487854003906, 18.933269500732422, 19.643051147460938, 20.352832794189453, 21.062612533569336, 21.77239418029785, 22.482175827026367, 23.19195556640625, 23.901737213134766, 24.61151885986328, 25.321298599243164, 26.03108024597168, 26.740859985351562, 27.450641632080078, 28.160423278808594, 28.870203018188477, 29.579984664916992, 30.289764404296875, 30.99954605102539]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 5.0, 3.0, 14.0, 10.0, 10.0, 13.0, 16.0, 15.0, 21.0, 25.0, 23.0, 24.0, 27.0, 43.0, 37.0, 36.0, 40.0, 40.0, 38.0, 41.0, 41.0, 29.0, 28.0, 33.0, 42.0, 43.0, 32.0, 36.0, 30.0, 24.0, 28.0, 20.0, 13.0, 20.0, 15.0, 9.0, 12.0, 15.0, 6.0, 4.0, 4.0, 5.0, 8.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.796864032745361, -7.5414628982543945, -7.286061763763428, -7.030660629272461, -6.775259971618652, -6.519858360290527, -6.264457702636719, -6.009056568145752, -5.753655433654785, -5.498254299163818, -5.242853164672852, -4.987452030181885, -4.732050895690918, -4.476650238037109, -4.221249103546143, -3.965847969055176, -3.710446834564209, -3.455045700073242, -3.1996445655822754, -2.9442436695098877, -2.688842535018921, -2.433441400527954, -2.1780405044555664, -1.9226393699645996, -1.6672382354736328, -1.411837100982666, -1.1564360857009888, -0.9010350108146667, -0.6456339359283447, -0.39023280143737793, -0.13483178615570068, 0.12056922912597656, 0.37596988677978516, 0.6313709616661072, 0.8867720365524292, 1.1421730518341064, 1.3975741863250732, 1.65297532081604, 1.9083763360977173, 2.1637773513793945, 2.4191784858703613, 2.674579620361328, 2.929980754852295, 3.1853816509246826, 3.4407827854156494, 3.696183919906616, 3.951584815979004, 4.206985950469971, 4.4623870849609375, 4.717788219451904, 4.973189353942871, 5.228590488433838, 5.483991622924805, 5.739392280578613, 5.99479341506958, 6.250194549560547, 6.505595684051514, 6.7609968185424805, 7.016397953033447, 7.271799087524414, 7.527199745178223, 7.782601356506348, 8.038002014160156, 8.293403625488281, 8.54880428314209]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 18.0, 5.0, 16.0, 15.0, 16.0, 16.0, 18.0, 30.0, 23.0, 23.0, 25.0, 31.0, 32.0, 33.0, 47.0, 44.0, 36.0, 44.0, 43.0, 47.0, 41.0, 29.0, 33.0, 40.0, 38.0, 37.0, 31.0, 34.0, 24.0, 19.0, 16.0, 16.0, 10.0, 11.0, 8.0, 6.0, 3.0, 8.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.28125, -1.2381744384765625, -1.195098876953125, -1.1520233154296875, -1.10894775390625, -1.0658721923828125, -1.022796630859375, -0.9797210693359375, -0.9366455078125, -0.8935699462890625, -0.850494384765625, -0.8074188232421875, -0.76434326171875, -0.7212677001953125, -0.678192138671875, -0.6351165771484375, -0.592041015625, -0.5489654541015625, -0.505889892578125, -0.4628143310546875, -0.41973876953125, -0.3766632080078125, -0.333587646484375, -0.2905120849609375, -0.2474365234375, -0.2043609619140625, -0.161285400390625, -0.1182098388671875, -0.07513427734375, -0.0320587158203125, 0.011016845703125, 0.0540924072265625, 0.09716796875, 0.1402435302734375, 0.183319091796875, 0.2263946533203125, 0.26947021484375, 0.3125457763671875, 0.355621337890625, 0.3986968994140625, 0.4417724609375, 0.4848480224609375, 0.527923583984375, 0.5709991455078125, 0.61407470703125, 0.6571502685546875, 0.700225830078125, 0.7433013916015625, 0.786376953125, 0.8294525146484375, 0.872528076171875, 0.9156036376953125, 0.95867919921875, 1.0017547607421875, 1.044830322265625, 1.0879058837890625, 1.1309814453125, 1.1740570068359375, 1.217132568359375, 1.2602081298828125, 1.30328369140625, 1.3463592529296875, 1.389434814453125, 1.4325103759765625, 1.4755859375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 11.0, 15.0, 15.0, 30.0, 44.0, 67.0, 121.0, 153.0, 269.0, 387.0, 524.0, 828.0, 1302.0, 1981.0, 3100.0, 4961.0, 7955.0, 12791.0, 20860.0, 33288.0, 53581.0, 82426.0, 120710.0, 156011.0, 161886.0, 131004.0, 92260.0, 60682.0, 38034.0, 23668.0, 14666.0, 9055.0, 5771.0, 3513.0, 2329.0, 1476.0, 912.0, 625.0, 396.0, 306.0, 187.0, 110.0, 81.0, 31.0, 32.0, 31.0, 23.0, 6.0, 13.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.141357421875, -0.13695907592773438, -0.13256072998046875, -0.12816238403320312, -0.1237640380859375, -0.11936569213867188, -0.11496734619140625, -0.11056900024414062, -0.106170654296875, -0.10177230834960938, -0.09737396240234375, -0.09297561645507812, -0.0885772705078125, -0.08417892456054688, -0.07978057861328125, -0.07538223266601562, -0.07098388671875, -0.06658554077148438, -0.06218719482421875, -0.057788848876953125, -0.0533905029296875, -0.048992156982421875, -0.04459381103515625, -0.040195465087890625, -0.035797119140625, -0.031398773193359375, -0.02700042724609375, -0.022602081298828125, -0.0182037353515625, -0.013805389404296875, -0.00940704345703125, -0.005008697509765625, -0.0006103515625, 0.003787994384765625, 0.00818634033203125, 0.012584686279296875, 0.0169830322265625, 0.021381378173828125, 0.02577972412109375, 0.030178070068359375, 0.034576416015625, 0.038974761962890625, 0.04337310791015625, 0.047771453857421875, 0.0521697998046875, 0.056568145751953125, 0.06096649169921875, 0.06536483764648438, 0.06976318359375, 0.07416152954101562, 0.07855987548828125, 0.08295822143554688, 0.0873565673828125, 0.09175491333007812, 0.09615325927734375, 0.10055160522460938, 0.104949951171875, 0.10934829711914062, 0.11374664306640625, 0.11814498901367188, 0.1225433349609375, 0.12694168090820312, 0.13134002685546875, 0.13573837280273438, 0.14013671875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 2.0, 12.0, 10.0, 10.0, 20.0, 18.0, 13.0, 18.0, 24.0, 27.0, 24.0, 37.0, 23.0, 37.0, 31.0, 48.0, 34.0, 35.0, 33.0, 41.0, 1056.0, 34.0, 46.0, 42.0, 34.0, 22.0, 30.0, 24.0, 42.0, 26.0, 26.0, 17.0, 11.0, 15.0, 18.0, 13.0, 14.0, 8.0, 15.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8642578125, -0.8373794555664062, -0.8105010986328125, -0.7836227416992188, -0.756744384765625, -0.7298660278320312, -0.7029876708984375, -0.6761093139648438, -0.64923095703125, -0.6223526000976562, -0.5954742431640625, -0.5685958862304688, -0.541717529296875, -0.5148391723632812, -0.4879608154296875, -0.46108245849609375, -0.4342041015625, -0.40732574462890625, -0.3804473876953125, -0.35356903076171875, -0.326690673828125, -0.29981231689453125, -0.2729339599609375, -0.24605560302734375, -0.21917724609375, -0.19229888916015625, -0.1654205322265625, -0.13854217529296875, -0.111663818359375, -0.08478546142578125, -0.0579071044921875, -0.03102874755859375, -0.004150390625, 0.02272796630859375, 0.0496063232421875, 0.07648468017578125, 0.103363037109375, 0.13024139404296875, 0.1571197509765625, 0.18399810791015625, 0.21087646484375, 0.23775482177734375, 0.2646331787109375, 0.29151153564453125, 0.318389892578125, 0.34526824951171875, 0.3721466064453125, 0.39902496337890625, 0.4259033203125, 0.45278167724609375, 0.4796600341796875, 0.5065383911132812, 0.533416748046875, 0.5602951049804688, 0.5871734619140625, 0.6140518188476562, 0.64093017578125, 0.6678085327148438, 0.6946868896484375, 0.7215652465820312, 0.748443603515625, 0.7753219604492188, 0.8022003173828125, 0.8290786743164062, 0.85595703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 11.0, 6.0, 19.0, 22.0, 28.0, 44.0, 56.0, 80.0, 120.0, 180.0, 291.0, 486.0, 751.0, 1262.0, 2146.0, 4075.0, 7509.0, 14369.0, 27750.0, 54458.0, 102474.0, 194393.0, 1085215.0, 320621.0, 132002.0, 71150.0, 36802.0, 18830.0, 9774.0, 5225.0, 2870.0, 1605.0, 907.0, 564.0, 326.0, 231.0, 135.0, 118.0, 59.0, 54.0, 36.0, 21.0, 27.0, 7.0, 1.0, 9.0, 0.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.1157379150390625, -0.111968994140625, -0.1082000732421875, -0.10443115234375, -0.1006622314453125, -0.096893310546875, -0.0931243896484375, -0.08935546875, -0.0855865478515625, -0.081817626953125, -0.0780487060546875, -0.07427978515625, -0.0705108642578125, -0.066741943359375, -0.0629730224609375, -0.0592041015625, -0.0554351806640625, -0.051666259765625, -0.0478973388671875, -0.04412841796875, -0.0403594970703125, -0.036590576171875, -0.0328216552734375, -0.029052734375, -0.0252838134765625, -0.021514892578125, -0.0177459716796875, -0.01397705078125, -0.0102081298828125, -0.006439208984375, -0.0026702880859375, 0.0010986328125, 0.0048675537109375, 0.008636474609375, 0.0124053955078125, 0.01617431640625, 0.0199432373046875, 0.023712158203125, 0.0274810791015625, 0.03125, 0.0350189208984375, 0.038787841796875, 0.0425567626953125, 0.04632568359375, 0.0500946044921875, 0.053863525390625, 0.0576324462890625, 0.0614013671875, 0.0651702880859375, 0.068939208984375, 0.0727081298828125, 0.07647705078125, 0.0802459716796875, 0.084014892578125, 0.0877838134765625, 0.091552734375, 0.0953216552734375, 0.099090576171875, 0.1028594970703125, 0.10662841796875, 0.1103973388671875, 0.114166259765625, 0.1179351806640625, 0.1217041015625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 8.0, 6.0, 9.0, 17.0, 14.0, 30.0, 41.0, 57.0, 55.0, 89.0, 94.0, 108.0, 93.0, 102.0, 76.0, 50.0, 41.0, 33.0, 20.0, 12.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0287628173828125, -0.02801990509033203, -0.027276992797851562, -0.026534080505371094, -0.025791168212890625, -0.025048255920410156, -0.024305343627929688, -0.02356243133544922, -0.02281951904296875, -0.02207660675048828, -0.021333694458007812, -0.020590782165527344, -0.019847869873046875, -0.019104957580566406, -0.018362045288085938, -0.01761913299560547, -0.016876220703125, -0.01613330841064453, -0.015390396118164062, -0.014647483825683594, -0.013904571533203125, -0.013161659240722656, -0.012418746948242188, -0.011675834655761719, -0.01093292236328125, -0.010190010070800781, -0.009447097778320312, -0.008704185485839844, -0.007961273193359375, -0.007218360900878906, -0.0064754486083984375, -0.005732536315917969, -0.0049896240234375, -0.004246711730957031, -0.0035037994384765625, -0.0027608871459960938, -0.002017974853515625, -0.0012750625610351562, -0.0005321502685546875, 0.00021076202392578125, 0.00095367431640625, 0.0016965866088867188, 0.0024394989013671875, 0.0031824111938476562, 0.003925323486328125, 0.004668235778808594, 0.0054111480712890625, 0.006154060363769531, 0.00689697265625, 0.007639884948730469, 0.008382797241210938, 0.009125709533691406, 0.009868621826171875, 0.010611534118652344, 0.011354446411132812, 0.012097358703613281, 0.01284027099609375, 0.013583183288574219, 0.014326095581054688, 0.015069007873535156, 0.015811920166015625, 0.016554832458496094, 0.017297744750976562, 0.01804065704345703, 0.0187835693359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 8.0, 6.0, 10.0, 20.0, 30.0, 40.0, 69.0, 120.0, 246.0, 4083.0, 1041995.0, 1383.0, 225.0, 91.0, 61.0, 42.0, 40.0, 16.0, 13.0, 15.0, 9.0, 5.0, 6.0, 6.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5093917846679688, -0.4885101318359375, -0.46762847900390625, -0.446746826171875, -0.42586517333984375, -0.4049835205078125, -0.38410186767578125, -0.36322021484375, -0.34233856201171875, -0.3214569091796875, -0.30057525634765625, -0.279693603515625, -0.25881195068359375, -0.2379302978515625, -0.21704864501953125, -0.1961669921875, -0.17528533935546875, -0.1544036865234375, -0.13352203369140625, -0.112640380859375, -0.09175872802734375, -0.0708770751953125, -0.04999542236328125, -0.02911376953125, -0.00823211669921875, 0.0126495361328125, 0.03353118896484375, 0.054412841796875, 0.07529449462890625, 0.0961761474609375, 0.11705780029296875, 0.137939453125, 0.15882110595703125, 0.1797027587890625, 0.20058441162109375, 0.221466064453125, 0.24234771728515625, 0.2632293701171875, 0.28411102294921875, 0.30499267578125, 0.32587432861328125, 0.3467559814453125, 0.36763763427734375, 0.388519287109375, 0.40940093994140625, 0.4302825927734375, 0.45116424560546875, 0.4720458984375, 0.49292755126953125, 0.5138092041015625, 0.5346908569335938, 0.555572509765625, 0.5764541625976562, 0.5973358154296875, 0.6182174682617188, 0.63909912109375, 0.6599807739257812, 0.6808624267578125, 0.7017440795898438, 0.722625732421875, 0.7435073852539062, 0.7643890380859375, 0.7852706909179688, 0.80615234375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 14.0, 69.0, 300.0, 444.0, 150.0, 23.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033446598798036575, -0.029853014275431633, -0.02625942975282669, -0.02266584523022175, -0.019072260707616806, -0.015478676185011864, -0.011885091662406921, -0.008291507139801979, -0.004697922617197037, -0.0011043380945920944, 0.002489246428012848, 0.00608283095061779, 0.009676415473222733, 0.013269999995827675, 0.016863584518432617, 0.02045716904103756, 0.024050753563642502, 0.027644338086247444, 0.031237922608852386, 0.03483150899410248, 0.03842509165406227, 0.042018674314022064, 0.045612260699272156, 0.04920584708452225, 0.05279942974448204, 0.056393012404441833, 0.059986598789691925, 0.06358018517494202, 0.06717376410961151, 0.0707673504948616, 0.0743609368801117, 0.07795452326536179, 0.08154810965061188, 0.08514169603586197, 0.08873528242111206, 0.09232886135578156, 0.09592244774103165, 0.09951603412628174, 0.10310961306095123, 0.10670319944620132, 0.11029678583145142, 0.11389037221670151, 0.1174839586019516, 0.1210775375366211, 0.12467112392187119, 0.12826471030712128, 0.13185828924179077, 0.13545188307762146, 0.13904546201229095, 0.14263904094696045, 0.14623263478279114, 0.14982621371746063, 0.15341979265213013, 0.15701338648796082, 0.1606069654226303, 0.164200559258461, 0.1677941381931305, 0.1713877171278, 0.17498131096363068, 0.17857488989830017, 0.18216848373413086, 0.18576206266880035, 0.18935564160346985, 0.19294923543930054, 0.19654281437397003]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 8.0, 12.0, 14.0, 13.0, 15.0, 18.0, 19.0, 15.0, 30.0, 23.0, 16.0, 30.0, 34.0, 31.0, 34.0, 34.0, 42.0, 37.0, 46.0, 48.0, 26.0, 30.0, 29.0, 35.0, 50.0, 26.0, 26.0, 34.0, 30.0, 22.0, 21.0, 25.0, 20.0, 10.0, 11.0, 12.0, 13.0, 9.0, 5.0, 4.0, 4.0, 9.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.01769733428955078, -0.01712176576256752, -0.016546199098229408, -0.015970632433891296, -0.015395063906908035, -0.014819496311247349, -0.014243928715586662, -0.013668361119925976, -0.01309279352426529, -0.012517225928604603, -0.011941658332943916, -0.01136609073728323, -0.010790523141622543, -0.010214955545961857, -0.00963938795030117, -0.009063820354640484, -0.008488252758979797, -0.007912685163319111, -0.007337117567658424, -0.006761549971997738, -0.006185982376337051, -0.005610414780676365, -0.005034847185015678, -0.004459279589354992, -0.0038837119936943054, -0.003308144398033619, -0.0027325768023729324, -0.002157009206712246, -0.0015814416110515594, -0.001005874015390873, -0.00043030641973018646, 0.00014526117593050003, 0.0007208287715911865, 0.001296396367251873, 0.0018719639629125595, 0.002447531558573246, 0.0030230991542339325, 0.003598666749894619, 0.0041742343455553055, 0.004749801941215992, 0.0053253695368766785, 0.005900937132537365, 0.0064765047281980515, 0.007052072323858738, 0.0076276399195194244, 0.008203207515180111, 0.008778775110840797, 0.009354342706501484, 0.00992991030216217, 0.010505477897822857, 0.011081045493483543, 0.01165661308914423, 0.012232180684804916, 0.012807748280465603, 0.01338331587612629, 0.013958883471786976, 0.014534451067447662, 0.015110018663108349, 0.015685586258769035, 0.016261152923107147, 0.01683672145009041, 0.01741228997707367, 0.01798785664141178, 0.018563423305749893, 0.019138991832733154]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 11.0, 18.0, 4.0, 16.0, 15.0, 17.0, 15.0, 21.0, 27.0, 23.0, 24.0, 23.0, 32.0, 32.0, 34.0, 48.0, 41.0, 37.0, 45.0, 42.0, 49.0, 40.0, 28.0, 34.0, 38.0, 39.0, 37.0, 32.0, 32.0, 25.0, 19.0, 16.0, 16.0, 10.0, 11.0, 8.0, 6.0, 3.0, 8.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2802734375, -1.237213134765625, -1.19415283203125, -1.151092529296875, -1.1080322265625, -1.064971923828125, -1.02191162109375, -0.978851318359375, -0.935791015625, -0.892730712890625, -0.84967041015625, -0.806610107421875, -0.7635498046875, -0.720489501953125, -0.67742919921875, -0.634368896484375, -0.59130859375, -0.548248291015625, -0.50518798828125, -0.462127685546875, -0.4190673828125, -0.376007080078125, -0.33294677734375, -0.289886474609375, -0.246826171875, -0.203765869140625, -0.16070556640625, -0.117645263671875, -0.0745849609375, -0.031524658203125, 0.01153564453125, 0.054595947265625, 0.09765625, 0.140716552734375, 0.18377685546875, 0.226837158203125, 0.2698974609375, 0.312957763671875, 0.35601806640625, 0.399078369140625, 0.442138671875, 0.485198974609375, 0.52825927734375, 0.571319580078125, 0.6143798828125, 0.657440185546875, 0.70050048828125, 0.743560791015625, 0.78662109375, 0.829681396484375, 0.87274169921875, 0.915802001953125, 0.9588623046875, 1.001922607421875, 1.04498291015625, 1.088043212890625, 1.131103515625, 1.174163818359375, 1.21722412109375, 1.260284423828125, 1.3033447265625, 1.346405029296875, 1.38946533203125, 1.432525634765625, 1.4755859375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 12.0, 20.0, 11.0, 19.0, 29.0, 45.0, 79.0, 102.0, 138.0, 262.0, 390.0, 609.0, 1039.0, 1717.0, 2806.0, 4704.0, 7914.0, 13511.0, 22826.0, 38711.0, 66196.0, 113789.0, 178450.0, 206601.0, 157431.0, 95780.0, 55548.0, 32459.0, 19050.0, 11205.0, 6716.0, 4127.0, 2396.0, 1509.0, 879.0, 519.0, 322.0, 220.0, 149.0, 77.0, 64.0, 46.0, 16.0, 12.0, 16.0, 11.0, 7.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3623046875, -1.3173980712890625, -1.272491455078125, -1.2275848388671875, -1.18267822265625, -1.1377716064453125, -1.092864990234375, -1.0479583740234375, -1.0030517578125, -0.9581451416015625, -0.913238525390625, -0.8683319091796875, -0.82342529296875, -0.7785186767578125, -0.733612060546875, -0.6887054443359375, -0.643798828125, -0.5988922119140625, -0.553985595703125, -0.5090789794921875, -0.46417236328125, -0.4192657470703125, -0.374359130859375, -0.3294525146484375, -0.2845458984375, -0.2396392822265625, -0.194732666015625, -0.1498260498046875, -0.10491943359375, -0.0600128173828125, -0.015106201171875, 0.0298004150390625, 0.07470703125, 0.1196136474609375, 0.164520263671875, 0.2094268798828125, 0.25433349609375, 0.2992401123046875, 0.344146728515625, 0.3890533447265625, 0.4339599609375, 0.4788665771484375, 0.523773193359375, 0.5686798095703125, 0.61358642578125, 0.6584930419921875, 0.703399658203125, 0.7483062744140625, 0.793212890625, 0.8381195068359375, 0.883026123046875, 0.9279327392578125, 0.97283935546875, 1.0177459716796875, 1.062652587890625, 1.1075592041015625, 1.1524658203125, 1.1973724365234375, 1.242279052734375, 1.2871856689453125, 1.33209228515625, 1.3769989013671875, 1.421905517578125, 1.4668121337890625, 1.51171875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 8.0, 8.0, 9.0, 9.0, 9.0, 18.0, 16.0, 24.0, 11.0, 32.0, 40.0, 26.0, 37.0, 43.0, 61.0, 64.0, 108.0, 204.0, 1309.0, 283.0, 189.0, 115.0, 70.0, 58.0, 49.0, 26.0, 27.0, 28.0, 26.0, 31.0, 27.0, 17.0, 12.0, 14.0, 5.0, 9.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65234375, -3.521484375, -3.390625, -3.259765625, -3.12890625, -2.998046875, -2.8671875, -2.736328125, -2.60546875, -2.474609375, -2.34375, -2.212890625, -2.08203125, -1.951171875, -1.8203125, -1.689453125, -1.55859375, -1.427734375, -1.296875, -1.166015625, -1.03515625, -0.904296875, -0.7734375, -0.642578125, -0.51171875, -0.380859375, -0.25, -0.119140625, 0.01171875, 0.142578125, 0.2734375, 0.404296875, 0.53515625, 0.666015625, 0.796875, 0.927734375, 1.05859375, 1.189453125, 1.3203125, 1.451171875, 1.58203125, 1.712890625, 1.84375, 1.974609375, 2.10546875, 2.236328125, 2.3671875, 2.498046875, 2.62890625, 2.759765625, 2.890625, 3.021484375, 3.15234375, 3.283203125, 3.4140625, 3.544921875, 3.67578125, 3.806640625, 3.9375, 4.068359375, 4.19921875, 4.330078125, 4.4609375, 4.591796875, 4.72265625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 6.0, 10.0, 14.0, 21.0, 26.0, 23.0, 31.0, 52.0, 75.0, 117.0, 131.0, 156.0, 283.0, 457.0, 1105.0, 4266.0, 36734.0, 659858.0, 2284723.0, 141544.0, 12102.0, 2004.0, 744.0, 378.0, 246.0, 144.0, 103.0, 95.0, 41.0, 44.0, 35.0, 31.0, 21.0, 17.0, 10.0, 9.0, 10.0, 10.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.28515625, -6.09619140625, -5.9072265625, -5.71826171875, -5.529296875, -5.34033203125, -5.1513671875, -4.96240234375, -4.7734375, -4.58447265625, -4.3955078125, -4.20654296875, -4.017578125, -3.82861328125, -3.6396484375, -3.45068359375, -3.26171875, -3.07275390625, -2.8837890625, -2.69482421875, -2.505859375, -2.31689453125, -2.1279296875, -1.93896484375, -1.75, -1.56103515625, -1.3720703125, -1.18310546875, -0.994140625, -0.80517578125, -0.6162109375, -0.42724609375, -0.23828125, -0.04931640625, 0.1396484375, 0.32861328125, 0.517578125, 0.70654296875, 0.8955078125, 1.08447265625, 1.2734375, 1.46240234375, 1.6513671875, 1.84033203125, 2.029296875, 2.21826171875, 2.4072265625, 2.59619140625, 2.78515625, 2.97412109375, 3.1630859375, 3.35205078125, 3.541015625, 3.72998046875, 3.9189453125, 4.10791015625, 4.296875, 4.48583984375, 4.6748046875, 4.86376953125, 5.052734375, 5.24169921875, 5.4306640625, 5.61962890625, 5.80859375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 42.0, 226.0, 420.0, 273.0, 51.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.96591567993164, -59.87018585205078, -58.77445983886719, -57.67873001098633, -56.583003997802734, -55.487274169921875, -54.39154815673828, -53.29581832885742, -52.20008850097656, -51.1043586730957, -50.00863265991211, -48.91290283203125, -47.817176818847656, -46.7214469909668, -45.62571716308594, -44.529991149902344, -43.43426513671875, -42.33853530883789, -41.2428092956543, -40.14707946777344, -39.051353454589844, -37.955623626708984, -36.859893798828125, -35.76416778564453, -34.66843795776367, -33.57270812988281, -32.47698211669922, -31.38125228881836, -30.285524368286133, -29.189796447753906, -28.09406852722168, -26.998340606689453, -25.902610778808594, -24.806882858276367, -23.71115493774414, -22.61542510986328, -21.519697189331055, -20.423969268798828, -19.3282413482666, -18.232513427734375, -17.136783599853516, -16.04105567932129, -14.945326805114746, -13.84959888458252, -12.753870010375977, -11.65814208984375, -10.562414169311523, -9.466686248779297, -8.370957374572754, -7.275228977203369, -6.179500579833984, -5.083772659301758, -3.988044261932373, -2.8923158645629883, -1.7965879440307617, -0.700859546661377, 0.3948688507080078, 1.490597128868103, 2.5863254070281982, 3.682053565979004, 4.777781963348389, 5.873510360717773, 6.96923828125, 8.064966201782227, 9.16069507598877]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 7.0, 4.0, 3.0, 8.0, 11.0, 10.0, 9.0, 9.0, 9.0, 18.0, 11.0, 16.0, 18.0, 23.0, 26.0, 29.0, 26.0, 26.0, 42.0, 38.0, 34.0, 42.0, 37.0, 44.0, 36.0, 33.0, 38.0, 46.0, 35.0, 46.0, 37.0, 33.0, 26.0, 24.0, 17.0, 16.0, 20.0, 22.0, 11.0, 13.0, 6.0, 15.0, 7.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.5885648727417, -9.282317161560059, -8.976070404052734, -8.669822692871094, -8.363574981689453, -8.057328224182129, -7.751080513000488, -7.444833278656006, -7.138586044311523, -6.832338809967041, -6.526091575622559, -6.219843864440918, -5.9135966300964355, -5.607349395751953, -5.3011016845703125, -4.99485445022583, -4.688607215881348, -4.382359981536865, -4.076112747192383, -3.769865036010742, -3.4636178016662598, -3.1573705673217773, -2.851123094558716, -2.5448756217956543, -2.238628387451172, -1.9323810338974, -1.626133680343628, -1.319886326789856, -1.013638973236084, -0.707391619682312, -0.40114426612854004, -0.09489679336547852, 0.2113513946533203, 0.5175987482070923, 0.8238461017608643, 1.1300934553146362, 1.4363408088684082, 1.7425881624221802, 2.048835515975952, 2.3550829887390137, 2.661330223083496, 2.9675774574279785, 3.27382493019104, 3.5800724029541016, 3.886319637298584, 4.192566871643066, 4.498814582824707, 4.8050618171691895, 5.111309051513672, 5.417556285858154, 5.723803520202637, 6.030051231384277, 6.33629846572876, 6.642545700073242, 6.948793411254883, 7.255040645599365, 7.561287879943848, 7.86753511428833, 8.173782348632812, 8.480030059814453, 8.786277770996094, 9.092524528503418, 9.398772239685059, 9.705018997192383, 10.011266708374023]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 3.0, 8.0, 10.0, 11.0, 10.0, 18.0, 17.0, 14.0, 30.0, 16.0, 36.0, 24.0, 22.0, 24.0, 37.0, 30.0, 33.0, 23.0, 30.0, 39.0, 49.0, 42.0, 36.0, 37.0, 37.0, 40.0, 47.0, 35.0, 32.0, 23.0, 26.0, 27.0, 26.0, 13.0, 23.0, 16.0, 4.0, 4.0, 7.0, 4.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2508697509765625, -1.209747314453125, -1.1686248779296875, -1.12750244140625, -1.0863800048828125, -1.045257568359375, -1.0041351318359375, -0.9630126953125, -0.9218902587890625, -0.880767822265625, -0.8396453857421875, -0.79852294921875, -0.7574005126953125, -0.716278076171875, -0.6751556396484375, -0.634033203125, -0.5929107666015625, -0.551788330078125, -0.5106658935546875, -0.46954345703125, -0.4284210205078125, -0.387298583984375, -0.3461761474609375, -0.3050537109375, -0.2639312744140625, -0.222808837890625, -0.1816864013671875, -0.14056396484375, -0.0994415283203125, -0.058319091796875, -0.0171966552734375, 0.02392578125, 0.0650482177734375, 0.106170654296875, 0.1472930908203125, 0.18841552734375, 0.2295379638671875, 0.270660400390625, 0.3117828369140625, 0.3529052734375, 0.3940277099609375, 0.435150146484375, 0.4762725830078125, 0.51739501953125, 0.5585174560546875, 0.599639892578125, 0.6407623291015625, 0.681884765625, 0.7230072021484375, 0.764129638671875, 0.8052520751953125, 0.84637451171875, 0.8874969482421875, 0.928619384765625, 0.9697418212890625, 1.0108642578125, 1.0519866943359375, 1.093109130859375, 1.1342315673828125, 1.17535400390625, 1.2164764404296875, 1.257598876953125, 1.2987213134765625, 1.33984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 7.0, 5.0, 6.0, 21.0, 12.0, 29.0, 26.0, 42.0, 55.0, 80.0, 98.0, 138.0, 211.0, 272.0, 448.0, 717.0, 1290.0, 2325.0, 4701.0, 10660.0, 26661.0, 79221.0, 284016.0, 1189612.0, 1852150.0, 533338.0, 136904.0, 42446.0, 15389.0, 6387.0, 2980.0, 1556.0, 901.0, 489.0, 293.0, 207.0, 170.0, 98.0, 95.0, 52.0, 42.0, 27.0, 20.0, 18.0, 14.0, 9.0, 5.0, 8.0, 4.0, 5.0, 3.0, 3.0, 6.0], "bins": [-2.54296875, -2.47076416015625, -2.3985595703125, -2.32635498046875, -2.254150390625, -2.18194580078125, -2.1097412109375, -2.03753662109375, -1.96533203125, -1.89312744140625, -1.8209228515625, -1.74871826171875, -1.676513671875, -1.60430908203125, -1.5321044921875, -1.45989990234375, -1.3876953125, -1.31549072265625, -1.2432861328125, -1.17108154296875, -1.098876953125, -1.02667236328125, -0.9544677734375, -0.88226318359375, -0.81005859375, -0.73785400390625, -0.6656494140625, -0.59344482421875, -0.521240234375, -0.44903564453125, -0.3768310546875, -0.30462646484375, -0.232421875, -0.16021728515625, -0.0880126953125, -0.01580810546875, 0.056396484375, 0.12860107421875, 0.2008056640625, 0.27301025390625, 0.34521484375, 0.41741943359375, 0.4896240234375, 0.56182861328125, 0.634033203125, 0.70623779296875, 0.7784423828125, 0.85064697265625, 0.9228515625, 0.99505615234375, 1.0672607421875, 1.13946533203125, 1.211669921875, 1.28387451171875, 1.3560791015625, 1.42828369140625, 1.50048828125, 1.57269287109375, 1.6448974609375, 1.71710205078125, 1.789306640625, 1.86151123046875, 1.9337158203125, 2.00592041015625, 2.078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 6.0, 10.0, 17.0, 13.0, 27.0, 32.0, 56.0, 71.0, 93.0, 92.0, 146.0, 162.0, 214.0, 275.0, 366.0, 415.0, 417.0, 386.0, 301.0, 224.0, 175.0, 113.0, 95.0, 99.0, 63.0, 44.0, 31.0, 24.0, 23.0, 16.0, 11.0, 8.0, 5.0, 5.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.2734375, -2.210296630859375, -2.14715576171875, -2.084014892578125, -2.0208740234375, -1.957733154296875, -1.89459228515625, -1.831451416015625, -1.768310546875, -1.705169677734375, -1.64202880859375, -1.578887939453125, -1.5157470703125, -1.452606201171875, -1.38946533203125, -1.326324462890625, -1.26318359375, -1.200042724609375, -1.13690185546875, -1.073760986328125, -1.0106201171875, -0.947479248046875, -0.88433837890625, -0.821197509765625, -0.758056640625, -0.694915771484375, -0.63177490234375, -0.568634033203125, -0.5054931640625, -0.442352294921875, -0.37921142578125, -0.316070556640625, -0.2529296875, -0.189788818359375, -0.12664794921875, -0.063507080078125, -0.0003662109375, 0.062774658203125, 0.12591552734375, 0.189056396484375, 0.252197265625, 0.315338134765625, 0.37847900390625, 0.441619873046875, 0.5047607421875, 0.567901611328125, 0.63104248046875, 0.694183349609375, 0.75732421875, 0.820465087890625, 0.88360595703125, 0.946746826171875, 1.0098876953125, 1.073028564453125, 1.13616943359375, 1.199310302734375, 1.262451171875, 1.325592041015625, 1.38873291015625, 1.451873779296875, 1.5150146484375, 1.578155517578125, 1.64129638671875, 1.704437255859375, 1.767578125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 13.0, 18.0, 22.0, 43.0, 63.0, 124.0, 183.0, 302.0, 592.0, 2919.0, 114141.0, 3885618.0, 184874.0, 3773.0, 667.0, 329.0, 230.0, 138.0, 82.0, 57.0, 24.0, 24.0, 13.0, 16.0, 11.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.0546875, -14.6923828125, -14.330078125, -13.9677734375, -13.60546875, -13.2431640625, -12.880859375, -12.5185546875, -12.15625, -11.7939453125, -11.431640625, -11.0693359375, -10.70703125, -10.3447265625, -9.982421875, -9.6201171875, -9.2578125, -8.8955078125, -8.533203125, -8.1708984375, -7.80859375, -7.4462890625, -7.083984375, -6.7216796875, -6.359375, -5.9970703125, -5.634765625, -5.2724609375, -4.91015625, -4.5478515625, -4.185546875, -3.8232421875, -3.4609375, -3.0986328125, -2.736328125, -2.3740234375, -2.01171875, -1.6494140625, -1.287109375, -0.9248046875, -0.5625, -0.2001953125, 0.162109375, 0.5244140625, 0.88671875, 1.2490234375, 1.611328125, 1.9736328125, 2.3359375, 2.6982421875, 3.060546875, 3.4228515625, 3.78515625, 4.1474609375, 4.509765625, 4.8720703125, 5.234375, 5.5966796875, 5.958984375, 6.3212890625, 6.68359375, 7.0458984375, 7.408203125, 7.7705078125, 8.1328125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 19.0, 74.0, 251.0, 351.0, 239.0, 70.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.990705490112305, -25.88751220703125, -24.784317016601562, -23.681123733520508, -22.57792854309082, -21.474735260009766, -20.371540069580078, -19.268346786499023, -18.16515350341797, -17.061960220336914, -15.958765029907227, -14.855571746826172, -13.752376556396484, -12.64918327331543, -11.545989036560059, -10.442794799804688, -9.339599609375, -8.236405372619629, -7.133211135864258, -6.030017375946045, -4.926823139190674, -3.8236289024353027, -2.72043514251709, -1.6172409057617188, -0.5140466690063477, 0.5891474485397339, 1.6923415660858154, 2.7955355644226074, 3.8987298011779785, 5.00192403793335, 6.1051177978515625, 7.208312034606934, 8.311508178710938, 9.414702415466309, 10.51789665222168, 11.621089935302734, 12.724285125732422, 13.827478408813477, 14.930672645568848, 16.03386688232422, 17.137062072753906, 18.24025535583496, 19.34345054626465, 20.446643829345703, 21.54983901977539, 22.653032302856445, 23.7562255859375, 24.859420776367188, 25.962614059448242, 27.065807342529297, 28.169002532958984, 29.27219581604004, 30.375391006469727, 31.47858428955078, 32.58177947998047, 33.684974670410156, 34.78816604614258, 35.891361236572266, 36.99455261230469, 38.097747802734375, 39.20094299316406, 40.30413818359375, 41.40732955932617, 42.51052474975586, 43.61371994018555]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 4.0, 5.0, 11.0, 10.0, 12.0, 18.0, 21.0, 18.0, 24.0, 21.0, 22.0, 26.0, 32.0, 19.0, 26.0, 36.0, 40.0, 36.0, 28.0, 45.0, 34.0, 37.0, 34.0, 29.0, 39.0, 37.0, 48.0, 27.0, 40.0, 27.0, 20.0, 31.0, 12.0, 18.0, 15.0, 21.0, 5.0, 16.0, 13.0, 7.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.453943729400635, -6.237559795379639, -6.021176338195801, -5.804792404174805, -5.588408946990967, -5.372025012969971, -5.155641555786133, -4.939257621765137, -4.722873687744141, -4.5064897537231445, -4.290106296539307, -4.0737223625183105, -3.8573389053344727, -3.6409549713134766, -3.4245712757110596, -3.2081875801086426, -2.9918041229248047, -2.7754204273223877, -2.5590367317199707, -2.3426527976989746, -2.1262693405151367, -1.9098855257034302, -1.6935017108917236, -1.4771180152893066, -1.2607343196868896, -1.0443506240844727, -0.8279668688774109, -0.6115831136703491, -0.39519941806793213, -0.17881572246551514, 0.037568092346191406, 0.2539517879486084, 0.4703354835510254, 0.6867191791534424, 0.9031029343605042, 1.119486689567566, 1.335870385169983, 1.5522540807724, 1.7686378955841064, 1.9850215911865234, 2.2014052867889404, 2.4177889823913574, 2.6341726779937744, 2.8505563735961914, 3.0669403076171875, 3.2833237648010254, 3.4997076988220215, 3.7160913944244385, 3.9324750900268555, 4.148859024047852, 4.3652424812316895, 4.5816264152526855, 4.798009872436523, 5.0143938064575195, 5.230777740478516, 5.4471611976623535, 5.663544654846191, 5.8799285888671875, 6.096312046051025, 6.3126959800720215, 6.529079437255859, 6.7454633712768555, 6.961847305297852, 7.1782307624816895, 7.3946146965026855]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 2.0, 5.0, 13.0, 11.0, 15.0, 11.0, 21.0, 17.0, 21.0, 22.0, 26.0, 29.0, 28.0, 34.0, 28.0, 44.0, 34.0, 41.0, 29.0, 39.0, 48.0, 51.0, 46.0, 51.0, 30.0, 40.0, 27.0, 33.0, 35.0, 39.0, 17.0, 22.0, 19.0, 18.0, 13.0, 11.0, 10.0, 1.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.140625, -1.0969390869140625, -1.053253173828125, -1.0095672607421875, -0.96588134765625, -0.9221954345703125, -0.878509521484375, -0.8348236083984375, -0.7911376953125, -0.7474517822265625, -0.703765869140625, -0.6600799560546875, -0.61639404296875, -0.5727081298828125, -0.529022216796875, -0.4853363037109375, -0.441650390625, -0.3979644775390625, -0.354278564453125, -0.3105926513671875, -0.26690673828125, -0.2232208251953125, -0.179534912109375, -0.1358489990234375, -0.0921630859375, -0.0484771728515625, -0.004791259765625, 0.0388946533203125, 0.08258056640625, 0.1262664794921875, 0.169952392578125, 0.2136383056640625, 0.25732421875, 0.3010101318359375, 0.344696044921875, 0.3883819580078125, 0.43206787109375, 0.4757537841796875, 0.519439697265625, 0.5631256103515625, 0.6068115234375, 0.6504974365234375, 0.694183349609375, 0.7378692626953125, 0.78155517578125, 0.8252410888671875, 0.868927001953125, 0.9126129150390625, 0.956298828125, 0.9999847412109375, 1.043670654296875, 1.0873565673828125, 1.13104248046875, 1.1747283935546875, 1.218414306640625, 1.2621002197265625, 1.3057861328125, 1.3494720458984375, 1.393157958984375, 1.4368438720703125, 1.48052978515625, 1.5242156982421875, 1.567901611328125, 1.6115875244140625, 1.6552734375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 6.0, 3.0, 3.0, 7.0, 6.0, 11.0, 14.0, 27.0, 47.0, 70.0, 85.0, 138.0, 218.0, 360.0, 567.0, 910.0, 1585.0, 2837.0, 5279.0, 10121.0, 20746.0, 46037.0, 109786.0, 242000.0, 305738.0, 168773.0, 71391.0, 30677.0, 14608.0, 7265.0, 3943.0, 2124.0, 1197.0, 749.0, 444.0, 274.0, 169.0, 110.0, 91.0, 50.0, 24.0, 26.0, 13.0, 8.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2239990234375, -0.2154674530029297, -0.20693588256835938, -0.19840431213378906, -0.18987274169921875, -0.18134117126464844, -0.17280960083007812, -0.1642780303955078, -0.1557464599609375, -0.1472148895263672, -0.13868331909179688, -0.13015174865722656, -0.12162017822265625, -0.11308860778808594, -0.10455703735351562, -0.09602546691894531, -0.087493896484375, -0.07896232604980469, -0.07043075561523438, -0.06189918518066406, -0.05336761474609375, -0.04483604431152344, -0.036304473876953125, -0.027772903442382812, -0.0192413330078125, -0.010709762573242188, -0.002178192138671875, 0.0063533782958984375, 0.01488494873046875, 0.023416519165039062, 0.031948089599609375, 0.04047966003417969, 0.04901123046875, 0.05754280090332031, 0.06607437133789062, 0.07460594177246094, 0.08313751220703125, 0.09166908264160156, 0.10020065307617188, 0.10873222351074219, 0.1172637939453125, 0.1257953643798828, 0.13432693481445312, 0.14285850524902344, 0.15139007568359375, 0.15992164611816406, 0.16845321655273438, 0.1769847869873047, 0.185516357421875, 0.1940479278564453, 0.20257949829101562, 0.21111106872558594, 0.21964263916015625, 0.22817420959472656, 0.23670578002929688, 0.2452373504638672, 0.2537689208984375, 0.2623004913330078, 0.2708320617675781, 0.27936363220214844, 0.28789520263671875, 0.29642677307128906, 0.3049583435058594, 0.3134899139404297, 0.322021484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 8.0, 9.0, 11.0, 11.0, 16.0, 9.0, 15.0, 16.0, 15.0, 23.0, 19.0, 20.0, 29.0, 31.0, 42.0, 48.0, 39.0, 34.0, 31.0, 48.0, 1065.0, 39.0, 46.0, 39.0, 40.0, 53.0, 25.0, 34.0, 25.0, 21.0, 20.0, 22.0, 13.0, 12.0, 19.0, 13.0, 14.0, 11.0, 6.0, 5.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.9130859375, -0.8860015869140625, -0.858917236328125, -0.8318328857421875, -0.80474853515625, -0.7776641845703125, -0.750579833984375, -0.7234954833984375, -0.6964111328125, -0.6693267822265625, -0.642242431640625, -0.6151580810546875, -0.58807373046875, -0.5609893798828125, -0.533905029296875, -0.5068206787109375, -0.479736328125, -0.4526519775390625, -0.425567626953125, -0.3984832763671875, -0.37139892578125, -0.3443145751953125, -0.317230224609375, -0.2901458740234375, -0.2630615234375, -0.2359771728515625, -0.208892822265625, -0.1818084716796875, -0.15472412109375, -0.1276397705078125, -0.100555419921875, -0.0734710693359375, -0.04638671875, -0.0193023681640625, 0.007781982421875, 0.0348663330078125, 0.06195068359375, 0.0890350341796875, 0.116119384765625, 0.1432037353515625, 0.1702880859375, 0.1973724365234375, 0.224456787109375, 0.2515411376953125, 0.27862548828125, 0.3057098388671875, 0.332794189453125, 0.3598785400390625, 0.386962890625, 0.4140472412109375, 0.441131591796875, 0.4682159423828125, 0.49530029296875, 0.5223846435546875, 0.549468994140625, 0.5765533447265625, 0.6036376953125, 0.6307220458984375, 0.657806396484375, 0.6848907470703125, 0.71197509765625, 0.7390594482421875, 0.766143798828125, 0.7932281494140625, 0.8203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 5.0, 9.0, 3.0, 19.0, 22.0, 28.0, 45.0, 59.0, 94.0, 111.0, 184.0, 248.0, 387.0, 599.0, 937.0, 1497.0, 2500.0, 4487.0, 8809.0, 18107.0, 41755.0, 100426.0, 249389.0, 1211612.0, 267111.0, 104790.0, 43812.0, 19243.0, 8995.0, 4805.0, 2591.0, 1550.0, 956.0, 661.0, 407.0, 257.0, 190.0, 139.0, 96.0, 58.0, 32.0, 33.0, 24.0, 16.0, 15.0, 10.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.15826797485351562, -0.15308380126953125, -0.14789962768554688, -0.1427154541015625, -0.13753128051757812, -0.13234710693359375, -0.12716293334960938, -0.121978759765625, -0.11679458618164062, -0.11161041259765625, -0.10642623901367188, -0.1012420654296875, -0.09605789184570312, -0.09087371826171875, -0.08568954467773438, -0.08050537109375, -0.07532119750976562, -0.07013702392578125, -0.06495285034179688, -0.0597686767578125, -0.054584503173828125, -0.04940032958984375, -0.044216156005859375, -0.039031982421875, -0.033847808837890625, -0.02866363525390625, -0.023479461669921875, -0.0182952880859375, -0.013111114501953125, -0.00792694091796875, -0.002742767333984375, 0.00244140625, 0.007625579833984375, 0.01280975341796875, 0.017993927001953125, 0.0231781005859375, 0.028362274169921875, 0.03354644775390625, 0.038730621337890625, 0.043914794921875, 0.049098968505859375, 0.05428314208984375, 0.059467315673828125, 0.0646514892578125, 0.06983566284179688, 0.07501983642578125, 0.08020401000976562, 0.08538818359375, 0.09057235717773438, 0.09575653076171875, 0.10094070434570312, 0.1061248779296875, 0.11130905151367188, 0.11649322509765625, 0.12167739868164062, 0.126861572265625, 0.13204574584960938, 0.13722991943359375, 0.14241409301757812, 0.1475982666015625, 0.15278244018554688, 0.15796661376953125, 0.16315078735351562, 0.1683349609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 6.0, 2.0, 3.0, 5.0, 11.0, 11.0, 17.0, 19.0, 30.0, 35.0, 43.0, 68.0, 95.0, 112.0, 120.0, 109.0, 70.0, 55.0, 38.0, 26.0, 22.0, 16.0, 11.0, 7.0, 14.0, 8.0, 3.0, 2.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.03399658203125, -0.03316640853881836, -0.03233623504638672, -0.03150606155395508, -0.030675888061523438, -0.029845714569091797, -0.029015541076660156, -0.028185367584228516, -0.027355194091796875, -0.026525020599365234, -0.025694847106933594, -0.024864673614501953, -0.024034500122070312, -0.023204326629638672, -0.02237415313720703, -0.02154397964477539, -0.02071380615234375, -0.01988363265991211, -0.01905345916748047, -0.018223285675048828, -0.017393112182617188, -0.016562938690185547, -0.015732765197753906, -0.014902591705322266, -0.014072418212890625, -0.013242244720458984, -0.012412071228027344, -0.011581897735595703, -0.010751724243164062, -0.009921550750732422, -0.009091377258300781, -0.00826120376586914, -0.0074310302734375, -0.006600856781005859, -0.005770683288574219, -0.004940509796142578, -0.0041103363037109375, -0.003280162811279297, -0.0024499893188476562, -0.0016198158264160156, -0.000789642333984375, 4.0531158447265625e-05, 0.0008707046508789062, 0.0017008781433105469, 0.0025310516357421875, 0.003361225128173828, 0.004191398620605469, 0.005021572113037109, 0.00585174560546875, 0.006681919097900391, 0.007512092590332031, 0.008342266082763672, 0.009172439575195312, 0.010002613067626953, 0.010832786560058594, 0.011662960052490234, 0.012493133544921875, 0.013323307037353516, 0.014153480529785156, 0.014983654022216797, 0.015813827514648438, 0.016644001007080078, 0.01747417449951172, 0.01830434799194336, 0.019134521484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 6.0, 1.0, 12.0, 13.0, 13.0, 20.0, 21.0, 41.0, 76.0, 108.0, 258.0, 3128.0, 1032152.0, 11884.0, 426.0, 126.0, 87.0, 51.0, 37.0, 18.0, 14.0, 5.0, 12.0, 11.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.523651123046875, -0.49945068359375, -0.475250244140625, -0.4510498046875, -0.426849365234375, -0.40264892578125, -0.378448486328125, -0.354248046875, -0.330047607421875, -0.30584716796875, -0.281646728515625, -0.2574462890625, -0.233245849609375, -0.20904541015625, -0.184844970703125, -0.16064453125, -0.136444091796875, -0.11224365234375, -0.088043212890625, -0.0638427734375, -0.039642333984375, -0.01544189453125, 0.008758544921875, 0.032958984375, 0.057159423828125, 0.08135986328125, 0.105560302734375, 0.1297607421875, 0.153961181640625, 0.17816162109375, 0.202362060546875, 0.2265625, 0.250762939453125, 0.27496337890625, 0.299163818359375, 0.3233642578125, 0.347564697265625, 0.37176513671875, 0.395965576171875, 0.420166015625, 0.444366455078125, 0.46856689453125, 0.492767333984375, 0.5169677734375, 0.541168212890625, 0.56536865234375, 0.589569091796875, 0.61376953125, 0.637969970703125, 0.66217041015625, 0.686370849609375, 0.7105712890625, 0.734771728515625, 0.75897216796875, 0.783172607421875, 0.807373046875, 0.831573486328125, 0.85577392578125, 0.879974365234375, 0.9041748046875, 0.928375244140625, 0.95257568359375, 0.976776123046875, 1.0009765625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 14.0, 30.0, 90.0, 226.0, 289.0, 222.0, 93.0, 34.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01707017980515957, -0.014475026167929173, -0.011879872530698776, -0.009284719824790955, -0.006689566187560558, -0.004094412550330162, -0.0014992598444223404, 0.0010958947241306305, 0.003691047430038452, 0.006286201067268848, 0.008881354704499245, 0.011476507410407066, 0.014071661047637463, 0.01666681468486786, 0.01926196739077568, 0.02185712195932865, 0.024452274665236473, 0.027047427371144295, 0.029642581939697266, 0.03223773464560509, 0.03483288735151291, 0.03742804378271103, 0.04002319276332855, 0.04261834919452667, 0.045213501900434494, 0.047808654606342316, 0.05040380731225014, 0.05299896001815796, 0.05559411644935608, 0.0581892691552639, 0.06078442186117172, 0.06337957829236984, 0.06597473472356796, 0.06856989115476608, 0.0711650401353836, 0.07376019656658173, 0.07635534554719925, 0.07895050197839737, 0.08154565095901489, 0.08414080739021301, 0.08673596382141113, 0.08933112025260925, 0.09192626923322678, 0.0945214256644249, 0.09711657464504242, 0.09971173107624054, 0.10230688750743866, 0.10490203648805618, 0.1074971854686737, 0.11009234189987183, 0.11268749088048935, 0.11528264731168747, 0.11787779629230499, 0.12047295272350311, 0.12306810915470123, 0.12566326558589935, 0.12825842201709747, 0.1308535784482956, 0.1334487348794937, 0.13604387640953064, 0.13863903284072876, 0.14123418927192688, 0.143829345703125, 0.14642450213432312, 0.14901964366436005]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 4.0, 12.0, 9.0, 15.0, 20.0, 26.0, 26.0, 28.0, 33.0, 44.0, 46.0, 47.0, 57.0, 62.0, 48.0, 43.0, 49.0, 40.0, 45.0, 37.0, 52.0, 44.0, 41.0, 29.0, 27.0, 23.0, 28.0, 10.0, 10.0, 16.0, 9.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03702390193939209, -0.03600029647350311, -0.034976691007614136, -0.03395308926701546, -0.03292948380112648, -0.0319058783352375, -0.030882274731993675, -0.029858671128749847, -0.02883506566286087, -0.027811460196971893, -0.026787856593728065, -0.025764252990484238, -0.02474064752459526, -0.023717042058706284, -0.022693438455462456, -0.021669834852218628, -0.02064622938632965, -0.019622623920440674, -0.018599020317196846, -0.017575416713953018, -0.01655181124806404, -0.015528206713497639, -0.014504602178931236, -0.013480997644364834, -0.012457393109798431, -0.011433788575232029, -0.010410184040665627, -0.009386579506099224, -0.008362974971532822, -0.007339370436966419, -0.006315765902400017, -0.005292161367833614, -0.004268556833267212, -0.0032449522987008095, -0.002221347764134407, -0.0011977432295680046, -0.00017413869500160217, 0.0008494658395648003, 0.0018730703741312027, 0.002896674908697605, 0.003920279443264008, 0.00494388397783041, 0.0059674885123968124, 0.006991093046963215, 0.008014697581529617, 0.00903830211609602, 0.010061906650662422, 0.011085511185228825, 0.012109115719795227, 0.01313272025436163, 0.014156324788928032, 0.015179929323494434, 0.016203533858060837, 0.017227139323949814, 0.01825074292719364, 0.01927434653043747, 0.020297951996326447, 0.021321557462215424, 0.02234516106545925, 0.02336876466870308, 0.024392370134592056, 0.025415975600481033, 0.02643957920372486, 0.02746318280696869, 0.028486788272857666]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 2.0, 5.0, 13.0, 11.0, 15.0, 11.0, 21.0, 17.0, 21.0, 22.0, 25.0, 31.0, 27.0, 35.0, 26.0, 44.0, 35.0, 39.0, 30.0, 38.0, 50.0, 50.0, 46.0, 51.0, 32.0, 37.0, 29.0, 33.0, 35.0, 38.0, 18.0, 21.0, 18.0, 20.0, 13.0, 11.0, 10.0, 1.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.140625, -1.096954345703125, -1.05328369140625, -1.009613037109375, -0.9659423828125, -0.922271728515625, -0.87860107421875, -0.834930419921875, -0.791259765625, -0.747589111328125, -0.70391845703125, -0.660247802734375, -0.6165771484375, -0.572906494140625, -0.52923583984375, -0.485565185546875, -0.44189453125, -0.398223876953125, -0.35455322265625, -0.310882568359375, -0.2672119140625, -0.223541259765625, -0.17987060546875, -0.136199951171875, -0.092529296875, -0.048858642578125, -0.00518798828125, 0.038482666015625, 0.0821533203125, 0.125823974609375, 0.16949462890625, 0.213165283203125, 0.2568359375, 0.300506591796875, 0.34417724609375, 0.387847900390625, 0.4315185546875, 0.475189208984375, 0.51885986328125, 0.562530517578125, 0.606201171875, 0.649871826171875, 0.69354248046875, 0.737213134765625, 0.7808837890625, 0.824554443359375, 0.86822509765625, 0.911895751953125, 0.95556640625, 0.999237060546875, 1.04290771484375, 1.086578369140625, 1.1302490234375, 1.173919677734375, 1.21759033203125, 1.261260986328125, 1.304931640625, 1.348602294921875, 1.39227294921875, 1.435943603515625, 1.4796142578125, 1.523284912109375, 1.56695556640625, 1.610626220703125, 1.654296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 6.0, 7.0, 14.0, 21.0, 27.0, 30.0, 56.0, 79.0, 127.0, 213.0, 398.0, 777.0, 1487.0, 3008.0, 6655.0, 15754.0, 40167.0, 115016.0, 315271.0, 343234.0, 129180.0, 45431.0, 17403.0, 7448.0, 3301.0, 1562.0, 823.0, 424.0, 223.0, 152.0, 85.0, 52.0, 36.0, 26.0, 16.0, 9.0, 13.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.088287353515625, -2.01641845703125, -1.944549560546875, -1.8726806640625, -1.800811767578125, -1.72894287109375, -1.657073974609375, -1.585205078125, -1.513336181640625, -1.44146728515625, -1.369598388671875, -1.2977294921875, -1.225860595703125, -1.15399169921875, -1.082122802734375, -1.01025390625, -0.938385009765625, -0.86651611328125, -0.794647216796875, -0.7227783203125, -0.650909423828125, -0.57904052734375, -0.507171630859375, -0.435302734375, -0.363433837890625, -0.29156494140625, -0.219696044921875, -0.1478271484375, -0.075958251953125, -0.00408935546875, 0.067779541015625, 0.1396484375, 0.211517333984375, 0.28338623046875, 0.355255126953125, 0.4271240234375, 0.498992919921875, 0.57086181640625, 0.642730712890625, 0.714599609375, 0.786468505859375, 0.85833740234375, 0.930206298828125, 1.0020751953125, 1.073944091796875, 1.14581298828125, 1.217681884765625, 1.28955078125, 1.361419677734375, 1.43328857421875, 1.505157470703125, 1.5770263671875, 1.648895263671875, 1.72076416015625, 1.792633056640625, 1.864501953125, 1.936370849609375, 2.00823974609375, 2.080108642578125, 2.1519775390625, 2.223846435546875, 2.29571533203125, 2.367584228515625, 2.439453125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 9.0, 14.0, 19.0, 13.0, 13.0, 23.0, 32.0, 22.0, 22.0, 29.0, 35.0, 61.0, 54.0, 60.0, 111.0, 178.0, 1374.0, 302.0, 159.0, 83.0, 49.0, 53.0, 50.0, 46.0, 37.0, 27.0, 34.0, 23.0, 18.0, 18.0, 14.0, 14.0, 7.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.623046875, -3.506072998046875, -3.38909912109375, -3.272125244140625, -3.1551513671875, -3.038177490234375, -2.92120361328125, -2.804229736328125, -2.687255859375, -2.570281982421875, -2.45330810546875, -2.336334228515625, -2.2193603515625, -2.102386474609375, -1.98541259765625, -1.868438720703125, -1.75146484375, -1.634490966796875, -1.51751708984375, -1.400543212890625, -1.2835693359375, -1.166595458984375, -1.04962158203125, -0.932647705078125, -0.815673828125, -0.698699951171875, -0.58172607421875, -0.464752197265625, -0.3477783203125, -0.230804443359375, -0.11383056640625, 0.003143310546875, 0.1201171875, 0.237091064453125, 0.35406494140625, 0.471038818359375, 0.5880126953125, 0.704986572265625, 0.82196044921875, 0.938934326171875, 1.055908203125, 1.172882080078125, 1.28985595703125, 1.406829833984375, 1.5238037109375, 1.640777587890625, 1.75775146484375, 1.874725341796875, 1.99169921875, 2.108673095703125, 2.22564697265625, 2.342620849609375, 2.4595947265625, 2.576568603515625, 2.69354248046875, 2.810516357421875, 2.927490234375, 3.044464111328125, 3.16143798828125, 3.278411865234375, 3.3953857421875, 3.512359619140625, 3.62933349609375, 3.746307373046875, 3.86328125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 8.0, 12.0, 17.0, 13.0, 19.0, 30.0, 38.0, 49.0, 57.0, 85.0, 121.0, 157.0, 196.0, 396.0, 880.0, 4284.0, 57802.0, 2455742.0, 604125.0, 18018.0, 1972.0, 603.0, 315.0, 212.0, 117.0, 88.0, 74.0, 66.0, 46.0, 33.0, 29.0, 28.0, 14.0, 16.0, 8.0, 4.0, 11.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.2171630859375, -6.008544921875, -5.7999267578125, -5.59130859375, -5.3826904296875, -5.174072265625, -4.9654541015625, -4.7568359375, -4.5482177734375, -4.339599609375, -4.1309814453125, -3.92236328125, -3.7137451171875, -3.505126953125, -3.2965087890625, -3.087890625, -2.8792724609375, -2.670654296875, -2.4620361328125, -2.25341796875, -2.0447998046875, -1.836181640625, -1.6275634765625, -1.4189453125, -1.2103271484375, -1.001708984375, -0.7930908203125, -0.58447265625, -0.3758544921875, -0.167236328125, 0.0413818359375, 0.25, 0.4586181640625, 0.667236328125, 0.8758544921875, 1.08447265625, 1.2930908203125, 1.501708984375, 1.7103271484375, 1.9189453125, 2.1275634765625, 2.336181640625, 2.5447998046875, 2.75341796875, 2.9620361328125, 3.170654296875, 3.3792724609375, 3.587890625, 3.7965087890625, 4.005126953125, 4.2137451171875, 4.42236328125, 4.6309814453125, 4.839599609375, 5.0482177734375, 5.2568359375, 5.4654541015625, 5.674072265625, 5.8826904296875, 6.09130859375, 6.2999267578125, 6.508544921875, 6.7171630859375, 6.92578125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 41.0, 720.0, 250.0, 7.0], "bins": [-106.87787628173828, -105.1459732055664, -103.4140625, -101.68215942382812, -99.95025634765625, -98.21834564208984, -96.48644256591797, -94.75453186035156, -93.02262878417969, -91.29072570800781, -89.5588150024414, -87.82691192626953, -86.09500122070312, -84.36309814453125, -82.63119506835938, -80.89928436279297, -79.1673812866211, -77.43547821044922, -75.70356750488281, -73.97166442871094, -72.23976135253906, -70.50785064697266, -68.77594757080078, -67.04403686523438, -65.3121337890625, -63.58022689819336, -61.84832000732422, -60.116416931152344, -58.3845100402832, -56.65260314941406, -54.92070007324219, -53.18879318237305, -51.456886291503906, -49.724979400634766, -47.993072509765625, -46.26116943359375, -44.52926254272461, -42.79735565185547, -41.065452575683594, -39.33354568481445, -37.60163879394531, -35.86973190307617, -34.13782501220703, -32.405921936035156, -30.674015045166016, -28.942108154296875, -27.210203170776367, -25.47829818725586, -23.74639129638672, -22.014484405517578, -20.28257942199707, -18.550674438476562, -16.818767547607422, -15.086861610412598, -13.354955673217773, -11.62304973602295, -9.891143798828125, -8.1592378616333, -6.427331924438477, -4.695425987243652, -2.963520050048828, -1.231614112854004, 0.5002918243408203, 2.2321977615356445, 3.9641032218933105]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 8.0, 5.0, 5.0, 2.0, 9.0, 8.0, 14.0, 14.0, 21.0, 21.0, 25.0, 22.0, 23.0, 22.0, 31.0, 20.0, 32.0, 31.0, 37.0, 32.0, 40.0, 37.0, 44.0, 52.0, 41.0, 35.0, 40.0, 40.0, 41.0, 36.0, 33.0, 27.0, 22.0, 19.0, 27.0, 16.0, 17.0, 12.0, 12.0, 0.0, 7.0, 5.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.667598724365234, -8.377462387084961, -8.087326049804688, -7.797189712524414, -7.507053852081299, -7.216917514801025, -6.926781177520752, -6.636645317077637, -6.346508979797363, -6.05637264251709, -5.766236305236816, -5.476099967956543, -5.185964107513428, -4.895827770233154, -4.605691432952881, -4.315555572509766, -4.025418758392334, -3.7352824211120605, -3.445146322250366, -3.1550099849700928, -2.8648738861083984, -2.574737548828125, -2.2846012115478516, -1.9944651126861572, -1.7043287754058838, -1.4141925573349, -1.124056339263916, -0.8339200019836426, -0.5437837839126587, -0.2536475658416748, 0.03648877143859863, 0.32662487030029297, 0.6167612075805664, 0.9068974256515503, 1.1970336437225342, 1.4871699810028076, 1.7773061990737915, 2.0674424171447754, 2.357578754425049, 2.647714853286743, 2.9378511905670166, 3.22798752784729, 3.5181236267089844, 3.808259963989258, 4.098396301269531, 4.388532638549805, 4.678668975830078, 4.968804836273193, 5.258941173553467, 5.54907751083374, 5.839213848114014, 6.129349708557129, 6.419486045837402, 6.709622383117676, 6.999758720397949, 7.289895057678223, 7.580031394958496, 7.8701677322387695, 8.160304069519043, 8.450440406799316, 8.74057674407959, 9.030712127685547, 9.32084846496582, 9.610984802246094, 9.901121139526367]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 8.0, 6.0, 13.0, 12.0, 10.0, 16.0, 24.0, 22.0, 25.0, 24.0, 22.0, 27.0, 26.0, 37.0, 33.0, 40.0, 33.0, 31.0, 31.0, 50.0, 34.0, 46.0, 38.0, 34.0, 29.0, 34.0, 30.0, 22.0, 30.0, 31.0, 19.0, 28.0, 29.0, 18.0, 17.0, 10.0, 9.0, 3.0, 7.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0165863037109375, -0.975555419921875, -0.9345245361328125, -0.89349365234375, -0.8524627685546875, -0.811431884765625, -0.7704010009765625, -0.7293701171875, -0.6883392333984375, -0.647308349609375, -0.6062774658203125, -0.56524658203125, -0.5242156982421875, -0.483184814453125, -0.4421539306640625, -0.401123046875, -0.3600921630859375, -0.319061279296875, -0.2780303955078125, -0.23699951171875, -0.1959686279296875, -0.154937744140625, -0.1139068603515625, -0.0728759765625, -0.0318450927734375, 0.009185791015625, 0.0502166748046875, 0.09124755859375, 0.1322784423828125, 0.173309326171875, 0.2143402099609375, 0.25537109375, 0.2964019775390625, 0.337432861328125, 0.3784637451171875, 0.41949462890625, 0.4605255126953125, 0.501556396484375, 0.5425872802734375, 0.5836181640625, 0.6246490478515625, 0.665679931640625, 0.7067108154296875, 0.74774169921875, 0.7887725830078125, 0.829803466796875, 0.8708343505859375, 0.911865234375, 0.9528961181640625, 0.993927001953125, 1.0349578857421875, 1.07598876953125, 1.1170196533203125, 1.158050537109375, 1.1990814208984375, 1.2401123046875, 1.2811431884765625, 1.322174072265625, 1.3632049560546875, 1.40423583984375, 1.4452667236328125, 1.486297607421875, 1.5273284912109375, 1.568359375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 12.0, 8.0, 22.0, 26.0, 50.0, 54.0, 93.0, 150.0, 189.0, 309.0, 430.0, 618.0, 1071.0, 1684.0, 2647.0, 4746.0, 8780.0, 17811.0, 41008.0, 108865.0, 327604.0, 1032877.0, 1618558.0, 679651.0, 212702.0, 74154.0, 29834.0, 13643.0, 6832.0, 3738.0, 2286.0, 1301.0, 859.0, 556.0, 373.0, 248.0, 163.0, 102.0, 86.0, 42.0, 29.0, 25.0, 12.0, 11.0, 9.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.935546875, -1.87744140625, -1.8193359375, -1.76123046875, -1.703125, -1.64501953125, -1.5869140625, -1.52880859375, -1.470703125, -1.41259765625, -1.3544921875, -1.29638671875, -1.23828125, -1.18017578125, -1.1220703125, -1.06396484375, -1.005859375, -0.94775390625, -0.8896484375, -0.83154296875, -0.7734375, -0.71533203125, -0.6572265625, -0.59912109375, -0.541015625, -0.48291015625, -0.4248046875, -0.36669921875, -0.30859375, -0.25048828125, -0.1923828125, -0.13427734375, -0.076171875, -0.01806640625, 0.0400390625, 0.09814453125, 0.15625, 0.21435546875, 0.2724609375, 0.33056640625, 0.388671875, 0.44677734375, 0.5048828125, 0.56298828125, 0.62109375, 0.67919921875, 0.7373046875, 0.79541015625, 0.853515625, 0.91162109375, 0.9697265625, 1.02783203125, 1.0859375, 1.14404296875, 1.2021484375, 1.26025390625, 1.318359375, 1.37646484375, 1.4345703125, 1.49267578125, 1.55078125, 1.60888671875, 1.6669921875, 1.72509765625, 1.783203125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 7.0, 2.0, 6.0, 8.0, 8.0, 16.0, 13.0, 32.0, 27.0, 44.0, 60.0, 99.0, 146.0, 209.0, 305.0, 364.0, 508.0, 510.0, 464.0, 361.0, 266.0, 161.0, 122.0, 94.0, 72.0, 59.0, 32.0, 31.0, 19.0, 15.0, 10.0, 3.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.75811767578125, -2.6802978515625, -2.60247802734375, -2.524658203125, -2.44683837890625, -2.3690185546875, -2.29119873046875, -2.21337890625, -2.13555908203125, -2.0577392578125, -1.97991943359375, -1.902099609375, -1.82427978515625, -1.7464599609375, -1.66864013671875, -1.5908203125, -1.51300048828125, -1.4351806640625, -1.35736083984375, -1.279541015625, -1.20172119140625, -1.1239013671875, -1.04608154296875, -0.96826171875, -0.89044189453125, -0.8126220703125, -0.73480224609375, -0.656982421875, -0.57916259765625, -0.5013427734375, -0.42352294921875, -0.345703125, -0.26788330078125, -0.1900634765625, -0.11224365234375, -0.034423828125, 0.04339599609375, 0.1212158203125, 0.19903564453125, 0.27685546875, 0.35467529296875, 0.4324951171875, 0.51031494140625, 0.588134765625, 0.66595458984375, 0.7437744140625, 0.82159423828125, 0.8994140625, 0.97723388671875, 1.0550537109375, 1.13287353515625, 1.210693359375, 1.28851318359375, 1.3663330078125, 1.44415283203125, 1.52197265625, 1.59979248046875, 1.6776123046875, 1.75543212890625, 1.833251953125, 1.91107177734375, 1.9888916015625, 2.06671142578125, 2.14453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 8.0, 13.0, 20.0, 24.0, 37.0, 38.0, 69.0, 108.0, 126.0, 192.0, 346.0, 548.0, 1570.0, 7582.0, 63716.0, 1154502.0, 2795571.0, 150891.0, 14327.0, 2554.0, 779.0, 394.0, 244.0, 164.0, 109.0, 88.0, 61.0, 54.0, 40.0, 23.0, 25.0, 21.0, 8.0, 10.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.15081787109375, -4.9539794921875, -4.75714111328125, -4.560302734375, -4.36346435546875, -4.1666259765625, -3.96978759765625, -3.77294921875, -3.57611083984375, -3.3792724609375, -3.18243408203125, -2.985595703125, -2.78875732421875, -2.5919189453125, -2.39508056640625, -2.1982421875, -2.00140380859375, -1.8045654296875, -1.60772705078125, -1.410888671875, -1.21405029296875, -1.0172119140625, -0.82037353515625, -0.62353515625, -0.42669677734375, -0.2298583984375, -0.03302001953125, 0.163818359375, 0.36065673828125, 0.5574951171875, 0.75433349609375, 0.951171875, 1.14801025390625, 1.3448486328125, 1.54168701171875, 1.738525390625, 1.93536376953125, 2.1322021484375, 2.32904052734375, 2.52587890625, 2.72271728515625, 2.9195556640625, 3.11639404296875, 3.313232421875, 3.51007080078125, 3.7069091796875, 3.90374755859375, 4.1005859375, 4.29742431640625, 4.4942626953125, 4.69110107421875, 4.887939453125, 5.08477783203125, 5.2816162109375, 5.47845458984375, 5.67529296875, 5.87213134765625, 6.0689697265625, 6.26580810546875, 6.462646484375, 6.65948486328125, 6.8563232421875, 7.05316162109375, 7.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 64.0, 335.0, 432.0, 153.0, 24.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.16972541809082, -23.70330047607422, -22.236873626708984, -20.770448684692383, -19.30402374267578, -17.83759880065918, -16.371173858642578, -14.904747009277344, -13.438322067260742, -11.97189712524414, -10.505471229553223, -9.039045333862305, -7.572620391845703, -6.106194972991943, -4.639769554138184, -3.1733436584472656, -1.706918716430664, -0.2404932975769043, 1.2259321212768555, 2.6923575401306152, 4.158782958984375, 5.625208377838135, 7.0916337966918945, 8.558059692382812, 10.024484634399414, 11.490909576416016, 12.957335472106934, 14.423761367797852, 15.890186309814453, 17.356611251831055, 18.823036193847656, 20.28946304321289, 21.755889892578125, 23.222314834594727, 24.688739776611328, 26.155166625976562, 27.621591567993164, 29.088016510009766, 30.554443359375, 32.02086639404297, 33.4872932434082, 34.95372009277344, 36.420143127441406, 37.88656997680664, 39.352996826171875, 40.819419860839844, 42.28584671020508, 43.75227355957031, 45.21869659423828, 46.685123443603516, 48.151546478271484, 49.61797332763672, 51.08439636230469, 52.55082321166992, 54.017250061035156, 55.483673095703125, 56.95009994506836, 58.416526794433594, 59.88294982910156, 61.3493766784668, 62.81580352783203, 64.2822265625, 65.74864959716797, 67.21508026123047, 68.68150329589844]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 17.0, 13.0, 13.0, 10.0, 19.0, 13.0, 19.0, 20.0, 21.0, 34.0, 29.0, 37.0, 29.0, 31.0, 32.0, 37.0, 32.0, 38.0, 44.0, 37.0, 35.0, 42.0, 25.0, 35.0, 28.0, 31.0, 37.0, 27.0, 30.0, 24.0, 25.0, 14.0, 17.0, 16.0, 16.0, 10.0, 9.0, 11.0, 8.0, 2.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.68221378326416, -6.460510730743408, -6.238807678222656, -6.017104625701904, -5.795401573181152, -5.573698043823242, -5.351995468139648, -5.130291938781738, -4.908588886260986, -4.686885833740234, -4.465182781219482, -4.2434797286987305, -4.0217766761779785, -3.8000733852386475, -3.5783703327178955, -3.3566670417785645, -3.1349642276763916, -2.9132611751556396, -2.6915581226348877, -2.4698548316955566, -2.2481517791748047, -2.0264487266540527, -1.8047456741333008, -1.5830425024032593, -1.3613394498825073, -1.1396363973617554, -0.9179332256317139, -0.6962301731109619, -0.4745270609855652, -0.25282394886016846, -0.031120896339416504, 0.190582275390625, 0.41228532791137695, 0.6339884400367737, 0.8556915521621704, 1.0773946046829224, 1.2990977764129639, 1.5208008289337158, 1.7425038814544678, 1.9642070531845093, 2.185910224914551, 2.4076132774353027, 2.6293163299560547, 2.8510193824768066, 3.0727226734161377, 3.2944257259368896, 3.5161287784576416, 3.7378320693969727, 3.9595348834991455, 4.181238174438477, 4.4029412269592285, 4.6246442794799805, 4.846347332000732, 5.068050384521484, 5.289753437042236, 5.511456489562988, 5.73315954208374, 5.954862594604492, 6.176565647125244, 6.398268699645996, 6.619971752166748, 6.8416748046875, 7.06337833404541, 7.285081386566162, 7.506784439086914]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 4.0, 11.0, 9.0, 18.0, 10.0, 14.0, 17.0, 27.0, 33.0, 32.0, 22.0, 25.0, 25.0, 28.0, 40.0, 40.0, 40.0, 38.0, 45.0, 55.0, 31.0, 46.0, 45.0, 37.0, 34.0, 35.0, 31.0, 32.0, 26.0, 21.0, 12.0, 19.0, 22.0, 15.0, 10.0, 10.0, 9.0, 5.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.0669403076171875, -1.024505615234375, -0.9820709228515625, -0.93963623046875, -0.8972015380859375, -0.854766845703125, -0.8123321533203125, -0.7698974609375, -0.7274627685546875, -0.685028076171875, -0.6425933837890625, -0.60015869140625, -0.5577239990234375, -0.515289306640625, -0.4728546142578125, -0.430419921875, -0.3879852294921875, -0.345550537109375, -0.3031158447265625, -0.26068115234375, -0.2182464599609375, -0.175811767578125, -0.1333770751953125, -0.0909423828125, -0.0485076904296875, -0.006072998046875, 0.0363616943359375, 0.07879638671875, 0.1212310791015625, 0.163665771484375, 0.2061004638671875, 0.24853515625, 0.2909698486328125, 0.333404541015625, 0.3758392333984375, 0.41827392578125, 0.4607086181640625, 0.503143310546875, 0.5455780029296875, 0.5880126953125, 0.6304473876953125, 0.672882080078125, 0.7153167724609375, 0.75775146484375, 0.8001861572265625, 0.842620849609375, 0.8850555419921875, 0.927490234375, 0.9699249267578125, 1.012359619140625, 1.0547943115234375, 1.09722900390625, 1.1396636962890625, 1.182098388671875, 1.2245330810546875, 1.2669677734375, 1.3094024658203125, 1.351837158203125, 1.3942718505859375, 1.43670654296875, 1.4791412353515625, 1.521575927734375, 1.5640106201171875, 1.6064453125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 10.0, 10.0, 6.0, 13.0, 13.0, 32.0, 33.0, 26.0, 61.0, 82.0, 114.0, 168.0, 220.0, 296.0, 467.0, 564.0, 761.0, 1096.0, 1520.0, 2314.0, 3942.0, 8787.0, 25476.0, 79024.0, 222186.0, 360557.0, 218455.0, 77185.0, 24643.0, 8764.0, 4050.0, 2315.0, 1466.0, 1070.0, 756.0, 540.0, 433.0, 310.0, 219.0, 176.0, 107.0, 71.0, 68.0, 46.0, 37.0, 23.0, 13.0, 15.0, 5.0, 5.0, 6.0, 7.0, 1.0, 0.0, 2.0], "bins": [-0.279052734375, -0.2709617614746094, -0.26287078857421875, -0.2547798156738281, -0.2466888427734375, -0.23859786987304688, -0.23050689697265625, -0.22241592407226562, -0.214324951171875, -0.20623397827148438, -0.19814300537109375, -0.19005203247070312, -0.1819610595703125, -0.17387008666992188, -0.16577911376953125, -0.15768814086914062, -0.14959716796875, -0.14150619506835938, -0.13341522216796875, -0.12532424926757812, -0.1172332763671875, -0.10914230346679688, -0.10105133056640625, -0.09296035766601562, -0.084869384765625, -0.07677841186523438, -0.06868743896484375, -0.060596466064453125, -0.0525054931640625, -0.044414520263671875, -0.03632354736328125, -0.028232574462890625, -0.0201416015625, -0.012050628662109375, -0.00395965576171875, 0.004131317138671875, 0.0122222900390625, 0.020313262939453125, 0.02840423583984375, 0.036495208740234375, 0.044586181640625, 0.052677154541015625, 0.06076812744140625, 0.06885910034179688, 0.0769500732421875, 0.08504104614257812, 0.09313201904296875, 0.10122299194335938, 0.10931396484375, 0.11740493774414062, 0.12549591064453125, 0.13358688354492188, 0.1416778564453125, 0.14976882934570312, 0.15785980224609375, 0.16595077514648438, 0.174041748046875, 0.18213272094726562, 0.19022369384765625, 0.19831466674804688, 0.2064056396484375, 0.21449661254882812, 0.22258758544921875, 0.23067855834960938, 0.23876953125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 0.0, 4.0, 1.0, 5.0, 9.0, 9.0, 12.0, 15.0, 17.0, 21.0, 21.0, 16.0, 24.0, 23.0, 39.0, 41.0, 37.0, 39.0, 46.0, 33.0, 35.0, 35.0, 1079.0, 44.0, 46.0, 38.0, 37.0, 27.0, 31.0, 17.0, 21.0, 30.0, 18.0, 22.0, 22.0, 21.0, 16.0, 12.0, 18.0, 10.0, 12.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-1.0087890625, -0.98095703125, -0.953125, -0.92529296875, -0.8974609375, -0.86962890625, -0.841796875, -0.81396484375, -0.7861328125, -0.75830078125, -0.73046875, -0.70263671875, -0.6748046875, -0.64697265625, -0.619140625, -0.59130859375, -0.5634765625, -0.53564453125, -0.5078125, -0.47998046875, -0.4521484375, -0.42431640625, -0.396484375, -0.36865234375, -0.3408203125, -0.31298828125, -0.28515625, -0.25732421875, -0.2294921875, -0.20166015625, -0.173828125, -0.14599609375, -0.1181640625, -0.09033203125, -0.0625, -0.03466796875, -0.0068359375, 0.02099609375, 0.048828125, 0.07666015625, 0.1044921875, 0.13232421875, 0.16015625, 0.18798828125, 0.2158203125, 0.24365234375, 0.271484375, 0.29931640625, 0.3271484375, 0.35498046875, 0.3828125, 0.41064453125, 0.4384765625, 0.46630859375, 0.494140625, 0.52197265625, 0.5498046875, 0.57763671875, 0.60546875, 0.63330078125, 0.6611328125, 0.68896484375, 0.716796875, 0.74462890625, 0.7724609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 15.0, 14.0, 12.0, 24.0, 24.0, 33.0, 40.0, 63.0, 100.0, 115.0, 178.0, 272.0, 512.0, 836.0, 1556.0, 3509.0, 11926.0, 56589.0, 271844.0, 1504126.0, 192136.0, 38478.0, 8638.0, 2835.0, 1254.0, 702.0, 459.0, 243.0, 175.0, 105.0, 92.0, 44.0, 61.0, 34.0, 17.0, 14.0, 6.0, 7.0, 10.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.276611328125, -0.2685661315917969, -0.26052093505859375, -0.2524757385253906, -0.2444305419921875, -0.23638534545898438, -0.22834014892578125, -0.22029495239257812, -0.212249755859375, -0.20420455932617188, -0.19615936279296875, -0.18811416625976562, -0.1800689697265625, -0.17202377319335938, -0.16397857666015625, -0.15593338012695312, -0.14788818359375, -0.13984298706054688, -0.13179779052734375, -0.12375259399414062, -0.1157073974609375, -0.10766220092773438, -0.09961700439453125, -0.09157180786132812, -0.083526611328125, -0.07548141479492188, -0.06743621826171875, -0.059391021728515625, -0.0513458251953125, -0.043300628662109375, -0.03525543212890625, -0.027210235595703125, -0.0191650390625, -0.011119842529296875, -0.00307464599609375, 0.004970550537109375, 0.0130157470703125, 0.021060943603515625, 0.02910614013671875, 0.037151336669921875, 0.045196533203125, 0.053241729736328125, 0.06128692626953125, 0.06933212280273438, 0.0773773193359375, 0.08542251586914062, 0.09346771240234375, 0.10151290893554688, 0.10955810546875, 0.11760330200195312, 0.12564849853515625, 0.13369369506835938, 0.1417388916015625, 0.14978408813476562, 0.15782928466796875, 0.16587448120117188, 0.173919677734375, 0.18196487426757812, 0.19001007080078125, 0.19805526733398438, 0.2061004638671875, 0.21414566040039062, 0.22219085693359375, 0.23023605346679688, 0.23828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 11.0, 16.0, 38.0, 93.0, 355.0, 300.0, 98.0, 36.0, 18.0, 6.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051055908203125, -0.04935264587402344, -0.047649383544921875, -0.04594612121582031, -0.04424285888671875, -0.04253959655761719, -0.040836334228515625, -0.03913307189941406, -0.0374298095703125, -0.03572654724121094, -0.034023284912109375, -0.03232002258300781, -0.03061676025390625, -0.028913497924804688, -0.027210235595703125, -0.025506973266601562, -0.0238037109375, -0.022100448608398438, -0.020397186279296875, -0.018693923950195312, -0.01699066162109375, -0.015287399291992188, -0.013584136962890625, -0.011880874633789062, -0.0101776123046875, -0.008474349975585938, -0.006771087646484375, -0.0050678253173828125, -0.00336456298828125, -0.0016613006591796875, 4.1961669921875e-05, 0.0017452239990234375, 0.003448486328125, 0.0051517486572265625, 0.006855010986328125, 0.008558273315429688, 0.01026153564453125, 0.011964797973632812, 0.013668060302734375, 0.015371322631835938, 0.0170745849609375, 0.018777847290039062, 0.020481109619140625, 0.022184371948242188, 0.02388763427734375, 0.025590896606445312, 0.027294158935546875, 0.028997421264648438, 0.03070068359375, 0.03240394592285156, 0.034107208251953125, 0.03581047058105469, 0.03751373291015625, 0.03921699523925781, 0.040920257568359375, 0.04262351989746094, 0.0443267822265625, 0.04603004455566406, 0.047733306884765625, 0.04943656921386719, 0.05113983154296875, 0.05284309387207031, 0.054546356201171875, 0.05624961853027344, 0.057952880859375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 16.0, 18.0, 44.0, 123.0, 77459.0, 970668.0, 105.0, 49.0, 21.0, 16.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.56207275390625, -1.5147705078125, -1.46746826171875, -1.420166015625, -1.37286376953125, -1.3255615234375, -1.27825927734375, -1.23095703125, -1.18365478515625, -1.1363525390625, -1.08905029296875, -1.041748046875, -0.99444580078125, -0.9471435546875, -0.89984130859375, -0.8525390625, -0.80523681640625, -0.7579345703125, -0.71063232421875, -0.663330078125, -0.61602783203125, -0.5687255859375, -0.52142333984375, -0.47412109375, -0.42681884765625, -0.3795166015625, -0.33221435546875, -0.284912109375, -0.23760986328125, -0.1903076171875, -0.14300537109375, -0.095703125, -0.04840087890625, -0.0010986328125, 0.04620361328125, 0.093505859375, 0.14080810546875, 0.1881103515625, 0.23541259765625, 0.28271484375, 0.33001708984375, 0.3773193359375, 0.42462158203125, 0.471923828125, 0.51922607421875, 0.5665283203125, 0.61383056640625, 0.6611328125, 0.70843505859375, 0.7557373046875, 0.80303955078125, 0.850341796875, 0.89764404296875, 0.9449462890625, 0.99224853515625, 1.03955078125, 1.08685302734375, 1.1341552734375, 1.18145751953125, 1.228759765625, 1.27606201171875, 1.3233642578125, 1.37066650390625, 1.41796875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 77.0, 786.0, 143.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19209235906600952, -0.18857504427433014, -0.18505771458148956, -0.18154039978981018, -0.1780230700969696, -0.17450575530529022, -0.17098842561244965, -0.16747111082077026, -0.1639537811279297, -0.1604364663362503, -0.15691913664340973, -0.15340182185173035, -0.14988449215888977, -0.1463671773672104, -0.1428498476743698, -0.13933253288269043, -0.13581520318984985, -0.13229788839817047, -0.1287805587053299, -0.1252632439136505, -0.12174591422080994, -0.11822859197854996, -0.11471126973628998, -0.1111939549446106, -0.10767664015293121, -0.10415931791067123, -0.10064199566841125, -0.09712467342615128, -0.0936073511838913, -0.09009002894163132, -0.08657270669937134, -0.08305539190769196, -0.07953806966543198, -0.076020747423172, -0.07250342518091202, -0.06898610293865204, -0.06546878069639206, -0.06195145845413208, -0.0584341399371624, -0.05491681769490242, -0.05139949545264244, -0.04788217321038246, -0.04436485096812248, -0.0408475324511528, -0.03733021020889282, -0.03381288796663284, -0.030295565724372864, -0.026778243482112885, -0.023260921239852905, -0.019743598997592926, -0.016226276755332947, -0.012708956375718117, -0.009191634133458138, -0.005674311891198158, -0.0021569915115833282, 0.001360330730676651, 0.00487765297293663, 0.00839497521519661, 0.011912296526134014, 0.015429617837071419, 0.018946940079331398, 0.022464262321591377, 0.025981582701206207, 0.029498904943466187, 0.033016227185726166]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 9.0, 8.0, 2.0, 9.0, 14.0, 21.0, 17.0, 20.0, 22.0, 20.0, 32.0, 32.0, 29.0, 22.0, 40.0, 31.0, 37.0, 40.0, 36.0, 34.0, 35.0, 38.0, 51.0, 37.0, 40.0, 31.0, 36.0, 30.0, 29.0, 31.0, 28.0, 19.0, 19.0, 15.0, 19.0, 15.0, 7.0, 7.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.02780771255493164, -0.026981748640537262, -0.026155782863497734, -0.025329817086458206, -0.024503853172063828, -0.02367788925766945, -0.02285192348062992, -0.022025957703590393, -0.021199993789196014, -0.020374029874801636, -0.019548064097762108, -0.01872209832072258, -0.0178961344063282, -0.017070170491933823, -0.016244204714894295, -0.015418239869177341, -0.014592275023460388, -0.013766310177743435, -0.012940345332026482, -0.012114380486309528, -0.011288415640592575, -0.010462450794875622, -0.009636485949158669, -0.008810521103441715, -0.007984556257724762, -0.007158591412007809, -0.006332626566290855, -0.005506661720573902, -0.004680696874856949, -0.0038547320291399956, -0.0030287671834230423, -0.002202802337706089, -0.0013768374919891357, -0.0005508726462721825, 0.0002750921994447708, 0.001101057045161724, 0.0019270218908786774, 0.0027529867365956306, 0.003578951582312584, 0.004404916428029537, 0.0052308812737464905, 0.006056846119463444, 0.006882810965180397, 0.00770877581089735, 0.008534740656614304, 0.009360705502331257, 0.01018667034804821, 0.011012635193765163, 0.011838600039482117, 0.01266456488519907, 0.013490529730916023, 0.014316494576632977, 0.01514245942234993, 0.01596842333674431, 0.016794389113783836, 0.017620354890823364, 0.018446318805217743, 0.01927228271961212, 0.02009824849665165, 0.020924214273691177, 0.021750178188085556, 0.022576142102479935, 0.023402107879519463, 0.02422807365655899, 0.02505403757095337]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 4.0, 11.0, 10.0, 17.0, 11.0, 14.0, 16.0, 29.0, 31.0, 32.0, 22.0, 25.0, 25.0, 28.0, 41.0, 39.0, 41.0, 40.0, 43.0, 54.0, 32.0, 46.0, 47.0, 37.0, 31.0, 35.0, 32.0, 31.0, 26.0, 21.0, 13.0, 19.0, 21.0, 15.0, 10.0, 10.0, 9.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0659637451171875, -1.023529052734375, -0.9810943603515625, -0.93865966796875, -0.8962249755859375, -0.853790283203125, -0.8113555908203125, -0.7689208984375, -0.7264862060546875, -0.684051513671875, -0.6416168212890625, -0.59918212890625, -0.5567474365234375, -0.514312744140625, -0.4718780517578125, -0.429443359375, -0.3870086669921875, -0.344573974609375, -0.3021392822265625, -0.25970458984375, -0.2172698974609375, -0.174835205078125, -0.1324005126953125, -0.0899658203125, -0.0475311279296875, -0.005096435546875, 0.0373382568359375, 0.07977294921875, 0.1222076416015625, 0.164642333984375, 0.2070770263671875, 0.24951171875, 0.2919464111328125, 0.334381103515625, 0.3768157958984375, 0.41925048828125, 0.4616851806640625, 0.504119873046875, 0.5465545654296875, 0.5889892578125, 0.6314239501953125, 0.673858642578125, 0.7162933349609375, 0.75872802734375, 0.8011627197265625, 0.843597412109375, 0.8860321044921875, 0.928466796875, 0.9709014892578125, 1.013336181640625, 1.0557708740234375, 1.09820556640625, 1.1406402587890625, 1.183074951171875, 1.2255096435546875, 1.2679443359375, 1.3103790283203125, 1.352813720703125, 1.3952484130859375, 1.43768310546875, 1.4801177978515625, 1.522552490234375, 1.5649871826171875, 1.607421875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 6.0, 7.0, 12.0, 22.0, 29.0, 27.0, 48.0, 73.0, 87.0, 109.0, 158.0, 239.0, 431.0, 673.0, 1268.0, 2386.0, 5036.0, 11527.0, 27770.0, 73193.0, 245429.0, 457338.0, 139616.0, 47936.0, 18936.0, 8247.0, 3631.0, 1831.0, 955.0, 539.0, 321.0, 169.0, 132.0, 98.0, 76.0, 42.0, 35.0, 30.0, 30.0, 15.0, 16.0, 8.0, 9.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.576171875, -2.491119384765625, -2.40606689453125, -2.321014404296875, -2.2359619140625, -2.150909423828125, -2.06585693359375, -1.980804443359375, -1.895751953125, -1.810699462890625, -1.72564697265625, -1.640594482421875, -1.5555419921875, -1.470489501953125, -1.38543701171875, -1.300384521484375, -1.21533203125, -1.130279541015625, -1.04522705078125, -0.960174560546875, -0.8751220703125, -0.790069580078125, -0.70501708984375, -0.619964599609375, -0.534912109375, -0.449859619140625, -0.36480712890625, -0.279754638671875, -0.1947021484375, -0.109649658203125, -0.02459716796875, 0.060455322265625, 0.1455078125, 0.230560302734375, 0.31561279296875, 0.400665283203125, 0.4857177734375, 0.570770263671875, 0.65582275390625, 0.740875244140625, 0.825927734375, 0.910980224609375, 0.99603271484375, 1.081085205078125, 1.1661376953125, 1.251190185546875, 1.33624267578125, 1.421295166015625, 1.50634765625, 1.591400146484375, 1.67645263671875, 1.761505126953125, 1.8465576171875, 1.931610107421875, 2.01666259765625, 2.101715087890625, 2.186767578125, 2.271820068359375, 2.35687255859375, 2.441925048828125, 2.5269775390625, 2.612030029296875, 2.69708251953125, 2.782135009765625, 2.8671875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 7.0, 12.0, 12.0, 12.0, 23.0, 12.0, 15.0, 37.0, 31.0, 25.0, 27.0, 37.0, 29.0, 46.0, 69.0, 86.0, 146.0, 232.0, 1314.0, 234.0, 124.0, 71.0, 59.0, 49.0, 35.0, 26.0, 38.0, 34.0, 28.0, 20.0, 23.0, 22.0, 13.0, 10.0, 7.0, 14.0, 11.0, 14.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.90234375, -2.80377197265625, -2.7052001953125, -2.60662841796875, -2.508056640625, -2.40948486328125, -2.3109130859375, -2.21234130859375, -2.11376953125, -2.01519775390625, -1.9166259765625, -1.81805419921875, -1.719482421875, -1.62091064453125, -1.5223388671875, -1.42376708984375, -1.3251953125, -1.22662353515625, -1.1280517578125, -1.02947998046875, -0.930908203125, -0.83233642578125, -0.7337646484375, -0.63519287109375, -0.53662109375, -0.43804931640625, -0.3394775390625, -0.24090576171875, -0.142333984375, -0.04376220703125, 0.0548095703125, 0.15338134765625, 0.251953125, 0.35052490234375, 0.4490966796875, 0.54766845703125, 0.646240234375, 0.74481201171875, 0.8433837890625, 0.94195556640625, 1.04052734375, 1.13909912109375, 1.2376708984375, 1.33624267578125, 1.434814453125, 1.53338623046875, 1.6319580078125, 1.73052978515625, 1.8291015625, 1.92767333984375, 2.0262451171875, 2.12481689453125, 2.223388671875, 2.32196044921875, 2.4205322265625, 2.51910400390625, 2.61767578125, 2.71624755859375, 2.8148193359375, 2.91339111328125, 3.011962890625, 3.11053466796875, 3.2091064453125, 3.30767822265625, 3.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 13.0, 10.0, 19.0, 13.0, 26.0, 23.0, 41.0, 41.0, 65.0, 52.0, 97.0, 112.0, 157.0, 207.0, 337.0, 722.0, 2335.0, 13923.0, 154696.0, 2642867.0, 303080.0, 21301.0, 3311.0, 938.0, 385.0, 228.0, 154.0, 109.0, 83.0, 72.0, 61.0, 36.0, 42.0, 22.0, 24.0, 20.0, 18.0, 12.0, 9.0, 6.0, 8.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.51953125, -6.33111572265625, -6.1427001953125, -5.95428466796875, -5.765869140625, -5.57745361328125, -5.3890380859375, -5.20062255859375, -5.01220703125, -4.82379150390625, -4.6353759765625, -4.44696044921875, -4.258544921875, -4.07012939453125, -3.8817138671875, -3.69329833984375, -3.5048828125, -3.31646728515625, -3.1280517578125, -2.93963623046875, -2.751220703125, -2.56280517578125, -2.3743896484375, -2.18597412109375, -1.99755859375, -1.80914306640625, -1.6207275390625, -1.43231201171875, -1.243896484375, -1.05548095703125, -0.8670654296875, -0.67864990234375, -0.490234375, -0.30181884765625, -0.1134033203125, 0.07501220703125, 0.263427734375, 0.45184326171875, 0.6402587890625, 0.82867431640625, 1.01708984375, 1.20550537109375, 1.3939208984375, 1.58233642578125, 1.770751953125, 1.95916748046875, 2.1475830078125, 2.33599853515625, 2.5244140625, 2.71282958984375, 2.9012451171875, 3.08966064453125, 3.278076171875, 3.46649169921875, 3.6549072265625, 3.84332275390625, 4.03173828125, 4.22015380859375, 4.4085693359375, 4.59698486328125, 4.785400390625, 4.97381591796875, 5.1622314453125, 5.35064697265625, 5.5390625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 16.0, 49.0, 74.0, 109.0, 162.0, 186.0, 132.0, 119.0, 69.0, 49.0, 26.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.740852355957031, -9.410861015319824, -9.080869674682617, -8.750879287719727, -8.42088794708252, -8.090896606445312, -7.760905742645264, -7.430914878845215, -7.100923538208008, -6.770932197570801, -6.440941333770752, -6.110950469970703, -5.780959129333496, -5.450967788696289, -5.12097692489624, -4.790986061096191, -4.460994720458984, -4.131003379821777, -3.8010125160217285, -3.4710214138031006, -3.1410303115844727, -2.8110392093658447, -2.481048107147217, -2.151057004928589, -1.821065902709961, -1.491074800491333, -1.161083698272705, -0.8310925960540771, -0.5011014938354492, -0.1711103916168213, 0.15888071060180664, 0.48887181282043457, 0.8188638687133789, 1.1488549709320068, 1.4788460731506348, 1.8088371753692627, 2.1388282775878906, 2.4688193798065186, 2.7988104820251465, 3.1288015842437744, 3.4587926864624023, 3.7887837886810303, 4.118774890899658, 4.448765754699707, 4.778757095336914, 5.108748435974121, 5.43873929977417, 5.768730163574219, 6.098721504211426, 6.428712844848633, 6.758703708648682, 7.0886945724487305, 7.4186859130859375, 7.7486772537231445, 8.078668594360352, 8.408658981323242, 8.73865032196045, 9.068641662597656, 9.398632049560547, 9.728623390197754, 10.058614730834961, 10.388606071472168, 10.718597412109375, 11.048587799072266, 11.378579139709473]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 4.0, 2.0, 5.0, 10.0, 6.0, 14.0, 10.0, 20.0, 20.0, 32.0, 35.0, 26.0, 26.0, 27.0, 38.0, 38.0, 31.0, 37.0, 36.0, 49.0, 46.0, 49.0, 51.0, 38.0, 43.0, 30.0, 36.0, 38.0, 30.0, 29.0, 21.0, 22.0, 10.0, 21.0, 18.0, 11.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.777368545532227, -9.483824729919434, -9.19028091430664, -8.896737098693848, -8.603193283081055, -8.309650421142578, -8.016106605529785, -7.722562789916992, -7.429018974304199, -7.135475158691406, -6.841931343078613, -6.5483880043029785, -6.2548441886901855, -5.961300373077393, -5.667757034301758, -5.374213218688965, -5.080669403076172, -4.787125587463379, -4.493581771850586, -4.200038433074951, -3.906494617462158, -3.6129508018493652, -3.3194072246551514, -3.0258636474609375, -2.7323198318481445, -2.4387760162353516, -2.1452324390411377, -1.8516887426376343, -1.5581450462341309, -1.2646013498306274, -0.971057653427124, -0.6775140762329102, -0.3839702606201172, -0.09042656421661377, 0.20311713218688965, 0.49666082859039307, 0.7902045249938965, 1.0837482213974, 1.3772919178009033, 1.6708354949951172, 1.9643793106079102, 2.257923126220703, 2.551466703414917, 2.845010280609131, 3.138554096221924, 3.432097911834717, 3.7256414890289307, 4.0191850662231445, 4.3127288818359375, 4.6062726974487305, 4.899816513061523, 5.193359851837158, 5.486903667449951, 5.780447483062744, 6.073990821838379, 6.367534637451172, 6.661078453063965, 6.954622268676758, 7.248166084289551, 7.5417094230651855, 7.8352532386779785, 8.128796577453613, 8.422340393066406, 8.7158842086792, 9.009428024291992]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 6.0, 6.0, 6.0, 5.0, 12.0, 14.0, 13.0, 25.0, 17.0, 25.0, 25.0, 25.0, 36.0, 28.0, 34.0, 29.0, 36.0, 39.0, 45.0, 38.0, 34.0, 37.0, 54.0, 40.0, 42.0, 46.0, 31.0, 38.0, 15.0, 31.0, 30.0, 19.0, 23.0, 25.0, 11.0, 12.0, 12.0, 9.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2568359375, -1.2133026123046875, -1.169769287109375, -1.1262359619140625, -1.08270263671875, -1.0391693115234375, -0.995635986328125, -0.9521026611328125, -0.9085693359375, -0.8650360107421875, -0.821502685546875, -0.7779693603515625, -0.73443603515625, -0.6909027099609375, -0.647369384765625, -0.6038360595703125, -0.560302734375, -0.5167694091796875, -0.473236083984375, -0.4297027587890625, -0.38616943359375, -0.3426361083984375, -0.299102783203125, -0.2555694580078125, -0.2120361328125, -0.1685028076171875, -0.124969482421875, -0.0814361572265625, -0.03790283203125, 0.0056304931640625, 0.049163818359375, 0.0926971435546875, 0.13623046875, 0.1797637939453125, 0.223297119140625, 0.2668304443359375, 0.31036376953125, 0.3538970947265625, 0.397430419921875, 0.4409637451171875, 0.4844970703125, 0.5280303955078125, 0.571563720703125, 0.6150970458984375, 0.65863037109375, 0.7021636962890625, 0.745697021484375, 0.7892303466796875, 0.832763671875, 0.8762969970703125, 0.919830322265625, 0.9633636474609375, 1.00689697265625, 1.0504302978515625, 1.093963623046875, 1.1374969482421875, 1.1810302734375, 1.2245635986328125, 1.268096923828125, 1.3116302490234375, 1.35516357421875, 1.3986968994140625, 1.442230224609375, 1.4857635498046875, 1.529296875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 16.0, 23.0, 25.0, 40.0, 62.0, 75.0, 117.0, 128.0, 240.0, 364.0, 519.0, 776.0, 1265.0, 2092.0, 3721.0, 7119.0, 14450.0, 32589.0, 80139.0, 216790.0, 627846.0, 1483150.0, 1096031.0, 390281.0, 137526.0, 53086.0, 22513.0, 10615.0, 5298.0, 2921.0, 1642.0, 964.0, 622.0, 380.0, 235.0, 185.0, 113.0, 94.0, 69.0, 47.0, 30.0, 21.0, 19.0, 13.0, 4.0, 11.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5634765625, -1.5109710693359375, -1.458465576171875, -1.4059600830078125, -1.35345458984375, -1.3009490966796875, -1.248443603515625, -1.1959381103515625, -1.1434326171875, -1.0909271240234375, -1.038421630859375, -0.9859161376953125, -0.93341064453125, -0.8809051513671875, -0.828399658203125, -0.7758941650390625, -0.723388671875, -0.6708831787109375, -0.618377685546875, -0.5658721923828125, -0.51336669921875, -0.4608612060546875, -0.408355712890625, -0.3558502197265625, -0.3033447265625, -0.2508392333984375, -0.198333740234375, -0.1458282470703125, -0.09332275390625, -0.0408172607421875, 0.011688232421875, 0.0641937255859375, 0.11669921875, 0.1692047119140625, 0.221710205078125, 0.2742156982421875, 0.32672119140625, 0.3792266845703125, 0.431732177734375, 0.4842376708984375, 0.5367431640625, 0.5892486572265625, 0.641754150390625, 0.6942596435546875, 0.74676513671875, 0.7992706298828125, 0.851776123046875, 0.9042816162109375, 0.956787109375, 1.0092926025390625, 1.061798095703125, 1.1143035888671875, 1.16680908203125, 1.2193145751953125, 1.271820068359375, 1.3243255615234375, 1.3768310546875, 1.4293365478515625, 1.481842041015625, 1.5343475341796875, 1.58685302734375, 1.6393585205078125, 1.691864013671875, 1.7443695068359375, 1.796875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 6.0, 12.0, 8.0, 9.0, 11.0, 19.0, 18.0, 29.0, 40.0, 64.0, 72.0, 105.0, 135.0, 167.0, 288.0, 348.0, 441.0, 493.0, 480.0, 390.0, 273.0, 185.0, 145.0, 86.0, 73.0, 55.0, 48.0, 19.0, 15.0, 11.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.5247344970703125, -2.455718994140625, -2.3867034912109375, -2.31768798828125, -2.2486724853515625, -2.179656982421875, -2.1106414794921875, -2.0416259765625, -1.9726104736328125, -1.903594970703125, -1.8345794677734375, -1.76556396484375, -1.6965484619140625, -1.627532958984375, -1.5585174560546875, -1.489501953125, -1.4204864501953125, -1.351470947265625, -1.2824554443359375, -1.21343994140625, -1.1444244384765625, -1.075408935546875, -1.0063934326171875, -0.9373779296875, -0.8683624267578125, -0.799346923828125, -0.7303314208984375, -0.66131591796875, -0.5923004150390625, -0.523284912109375, -0.4542694091796875, -0.38525390625, -0.3162384033203125, -0.247222900390625, -0.1782073974609375, -0.10919189453125, -0.0401763916015625, 0.028839111328125, 0.0978546142578125, 0.1668701171875, 0.2358856201171875, 0.304901123046875, 0.3739166259765625, 0.44293212890625, 0.5119476318359375, 0.580963134765625, 0.6499786376953125, 0.718994140625, 0.7880096435546875, 0.857025146484375, 0.9260406494140625, 0.99505615234375, 1.0640716552734375, 1.133087158203125, 1.2021026611328125, 1.2711181640625, 1.3401336669921875, 1.409149169921875, 1.4781646728515625, 1.54718017578125, 1.6161956787109375, 1.685211181640625, 1.7542266845703125, 1.8232421875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 10.0, 10.0, 29.0, 19.0, 33.0, 47.0, 77.0, 125.0, 181.0, 283.0, 550.0, 1242.0, 4749.0, 29208.0, 350838.0, 3318263.0, 445838.0, 34303.0, 5328.0, 1475.0, 577.0, 293.0, 225.0, 135.0, 99.0, 69.0, 61.0, 41.0, 30.0, 25.0, 22.0, 20.0, 14.0, 11.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91796875, -4.732666015625, -4.54736328125, -4.362060546875, -4.1767578125, -3.991455078125, -3.80615234375, -3.620849609375, -3.435546875, -3.250244140625, -3.06494140625, -2.879638671875, -2.6943359375, -2.509033203125, -2.32373046875, -2.138427734375, -1.953125, -1.767822265625, -1.58251953125, -1.397216796875, -1.2119140625, -1.026611328125, -0.84130859375, -0.656005859375, -0.470703125, -0.285400390625, -0.10009765625, 0.085205078125, 0.2705078125, 0.455810546875, 0.64111328125, 0.826416015625, 1.01171875, 1.197021484375, 1.38232421875, 1.567626953125, 1.7529296875, 1.938232421875, 2.12353515625, 2.308837890625, 2.494140625, 2.679443359375, 2.86474609375, 3.050048828125, 3.2353515625, 3.420654296875, 3.60595703125, 3.791259765625, 3.9765625, 4.161865234375, 4.34716796875, 4.532470703125, 4.7177734375, 4.903076171875, 5.08837890625, 5.273681640625, 5.458984375, 5.644287109375, 5.82958984375, 6.014892578125, 6.2001953125, 6.385498046875, 6.57080078125, 6.756103515625, 6.94140625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 39.0, 957.0, 21.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.48561096191406, -88.68201446533203, -83.87841796875, -79.07481384277344, -74.2712173461914, -69.46762084960938, -64.66402435302734, -59.86042404174805, -55.056827545166016, -50.253231048583984, -45.44963073730469, -40.646034240722656, -35.842437744140625, -31.038837432861328, -26.235240936279297, -21.431640625, -16.62804412841797, -11.824445724487305, -7.020848274230957, -2.2172508239746094, 2.5863475799560547, 7.389945983886719, 12.19354248046875, 16.997142791748047, 21.800739288330078, 26.604337692260742, 31.407936096191406, 36.21153259277344, 41.01512908935547, 45.818729400634766, 50.6223258972168, 55.425926208496094, 60.229522705078125, 65.03311920166016, 69.83671569824219, 74.64031982421875, 79.44391632080078, 84.24751281738281, 89.05110931396484, 93.85470581054688, 98.65830993652344, 103.46190643310547, 108.2655029296875, 113.06910705566406, 117.8727035522461, 122.67630004882812, 127.47989654541016, 132.2834930419922, 137.08709716796875, 141.8907012939453, 146.6942901611328, 151.49789428710938, 156.30148315429688, 161.10508728027344, 165.90869140625, 170.7122802734375, 175.515869140625, 180.31947326660156, 185.12306213378906, 189.92666625976562, 194.73025512695312, 199.5338592529297, 204.33746337890625, 209.14105224609375, 213.9446563720703]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 6.0, 11.0, 12.0, 7.0, 14.0, 18.0, 12.0, 17.0, 22.0, 36.0, 24.0, 39.0, 33.0, 38.0, 43.0, 47.0, 42.0, 46.0, 37.0, 60.0, 41.0, 39.0, 45.0, 46.0, 35.0, 30.0, 26.0, 28.0, 31.0, 24.0, 20.0, 7.0, 19.0, 8.0, 10.0, 3.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.847167015075684, -7.567250728607178, -7.28733491897583, -7.007418632507324, -6.727502822875977, -6.447586536407471, -6.167670249938965, -5.887754440307617, -5.6078386306762695, -5.327922344207764, -5.048006534576416, -4.76809024810791, -4.4881744384765625, -4.208258152008057, -3.92834210395813, -3.648426055908203, -3.3685097694396973, -3.0885937213897705, -2.8086776733398438, -2.528761386871338, -2.2488455772399902, -1.968929409980774, -1.6890132427215576, -1.4090971946716309, -1.129181146621704, -0.8492650985717773, -0.5693489909172058, -0.2894328832626343, -0.00951683521270752, 0.27039921283721924, 0.5503153800964355, 0.8302314281463623, 1.110147476196289, 1.3900635242462158, 1.6699795722961426, 1.9498957395553589, 2.229811668395996, 2.509727954864502, 2.7896440029144287, 3.0695600509643555, 3.3494760990142822, 3.629392147064209, 3.9093081951141357, 4.1892242431640625, 4.469140529632568, 4.749056339263916, 5.028972625732422, 5.3088884353637695, 5.588804721832275, 5.868721008300781, 6.148636817932129, 6.428553104400635, 6.708468914031982, 6.988385200500488, 7.268301010131836, 7.548217296600342, 7.828133583068848, 8.108049392700195, 8.38796615600586, 8.667881965637207, 8.947797775268555, 9.227713584899902, 9.507630348205566, 9.787546157836914, 10.067461967468262]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 9.0, 6.0, 11.0, 9.0, 15.0, 9.0, 8.0, 9.0, 22.0, 14.0, 23.0, 23.0, 25.0, 30.0, 31.0, 25.0, 33.0, 33.0, 49.0, 38.0, 41.0, 39.0, 40.0, 40.0, 39.0, 39.0, 30.0, 43.0, 30.0, 34.0, 20.0, 25.0, 27.0, 25.0, 27.0, 16.0, 10.0, 14.0, 7.0, 8.0, 10.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.232421875, -1.1912384033203125, -1.150054931640625, -1.1088714599609375, -1.06768798828125, -1.0265045166015625, -0.985321044921875, -0.9441375732421875, -0.9029541015625, -0.8617706298828125, -0.820587158203125, -0.7794036865234375, -0.73822021484375, -0.6970367431640625, -0.655853271484375, -0.6146697998046875, -0.573486328125, -0.5323028564453125, -0.491119384765625, -0.4499359130859375, -0.40875244140625, -0.3675689697265625, -0.326385498046875, -0.2852020263671875, -0.2440185546875, -0.2028350830078125, -0.161651611328125, -0.1204681396484375, -0.07928466796875, -0.0381011962890625, 0.003082275390625, 0.0442657470703125, 0.08544921875, 0.1266326904296875, 0.167816162109375, 0.2089996337890625, 0.25018310546875, 0.2913665771484375, 0.332550048828125, 0.3737335205078125, 0.4149169921875, 0.4561004638671875, 0.497283935546875, 0.5384674072265625, 0.57965087890625, 0.6208343505859375, 0.662017822265625, 0.7032012939453125, 0.744384765625, 0.7855682373046875, 0.826751708984375, 0.8679351806640625, 0.90911865234375, 0.9503021240234375, 0.991485595703125, 1.0326690673828125, 1.0738525390625, 1.1150360107421875, 1.156219482421875, 1.1974029541015625, 1.23858642578125, 1.2797698974609375, 1.320953369140625, 1.3621368408203125, 1.4033203125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 9.0, 19.0, 30.0, 18.0, 33.0, 53.0, 80.0, 117.0, 180.0, 258.0, 407.0, 556.0, 898.0, 1412.0, 2144.0, 3620.0, 5888.0, 10036.0, 17537.0, 30324.0, 53869.0, 92425.0, 143756.0, 188805.0, 178947.0, 128694.0, 79182.0, 45981.0, 26180.0, 14650.0, 8665.0, 5090.0, 3055.0, 1873.0, 1317.0, 766.0, 531.0, 382.0, 238.0, 159.0, 106.0, 80.0, 55.0, 36.0, 18.0, 16.0, 16.0, 16.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13240623474121094, -0.12797164916992188, -0.12353706359863281, -0.11910247802734375, -0.11466789245605469, -0.11023330688476562, -0.10579872131347656, -0.1013641357421875, -0.09692955017089844, -0.09249496459960938, -0.08806037902832031, -0.08362579345703125, -0.07919120788574219, -0.07475662231445312, -0.07032203674316406, -0.065887451171875, -0.06145286560058594, -0.057018280029296875, -0.05258369445800781, -0.04814910888671875, -0.04371452331542969, -0.039279937744140625, -0.03484535217285156, -0.0304107666015625, -0.025976181030273438, -0.021541595458984375, -0.017107009887695312, -0.01267242431640625, -0.008237838745117188, -0.003803253173828125, 0.0006313323974609375, 0.00506591796875, 0.009500503540039062, 0.013935089111328125, 0.018369674682617188, 0.02280426025390625, 0.027238845825195312, 0.031673431396484375, 0.03610801696777344, 0.0405426025390625, 0.04497718811035156, 0.049411773681640625, 0.05384635925292969, 0.05828094482421875, 0.06271553039550781, 0.06715011596679688, 0.07158470153808594, 0.076019287109375, 0.08045387268066406, 0.08488845825195312, 0.08932304382324219, 0.09375762939453125, 0.09819221496582031, 0.10262680053710938, 0.10706138610839844, 0.1114959716796875, 0.11593055725097656, 0.12036514282226562, 0.12479972839355469, 0.12923431396484375, 0.1336688995361328, 0.13810348510742188, 0.14253807067871094, 0.14697265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 5.0, 5.0, 12.0, 10.0, 9.0, 15.0, 18.0, 23.0, 24.0, 27.0, 25.0, 31.0, 41.0, 38.0, 29.0, 44.0, 58.0, 54.0, 1071.0, 51.0, 41.0, 37.0, 45.0, 52.0, 42.0, 39.0, 22.0, 19.0, 22.0, 21.0, 22.0, 9.0, 17.0, 9.0, 10.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.994110107421875, -0.96282958984375, -0.931549072265625, -0.9002685546875, -0.868988037109375, -0.83770751953125, -0.806427001953125, -0.775146484375, -0.743865966796875, -0.71258544921875, -0.681304931640625, -0.6500244140625, -0.618743896484375, -0.58746337890625, -0.556182861328125, -0.52490234375, -0.493621826171875, -0.46234130859375, -0.431060791015625, -0.3997802734375, -0.368499755859375, -0.33721923828125, -0.305938720703125, -0.274658203125, -0.243377685546875, -0.21209716796875, -0.180816650390625, -0.1495361328125, -0.118255615234375, -0.08697509765625, -0.055694580078125, -0.0244140625, 0.006866455078125, 0.03814697265625, 0.069427490234375, 0.1007080078125, 0.131988525390625, 0.16326904296875, 0.194549560546875, 0.225830078125, 0.257110595703125, 0.28839111328125, 0.319671630859375, 0.3509521484375, 0.382232666015625, 0.41351318359375, 0.444793701171875, 0.47607421875, 0.507354736328125, 0.53863525390625, 0.569915771484375, 0.6011962890625, 0.632476806640625, 0.66375732421875, 0.695037841796875, 0.726318359375, 0.757598876953125, 0.78887939453125, 0.820159912109375, 0.8514404296875, 0.882720947265625, 0.91400146484375, 0.945281982421875, 0.9765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 11.0, 7.0, 13.0, 19.0, 18.0, 35.0, 31.0, 45.0, 72.0, 84.0, 158.0, 243.0, 383.0, 585.0, 893.0, 1628.0, 2698.0, 5243.0, 9932.0, 19213.0, 38901.0, 76458.0, 145586.0, 454997.0, 982132.0, 171930.0, 90272.0, 46258.0, 23122.0, 11837.0, 6169.0, 3398.0, 1831.0, 1046.0, 630.0, 428.0, 270.0, 175.0, 111.0, 84.0, 60.0, 36.0, 29.0, 23.0, 14.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1015625, -0.09807586669921875, -0.0945892333984375, -0.09110260009765625, -0.087615966796875, -0.08412933349609375, -0.0806427001953125, -0.07715606689453125, -0.07366943359375, -0.07018280029296875, -0.0666961669921875, -0.06320953369140625, -0.059722900390625, -0.05623626708984375, -0.0527496337890625, -0.04926300048828125, -0.0457763671875, -0.04228973388671875, -0.0388031005859375, -0.03531646728515625, -0.031829833984375, -0.02834320068359375, -0.0248565673828125, -0.02136993408203125, -0.01788330078125, -0.01439666748046875, -0.0109100341796875, -0.00742340087890625, -0.003936767578125, -0.00045013427734375, 0.0030364990234375, 0.00652313232421875, 0.010009765625, 0.01349639892578125, 0.0169830322265625, 0.02046966552734375, 0.023956298828125, 0.02744293212890625, 0.0309295654296875, 0.03441619873046875, 0.03790283203125, 0.04138946533203125, 0.0448760986328125, 0.04836273193359375, 0.051849365234375, 0.05533599853515625, 0.0588226318359375, 0.06230926513671875, 0.0657958984375, 0.06928253173828125, 0.0727691650390625, 0.07625579833984375, 0.079742431640625, 0.08322906494140625, 0.0867156982421875, 0.09020233154296875, 0.09368896484375, 0.09717559814453125, 0.1006622314453125, 0.10414886474609375, 0.107635498046875, 0.11112213134765625, 0.1146087646484375, 0.11809539794921875, 0.12158203125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 5.0, 13.0, 8.0, 15.0, 20.0, 30.0, 58.0, 71.0, 151.0, 170.0, 155.0, 99.0, 60.0, 43.0, 29.0, 14.0, 19.0, 12.0, 5.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.027618408203125, -0.026822805404663086, -0.026027202606201172, -0.025231599807739258, -0.024435997009277344, -0.02364039421081543, -0.022844791412353516, -0.0220491886138916, -0.021253585815429688, -0.020457983016967773, -0.01966238021850586, -0.018866777420043945, -0.01807117462158203, -0.017275571823120117, -0.016479969024658203, -0.01568436622619629, -0.014888763427734375, -0.014093160629272461, -0.013297557830810547, -0.012501955032348633, -0.011706352233886719, -0.010910749435424805, -0.01011514663696289, -0.009319543838500977, -0.008523941040039062, -0.0077283382415771484, -0.006932735443115234, -0.00613713264465332, -0.005341529846191406, -0.004545927047729492, -0.003750324249267578, -0.002954721450805664, -0.00215911865234375, -0.001363515853881836, -0.0005679130554199219, 0.0002276897430419922, 0.0010232925415039062, 0.0018188953399658203, 0.0026144981384277344, 0.0034101009368896484, 0.0042057037353515625, 0.0050013065338134766, 0.005796909332275391, 0.006592512130737305, 0.007388114929199219, 0.008183717727661133, 0.008979320526123047, 0.009774923324584961, 0.010570526123046875, 0.011366128921508789, 0.012161731719970703, 0.012957334518432617, 0.013752937316894531, 0.014548540115356445, 0.01534414291381836, 0.016139745712280273, 0.016935348510742188, 0.0177309513092041, 0.018526554107666016, 0.01932215690612793, 0.020117759704589844, 0.020913362503051758, 0.021708965301513672, 0.022504568099975586, 0.0233001708984375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 12.0, 12.0, 19.0, 28.0, 54.0, 89.0, 216.0, 4752.0, 1042545.0, 529.0, 136.0, 69.0, 34.0, 11.0, 8.0, 9.0, 8.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6123123168945312, -0.5898590087890625, -0.5674057006835938, -0.544952392578125, -0.5224990844726562, -0.5000457763671875, -0.47759246826171875, -0.45513916015625, -0.43268585205078125, -0.4102325439453125, -0.38777923583984375, -0.365325927734375, -0.34287261962890625, -0.3204193115234375, -0.29796600341796875, -0.2755126953125, -0.25305938720703125, -0.2306060791015625, -0.20815277099609375, -0.185699462890625, -0.16324615478515625, -0.1407928466796875, -0.11833953857421875, -0.09588623046875, -0.07343292236328125, -0.0509796142578125, -0.02852630615234375, -0.006072998046875, 0.01638031005859375, 0.0388336181640625, 0.06128692626953125, 0.083740234375, 0.10619354248046875, 0.1286468505859375, 0.15110015869140625, 0.173553466796875, 0.19600677490234375, 0.2184600830078125, 0.24091339111328125, 0.26336669921875, 0.28582000732421875, 0.3082733154296875, 0.33072662353515625, 0.353179931640625, 0.37563323974609375, 0.3980865478515625, 0.42053985595703125, 0.4429931640625, 0.46544647216796875, 0.4878997802734375, 0.5103530883789062, 0.532806396484375, 0.5552597045898438, 0.5777130126953125, 0.6001663208007812, 0.62261962890625, 0.6450729370117188, 0.6675262451171875, 0.6899795532226562, 0.712432861328125, 0.7348861694335938, 0.7573394775390625, 0.7797927856445312, 0.80224609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 632.0, 382.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08831531554460526, -0.08150383830070496, -0.07469236105680466, -0.06788088381290436, -0.06106940656900406, -0.05425792559981346, -0.04744644835591316, -0.04063497111201286, -0.033823493868112564, -0.027012016624212265, -0.020200539380311966, -0.013389060273766518, -0.006577583029866219, 0.00023389607667922974, 0.007045373320579529, 0.013856850564479828, 0.020668327808380127, 0.027479805052280426, 0.034291282296180725, 0.041102759540081024, 0.04791423678398132, 0.05472571775317192, 0.06153719499707222, 0.06834867596626282, 0.07516014575958252, 0.08197162300348282, 0.08878310024738312, 0.09559457749128342, 0.10240605473518372, 0.10921753942966461, 0.11602900922298431, 0.12284049391746521, 0.1296519786119461, 0.136463463306427, 0.1432749330997467, 0.1500864177942276, 0.1568978875875473, 0.1637093722820282, 0.1705208420753479, 0.1773323267698288, 0.1841437965631485, 0.1909552812576294, 0.1977667510509491, 0.20457823574543, 0.2113897055387497, 0.2182011902332306, 0.2250126600265503, 0.2318241447210312, 0.23863562941551208, 0.24544711410999298, 0.2522585988044739, 0.2590700685977936, 0.2658815383911133, 0.272693008184433, 0.2795045077800751, 0.2863159775733948, 0.2931274473667145, 0.2999389171600342, 0.30675041675567627, 0.31356188654899597, 0.3203733563423157, 0.3271848261356354, 0.33399632573127747, 0.34080779552459717, 0.34761926531791687]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 11.0, 8.0, 13.0, 21.0, 19.0, 23.0, 20.0, 20.0, 45.0, 34.0, 39.0, 40.0, 66.0, 54.0, 48.0, 38.0, 56.0, 46.0, 41.0, 39.0, 41.0, 26.0, 36.0, 30.0, 36.0, 29.0, 21.0, 15.0, 15.0, 15.0, 7.0, 1.0, 7.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.01996392011642456, -0.019432932138442993, -0.018901944160461426, -0.01837095618247986, -0.01783996820449829, -0.017308980226516724, -0.016777992248535156, -0.01624700427055359, -0.01571601629257202, -0.015185028314590454, -0.014654040336608887, -0.01412305235862732, -0.013592064380645752, -0.013061076402664185, -0.012530088424682617, -0.01199910044670105, -0.011468112468719482, -0.010937124490737915, -0.010406136512756348, -0.00987514853477478, -0.009344160556793213, -0.008813172578811646, -0.008282184600830078, -0.007751196622848511, -0.007220208644866943, -0.006689220666885376, -0.006158232688903809, -0.005627244710922241, -0.005096256732940674, -0.0045652687549591064, -0.004034280776977539, -0.0035032927989959717, -0.0029723048210144043, -0.002441316843032837, -0.0019103288650512695, -0.0013793408870697021, -0.0008483529090881348, -0.0003173649311065674, 0.000213623046875, 0.0007446110248565674, 0.0012755990028381348, 0.0018065869808197021, 0.0023375749588012695, 0.002868562936782837, 0.0033995509147644043, 0.003930538892745972, 0.004461526870727539, 0.0049925148487091064, 0.005523502826690674, 0.006054490804672241, 0.006585478782653809, 0.007116466760635376, 0.007647454738616943, 0.00817844271659851, 0.008709430694580078, 0.009240418672561646, 0.009771406650543213, 0.01030239462852478, 0.010833382606506348, 0.011364370584487915, 0.011895358562469482, 0.01242634654045105, 0.012957334518432617, 0.013488322496414185, 0.014019310474395752]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 9.0, 6.0, 11.0, 9.0, 15.0, 9.0, 8.0, 8.0, 23.0, 14.0, 23.0, 23.0, 25.0, 30.0, 30.0, 26.0, 33.0, 33.0, 49.0, 38.0, 40.0, 41.0, 39.0, 40.0, 39.0, 39.0, 29.0, 43.0, 31.0, 34.0, 20.0, 25.0, 27.0, 25.0, 26.0, 16.0, 11.0, 14.0, 7.0, 8.0, 9.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.232421875, -1.1912384033203125, -1.150054931640625, -1.1088714599609375, -1.06768798828125, -1.0265045166015625, -0.985321044921875, -0.9441375732421875, -0.9029541015625, -0.8617706298828125, -0.820587158203125, -0.7794036865234375, -0.73822021484375, -0.6970367431640625, -0.655853271484375, -0.6146697998046875, -0.573486328125, -0.5323028564453125, -0.491119384765625, -0.4499359130859375, -0.40875244140625, -0.3675689697265625, -0.326385498046875, -0.2852020263671875, -0.2440185546875, -0.2028350830078125, -0.161651611328125, -0.1204681396484375, -0.07928466796875, -0.0381011962890625, 0.003082275390625, 0.0442657470703125, 0.08544921875, 0.1266326904296875, 0.167816162109375, 0.2089996337890625, 0.25018310546875, 0.2913665771484375, 0.332550048828125, 0.3737335205078125, 0.4149169921875, 0.4561004638671875, 0.497283935546875, 0.5384674072265625, 0.57965087890625, 0.6208343505859375, 0.662017822265625, 0.7032012939453125, 0.744384765625, 0.7855682373046875, 0.826751708984375, 0.8679351806640625, 0.90911865234375, 0.9503021240234375, 0.991485595703125, 1.0326690673828125, 1.0738525390625, 1.1150360107421875, 1.156219482421875, 1.1974029541015625, 1.23858642578125, 1.2797698974609375, 1.320953369140625, 1.3621368408203125, 1.4033203125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 18.0, 20.0, 21.0, 42.0, 50.0, 74.0, 119.0, 187.0, 295.0, 486.0, 818.0, 1356.0, 2195.0, 3623.0, 6452.0, 11703.0, 21809.0, 41224.0, 80510.0, 154594.0, 240287.0, 218090.0, 126495.0, 64203.0, 33225.0, 17650.0, 9690.0, 5447.0, 3137.0, 1830.0, 1106.0, 654.0, 427.0, 264.0, 137.0, 105.0, 68.0, 49.0, 37.0, 17.0, 12.0, 10.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6298828125, -1.5770263671875, -1.524169921875, -1.4713134765625, -1.41845703125, -1.3656005859375, -1.312744140625, -1.2598876953125, -1.20703125, -1.1541748046875, -1.101318359375, -1.0484619140625, -0.99560546875, -0.9427490234375, -0.889892578125, -0.8370361328125, -0.7841796875, -0.7313232421875, -0.678466796875, -0.6256103515625, -0.57275390625, -0.5198974609375, -0.467041015625, -0.4141845703125, -0.361328125, -0.3084716796875, -0.255615234375, -0.2027587890625, -0.14990234375, -0.0970458984375, -0.044189453125, 0.0086669921875, 0.0615234375, 0.1143798828125, 0.167236328125, 0.2200927734375, 0.27294921875, 0.3258056640625, 0.378662109375, 0.4315185546875, 0.484375, 0.5372314453125, 0.590087890625, 0.6429443359375, 0.69580078125, 0.7486572265625, 0.801513671875, 0.8543701171875, 0.9072265625, 0.9600830078125, 1.012939453125, 1.0657958984375, 1.11865234375, 1.1715087890625, 1.224365234375, 1.2772216796875, 1.330078125, 1.3829345703125, 1.435791015625, 1.4886474609375, 1.54150390625, 1.5943603515625, 1.647216796875, 1.7000732421875, 1.7529296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 5.0, 8.0, 10.0, 8.0, 9.0, 11.0, 17.0, 18.0, 21.0, 22.0, 29.0, 35.0, 45.0, 52.0, 48.0, 64.0, 100.0, 149.0, 228.0, 1328.0, 190.0, 146.0, 77.0, 70.0, 52.0, 40.0, 39.0, 24.0, 28.0, 20.0, 29.0, 18.0, 22.0, 13.0, 14.0, 12.0, 7.0, 8.0, 3.0, 9.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.685546875, -2.5843505859375, -2.483154296875, -2.3819580078125, -2.28076171875, -2.1795654296875, -2.078369140625, -1.9771728515625, -1.8759765625, -1.7747802734375, -1.673583984375, -1.5723876953125, -1.47119140625, -1.3699951171875, -1.268798828125, -1.1676025390625, -1.06640625, -0.9652099609375, -0.864013671875, -0.7628173828125, -0.66162109375, -0.5604248046875, -0.459228515625, -0.3580322265625, -0.2568359375, -0.1556396484375, -0.054443359375, 0.0467529296875, 0.14794921875, 0.2491455078125, 0.350341796875, 0.4515380859375, 0.552734375, 0.6539306640625, 0.755126953125, 0.8563232421875, 0.95751953125, 1.0587158203125, 1.159912109375, 1.2611083984375, 1.3623046875, 1.4635009765625, 1.564697265625, 1.6658935546875, 1.76708984375, 1.8682861328125, 1.969482421875, 2.0706787109375, 2.171875, 2.2730712890625, 2.374267578125, 2.4754638671875, 2.57666015625, 2.6778564453125, 2.779052734375, 2.8802490234375, 2.9814453125, 3.0826416015625, 3.183837890625, 3.2850341796875, 3.38623046875, 3.4874267578125, 3.588623046875, 3.6898193359375, 3.791015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 7.0, 11.0, 17.0, 18.0, 31.0, 38.0, 43.0, 67.0, 83.0, 136.0, 180.0, 235.0, 428.0, 831.0, 2793.0, 13175.0, 87537.0, 1083729.0, 1793976.0, 137289.0, 18874.0, 3701.0, 1071.0, 478.0, 258.0, 190.0, 121.0, 95.0, 62.0, 59.0, 37.0, 39.0, 28.0, 7.0, 16.0, 5.0, 6.0, 8.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.12890625, -3.99615478515625, -3.8634033203125, -3.73065185546875, -3.597900390625, -3.46514892578125, -3.3323974609375, -3.19964599609375, -3.06689453125, -2.93414306640625, -2.8013916015625, -2.66864013671875, -2.535888671875, -2.40313720703125, -2.2703857421875, -2.13763427734375, -2.0048828125, -1.87213134765625, -1.7393798828125, -1.60662841796875, -1.473876953125, -1.34112548828125, -1.2083740234375, -1.07562255859375, -0.94287109375, -0.81011962890625, -0.6773681640625, -0.54461669921875, -0.411865234375, -0.27911376953125, -0.1463623046875, -0.01361083984375, 0.119140625, 0.25189208984375, 0.3846435546875, 0.51739501953125, 0.650146484375, 0.78289794921875, 0.9156494140625, 1.04840087890625, 1.18115234375, 1.31390380859375, 1.4466552734375, 1.57940673828125, 1.712158203125, 1.84490966796875, 1.9776611328125, 2.11041259765625, 2.2431640625, 2.37591552734375, 2.5086669921875, 2.64141845703125, 2.774169921875, 2.90692138671875, 3.0396728515625, 3.17242431640625, 3.30517578125, 3.43792724609375, 3.5706787109375, 3.70343017578125, 3.836181640625, 3.96893310546875, 4.1016845703125, 4.23443603515625, 4.3671875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 11.0, 169.0, 429.0, 320.0, 80.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8735671043396, -3.858931541442871, -2.8442962169647217, -1.8296608924865723, -0.8150253295898438, 0.19961023330688477, 1.214245319366455, 2.2288808822631836, 3.243516445159912, 4.258152008056641, 5.272787094116211, 6.2874226570129395, 7.302058219909668, 8.316694259643555, 9.331329345703125, 10.345964431762695, 11.360599517822266, 12.375234603881836, 13.389870643615723, 14.404505729675293, 15.41914176940918, 16.43377685546875, 17.44841194152832, 18.46304702758789, 19.477684020996094, 20.492319107055664, 21.506954193115234, 22.521591186523438, 23.536226272583008, 24.550861358642578, 25.56549644470215, 26.58013153076172, 27.594764709472656, 28.609399795532227, 29.624034881591797, 30.638671875, 31.65330696105957, 32.66794204711914, 33.682579040527344, 34.69721221923828, 35.711849212646484, 36.72648620605469, 37.741119384765625, 38.75575637817383, 39.770389556884766, 40.78502655029297, 41.799659729003906, 42.81429672241211, 43.82893371582031, 44.843570709228516, 45.85820388793945, 46.872840881347656, 47.887474060058594, 48.9021110534668, 49.916748046875, 50.93138122558594, 51.946014404296875, 52.96065139770508, 53.975284576416016, 54.98992156982422, 56.004554748535156, 57.01919174194336, 58.03382873535156, 59.0484619140625, 60.0630989074707]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 9.0, 2.0, 8.0, 14.0, 14.0, 23.0, 19.0, 17.0, 22.0, 29.0, 39.0, 36.0, 35.0, 37.0, 46.0, 43.0, 37.0, 44.0, 45.0, 47.0, 29.0, 43.0, 43.0, 51.0, 41.0, 26.0, 31.0, 30.0, 24.0, 22.0, 6.0, 24.0, 13.0, 8.0, 11.0, 9.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.088802337646484, -7.836400985717773, -7.583999156951904, -7.331597805023193, -7.079195976257324, -6.826794624328613, -6.574393272399902, -6.321991920471191, -6.069590091705322, -5.817188739776611, -5.564786911010742, -5.312385559082031, -5.05998420715332, -4.807582378387451, -4.55518102645874, -4.302779197692871, -4.05037784576416, -3.79797625541687, -3.54557466506958, -3.293173313140869, -3.040771722793579, -2.788370132446289, -2.535968780517578, -2.283567190170288, -2.031165599822998, -1.778764009475708, -1.5263625383377075, -1.273961067199707, -1.021559476852417, -0.769157886505127, -0.5167564153671265, -0.264354944229126, -0.011953353881835938, 0.24044817686080933, 0.4928497076034546, 0.7452512383460999, 0.9976527690887451, 1.2500543594360352, 1.5024558305740356, 1.7548573017120361, 2.007258892059326, 2.259660482406616, 2.5120620727539062, 2.764463424682617, 3.0168650150299072, 3.2692666053771973, 3.521667957305908, 3.7740695476531982, 4.026471138000488, 4.278872489929199, 4.531274318695068, 4.783675670623779, 5.036077499389648, 5.288478851318359, 5.54088020324707, 5.793281555175781, 6.04568338394165, 6.298084735870361, 6.5504865646362305, 6.802887916564941, 7.055289268493652, 7.3076910972595215, 7.560092449188232, 7.812494277954102, 8.064895629882812]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 2.0, 3.0, 14.0, 15.0, 14.0, 21.0, 14.0, 20.0, 22.0, 23.0, 26.0, 29.0, 32.0, 31.0, 29.0, 45.0, 44.0, 39.0, 38.0, 45.0, 44.0, 42.0, 46.0, 43.0, 33.0, 37.0, 26.0, 28.0, 31.0, 33.0, 21.0, 19.0, 15.0, 9.0, 14.0, 11.0, 9.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.396484375, -1.353240966796875, -1.30999755859375, -1.266754150390625, -1.2235107421875, -1.180267333984375, -1.13702392578125, -1.093780517578125, -1.050537109375, -1.007293701171875, -0.96405029296875, -0.920806884765625, -0.8775634765625, -0.834320068359375, -0.79107666015625, -0.747833251953125, -0.70458984375, -0.661346435546875, -0.61810302734375, -0.574859619140625, -0.5316162109375, -0.488372802734375, -0.44512939453125, -0.401885986328125, -0.358642578125, -0.315399169921875, -0.27215576171875, -0.228912353515625, -0.1856689453125, -0.142425537109375, -0.09918212890625, -0.055938720703125, -0.0126953125, 0.030548095703125, 0.07379150390625, 0.117034912109375, 0.1602783203125, 0.203521728515625, 0.24676513671875, 0.290008544921875, 0.333251953125, 0.376495361328125, 0.41973876953125, 0.462982177734375, 0.5062255859375, 0.549468994140625, 0.59271240234375, 0.635955810546875, 0.67919921875, 0.722442626953125, 0.76568603515625, 0.808929443359375, 0.8521728515625, 0.895416259765625, 0.93865966796875, 0.981903076171875, 1.025146484375, 1.068389892578125, 1.11163330078125, 1.154876708984375, 1.1981201171875, 1.241363525390625, 1.28460693359375, 1.327850341796875, 1.37109375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 6.0, 9.0, 11.0, 16.0, 12.0, 29.0, 36.0, 42.0, 86.0, 99.0, 200.0, 283.0, 547.0, 998.0, 2039.0, 4564.0, 11511.0, 34614.0, 136467.0, 756055.0, 2385035.0, 685010.0, 125646.0, 32121.0, 10581.0, 4186.0, 1852.0, 941.0, 498.0, 280.0, 148.0, 109.0, 60.0, 38.0, 30.0, 31.0, 29.0, 19.0, 7.0, 6.0, 5.0, 6.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.16015625, -3.0684814453125, -2.976806640625, -2.8851318359375, -2.79345703125, -2.7017822265625, -2.610107421875, -2.5184326171875, -2.4267578125, -2.3350830078125, -2.243408203125, -2.1517333984375, -2.06005859375, -1.9683837890625, -1.876708984375, -1.7850341796875, -1.693359375, -1.6016845703125, -1.510009765625, -1.4183349609375, -1.32666015625, -1.2349853515625, -1.143310546875, -1.0516357421875, -0.9599609375, -0.8682861328125, -0.776611328125, -0.6849365234375, -0.59326171875, -0.5015869140625, -0.409912109375, -0.3182373046875, -0.2265625, -0.1348876953125, -0.043212890625, 0.0484619140625, 0.14013671875, 0.2318115234375, 0.323486328125, 0.4151611328125, 0.5068359375, 0.5985107421875, 0.690185546875, 0.7818603515625, 0.87353515625, 0.9652099609375, 1.056884765625, 1.1485595703125, 1.240234375, 1.3319091796875, 1.423583984375, 1.5152587890625, 1.60693359375, 1.6986083984375, 1.790283203125, 1.8819580078125, 1.9736328125, 2.0653076171875, 2.156982421875, 2.2486572265625, 2.34033203125, 2.4320068359375, 2.523681640625, 2.6153564453125, 2.70703125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 8.0, 9.0, 15.0, 24.0, 26.0, 25.0, 37.0, 52.0, 53.0, 81.0, 104.0, 123.0, 168.0, 208.0, 313.0, 355.0, 463.0, 445.0, 343.0, 287.0, 220.0, 176.0, 122.0, 108.0, 68.0, 46.0, 36.0, 37.0, 20.0, 19.0, 11.0, 13.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.890625, -1.835113525390625, -1.77960205078125, -1.724090576171875, -1.6685791015625, -1.613067626953125, -1.55755615234375, -1.502044677734375, -1.446533203125, -1.391021728515625, -1.33551025390625, -1.279998779296875, -1.2244873046875, -1.168975830078125, -1.11346435546875, -1.057952880859375, -1.00244140625, -0.946929931640625, -0.89141845703125, -0.835906982421875, -0.7803955078125, -0.724884033203125, -0.66937255859375, -0.613861083984375, -0.558349609375, -0.502838134765625, -0.44732666015625, -0.391815185546875, -0.3363037109375, -0.280792236328125, -0.22528076171875, -0.169769287109375, -0.1142578125, -0.058746337890625, -0.00323486328125, 0.052276611328125, 0.1077880859375, 0.163299560546875, 0.21881103515625, 0.274322509765625, 0.329833984375, 0.385345458984375, 0.44085693359375, 0.496368408203125, 0.5518798828125, 0.607391357421875, 0.66290283203125, 0.718414306640625, 0.77392578125, 0.829437255859375, 0.88494873046875, 0.940460205078125, 0.9959716796875, 1.051483154296875, 1.10699462890625, 1.162506103515625, 1.218017578125, 1.273529052734375, 1.32904052734375, 1.384552001953125, 1.4400634765625, 1.495574951171875, 1.55108642578125, 1.606597900390625, 1.662109375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 12.0, 13.0, 50.0, 90.0, 207.0, 882.0, 6629.0, 130413.0, 3661679.0, 378614.0, 13679.0, 1452.0, 356.0, 112.0, 41.0, 19.0, 20.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55859375, -4.28460693359375, -4.0106201171875, -3.73663330078125, -3.462646484375, -3.18865966796875, -2.9146728515625, -2.64068603515625, -2.36669921875, -2.09271240234375, -1.8187255859375, -1.54473876953125, -1.270751953125, -0.99676513671875, -0.7227783203125, -0.44879150390625, -0.1748046875, 0.09918212890625, 0.3731689453125, 0.64715576171875, 0.921142578125, 1.19512939453125, 1.4691162109375, 1.74310302734375, 2.01708984375, 2.29107666015625, 2.5650634765625, 2.83905029296875, 3.113037109375, 3.38702392578125, 3.6610107421875, 3.93499755859375, 4.208984375, 4.48297119140625, 4.7569580078125, 5.03094482421875, 5.304931640625, 5.57891845703125, 5.8529052734375, 6.12689208984375, 6.40087890625, 6.67486572265625, 6.9488525390625, 7.22283935546875, 7.496826171875, 7.77081298828125, 8.0447998046875, 8.31878662109375, 8.5927734375, 8.86676025390625, 9.1407470703125, 9.41473388671875, 9.688720703125, 9.96270751953125, 10.2366943359375, 10.51068115234375, 10.78466796875, 11.05865478515625, 11.3326416015625, 11.60662841796875, 11.880615234375, 12.15460205078125, 12.4285888671875, 12.70257568359375, 12.9765625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 15.0, 995.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.98579788208008, -27.009933471679688, -21.03407096862793, -15.058208465576172, -9.082344055175781, -3.1064796447753906, 2.8693809509277344, 8.845245361328125, 14.821109771728516, 20.796974182128906, 26.772836685180664, 32.74869918823242, 38.72456359863281, 44.7004280090332, 50.67628860473633, 56.65215301513672, 62.62801742553711, 68.6038818359375, 74.57974243164062, 80.55560302734375, 86.5314712524414, 92.50733947753906, 98.48320007324219, 104.45906066894531, 110.43492126464844, 116.41078186035156, 122.38665008544922, 128.36251831054688, 134.33837890625, 140.31423950195312, 146.29010009765625, 152.26596069335938, 158.2418212890625, 164.21768188476562, 170.19354248046875, 176.16940307617188, 182.14527893066406, 188.1211395263672, 194.0970001220703, 200.07286071777344, 206.04873657226562, 212.02459716796875, 218.00045776367188, 223.976318359375, 229.9521942138672, 235.9280548095703, 241.90391540527344, 247.87977600097656, 253.8556365966797, 259.8315124511719, 265.807373046875, 271.7832336425781, 277.75909423828125, 283.7349548339844, 289.7108154296875, 295.6866760253906, 301.66253662109375, 307.6383972167969, 313.6142578125, 319.5901184082031, 325.56597900390625, 331.5418701171875, 337.5177001953125, 343.49359130859375, 349.4694519042969]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 6.0, 4.0, 11.0, 4.0, 16.0, 13.0, 17.0, 21.0, 28.0, 37.0, 39.0, 55.0, 35.0, 40.0, 61.0, 45.0, 56.0, 52.0, 56.0, 59.0, 31.0, 39.0, 37.0, 38.0, 33.0, 32.0, 25.0, 21.0, 14.0, 21.0, 9.0, 8.0, 12.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.368560791015625, -14.911890029907227, -14.455219268798828, -13.99854850769043, -13.541876792907715, -13.085206031799316, -12.628535270690918, -12.17186450958252, -11.715193748474121, -11.258522987365723, -10.801852226257324, -10.34518051147461, -9.888509750366211, -9.431838989257812, -8.975168228149414, -8.518497467041016, -8.061826705932617, -7.605155944824219, -7.148484706878662, -6.691813945770264, -6.235143184661865, -5.778471946716309, -5.32180118560791, -4.865130424499512, -4.408458709716797, -3.9517877101898193, -3.495116949081421, -3.0384459495544434, -2.581775188446045, -2.1251041889190674, -1.6684331893920898, -1.2117624282836914, -0.755091667175293, -0.2984207570552826, 0.15825015306472778, 0.6149210929870605, 1.0715919733047485, 1.5282628536224365, 1.984933853149414, 2.4416046142578125, 2.89827561378479, 3.3549466133117676, 3.811617374420166, 4.268288612365723, 4.724959373474121, 5.1816301345825195, 5.638300895690918, 6.094971656799316, 6.551642894744873, 7.0083136558532715, 7.464984893798828, 7.921655654907227, 8.378326416015625, 8.834997177124023, 9.291667938232422, 9.74833869934082, 10.205010414123535, 10.661681175231934, 11.118351936340332, 11.575023651123047, 12.031694412231445, 12.488365173339844, 12.945035934448242, 13.40170669555664, 13.858377456665039]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 6.0, 9.0, 6.0, 6.0, 5.0, 6.0, 12.0, 8.0, 10.0, 26.0, 19.0, 37.0, 20.0, 26.0, 30.0, 32.0, 24.0, 38.0, 37.0, 30.0, 44.0, 47.0, 38.0, 44.0, 37.0, 38.0, 31.0, 37.0, 40.0, 23.0, 24.0, 28.0, 29.0, 24.0, 20.0, 15.0, 12.0, 14.0, 14.0, 11.0, 14.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.2442169189453125, -1.203277587890625, -1.1623382568359375, -1.12139892578125, -1.0804595947265625, -1.039520263671875, -0.9985809326171875, -0.9576416015625, -0.9167022705078125, -0.875762939453125, -0.8348236083984375, -0.79388427734375, -0.7529449462890625, -0.712005615234375, -0.6710662841796875, -0.630126953125, -0.5891876220703125, -0.548248291015625, -0.5073089599609375, -0.46636962890625, -0.4254302978515625, -0.384490966796875, -0.3435516357421875, -0.3026123046875, -0.2616729736328125, -0.220733642578125, -0.1797943115234375, -0.13885498046875, -0.0979156494140625, -0.056976318359375, -0.0160369873046875, 0.02490234375, 0.0658416748046875, 0.106781005859375, 0.1477203369140625, 0.18865966796875, 0.2295989990234375, 0.270538330078125, 0.3114776611328125, 0.3524169921875, 0.3933563232421875, 0.434295654296875, 0.4752349853515625, 0.51617431640625, 0.5571136474609375, 0.598052978515625, 0.6389923095703125, 0.679931640625, 0.7208709716796875, 0.761810302734375, 0.8027496337890625, 0.84368896484375, 0.8846282958984375, 0.925567626953125, 0.9665069580078125, 1.0074462890625, 1.0483856201171875, 1.089324951171875, 1.1302642822265625, 1.17120361328125, 1.2121429443359375, 1.253082275390625, 1.2940216064453125, 1.3349609375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 15.0, 16.0, 22.0, 35.0, 59.0, 82.0, 139.0, 186.0, 293.0, 439.0, 784.0, 1250.0, 1947.0, 3125.0, 4849.0, 8006.0, 13023.0, 21182.0, 33185.0, 50876.0, 74874.0, 103276.0, 129535.0, 141587.0, 131393.0, 106372.0, 76895.0, 52880.0, 34240.0, 21906.0, 13787.0, 8491.0, 5146.0, 3288.0, 1936.0, 1238.0, 779.0, 504.0, 321.0, 218.0, 128.0, 85.0, 55.0, 38.0, 15.0, 18.0, 14.0, 10.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09735107421875, -0.09416389465332031, -0.09097671508789062, -0.08778953552246094, -0.08460235595703125, -0.08141517639160156, -0.07822799682617188, -0.07504081726074219, -0.0718536376953125, -0.06866645812988281, -0.06547927856445312, -0.06229209899902344, -0.05910491943359375, -0.05591773986816406, -0.052730560302734375, -0.04954338073730469, -0.046356201171875, -0.04316902160644531, -0.039981842041015625, -0.03679466247558594, -0.03360748291015625, -0.030420303344726562, -0.027233123779296875, -0.024045944213867188, -0.0208587646484375, -0.017671585083007812, -0.014484405517578125, -0.011297225952148438, -0.00811004638671875, -0.0049228668212890625, -0.001735687255859375, 0.0014514923095703125, 0.004638671875, 0.007825851440429688, 0.011013031005859375, 0.014200210571289062, 0.01738739013671875, 0.020574569702148438, 0.023761749267578125, 0.026948928833007812, 0.0301361083984375, 0.03332328796386719, 0.036510467529296875, 0.03969764709472656, 0.04288482666015625, 0.04607200622558594, 0.049259185791015625, 0.05244636535644531, 0.055633544921875, 0.05882072448730469, 0.062007904052734375, 0.06519508361816406, 0.06838226318359375, 0.07156944274902344, 0.07475662231445312, 0.07794380187988281, 0.0811309814453125, 0.08431816101074219, 0.08750534057617188, 0.09069252014160156, 0.09387969970703125, 0.09706687927246094, 0.10025405883789062, 0.10344123840332031, 0.10662841796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 10.0, 5.0, 13.0, 11.0, 14.0, 18.0, 17.0, 22.0, 25.0, 24.0, 25.0, 28.0, 27.0, 29.0, 30.0, 27.0, 42.0, 39.0, 43.0, 39.0, 1062.0, 42.0, 42.0, 40.0, 33.0, 26.0, 29.0, 28.0, 31.0, 35.0, 27.0, 18.0, 17.0, 14.0, 17.0, 18.0, 9.0, 10.0, 10.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.92578125, -0.8986663818359375, -0.871551513671875, -0.8444366455078125, -0.81732177734375, -0.7902069091796875, -0.763092041015625, -0.7359771728515625, -0.7088623046875, -0.6817474365234375, -0.654632568359375, -0.6275177001953125, -0.60040283203125, -0.5732879638671875, -0.546173095703125, -0.5190582275390625, -0.491943359375, -0.4648284912109375, -0.437713623046875, -0.4105987548828125, -0.38348388671875, -0.3563690185546875, -0.329254150390625, -0.3021392822265625, -0.2750244140625, -0.2479095458984375, -0.220794677734375, -0.1936798095703125, -0.16656494140625, -0.1394500732421875, -0.112335205078125, -0.0852203369140625, -0.05810546875, -0.0309906005859375, -0.003875732421875, 0.0232391357421875, 0.05035400390625, 0.0774688720703125, 0.104583740234375, 0.1316986083984375, 0.1588134765625, 0.1859283447265625, 0.213043212890625, 0.2401580810546875, 0.26727294921875, 0.2943878173828125, 0.321502685546875, 0.3486175537109375, 0.375732421875, 0.4028472900390625, 0.429962158203125, 0.4570770263671875, 0.48419189453125, 0.5113067626953125, 0.538421630859375, 0.5655364990234375, 0.5926513671875, 0.6197662353515625, 0.646881103515625, 0.6739959716796875, 0.70111083984375, 0.7282257080078125, 0.755340576171875, 0.7824554443359375, 0.8095703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 7.0, 6.0, 12.0, 14.0, 23.0, 25.0, 56.0, 85.0, 124.0, 209.0, 361.0, 562.0, 997.0, 1643.0, 2726.0, 4523.0, 7966.0, 13041.0, 22449.0, 37534.0, 60233.0, 94887.0, 151978.0, 803255.0, 525999.0, 138772.0, 88174.0, 56202.0, 34418.0, 20634.0, 12331.0, 7297.0, 4311.0, 2527.0, 1505.0, 877.0, 522.0, 311.0, 200.0, 117.0, 80.0, 54.0, 26.0, 16.0, 14.0, 13.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08050537109375, -0.07806015014648438, -0.07561492919921875, -0.07316970825195312, -0.0707244873046875, -0.06827926635742188, -0.06583404541015625, -0.06338882446289062, -0.060943603515625, -0.058498382568359375, -0.05605316162109375, -0.053607940673828125, -0.0511627197265625, -0.048717498779296875, -0.04627227783203125, -0.043827056884765625, -0.0413818359375, -0.038936614990234375, -0.03649139404296875, -0.034046173095703125, -0.0316009521484375, -0.029155731201171875, -0.02671051025390625, -0.024265289306640625, -0.021820068359375, -0.019374847412109375, -0.01692962646484375, -0.014484405517578125, -0.0120391845703125, -0.009593963623046875, -0.00714874267578125, -0.004703521728515625, -0.00225830078125, 0.000186920166015625, 0.00263214111328125, 0.005077362060546875, 0.0075225830078125, 0.009967803955078125, 0.01241302490234375, 0.014858245849609375, 0.017303466796875, 0.019748687744140625, 0.02219390869140625, 0.024639129638671875, 0.0270843505859375, 0.029529571533203125, 0.03197479248046875, 0.034420013427734375, 0.036865234375, 0.039310455322265625, 0.04175567626953125, 0.044200897216796875, 0.0466461181640625, 0.049091339111328125, 0.05153656005859375, 0.053981781005859375, 0.056427001953125, 0.058872222900390625, 0.06131744384765625, 0.06376266479492188, 0.0662078857421875, 0.06865310668945312, 0.07109832763671875, 0.07354354858398438, 0.07598876953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 8.0, 14.0, 18.0, 10.0, 14.0, 25.0, 21.0, 34.0, 29.0, 60.0, 42.0, 53.0, 67.0, 79.0, 83.0, 74.0, 58.0, 49.0, 47.0, 45.0, 31.0, 25.0, 18.0, 14.0, 14.0, 10.0, 8.0, 3.0, 4.0, 5.0, 6.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0124664306640625, -0.012063980102539062, -0.011661529541015625, -0.011259078979492188, -0.01085662841796875, -0.010454177856445312, -0.010051727294921875, -0.009649276733398438, -0.009246826171875, -0.008844375610351562, -0.008441925048828125, -0.008039474487304688, -0.00763702392578125, -0.0072345733642578125, -0.006832122802734375, -0.0064296722412109375, -0.0060272216796875, -0.0056247711181640625, -0.005222320556640625, -0.0048198699951171875, -0.00441741943359375, -0.0040149688720703125, -0.003612518310546875, -0.0032100677490234375, -0.0028076171875, -0.0024051666259765625, -0.002002716064453125, -0.0016002655029296875, -0.00119781494140625, -0.0007953643798828125, -0.000392913818359375, 9.5367431640625e-06, 0.0004119873046875, 0.0008144378662109375, 0.001216888427734375, 0.0016193389892578125, 0.00202178955078125, 0.0024242401123046875, 0.002826690673828125, 0.0032291412353515625, 0.003631591796875, 0.0040340423583984375, 0.004436492919921875, 0.0048389434814453125, 0.00524139404296875, 0.0056438446044921875, 0.006046295166015625, 0.0064487457275390625, 0.0068511962890625, 0.0072536468505859375, 0.007656097412109375, 0.008058547973632812, 0.00846099853515625, 0.008863449096679688, 0.009265899658203125, 0.009668350219726562, 0.01007080078125, 0.010473251342773438, 0.010875701904296875, 0.011278152465820312, 0.01168060302734375, 0.012083053588867188, 0.012485504150390625, 0.012887954711914062, 0.0132904052734375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 13.0, 15.0, 19.0, 19.0, 19.0, 34.0, 43.0, 54.0, 72.0, 104.0, 174.0, 782.0, 15062.0, 1026210.0, 4941.0, 441.0, 133.0, 80.0, 66.0, 53.0, 42.0, 31.0, 22.0, 20.0, 15.0, 18.0, 7.0, 15.0, 5.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.267822265625, -0.258026123046875, -0.24822998046875, -0.238433837890625, -0.2286376953125, -0.218841552734375, -0.20904541015625, -0.199249267578125, -0.189453125, -0.179656982421875, -0.16986083984375, -0.160064697265625, -0.1502685546875, -0.140472412109375, -0.13067626953125, -0.120880126953125, -0.111083984375, -0.101287841796875, -0.09149169921875, -0.081695556640625, -0.0718994140625, -0.062103271484375, -0.05230712890625, -0.042510986328125, -0.03271484375, -0.022918701171875, -0.01312255859375, -0.003326416015625, 0.0064697265625, 0.016265869140625, 0.02606201171875, 0.035858154296875, 0.045654296875, 0.055450439453125, 0.06524658203125, 0.075042724609375, 0.0848388671875, 0.094635009765625, 0.10443115234375, 0.114227294921875, 0.1240234375, 0.133819580078125, 0.14361572265625, 0.153411865234375, 0.1632080078125, 0.173004150390625, 0.18280029296875, 0.192596435546875, 0.202392578125, 0.212188720703125, 0.22198486328125, 0.231781005859375, 0.2415771484375, 0.251373291015625, 0.26116943359375, 0.270965576171875, 0.28076171875, 0.290557861328125, 0.30035400390625, 0.310150146484375, 0.3199462890625, 0.329742431640625, 0.33953857421875, 0.349334716796875, 0.359130859375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 53.0, 521.0, 386.0, 39.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14927704632282257, -0.14640367031097412, -0.14353029429912567, -0.14065691828727722, -0.13778354227542877, -0.13491016626358032, -0.13203679025173187, -0.12916341423988342, -0.12629005312919617, -0.12341667711734772, -0.12054330110549927, -0.11766992509365082, -0.11479654908180237, -0.11192318052053452, -0.10904980450868607, -0.10617642849683762, -0.10330304503440857, -0.10042966902256012, -0.09755629301071167, -0.09468291699886322, -0.09180954098701477, -0.08893617242574692, -0.08606279641389847, -0.08318942040205002, -0.08031604439020157, -0.07744266837835312, -0.07456929236650467, -0.07169591635465622, -0.06882254779338837, -0.06594917178153992, -0.06307579576969147, -0.06020241975784302, -0.05732904374599457, -0.05445566773414612, -0.05158229172229767, -0.04870891943573952, -0.04583554342389107, -0.04296216741204262, -0.04008879512548447, -0.03721541911363602, -0.03434204310178757, -0.03146866708993912, -0.028595292940735817, -0.025721918791532516, -0.022848542779684067, -0.019975166767835617, -0.017101792618632317, -0.014228418469429016, -0.011355042457580566, -0.008481667377054691, -0.005608292296528816, -0.002734917216002941, 0.00013845786452293396, 0.003011832945048809, 0.005885208025574684, 0.008758582174777985, 0.011631958186626434, 0.01450533326715231, 0.017378708347678185, 0.020252082496881485, 0.023125458508729935, 0.025998834520578384, 0.028872208669781685, 0.031745582818984985, 0.034618958830833435]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 11.0, 10.0, 13.0, 11.0, 8.0, 25.0, 22.0, 21.0, 29.0, 14.0, 27.0, 27.0, 34.0, 33.0, 29.0, 34.0, 38.0, 42.0, 40.0, 40.0, 24.0, 48.0, 49.0, 33.0, 31.0, 34.0, 33.0, 26.0, 20.0, 20.0, 28.0, 12.0, 8.0, 16.0, 7.0, 15.0, 14.0, 9.0, 11.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.010895252227783203, -0.010523577220737934, -0.010151902213692665, -0.009780227206647396, -0.009408552199602127, -0.009036877192556858, -0.008665202185511589, -0.00829352717846632, -0.007921852171421051, -0.007550177164375782, -0.007178502157330513, -0.006806827150285244, -0.006435152143239975, -0.006063477136194706, -0.005691802129149437, -0.005320127122104168, -0.004948452115058899, -0.00457677710801363, -0.004205102100968361, -0.003833427093923092, -0.003461752086877823, -0.003090077079832554, -0.002718402072787285, -0.002346727065742016, -0.001975052058696747, -0.0016033770516514778, -0.0012317020446062088, -0.0008600270375609398, -0.0004883520305156708, -0.00011667702347040176, 0.00025499798357486725, 0.0006266729906201363, 0.0009983479976654053, 0.0013700230047106743, 0.0017416980117559433, 0.0021133730188012123, 0.0024850480258464813, 0.0028567230328917503, 0.0032283980399370193, 0.0036000730469822884, 0.003971748054027557, 0.004343423061072826, 0.004715098068118095, 0.005086773075163364, 0.005458448082208633, 0.0058301230892539024, 0.0062017980962991714, 0.0065734731033444405, 0.0069451481103897095, 0.0073168231174349785, 0.0076884981244802475, 0.008060173131525517, 0.008431848138570786, 0.008803523145616055, 0.009175198152661324, 0.009546873159706593, 0.009918548166751862, 0.01029022317379713, 0.0106618981808424, 0.011033573187887669, 0.011405248194932938, 0.011776923201978207, 0.012148598209023476, 0.012520273216068745, 0.012891948223114014]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 6.0, 9.0, 6.0, 6.0, 5.0, 6.0, 12.0, 8.0, 10.0, 26.0, 19.0, 37.0, 20.0, 26.0, 30.0, 32.0, 23.0, 39.0, 37.0, 30.0, 44.0, 48.0, 37.0, 44.0, 37.0, 38.0, 30.0, 38.0, 40.0, 23.0, 24.0, 28.0, 29.0, 25.0, 19.0, 15.0, 13.0, 13.0, 14.0, 11.0, 14.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2861328125, -1.2451629638671875, -1.204193115234375, -1.1632232666015625, -1.12225341796875, -1.0812835693359375, -1.040313720703125, -0.9993438720703125, -0.9583740234375, -0.9174041748046875, -0.876434326171875, -0.8354644775390625, -0.79449462890625, -0.7535247802734375, -0.712554931640625, -0.6715850830078125, -0.630615234375, -0.5896453857421875, -0.548675537109375, -0.5077056884765625, -0.46673583984375, -0.4257659912109375, -0.384796142578125, -0.3438262939453125, -0.3028564453125, -0.2618865966796875, -0.220916748046875, -0.1799468994140625, -0.13897705078125, -0.0980072021484375, -0.057037353515625, -0.0160675048828125, 0.02490234375, 0.0658721923828125, 0.106842041015625, 0.1478118896484375, 0.18878173828125, 0.2297515869140625, 0.270721435546875, 0.3116912841796875, 0.3526611328125, 0.3936309814453125, 0.434600830078125, 0.4755706787109375, 0.51654052734375, 0.5575103759765625, 0.598480224609375, 0.6394500732421875, 0.680419921875, 0.7213897705078125, 0.762359619140625, 0.8033294677734375, 0.84429931640625, 0.8852691650390625, 0.926239013671875, 0.9672088623046875, 1.0081787109375, 1.0491485595703125, 1.090118408203125, 1.1310882568359375, 1.17205810546875, 1.2130279541015625, 1.253997802734375, 1.2949676513671875, 1.3359375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 8.0, 8.0, 6.0, 10.0, 14.0, 20.0, 30.0, 36.0, 45.0, 71.0, 112.0, 153.0, 270.0, 383.0, 686.0, 1105.0, 1980.0, 3397.0, 6163.0, 11204.0, 21155.0, 40152.0, 76810.0, 152136.0, 265649.0, 223831.0, 115814.0, 59049.0, 30908.0, 16625.0, 9030.0, 4846.0, 2753.0, 1602.0, 929.0, 581.0, 356.0, 189.0, 137.0, 92.0, 67.0, 44.0, 27.0, 26.0, 11.0, 15.0, 6.0, 4.0, 7.0, 1.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.732421875, -1.677947998046875, -1.62347412109375, -1.569000244140625, -1.5145263671875, -1.460052490234375, -1.40557861328125, -1.351104736328125, -1.296630859375, -1.242156982421875, -1.18768310546875, -1.133209228515625, -1.0787353515625, -1.024261474609375, -0.96978759765625, -0.915313720703125, -0.86083984375, -0.806365966796875, -0.75189208984375, -0.697418212890625, -0.6429443359375, -0.588470458984375, -0.53399658203125, -0.479522705078125, -0.425048828125, -0.370574951171875, -0.31610107421875, -0.261627197265625, -0.2071533203125, -0.152679443359375, -0.09820556640625, -0.043731689453125, 0.0107421875, 0.065216064453125, 0.11968994140625, 0.174163818359375, 0.2286376953125, 0.283111572265625, 0.33758544921875, 0.392059326171875, 0.446533203125, 0.501007080078125, 0.55548095703125, 0.609954833984375, 0.6644287109375, 0.718902587890625, 0.77337646484375, 0.827850341796875, 0.88232421875, 0.936798095703125, 0.99127197265625, 1.045745849609375, 1.1002197265625, 1.154693603515625, 1.20916748046875, 1.263641357421875, 1.318115234375, 1.372589111328125, 1.42706298828125, 1.481536865234375, 1.5360107421875, 1.590484619140625, 1.64495849609375, 1.699432373046875, 1.75390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 11.0, 7.0, 12.0, 8.0, 8.0, 15.0, 23.0, 20.0, 26.0, 25.0, 29.0, 33.0, 36.0, 56.0, 69.0, 110.0, 149.0, 285.0, 1318.0, 201.0, 120.0, 86.0, 66.0, 37.0, 44.0, 37.0, 29.0, 25.0, 34.0, 25.0, 17.0, 14.0, 11.0, 12.0, 8.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.251953125, -3.147705078125, -3.04345703125, -2.939208984375, -2.8349609375, -2.730712890625, -2.62646484375, -2.522216796875, -2.41796875, -2.313720703125, -2.20947265625, -2.105224609375, -2.0009765625, -1.896728515625, -1.79248046875, -1.688232421875, -1.583984375, -1.479736328125, -1.37548828125, -1.271240234375, -1.1669921875, -1.062744140625, -0.95849609375, -0.854248046875, -0.75, -0.645751953125, -0.54150390625, -0.437255859375, -0.3330078125, -0.228759765625, -0.12451171875, -0.020263671875, 0.083984375, 0.188232421875, 0.29248046875, 0.396728515625, 0.5009765625, 0.605224609375, 0.70947265625, 0.813720703125, 0.91796875, 1.022216796875, 1.12646484375, 1.230712890625, 1.3349609375, 1.439208984375, 1.54345703125, 1.647705078125, 1.751953125, 1.856201171875, 1.96044921875, 2.064697265625, 2.1689453125, 2.273193359375, 2.37744140625, 2.481689453125, 2.5859375, 2.690185546875, 2.79443359375, 2.898681640625, 3.0029296875, 3.107177734375, 3.21142578125, 3.315673828125, 3.419921875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 8.0, 8.0, 8.0, 21.0, 32.0, 28.0, 43.0, 53.0, 72.0, 105.0, 145.0, 193.0, 279.0, 409.0, 801.0, 2896.0, 30113.0, 939653.0, 2106004.0, 57802.0, 4469.0, 973.0, 507.0, 317.0, 178.0, 157.0, 111.0, 72.0, 72.0, 45.0, 27.0, 30.0, 17.0, 18.0, 8.0, 5.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 5.0, 4.0], "bins": [-7.0625, -6.877197265625, -6.69189453125, -6.506591796875, -6.3212890625, -6.135986328125, -5.95068359375, -5.765380859375, -5.580078125, -5.394775390625, -5.20947265625, -5.024169921875, -4.8388671875, -4.653564453125, -4.46826171875, -4.282958984375, -4.09765625, -3.912353515625, -3.72705078125, -3.541748046875, -3.3564453125, -3.171142578125, -2.98583984375, -2.800537109375, -2.615234375, -2.429931640625, -2.24462890625, -2.059326171875, -1.8740234375, -1.688720703125, -1.50341796875, -1.318115234375, -1.1328125, -0.947509765625, -0.76220703125, -0.576904296875, -0.3916015625, -0.206298828125, -0.02099609375, 0.164306640625, 0.349609375, 0.534912109375, 0.72021484375, 0.905517578125, 1.0908203125, 1.276123046875, 1.46142578125, 1.646728515625, 1.83203125, 2.017333984375, 2.20263671875, 2.387939453125, 2.5732421875, 2.758544921875, 2.94384765625, 3.129150390625, 3.314453125, 3.499755859375, 3.68505859375, 3.870361328125, 4.0556640625, 4.240966796875, 4.42626953125, 4.611572265625, 4.796875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 24.0, 620.0, 367.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.82633209228516, -70.67564392089844, -68.52495574951172, -66.37425994873047, -64.22357177734375, -62.07288360595703, -59.92219543457031, -57.77150344848633, -55.620811462402344, -53.470123291015625, -51.31943130493164, -49.16874313354492, -47.01805114746094, -44.86736297607422, -42.7166748046875, -40.565982818603516, -38.4152946472168, -36.26460647583008, -34.113914489746094, -31.963226318359375, -29.81253433227539, -27.661846160888672, -25.51115608215332, -23.36046600341797, -21.209775924682617, -19.059085845947266, -16.908395767211914, -14.757706642150879, -12.607016563415527, -10.456326484680176, -8.30563735961914, -6.154947280883789, -4.0042572021484375, -1.853567361831665, 0.2971224784851074, 2.447812080383301, 4.598502159118652, 6.749192237854004, 8.899881362915039, 11.05057144165039, 13.201261520385742, 15.351951599121094, 17.502641677856445, 19.653331756591797, 21.804019927978516, 23.9547119140625, 26.10540008544922, 28.25609016418457, 30.406780242919922, 32.55746841430664, 34.708160400390625, 36.858848571777344, 39.00954055786133, 41.16022872924805, 43.31092071533203, 45.46160888671875, 47.61229705810547, 49.76298522949219, 51.91367721557617, 54.06436538696289, 56.215057373046875, 58.365745544433594, 60.51643371582031, 62.6671257019043, 64.81781768798828]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 5.0, 11.0, 10.0, 13.0, 11.0, 7.0, 7.0, 22.0, 23.0, 22.0, 29.0, 33.0, 29.0, 28.0, 29.0, 26.0, 30.0, 31.0, 33.0, 39.0, 41.0, 38.0, 39.0, 37.0, 45.0, 39.0, 30.0, 38.0, 36.0, 22.0, 22.0, 18.0, 19.0, 13.0, 19.0, 17.0, 16.0, 6.0, 15.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.894298553466797, -6.662705898284912, -6.431113243103027, -6.199520587921143, -5.967927932739258, -5.736335754394531, -5.504742622375488, -5.273150444030762, -5.041557788848877, -4.809965133666992, -4.578372478485107, -4.346779823303223, -4.115187168121338, -3.8835947513580322, -3.6520020961761475, -3.420409679412842, -3.188816785812378, -2.957224130630493, -2.7256314754486084, -2.4940390586853027, -2.262446403503418, -2.030853748321533, -1.7992610931396484, -1.5676685571670532, -1.3360759019851685, -1.1044832468032837, -0.8728907108306885, -0.6412980556488037, -0.4097054600715637, -0.17811286449432373, 0.053479790687561035, 0.28507232666015625, 0.516664981842041, 0.748257577419281, 0.979850172996521, 1.2114428281784058, 1.443035364151001, 1.6746280193328857, 1.9062206745147705, 2.137813091278076, 2.369405746459961, 2.6009984016418457, 2.8325910568237305, 3.0641837120056152, 3.295776128768921, 3.5273687839508057, 3.7589614391326904, 3.990553855895996, 4.222146987915039, 4.453739643096924, 4.685332298278809, 4.916924953460693, 5.148517608642578, 5.380109786987305, 5.611702919006348, 5.843295097351074, 6.074887752532959, 6.306480407714844, 6.5380730628967285, 6.769665718078613, 7.001258373260498, 7.232851028442383, 7.464443206787109, 7.696035861968994, 7.927628517150879]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 2.0, 6.0, 8.0, 16.0, 17.0, 14.0, 13.0, 20.0, 23.0, 28.0, 29.0, 26.0, 25.0, 37.0, 34.0, 44.0, 41.0, 42.0, 37.0, 34.0, 45.0, 41.0, 53.0, 26.0, 35.0, 36.0, 24.0, 28.0, 25.0, 31.0, 23.0, 17.0, 15.0, 14.0, 16.0, 13.0, 12.0, 10.0, 2.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4248046875, -1.382110595703125, -1.33941650390625, -1.296722412109375, -1.2540283203125, -1.211334228515625, -1.16864013671875, -1.125946044921875, -1.083251953125, -1.040557861328125, -0.99786376953125, -0.955169677734375, -0.9124755859375, -0.869781494140625, -0.82708740234375, -0.784393310546875, -0.74169921875, -0.699005126953125, -0.65631103515625, -0.613616943359375, -0.5709228515625, -0.528228759765625, -0.48553466796875, -0.442840576171875, -0.400146484375, -0.357452392578125, -0.31475830078125, -0.272064208984375, -0.2293701171875, -0.186676025390625, -0.14398193359375, -0.101287841796875, -0.05859375, -0.015899658203125, 0.02679443359375, 0.069488525390625, 0.1121826171875, 0.154876708984375, 0.19757080078125, 0.240264892578125, 0.282958984375, 0.325653076171875, 0.36834716796875, 0.411041259765625, 0.4537353515625, 0.496429443359375, 0.53912353515625, 0.581817626953125, 0.62451171875, 0.667205810546875, 0.70989990234375, 0.752593994140625, 0.7952880859375, 0.837982177734375, 0.88067626953125, 0.923370361328125, 0.966064453125, 1.008758544921875, 1.05145263671875, 1.094146728515625, 1.1368408203125, 1.179534912109375, 1.22222900390625, 1.264923095703125, 1.3076171875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 14.0, 12.0, 12.0, 11.0, 20.0, 22.0, 22.0, 30.0, 49.0, 51.0, 67.0, 71.0, 121.0, 190.0, 218.0, 282.0, 454.0, 2124.0, 3807447.0, 380357.0, 1122.0, 389.0, 290.0, 235.0, 142.0, 99.0, 87.0, 69.0, 55.0, 35.0, 28.0, 25.0, 24.0, 21.0, 20.0, 17.0, 9.0, 3.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-26.890625, -26.119873046875, -25.34912109375, -24.578369140625, -23.8076171875, -23.036865234375, -22.26611328125, -21.495361328125, -20.724609375, -19.953857421875, -19.18310546875, -18.412353515625, -17.6416015625, -16.870849609375, -16.10009765625, -15.329345703125, -14.55859375, -13.787841796875, -13.01708984375, -12.246337890625, -11.4755859375, -10.704833984375, -9.93408203125, -9.163330078125, -8.392578125, -7.621826171875, -6.85107421875, -6.080322265625, -5.3095703125, -4.538818359375, -3.76806640625, -2.997314453125, -2.2265625, -1.455810546875, -0.68505859375, 0.085693359375, 0.8564453125, 1.627197265625, 2.39794921875, 3.168701171875, 3.939453125, 4.710205078125, 5.48095703125, 6.251708984375, 7.0224609375, 7.793212890625, 8.56396484375, 9.334716796875, 10.10546875, 10.876220703125, 11.64697265625, 12.417724609375, 13.1884765625, 13.959228515625, 14.72998046875, 15.500732421875, 16.271484375, 17.042236328125, 17.81298828125, 18.583740234375, 19.3544921875, 20.125244140625, 20.89599609375, 21.666748046875, 22.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 11.0, 8.0, 5.0, 11.0, 13.0, 18.0, 24.0, 36.0, 56.0, 82.0, 85.0, 128.0, 167.0, 229.0, 348.0, 487.0, 592.0, 512.0, 313.0, 253.0, 182.0, 134.0, 90.0, 67.0, 61.0, 37.0, 42.0, 20.0, 17.0, 11.0, 6.0, 2.0, 2.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.548828125, -2.4808349609375, -2.412841796875, -2.3448486328125, -2.27685546875, -2.2088623046875, -2.140869140625, -2.0728759765625, -2.0048828125, -1.9368896484375, -1.868896484375, -1.8009033203125, -1.73291015625, -1.6649169921875, -1.596923828125, -1.5289306640625, -1.4609375, -1.3929443359375, -1.324951171875, -1.2569580078125, -1.18896484375, -1.1209716796875, -1.052978515625, -0.9849853515625, -0.9169921875, -0.8489990234375, -0.781005859375, -0.7130126953125, -0.64501953125, -0.5770263671875, -0.509033203125, -0.4410400390625, -0.373046875, -0.3050537109375, -0.237060546875, -0.1690673828125, -0.10107421875, -0.0330810546875, 0.034912109375, 0.1029052734375, 0.1708984375, 0.2388916015625, 0.306884765625, 0.3748779296875, 0.44287109375, 0.5108642578125, 0.578857421875, 0.6468505859375, 0.71484375, 0.7828369140625, 0.850830078125, 0.9188232421875, 0.98681640625, 1.0548095703125, 1.122802734375, 1.1907958984375, 1.2587890625, 1.3267822265625, 1.394775390625, 1.4627685546875, 1.53076171875, 1.5987548828125, 1.666748046875, 1.7347412109375, 1.802734375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 10.0, 15.0, 20.0, 27.0, 31.0, 47.0, 89.0, 206.0, 1133.0, 119021.0, 4062376.0, 10468.0, 449.0, 154.0, 82.0, 50.0, 33.0, 20.0, 19.0, 8.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.0, -9.422119140625, -8.84423828125, -8.266357421875, -7.6884765625, -7.110595703125, -6.53271484375, -5.954833984375, -5.376953125, -4.799072265625, -4.22119140625, -3.643310546875, -3.0654296875, -2.487548828125, -1.90966796875, -1.331787109375, -0.75390625, -0.176025390625, 0.40185546875, 0.979736328125, 1.5576171875, 2.135498046875, 2.71337890625, 3.291259765625, 3.869140625, 4.447021484375, 5.02490234375, 5.602783203125, 6.1806640625, 6.758544921875, 7.33642578125, 7.914306640625, 8.4921875, 9.070068359375, 9.64794921875, 10.225830078125, 10.8037109375, 11.381591796875, 11.95947265625, 12.537353515625, 13.115234375, 13.693115234375, 14.27099609375, 14.848876953125, 15.4267578125, 16.004638671875, 16.58251953125, 17.160400390625, 17.73828125, 18.316162109375, 18.89404296875, 19.471923828125, 20.0498046875, 20.627685546875, 21.20556640625, 21.783447265625, 22.361328125, 22.939208984375, 23.51708984375, 24.094970703125, 24.6728515625, 25.250732421875, 25.82861328125, 26.406494140625, 26.984375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 350.0, 651.0, 11.0, 1.0, 1.0], "bins": [-202.1901397705078, -198.8300323486328, -195.46990966796875, -192.10980224609375, -188.7496795654297, -185.3895721435547, -182.02944946289062, -178.66934204101562, -175.30921936035156, -171.94911193847656, -168.5889892578125, -165.2288818359375, -161.86875915527344, -158.50865173339844, -155.14852905273438, -151.78842163085938, -148.42831420898438, -145.06820678710938, -141.7080841064453, -138.3479766845703, -134.98785400390625, -131.62774658203125, -128.2676239013672, -124.90751647949219, -121.54739379882812, -118.1872787475586, -114.82716369628906, -111.46704864501953, -108.10693359375, -104.74681854248047, -101.38670349121094, -98.02659606933594, -94.66647338867188, -91.30635833740234, -87.94624328613281, -84.58612823486328, -81.22601318359375, -77.86589813232422, -74.50578308105469, -71.14567565917969, -67.78555297851562, -64.4254379272461, -61.06532287597656, -57.70520782470703, -54.3450927734375, -50.98497772216797, -47.6248664855957, -44.26475143432617, -40.90463638305664, -37.54452133178711, -34.18440628051758, -30.82429313659668, -27.46417808532715, -24.104063034057617, -20.74394989013672, -17.383834838867188, -14.023719787597656, -10.663604736328125, -7.30349063873291, -3.9433765411376953, -0.5832614898681641, 2.776853561401367, 6.136966705322266, 9.497081756591797, 12.857196807861328]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 17.0, 9.0, 13.0, 11.0, 27.0, 25.0, 27.0, 39.0, 40.0, 36.0, 39.0, 50.0, 44.0, 68.0, 45.0, 53.0, 50.0, 56.0, 38.0, 32.0, 29.0, 56.0, 30.0, 25.0, 23.0, 26.0, 20.0, 15.0, 8.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.604053497314453, -13.173945426940918, -12.743837356567383, -12.313729286193848, -11.883621215820312, -11.453513145446777, -11.023405075073242, -10.593297004699707, -10.163188934326172, -9.733080863952637, -9.302972793579102, -8.872864723205566, -8.442756652832031, -8.012648582458496, -7.582540512084961, -7.152432441711426, -6.722324848175049, -6.292216777801514, -5.8621087074279785, -5.432000637054443, -5.001892566680908, -4.571784973144531, -4.141676902770996, -3.711568593978882, -3.2814605236053467, -2.8513524532318115, -2.4212443828582764, -1.9911364316940308, -1.5610283613204956, -1.13092041015625, -0.7008123397827148, -0.2707042694091797, 0.15940380096435547, 0.5895118713378906, 1.0196199417114258, 1.4497278928756714, 1.8798359632492065, 2.309943914413452, 2.7400519847869873, 3.1701600551605225, 3.6002681255340576, 4.030375957489014, 4.460484027862549, 4.890592098236084, 5.320700168609619, 5.750808238983154, 6.1809163093566895, 6.611024379730225, 7.04113245010376, 7.471240520477295, 7.90134859085083, 8.331456184387207, 8.761564254760742, 9.191672325134277, 9.621780395507812, 10.051888465881348, 10.481996536254883, 10.912104606628418, 11.342212677001953, 11.772320747375488, 12.202428817749023, 12.632536888122559, 13.062644958496094, 13.492753028869629, 13.922861099243164]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 8.0, 8.0, 5.0, 7.0, 9.0, 16.0, 15.0, 13.0, 21.0, 15.0, 19.0, 24.0, 22.0, 35.0, 26.0, 28.0, 43.0, 23.0, 35.0, 51.0, 35.0, 35.0, 27.0, 37.0, 45.0, 38.0, 36.0, 38.0, 26.0, 30.0, 24.0, 26.0, 25.0, 14.0, 15.0, 24.0, 13.0, 14.0, 11.0, 10.0, 15.0, 5.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0], "bins": [-1.4365234375, -1.3961029052734375, -1.355682373046875, -1.3152618408203125, -1.27484130859375, -1.2344207763671875, -1.194000244140625, -1.1535797119140625, -1.1131591796875, -1.0727386474609375, -1.032318115234375, -0.9918975830078125, -0.95147705078125, -0.9110565185546875, -0.870635986328125, -0.8302154541015625, -0.789794921875, -0.7493743896484375, -0.708953857421875, -0.6685333251953125, -0.62811279296875, -0.5876922607421875, -0.547271728515625, -0.5068511962890625, -0.4664306640625, -0.4260101318359375, -0.385589599609375, -0.3451690673828125, -0.30474853515625, -0.2643280029296875, -0.223907470703125, -0.1834869384765625, -0.14306640625, -0.1026458740234375, -0.062225341796875, -0.0218048095703125, 0.01861572265625, 0.0590362548828125, 0.099456787109375, 0.1398773193359375, 0.1802978515625, 0.2207183837890625, 0.261138916015625, 0.3015594482421875, 0.34197998046875, 0.3824005126953125, 0.422821044921875, 0.4632415771484375, 0.503662109375, 0.5440826416015625, 0.584503173828125, 0.6249237060546875, 0.66534423828125, 0.7057647705078125, 0.746185302734375, 0.7866058349609375, 0.8270263671875, 0.8674468994140625, 0.907867431640625, 0.9482879638671875, 0.98870849609375, 1.0291290283203125, 1.069549560546875, 1.1099700927734375, 1.150390625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 0.0, 7.0, 8.0, 9.0, 14.0, 12.0, 19.0, 32.0, 50.0, 58.0, 94.0, 118.0, 158.0, 236.0, 335.0, 459.0, 684.0, 1098.0, 1813.0, 3598.0, 9468.0, 34481.0, 155961.0, 467910.0, 281740.0, 63368.0, 15206.0, 5170.0, 2444.0, 1265.0, 829.0, 514.0, 388.0, 275.0, 215.0, 140.0, 107.0, 90.0, 52.0, 39.0, 30.0, 17.0, 17.0, 10.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.59765625, -0.579925537109375, -0.56219482421875, -0.544464111328125, -0.5267333984375, -0.509002685546875, -0.49127197265625, -0.473541259765625, -0.455810546875, -0.438079833984375, -0.42034912109375, -0.402618408203125, -0.3848876953125, -0.367156982421875, -0.34942626953125, -0.331695556640625, -0.31396484375, -0.296234130859375, -0.27850341796875, -0.260772705078125, -0.2430419921875, -0.225311279296875, -0.20758056640625, -0.189849853515625, -0.172119140625, -0.154388427734375, -0.13665771484375, -0.118927001953125, -0.1011962890625, -0.083465576171875, -0.06573486328125, -0.048004150390625, -0.0302734375, -0.012542724609375, 0.00518798828125, 0.022918701171875, 0.0406494140625, 0.058380126953125, 0.07611083984375, 0.093841552734375, 0.111572265625, 0.129302978515625, 0.14703369140625, 0.164764404296875, 0.1824951171875, 0.200225830078125, 0.21795654296875, 0.235687255859375, 0.25341796875, 0.271148681640625, 0.28887939453125, 0.306610107421875, 0.3243408203125, 0.342071533203125, 0.35980224609375, 0.377532958984375, 0.395263671875, 0.412994384765625, 0.43072509765625, 0.448455810546875, 0.4661865234375, 0.483917236328125, 0.50164794921875, 0.519378662109375, 0.537109375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 9.0, 8.0, 6.0, 6.0, 8.0, 13.0, 10.0, 14.0, 19.0, 28.0, 25.0, 34.0, 26.0, 29.0, 39.0, 45.0, 48.0, 47.0, 45.0, 39.0, 1070.0, 32.0, 40.0, 37.0, 33.0, 29.0, 42.0, 27.0, 31.0, 28.0, 29.0, 15.0, 21.0, 14.0, 13.0, 15.0, 9.0, 12.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.97076416015625, -0.9376220703125, -0.90447998046875, -0.871337890625, -0.83819580078125, -0.8050537109375, -0.77191162109375, -0.73876953125, -0.70562744140625, -0.6724853515625, -0.63934326171875, -0.606201171875, -0.57305908203125, -0.5399169921875, -0.50677490234375, -0.4736328125, -0.44049072265625, -0.4073486328125, -0.37420654296875, -0.341064453125, -0.30792236328125, -0.2747802734375, -0.24163818359375, -0.20849609375, -0.17535400390625, -0.1422119140625, -0.10906982421875, -0.075927734375, -0.04278564453125, -0.0096435546875, 0.02349853515625, 0.056640625, 0.08978271484375, 0.1229248046875, 0.15606689453125, 0.189208984375, 0.22235107421875, 0.2554931640625, 0.28863525390625, 0.32177734375, 0.35491943359375, 0.3880615234375, 0.42120361328125, 0.454345703125, 0.48748779296875, 0.5206298828125, 0.55377197265625, 0.5869140625, 0.62005615234375, 0.6531982421875, 0.68634033203125, 0.719482421875, 0.75262451171875, 0.7857666015625, 0.81890869140625, 0.85205078125, 0.88519287109375, 0.9183349609375, 0.95147705078125, 0.984619140625, 1.01776123046875, 1.0509033203125, 1.08404541015625, 1.1171875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 9.0, 8.0, 10.0, 16.0, 29.0, 38.0, 38.0, 64.0, 81.0, 117.0, 150.0, 196.0, 291.0, 444.0, 643.0, 898.0, 1468.0, 2322.0, 4286.0, 9274.0, 31126.0, 229542.0, 1628016.0, 146640.0, 23304.0, 7888.0, 3756.0, 2251.0, 1349.0, 919.0, 593.0, 401.0, 288.0, 193.0, 120.0, 91.0, 75.0, 45.0, 40.0, 26.0, 26.0, 8.0, 10.0, 12.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.5703125, -0.5527114868164062, -0.5351104736328125, -0.5175094604492188, -0.499908447265625, -0.48230743408203125, -0.4647064208984375, -0.44710540771484375, -0.42950439453125, -0.41190338134765625, -0.3943023681640625, -0.37670135498046875, -0.359100341796875, -0.34149932861328125, -0.3238983154296875, -0.30629730224609375, -0.2886962890625, -0.27109527587890625, -0.2534942626953125, -0.23589324951171875, -0.218292236328125, -0.20069122314453125, -0.1830902099609375, -0.16548919677734375, -0.14788818359375, -0.13028717041015625, -0.1126861572265625, -0.09508514404296875, -0.077484130859375, -0.05988311767578125, -0.0422821044921875, -0.02468109130859375, -0.007080078125, 0.01052093505859375, 0.0281219482421875, 0.04572296142578125, 0.063323974609375, 0.08092498779296875, 0.0985260009765625, 0.11612701416015625, 0.13372802734375, 0.15132904052734375, 0.1689300537109375, 0.18653106689453125, 0.204132080078125, 0.22173309326171875, 0.2393341064453125, 0.25693511962890625, 0.2745361328125, 0.29213714599609375, 0.3097381591796875, 0.32733917236328125, 0.344940185546875, 0.36254119873046875, 0.3801422119140625, 0.39774322509765625, 0.41534423828125, 0.43294525146484375, 0.4505462646484375, 0.46814727783203125, 0.485748291015625, 0.5033493041992188, 0.5209503173828125, 0.5385513305664062, 0.55615234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 0.0, 6.0, 8.0, 13.0, 15.0, 29.0, 57.0, 140.0, 240.0, 216.0, 140.0, 56.0, 21.0, 12.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1961669921875, -0.18961334228515625, -0.1830596923828125, -0.17650604248046875, -0.169952392578125, -0.16339874267578125, -0.1568450927734375, -0.15029144287109375, -0.14373779296875, -0.13718414306640625, -0.1306304931640625, -0.12407684326171875, -0.117523193359375, -0.11096954345703125, -0.1044158935546875, -0.09786224365234375, -0.09130859375, -0.08475494384765625, -0.0782012939453125, -0.07164764404296875, -0.065093994140625, -0.05854034423828125, -0.0519866943359375, -0.04543304443359375, -0.03887939453125, -0.03232574462890625, -0.0257720947265625, -0.01921844482421875, -0.012664794921875, -0.00611114501953125, 0.0004425048828125, 0.00699615478515625, 0.0135498046875, 0.02010345458984375, 0.0266571044921875, 0.03321075439453125, 0.039764404296875, 0.04631805419921875, 0.0528717041015625, 0.05942535400390625, 0.06597900390625, 0.07253265380859375, 0.0790863037109375, 0.08563995361328125, 0.092193603515625, 0.09874725341796875, 0.1053009033203125, 0.11185455322265625, 0.118408203125, 0.12496185302734375, 0.1315155029296875, 0.13806915283203125, 0.144622802734375, 0.15117645263671875, 0.1577301025390625, 0.16428375244140625, 0.17083740234375, 0.17739105224609375, 0.1839447021484375, 0.19049835205078125, 0.197052001953125, 0.20360565185546875, 0.2101593017578125, 0.21671295166015625, 0.2232666015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 6.0, 5.0, 12.0, 16.0, 27.0, 69.0, 186.0, 728.0, 1046802.0, 393.0, 139.0, 61.0, 22.0, 20.0, 14.0, 6.0, 4.0, 2.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.31640625, -6.13250732421875, -5.9486083984375, -5.76470947265625, -5.580810546875, -5.39691162109375, -5.2130126953125, -5.02911376953125, -4.84521484375, -4.66131591796875, -4.4774169921875, -4.29351806640625, -4.109619140625, -3.92572021484375, -3.7418212890625, -3.55792236328125, -3.3740234375, -3.19012451171875, -3.0062255859375, -2.82232666015625, -2.638427734375, -2.45452880859375, -2.2706298828125, -2.08673095703125, -1.90283203125, -1.71893310546875, -1.5350341796875, -1.35113525390625, -1.167236328125, -0.98333740234375, -0.7994384765625, -0.61553955078125, -0.431640625, -0.24774169921875, -0.0638427734375, 0.12005615234375, 0.303955078125, 0.48785400390625, 0.6717529296875, 0.85565185546875, 1.03955078125, 1.22344970703125, 1.4073486328125, 1.59124755859375, 1.775146484375, 1.95904541015625, 2.1429443359375, 2.32684326171875, 2.5107421875, 2.69464111328125, 2.8785400390625, 3.06243896484375, 3.246337890625, 3.43023681640625, 3.6141357421875, 3.79803466796875, 3.98193359375, 4.16583251953125, 4.3497314453125, 4.53363037109375, 4.717529296875, 4.90142822265625, 5.0853271484375, 5.26922607421875, 5.453125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 341.0, 672.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5939745903015137, -0.5590887665748596, -0.5242029428482056, -0.4893171489238739, -0.45443132519721985, -0.4195455014705658, -0.38465970754623413, -0.3497738838195801, -0.314888060092926, -0.280002236366272, -0.2451164275407791, -0.21023061871528625, -0.1753447949886322, -0.14045897126197815, -0.10557316243648529, -0.07068735361099243, -0.03580152988433838, -0.0009157136082649231, 0.03397010266780853, 0.06885591894388199, 0.10374173521995544, 0.1386275589466095, 0.17351336777210236, 0.20839917659759521, 0.24328500032424927, 0.2781708240509033, 0.3130566477775574, 0.34794244170188904, 0.3828282654285431, 0.41771408915519714, 0.4525998830795288, 0.48748570680618286, 0.5223716497421265, 0.5572574734687805, 0.5921432971954346, 0.6270291209220886, 0.6619149446487427, 0.696800708770752, 0.731686532497406, 0.7665723562240601, 0.8014581799507141, 0.8363440036773682, 0.8712298274040222, 0.9061156511306763, 0.9410014152526855, 0.9758872985839844, 1.0107730627059937, 1.045658826828003, 1.0805447101593018, 1.115430474281311, 1.1503163576126099, 1.1852021217346191, 1.220088005065918, 1.2549737691879272, 1.289859652519226, 1.3247454166412354, 1.3596312999725342, 1.3945170640945435, 1.4294029474258423, 1.4642887115478516, 1.4991745948791504, 1.5340603590011597, 1.5689462423324585, 1.6038320064544678, 1.638717770576477]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 7.0, 5.0, 5.0, 7.0, 8.0, 9.0, 3.0, 10.0, 10.0, 15.0, 18.0, 20.0, 14.0, 20.0, 28.0, 14.0, 14.0, 34.0, 31.0, 36.0, 35.0, 35.0, 32.0, 35.0, 39.0, 32.0, 40.0, 30.0, 33.0, 38.0, 48.0, 37.0, 43.0, 33.0, 20.0, 22.0, 19.0, 17.0, 20.0, 7.0, 14.0, 15.0, 12.0, 6.0, 12.0, 4.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.15505623817443848, -0.14976215362548828, -0.1444680541753769, -0.1391739696264267, -0.1338798850774765, -0.1285857856273651, -0.12329170107841492, -0.11799761652946472, -0.11270352452993393, -0.10740943253040314, -0.10211534798145294, -0.09682125598192215, -0.09152716398239136, -0.08623307943344116, -0.08093898743391037, -0.07564489543437958, -0.07035081088542938, -0.06505671888589859, -0.059762634336948395, -0.0544685423374176, -0.04917445406317711, -0.043880365788936615, -0.03858627378940582, -0.03329218551516533, -0.027998097240924835, -0.02270400896668434, -0.0174099188297987, -0.012115828692913055, -0.006821740418672562, -0.0015276521444320679, 0.0037664398550987244, 0.009060528129339218, 0.014354616403579712, 0.019648704677820206, 0.02494279481470585, 0.03023688495159149, 0.035530973225831985, 0.04082506150007248, 0.04611915349960327, 0.051413241773843765, 0.05670733004808426, 0.06200141832232475, 0.06729550659656525, 0.07258959859609604, 0.07788369059562683, 0.08317777514457703, 0.08847186714410782, 0.09376595914363861, 0.0990600436925888, 0.1043541356921196, 0.1096482202410698, 0.11494231224060059, 0.12023639678955078, 0.12553048133850098, 0.13082458078861237, 0.13611866533756256, 0.14141276478767395, 0.14670684933662415, 0.15200094878673553, 0.15729503333568573, 0.16258911788463593, 0.16788321733474731, 0.1731773018836975, 0.1784713864326477, 0.1837654709815979]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 8.0, 10.0, 4.0, 8.0, 5.0, 19.0, 16.0, 12.0, 20.0, 16.0, 20.0, 22.0, 22.0, 33.0, 27.0, 30.0, 39.0, 29.0, 29.0, 56.0, 30.0, 38.0, 29.0, 34.0, 46.0, 38.0, 36.0, 40.0, 23.0, 31.0, 24.0, 27.0, 25.0, 15.0, 20.0, 18.0, 14.0, 12.0, 13.0, 10.0, 16.0, 4.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0], "bins": [-1.4423828125, -1.40185546875, -1.361328125, -1.32080078125, -1.2802734375, -1.23974609375, -1.19921875, -1.15869140625, -1.1181640625, -1.07763671875, -1.037109375, -0.99658203125, -0.9560546875, -0.91552734375, -0.875, -0.83447265625, -0.7939453125, -0.75341796875, -0.712890625, -0.67236328125, -0.6318359375, -0.59130859375, -0.55078125, -0.51025390625, -0.4697265625, -0.42919921875, -0.388671875, -0.34814453125, -0.3076171875, -0.26708984375, -0.2265625, -0.18603515625, -0.1455078125, -0.10498046875, -0.064453125, -0.02392578125, 0.0166015625, 0.05712890625, 0.09765625, 0.13818359375, 0.1787109375, 0.21923828125, 0.259765625, 0.30029296875, 0.3408203125, 0.38134765625, 0.421875, 0.46240234375, 0.5029296875, 0.54345703125, 0.583984375, 0.62451171875, 0.6650390625, 0.70556640625, 0.74609375, 0.78662109375, 0.8271484375, 0.86767578125, 0.908203125, 0.94873046875, 0.9892578125, 1.02978515625, 1.0703125, 1.11083984375, 1.1513671875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 13.0, 23.0, 22.0, 33.0, 48.0, 84.0, 82.0, 120.0, 133.0, 201.0, 273.0, 424.0, 583.0, 930.0, 1692.0, 3383.0, 7127.0, 15585.0, 35570.0, 80449.0, 174757.0, 307548.0, 225520.0, 105765.0, 47954.0, 20954.0, 9358.0, 4315.0, 2095.0, 1137.0, 673.0, 427.0, 325.0, 247.0, 166.0, 132.0, 104.0, 70.0, 54.0, 47.0, 33.0, 13.0, 24.0, 12.0, 11.0, 4.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7822265625, -1.7200775146484375, -1.657928466796875, -1.5957794189453125, -1.53363037109375, -1.4714813232421875, -1.409332275390625, -1.3471832275390625, -1.2850341796875, -1.2228851318359375, -1.160736083984375, -1.0985870361328125, -1.03643798828125, -0.9742889404296875, -0.912139892578125, -0.8499908447265625, -0.787841796875, -0.7256927490234375, -0.663543701171875, -0.6013946533203125, -0.53924560546875, -0.4770965576171875, -0.414947509765625, -0.3527984619140625, -0.2906494140625, -0.2285003662109375, -0.166351318359375, -0.1042022705078125, -0.04205322265625, 0.0200958251953125, 0.082244873046875, 0.1443939208984375, 0.20654296875, 0.2686920166015625, 0.330841064453125, 0.3929901123046875, 0.45513916015625, 0.5172882080078125, 0.579437255859375, 0.6415863037109375, 0.7037353515625, 0.7658843994140625, 0.828033447265625, 0.8901824951171875, 0.95233154296875, 1.0144805908203125, 1.076629638671875, 1.1387786865234375, 1.200927734375, 1.2630767822265625, 1.325225830078125, 1.3873748779296875, 1.44952392578125, 1.5116729736328125, 1.573822021484375, 1.6359710693359375, 1.6981201171875, 1.7602691650390625, 1.822418212890625, 1.8845672607421875, 1.94671630859375, 2.0088653564453125, 2.071014404296875, 2.1331634521484375, 2.1953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 13.0, 11.0, 18.0, 18.0, 26.0, 29.0, 21.0, 31.0, 33.0, 44.0, 52.0, 55.0, 99.0, 169.0, 368.0, 1363.0, 169.0, 120.0, 63.0, 48.0, 38.0, 41.0, 40.0, 30.0, 20.0, 15.0, 18.0, 17.0, 13.0, 10.0, 8.0, 5.0, 7.0, 5.0, 2.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.78515625, -3.6630859375, -3.541015625, -3.4189453125, -3.296875, -3.1748046875, -3.052734375, -2.9306640625, -2.80859375, -2.6865234375, -2.564453125, -2.4423828125, -2.3203125, -2.1982421875, -2.076171875, -1.9541015625, -1.83203125, -1.7099609375, -1.587890625, -1.4658203125, -1.34375, -1.2216796875, -1.099609375, -0.9775390625, -0.85546875, -0.7333984375, -0.611328125, -0.4892578125, -0.3671875, -0.2451171875, -0.123046875, -0.0009765625, 0.12109375, 0.2431640625, 0.365234375, 0.4873046875, 0.609375, 0.7314453125, 0.853515625, 0.9755859375, 1.09765625, 1.2197265625, 1.341796875, 1.4638671875, 1.5859375, 1.7080078125, 1.830078125, 1.9521484375, 2.07421875, 2.1962890625, 2.318359375, 2.4404296875, 2.5625, 2.6845703125, 2.806640625, 2.9287109375, 3.05078125, 3.1728515625, 3.294921875, 3.4169921875, 3.5390625, 3.6611328125, 3.783203125, 3.9052734375, 4.02734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 6.0, 13.0, 11.0, 6.0, 17.0, 20.0, 37.0, 34.0, 48.0, 64.0, 77.0, 87.0, 97.0, 167.0, 211.0, 302.0, 400.0, 680.0, 1231.0, 5581.0, 2617989.0, 512628.0, 2810.0, 1015.0, 639.0, 363.0, 286.0, 193.0, 145.0, 124.0, 91.0, 71.0, 55.0, 45.0, 36.0, 23.0, 22.0, 16.0, 12.0, 11.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.4765625, -9.169677734375, -8.86279296875, -8.555908203125, -8.2490234375, -7.942138671875, -7.63525390625, -7.328369140625, -7.021484375, -6.714599609375, -6.40771484375, -6.100830078125, -5.7939453125, -5.487060546875, -5.18017578125, -4.873291015625, -4.56640625, -4.259521484375, -3.95263671875, -3.645751953125, -3.3388671875, -3.031982421875, -2.72509765625, -2.418212890625, -2.111328125, -1.804443359375, -1.49755859375, -1.190673828125, -0.8837890625, -0.576904296875, -0.27001953125, 0.036865234375, 0.34375, 0.650634765625, 0.95751953125, 1.264404296875, 1.5712890625, 1.878173828125, 2.18505859375, 2.491943359375, 2.798828125, 3.105712890625, 3.41259765625, 3.719482421875, 4.0263671875, 4.333251953125, 4.64013671875, 4.947021484375, 5.25390625, 5.560791015625, 5.86767578125, 6.174560546875, 6.4814453125, 6.788330078125, 7.09521484375, 7.402099609375, 7.708984375, 8.015869140625, 8.32275390625, 8.629638671875, 8.9365234375, 9.243408203125, 9.55029296875, 9.857177734375, 10.1640625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 93.0, 920.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.67279052734375, -118.6240234375, -114.57525634765625, -110.5264892578125, -106.47772216796875, -102.428955078125, -98.38019561767578, -94.33142852783203, -90.28266143798828, -86.23389434814453, -82.18512725830078, -78.13636016845703, -74.08760070800781, -70.03883361816406, -65.99006652832031, -61.94129943847656, -57.89253234863281, -53.84376525878906, -49.79499816894531, -45.74623489379883, -41.69746780395508, -37.64870071411133, -33.599937438964844, -29.551170349121094, -25.502403259277344, -21.453636169433594, -17.404870986938477, -13.356104850769043, -9.30733871459961, -5.258571624755859, -1.2098064422607422, 2.838958740234375, 6.887725830078125, 10.936491966247559, 14.985258102416992, 19.03402328491211, 23.08279037475586, 27.13155746459961, 31.180322647094727, 35.229087829589844, 39.277854919433594, 43.326622009277344, 47.375389099121094, 51.42415237426758, 55.47291946411133, 59.52168655395508, 63.57044982910156, 67.61921691894531, 71.66798400878906, 75.71675109863281, 79.76551818847656, 83.81428527832031, 87.86305236816406, 91.91181945800781, 95.96057891845703, 100.00934600830078, 104.05811309814453, 108.10688018798828, 112.15564727783203, 116.20441436767578, 120.253173828125, 124.30194091796875, 128.3507080078125, 132.39947509765625, 136.4482421875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 7.0, 5.0, 6.0, 5.0, 8.0, 13.0, 17.0, 28.0, 21.0, 22.0, 19.0, 27.0, 29.0, 36.0, 31.0, 32.0, 42.0, 35.0, 35.0, 30.0, 43.0, 43.0, 36.0, 34.0, 28.0, 38.0, 36.0, 32.0, 30.0, 27.0, 23.0, 32.0, 21.0, 18.0, 19.0, 15.0, 12.0, 17.0, 8.0, 7.0, 6.0, 4.0, 0.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.070791244506836, -9.769468307495117, -9.468145370483398, -9.16682243347168, -8.865499496459961, -8.564176559448242, -8.262853622436523, -7.961531162261963, -7.660208225250244, -7.358885288238525, -7.057562351226807, -6.756239414215088, -6.454916954040527, -6.153594017028809, -5.85227108001709, -5.550948143005371, -5.249625205993652, -4.948302268981934, -4.646979331970215, -4.345656394958496, -4.044333457946777, -3.7430107593536377, -3.441688060760498, -3.1403651237487793, -2.8390421867370605, -2.537719249725342, -2.236396312713623, -1.9350736141204834, -1.6337506771087646, -1.332427740097046, -1.0311049222946167, -0.7297821044921875, -0.42845916748046875, -0.12713629007339478, 0.1741865873336792, 0.4755094647407532, 0.7768323421478271, 1.078155279159546, 1.379478096961975, 1.6808009147644043, 1.982123851776123, 2.283446788787842, 2.5847697257995605, 2.8860924243927, 3.187415361404419, 3.4887382984161377, 3.7900609970092773, 4.091383934020996, 4.392706871032715, 4.694029808044434, 4.995352745056152, 5.296675682067871, 5.59799861907959, 5.899321556091309, 6.200644016265869, 6.501966953277588, 6.803289890289307, 7.104612827301025, 7.405935764312744, 7.707258701324463, 8.008581161499023, 8.309904098510742, 8.611227035522461, 8.91254997253418, 9.213872909545898]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 15.0, 7.0, 16.0, 13.0, 13.0, 28.0, 19.0, 31.0, 33.0, 33.0, 36.0, 32.0, 43.0, 34.0, 35.0, 47.0, 49.0, 47.0, 38.0, 40.0, 42.0, 35.0, 39.0, 39.0, 27.0, 32.0, 25.0, 19.0, 15.0, 18.0, 11.0, 10.0, 15.0, 14.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.60577392578125, -1.5592041015625, -1.51263427734375, -1.466064453125, -1.41949462890625, -1.3729248046875, -1.32635498046875, -1.27978515625, -1.23321533203125, -1.1866455078125, -1.14007568359375, -1.093505859375, -1.04693603515625, -1.0003662109375, -0.95379638671875, -0.9072265625, -0.86065673828125, -0.8140869140625, -0.76751708984375, -0.720947265625, -0.67437744140625, -0.6278076171875, -0.58123779296875, -0.53466796875, -0.48809814453125, -0.4415283203125, -0.39495849609375, -0.348388671875, -0.30181884765625, -0.2552490234375, -0.20867919921875, -0.162109375, -0.11553955078125, -0.0689697265625, -0.02239990234375, 0.024169921875, 0.07073974609375, 0.1173095703125, 0.16387939453125, 0.21044921875, 0.25701904296875, 0.3035888671875, 0.35015869140625, 0.396728515625, 0.44329833984375, 0.4898681640625, 0.53643798828125, 0.5830078125, 0.62957763671875, 0.6761474609375, 0.72271728515625, 0.769287109375, 0.81585693359375, 0.8624267578125, 0.90899658203125, 0.95556640625, 1.00213623046875, 1.0487060546875, 1.09527587890625, 1.141845703125, 1.18841552734375, 1.2349853515625, 1.28155517578125, 1.328125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 12.0, 11.0, 31.0, 25.0, 28.0, 40.0, 74.0, 84.0, 97.0, 144.0, 181.0, 316.0, 512.0, 951.0, 1974.0, 4325.0, 11729.0, 45848.0, 406649.0, 2588967.0, 1004016.0, 98024.0, 18571.0, 6148.0, 2538.0, 1126.0, 629.0, 369.0, 229.0, 160.0, 110.0, 95.0, 67.0, 44.0, 39.0, 29.0, 15.0, 19.0, 8.0, 10.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.4609375, -3.348175048828125, -3.23541259765625, -3.122650146484375, -3.0098876953125, -2.897125244140625, -2.78436279296875, -2.671600341796875, -2.558837890625, -2.446075439453125, -2.33331298828125, -2.220550537109375, -2.1077880859375, -1.995025634765625, -1.88226318359375, -1.769500732421875, -1.65673828125, -1.543975830078125, -1.43121337890625, -1.318450927734375, -1.2056884765625, -1.092926025390625, -0.98016357421875, -0.867401123046875, -0.754638671875, -0.641876220703125, -0.52911376953125, -0.416351318359375, -0.3035888671875, -0.190826416015625, -0.07806396484375, 0.034698486328125, 0.1474609375, 0.260223388671875, 0.37298583984375, 0.485748291015625, 0.5985107421875, 0.711273193359375, 0.82403564453125, 0.936798095703125, 1.049560546875, 1.162322998046875, 1.27508544921875, 1.387847900390625, 1.5006103515625, 1.613372802734375, 1.72613525390625, 1.838897705078125, 1.95166015625, 2.064422607421875, 2.17718505859375, 2.289947509765625, 2.4027099609375, 2.515472412109375, 2.62823486328125, 2.740997314453125, 2.853759765625, 2.966522216796875, 3.07928466796875, 3.192047119140625, 3.3048095703125, 3.417572021484375, 3.53033447265625, 3.643096923828125, 3.755859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 8.0, 8.0, 16.0, 21.0, 46.0, 68.0, 121.0, 197.0, 295.0, 558.0, 782.0, 722.0, 449.0, 274.0, 186.0, 130.0, 56.0, 57.0, 35.0, 12.0, 9.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.73016357421875, -2.6048583984375, -2.47955322265625, -2.354248046875, -2.22894287109375, -2.1036376953125, -1.97833251953125, -1.85302734375, -1.72772216796875, -1.6024169921875, -1.47711181640625, -1.351806640625, -1.22650146484375, -1.1011962890625, -0.97589111328125, -0.8505859375, -0.72528076171875, -0.5999755859375, -0.47467041015625, -0.349365234375, -0.22406005859375, -0.0987548828125, 0.02655029296875, 0.15185546875, 0.27716064453125, 0.4024658203125, 0.52777099609375, 0.653076171875, 0.77838134765625, 0.9036865234375, 1.02899169921875, 1.154296875, 1.27960205078125, 1.4049072265625, 1.53021240234375, 1.655517578125, 1.78082275390625, 1.9061279296875, 2.03143310546875, 2.15673828125, 2.28204345703125, 2.4073486328125, 2.53265380859375, 2.657958984375, 2.78326416015625, 2.9085693359375, 3.03387451171875, 3.1591796875, 3.28448486328125, 3.4097900390625, 3.53509521484375, 3.660400390625, 3.78570556640625, 3.9110107421875, 4.03631591796875, 4.16162109375, 4.28692626953125, 4.4122314453125, 4.53753662109375, 4.662841796875, 4.78814697265625, 4.9134521484375, 5.03875732421875, 5.1640625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 12.0, 18.0, 46.0, 167.0, 743.0, 32605.0, 4144838.0, 15077.0, 574.0, 134.0, 36.0, 16.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.59375, -24.000244140625, -23.40673828125, -22.813232421875, -22.2197265625, -21.626220703125, -21.03271484375, -20.439208984375, -19.845703125, -19.252197265625, -18.65869140625, -18.065185546875, -17.4716796875, -16.878173828125, -16.28466796875, -15.691162109375, -15.09765625, -14.504150390625, -13.91064453125, -13.317138671875, -12.7236328125, -12.130126953125, -11.53662109375, -10.943115234375, -10.349609375, -9.756103515625, -9.16259765625, -8.569091796875, -7.9755859375, -7.382080078125, -6.78857421875, -6.195068359375, -5.6015625, -5.008056640625, -4.41455078125, -3.821044921875, -3.2275390625, -2.634033203125, -2.04052734375, -1.447021484375, -0.853515625, -0.260009765625, 0.33349609375, 0.927001953125, 1.5205078125, 2.114013671875, 2.70751953125, 3.301025390625, 3.89453125, 4.488037109375, 5.08154296875, 5.675048828125, 6.2685546875, 6.862060546875, 7.45556640625, 8.049072265625, 8.642578125, 9.236083984375, 9.82958984375, 10.423095703125, 11.0166015625, 11.610107421875, 12.20361328125, 12.797119140625, 13.390625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 11.0, 269.0, 648.0, 84.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.05596160888672, -121.72831726074219, -119.40068054199219, -117.07303619384766, -114.74539947509766, -112.41775512695312, -110.09011840820312, -107.7624740600586, -105.43482971191406, -103.10718536376953, -100.77954864501953, -98.451904296875, -96.124267578125, -93.79662322998047, -91.46897888183594, -89.14134216308594, -86.81370544433594, -84.4860610961914, -82.1584243774414, -79.83078002929688, -77.50314331054688, -75.17549896240234, -72.84785461425781, -70.52021789550781, -68.19257354736328, -65.86492919921875, -63.53729248046875, -61.20964813232422, -58.88200759887695, -56.55436706542969, -54.22672653198242, -51.899085998535156, -49.571441650390625, -47.24380111694336, -44.916160583496094, -42.58851623535156, -40.2608757019043, -37.93323516845703, -35.605594635009766, -33.2779541015625, -30.9503116607666, -28.622671127319336, -26.295028686523438, -23.967388153076172, -21.639747619628906, -19.312105178833008, -16.984464645385742, -14.656822204589844, -12.329181671142578, -10.001540184020996, -7.673899173736572, -5.346258163452148, -3.0186166763305664, -0.6909751892089844, 1.6366653442382812, 3.9643077850341797, 6.291948318481445, 8.619589805603027, 10.94723129272461, 13.274871826171875, 15.602513313293457, 17.93015480041504, 20.257795333862305, 22.585437774658203, 24.91307830810547]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 10.0, 10.0, 12.0, 28.0, 13.0, 30.0, 33.0, 43.0, 42.0, 47.0, 47.0, 55.0, 55.0, 53.0, 62.0, 48.0, 55.0, 59.0, 38.0, 28.0, 41.0, 41.0, 39.0, 20.0, 16.0, 11.0, 12.0, 16.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.12341022491455, -8.730704307556152, -8.337998390197754, -7.945292949676514, -7.552587509155273, -7.159881591796875, -6.767175674438477, -6.374469757080078, -5.981764316558838, -5.5890583992004395, -5.196352958679199, -4.803647041320801, -4.410941123962402, -4.018235683441162, -3.6255297660827637, -3.2328240871429443, -2.840118408203125, -2.4474127292633057, -2.0547070503234863, -1.662001132965088, -1.2692954540252686, -0.8765897750854492, -0.4838838577270508, -0.09117817878723145, 0.3015275001525879, 0.694233238697052, 1.0869389772415161, 1.479644775390625, 1.8723504543304443, 2.2650561332702637, 2.657762050628662, 3.0504677295684814, 3.443174362182617, 3.8358800411224365, 4.228585720062256, 4.621291637420654, 5.0139970779418945, 5.406702995300293, 5.799408912658691, 6.19211483001709, 6.58482027053833, 6.9775261878967285, 7.370231628417969, 7.762937545776367, 8.155643463134766, 8.548349380493164, 8.941055297851562, 9.333760261535645, 9.726466178894043, 10.119172096252441, 10.51187801361084, 10.904582977294922, 11.29728889465332, 11.689994812011719, 12.082700729370117, 12.475406646728516, 12.868112564086914, 13.260818481445312, 13.653524398803711, 14.04623031616211, 14.438935279846191, 14.83164119720459, 15.224347114562988, 15.617053031921387, 16.00975799560547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 6.0, 4.0, 3.0, 10.0, 8.0, 16.0, 6.0, 6.0, 13.0, 26.0, 17.0, 27.0, 19.0, 28.0, 30.0, 36.0, 35.0, 34.0, 30.0, 41.0, 40.0, 43.0, 45.0, 33.0, 40.0, 47.0, 41.0, 36.0, 38.0, 25.0, 27.0, 25.0, 28.0, 17.0, 19.0, 16.0, 13.0, 14.0, 10.0, 10.0, 8.0, 8.0, 12.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.230499267578125, -1.18951416015625, -1.148529052734375, -1.1075439453125, -1.066558837890625, -1.02557373046875, -0.984588623046875, -0.943603515625, -0.902618408203125, -0.86163330078125, -0.820648193359375, -0.7796630859375, -0.738677978515625, -0.69769287109375, -0.656707763671875, -0.61572265625, -0.574737548828125, -0.53375244140625, -0.492767333984375, -0.4517822265625, -0.410797119140625, -0.36981201171875, -0.328826904296875, -0.287841796875, -0.246856689453125, -0.20587158203125, -0.164886474609375, -0.1239013671875, -0.082916259765625, -0.04193115234375, -0.000946044921875, 0.0400390625, 0.081024169921875, 0.12200927734375, 0.162994384765625, 0.2039794921875, 0.244964599609375, 0.28594970703125, 0.326934814453125, 0.367919921875, 0.408905029296875, 0.44989013671875, 0.490875244140625, 0.5318603515625, 0.572845458984375, 0.61383056640625, 0.654815673828125, 0.69580078125, 0.736785888671875, 0.77777099609375, 0.818756103515625, 0.8597412109375, 0.900726318359375, 0.94171142578125, 0.982696533203125, 1.023681640625, 1.064666748046875, 1.10565185546875, 1.146636962890625, 1.1876220703125, 1.228607177734375, 1.26959228515625, 1.310577392578125, 1.3515625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 7.0, 13.0, 26.0, 14.0, 36.0, 41.0, 68.0, 80.0, 107.0, 170.0, 213.0, 304.0, 475.0, 646.0, 918.0, 1261.0, 1809.0, 2427.0, 3720.0, 5878.0, 47929.0, 873644.0, 88949.0, 6744.0, 3961.0, 2589.0, 1899.0, 1266.0, 1011.0, 687.0, 492.0, 337.0, 227.0, 157.0, 132.0, 94.0, 51.0, 49.0, 35.0, 23.0, 15.0, 13.0, 13.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3110198974609375, -1.269500732421875, -1.2279815673828125, -1.18646240234375, -1.1449432373046875, -1.103424072265625, -1.0619049072265625, -1.0203857421875, -0.9788665771484375, -0.937347412109375, -0.8958282470703125, -0.85430908203125, -0.8127899169921875, -0.771270751953125, -0.7297515869140625, -0.688232421875, -0.6467132568359375, -0.605194091796875, -0.5636749267578125, -0.52215576171875, -0.4806365966796875, -0.439117431640625, -0.3975982666015625, -0.3560791015625, -0.3145599365234375, -0.273040771484375, -0.2315216064453125, -0.19000244140625, -0.1484832763671875, -0.106964111328125, -0.0654449462890625, -0.02392578125, 0.0175933837890625, 0.059112548828125, 0.1006317138671875, 0.14215087890625, 0.1836700439453125, 0.225189208984375, 0.2667083740234375, 0.3082275390625, 0.3497467041015625, 0.391265869140625, 0.4327850341796875, 0.47430419921875, 0.5158233642578125, 0.557342529296875, 0.5988616943359375, 0.640380859375, 0.6819000244140625, 0.723419189453125, 0.7649383544921875, 0.80645751953125, 0.8479766845703125, 0.889495849609375, 0.9310150146484375, 0.9725341796875, 1.0140533447265625, 1.055572509765625, 1.0970916748046875, 1.13861083984375, 1.1801300048828125, 1.221649169921875, 1.2631683349609375, 1.3046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 4.0, 13.0, 10.0, 22.0, 14.0, 19.0, 21.0, 26.0, 20.0, 26.0, 41.0, 43.0, 36.0, 37.0, 44.0, 46.0, 49.0, 1072.0, 52.0, 38.0, 40.0, 41.0, 26.0, 44.0, 40.0, 34.0, 29.0, 19.0, 25.0, 16.0, 15.0, 6.0, 12.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.099609375, -1.0654144287109375, -1.031219482421875, -0.9970245361328125, -0.96282958984375, -0.9286346435546875, -0.894439697265625, -0.8602447509765625, -0.8260498046875, -0.7918548583984375, -0.757659912109375, -0.7234649658203125, -0.68927001953125, -0.6550750732421875, -0.620880126953125, -0.5866851806640625, -0.552490234375, -0.5182952880859375, -0.484100341796875, -0.4499053955078125, -0.41571044921875, -0.3815155029296875, -0.347320556640625, -0.3131256103515625, -0.2789306640625, -0.2447357177734375, -0.210540771484375, -0.1763458251953125, -0.14215087890625, -0.1079559326171875, -0.073760986328125, -0.0395660400390625, -0.00537109375, 0.0288238525390625, 0.063018798828125, 0.0972137451171875, 0.13140869140625, 0.1656036376953125, 0.199798583984375, 0.2339935302734375, 0.2681884765625, 0.3023834228515625, 0.336578369140625, 0.3707733154296875, 0.40496826171875, 0.4391632080078125, 0.473358154296875, 0.5075531005859375, 0.541748046875, 0.5759429931640625, 0.610137939453125, 0.6443328857421875, 0.67852783203125, 0.7127227783203125, 0.746917724609375, 0.7811126708984375, 0.8153076171875, 0.8495025634765625, 0.883697509765625, 0.9178924560546875, 0.95208740234375, 0.9862823486328125, 1.020477294921875, 1.0546722412109375, 1.0888671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 3.0, 12.0, 8.0, 13.0, 15.0, 28.0, 34.0, 52.0, 44.0, 75.0, 96.0, 117.0, 187.0, 248.0, 375.0, 526.0, 854.0, 1381.0, 2367.0, 4700.0, 14953.0, 2040549.0, 18202.0, 5449.0, 2514.0, 1369.0, 874.0, 609.0, 402.0, 276.0, 225.0, 177.0, 119.0, 78.0, 48.0, 42.0, 21.0, 26.0, 9.0, 18.0, 11.0, 8.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.615234375, -3.50067138671875, -3.3861083984375, -3.27154541015625, -3.156982421875, -3.04241943359375, -2.9278564453125, -2.81329345703125, -2.69873046875, -2.58416748046875, -2.4696044921875, -2.35504150390625, -2.240478515625, -2.12591552734375, -2.0113525390625, -1.89678955078125, -1.7822265625, -1.66766357421875, -1.5531005859375, -1.43853759765625, -1.323974609375, -1.20941162109375, -1.0948486328125, -0.98028564453125, -0.86572265625, -0.75115966796875, -0.6365966796875, -0.52203369140625, -0.407470703125, -0.29290771484375, -0.1783447265625, -0.06378173828125, 0.05078125, 0.16534423828125, 0.2799072265625, 0.39447021484375, 0.509033203125, 0.62359619140625, 0.7381591796875, 0.85272216796875, 0.96728515625, 1.08184814453125, 1.1964111328125, 1.31097412109375, 1.425537109375, 1.54010009765625, 1.6546630859375, 1.76922607421875, 1.8837890625, 1.99835205078125, 2.1129150390625, 2.22747802734375, 2.342041015625, 2.45660400390625, 2.5711669921875, 2.68572998046875, 2.80029296875, 2.91485595703125, 3.0294189453125, 3.14398193359375, 3.258544921875, 3.37310791015625, 3.4876708984375, 3.60223388671875, 3.716796875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 0.0, 1.0, 6.0, 5.0, 24.0, 289.0, 604.0, 41.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.4013175964355469, -0.38881683349609375, -0.3763160705566406, -0.3638153076171875, -0.3513145446777344, -0.33881378173828125, -0.3263130187988281, -0.313812255859375, -0.3013114929199219, -0.28881072998046875, -0.2763099670410156, -0.2638092041015625, -0.2513084411621094, -0.23880767822265625, -0.22630691528320312, -0.21380615234375, -0.20130538940429688, -0.18880462646484375, -0.17630386352539062, -0.1638031005859375, -0.15130233764648438, -0.13880157470703125, -0.12630081176757812, -0.113800048828125, -0.10129928588867188, -0.08879852294921875, -0.07629776000976562, -0.0637969970703125, -0.051296234130859375, -0.03879547119140625, -0.026294708251953125, -0.0137939453125, -0.001293182373046875, 0.01120758056640625, 0.023708343505859375, 0.0362091064453125, 0.048709869384765625, 0.06121063232421875, 0.07371139526367188, 0.086212158203125, 0.09871292114257812, 0.11121368408203125, 0.12371444702148438, 0.1362152099609375, 0.14871597290039062, 0.16121673583984375, 0.17371749877929688, 0.18621826171875, 0.19871902465820312, 0.21121978759765625, 0.22372055053710938, 0.2362213134765625, 0.24872207641601562, 0.26122283935546875, 0.2737236022949219, 0.286224365234375, 0.2987251281738281, 0.31122589111328125, 0.3237266540527344, 0.3362274169921875, 0.3487281799316406, 0.36122894287109375, 0.3737297058105469, 0.38623046875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 10.0, 9.0, 15.0, 30.0, 121.0, 306758.0, 741361.0, 95.0, 40.0, 24.0, 6.0, 7.0, 10.0, 10.0, 4.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8515625, -8.5660400390625, -8.280517578125, -7.9949951171875, -7.70947265625, -7.4239501953125, -7.138427734375, -6.8529052734375, -6.5673828125, -6.2818603515625, -5.996337890625, -5.7108154296875, -5.42529296875, -5.1397705078125, -4.854248046875, -4.5687255859375, -4.283203125, -3.9976806640625, -3.712158203125, -3.4266357421875, -3.14111328125, -2.8555908203125, -2.570068359375, -2.2845458984375, -1.9990234375, -1.7135009765625, -1.427978515625, -1.1424560546875, -0.85693359375, -0.5714111328125, -0.285888671875, -0.0003662109375, 0.28515625, 0.5706787109375, 0.856201171875, 1.1417236328125, 1.42724609375, 1.7127685546875, 1.998291015625, 2.2838134765625, 2.5693359375, 2.8548583984375, 3.140380859375, 3.4259033203125, 3.71142578125, 3.9969482421875, 4.282470703125, 4.5679931640625, 4.853515625, 5.1390380859375, 5.424560546875, 5.7100830078125, 5.99560546875, 6.2811279296875, 6.566650390625, 6.8521728515625, 7.1376953125, 7.4232177734375, 7.708740234375, 7.9942626953125, 8.27978515625, 8.5653076171875, 8.850830078125, 9.1363525390625, 9.421875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 185.0, 830.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7565092444419861, -0.672991156578064, -0.5894731283187866, -0.5059551000595093, -0.42243701219558716, -0.3389189541339874, -0.2554008960723877, -0.17188280820846558, -0.08836477994918823, -0.004846721887588501, 0.07867133617401123, 0.16218939423561096, 0.2457074522972107, 0.3292255103588104, 0.41274356842041016, 0.4962616562843323, 0.5797796845436096, 0.6632977724075317, 0.7468158006668091, 0.8303338289260864, 0.9138519167900085, 0.9973700046539307, 1.080888032913208, 1.1644060611724854, 1.2479240894317627, 1.33144211769104, 1.4149601459503174, 1.4984782934188843, 1.5819963216781616, 1.665514349937439, 1.7490324974060059, 1.8325505256652832, 1.9160685539245605, 1.999586582183838, 2.0831046104431152, 2.1666226387023926, 2.25014066696167, 2.3336589336395264, 2.4171769618988037, 2.500694990158081, 2.5842130184173584, 2.6677310466766357, 2.751249074935913, 2.8347671031951904, 2.918285369873047, 3.001803398132324, 3.0853214263916016, 3.168839454650879, 3.2523574829101562, 3.3358755111694336, 3.419393539428711, 3.5029115676879883, 3.5864295959472656, 3.669947862625122, 3.7534658908843994, 3.8369839191436768, 3.920501947402954, 4.0040202140808105, 4.087538242340088, 4.171056270599365, 4.254574298858643, 4.33809232711792, 4.421610355377197, 4.505128383636475, 4.588646411895752]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 7.0, 10.0, 7.0, 8.0, 20.0, 16.0, 17.0, 30.0, 29.0, 46.0, 39.0, 24.0, 42.0, 40.0, 44.0, 41.0, 46.0, 51.0, 34.0, 47.0, 45.0, 43.0, 53.0, 31.0, 30.0, 24.0, 25.0, 21.0, 22.0, 19.0, 21.0, 9.0, 6.0, 11.0, 7.0, 4.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20082080364227295, -0.19466346502304077, -0.1885061264038086, -0.18234878778457642, -0.17619144916534424, -0.17003411054611206, -0.16387677192687988, -0.1577194333076477, -0.15156209468841553, -0.14540475606918335, -0.13924741744995117, -0.133090078830719, -0.12693274021148682, -0.12077540159225464, -0.11461806297302246, -0.10846072435379028, -0.1023033857345581, -0.09614604711532593, -0.08998870849609375, -0.08383136987686157, -0.0776740312576294, -0.07151669263839722, -0.06535935401916504, -0.05920201539993286, -0.053044676780700684, -0.046887338161468506, -0.04072999954223633, -0.03457266092300415, -0.028415322303771973, -0.022257983684539795, -0.016100645065307617, -0.00994330644607544, -0.0037859678268432617, 0.002371370792388916, 0.008528709411621094, 0.014686048030853271, 0.02084338665008545, 0.027000725269317627, 0.033158063888549805, 0.03931540250778198, 0.04547274112701416, 0.05163007974624634, 0.057787418365478516, 0.0639447569847107, 0.07010209560394287, 0.07625943422317505, 0.08241677284240723, 0.0885741114616394, 0.09473145008087158, 0.10088878870010376, 0.10704612731933594, 0.11320346593856812, 0.11936080455780029, 0.12551814317703247, 0.13167548179626465, 0.13783282041549683, 0.143990159034729, 0.15014749765396118, 0.15630483627319336, 0.16246217489242554, 0.16861951351165771, 0.1747768521308899, 0.18093419075012207, 0.18709152936935425, 0.19324886798858643]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 10.0, 8.0, 16.0, 7.0, 7.0, 11.0, 28.0, 16.0, 26.0, 19.0, 25.0, 35.0, 35.0, 37.0, 27.0, 39.0, 34.0, 43.0, 44.0, 43.0, 36.0, 39.0, 51.0, 39.0, 32.0, 41.0, 26.0, 24.0, 26.0, 27.0, 20.0, 16.0, 17.0, 13.0, 14.0, 8.0, 12.0, 7.0, 10.0, 11.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.2352142333984375, -1.194061279296875, -1.1529083251953125, -1.11175537109375, -1.0706024169921875, -1.029449462890625, -0.9882965087890625, -0.9471435546875, -0.9059906005859375, -0.864837646484375, -0.8236846923828125, -0.78253173828125, -0.7413787841796875, -0.700225830078125, -0.6590728759765625, -0.617919921875, -0.5767669677734375, -0.535614013671875, -0.4944610595703125, -0.45330810546875, -0.4121551513671875, -0.371002197265625, -0.3298492431640625, -0.2886962890625, -0.2475433349609375, -0.206390380859375, -0.1652374267578125, -0.12408447265625, -0.0829315185546875, -0.041778564453125, -0.0006256103515625, 0.04052734375, 0.0816802978515625, 0.122833251953125, 0.1639862060546875, 0.20513916015625, 0.2462921142578125, 0.287445068359375, 0.3285980224609375, 0.3697509765625, 0.4109039306640625, 0.452056884765625, 0.4932098388671875, 0.53436279296875, 0.5755157470703125, 0.616668701171875, 0.6578216552734375, 0.698974609375, 0.7401275634765625, 0.781280517578125, 0.8224334716796875, 0.86358642578125, 0.9047393798828125, 0.945892333984375, 0.9870452880859375, 1.0281982421875, 1.0693511962890625, 1.110504150390625, 1.1516571044921875, 1.19281005859375, 1.2339630126953125, 1.275115966796875, 1.3162689208984375, 1.357421875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 11.0, 5.0, 16.0, 15.0, 20.0, 40.0, 43.0, 68.0, 85.0, 111.0, 155.0, 227.0, 286.0, 363.0, 518.0, 682.0, 1071.0, 1674.0, 2819.0, 5947.0, 14024.0, 38111.0, 115221.0, 398912.0, 319508.0, 93216.0, 31083.0, 11644.0, 5101.0, 2610.0, 1529.0, 964.0, 683.0, 472.0, 352.0, 222.0, 190.0, 120.0, 103.0, 79.0, 64.0, 40.0, 55.0, 20.0, 20.0, 16.0, 12.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0], "bins": [-2.283203125, -2.211639404296875, -2.14007568359375, -2.068511962890625, -1.9969482421875, -1.925384521484375, -1.85382080078125, -1.782257080078125, -1.710693359375, -1.639129638671875, -1.56756591796875, -1.496002197265625, -1.4244384765625, -1.352874755859375, -1.28131103515625, -1.209747314453125, -1.13818359375, -1.066619873046875, -0.99505615234375, -0.923492431640625, -0.8519287109375, -0.780364990234375, -0.70880126953125, -0.637237548828125, -0.565673828125, -0.494110107421875, -0.42254638671875, -0.350982666015625, -0.2794189453125, -0.207855224609375, -0.13629150390625, -0.064727783203125, 0.0068359375, 0.078399658203125, 0.14996337890625, 0.221527099609375, 0.2930908203125, 0.364654541015625, 0.43621826171875, 0.507781982421875, 0.579345703125, 0.650909423828125, 0.72247314453125, 0.794036865234375, 0.8656005859375, 0.937164306640625, 1.00872802734375, 1.080291748046875, 1.15185546875, 1.223419189453125, 1.29498291015625, 1.366546630859375, 1.4381103515625, 1.509674072265625, 1.58123779296875, 1.652801513671875, 1.724365234375, 1.795928955078125, 1.86749267578125, 1.939056396484375, 2.0106201171875, 2.082183837890625, 2.15374755859375, 2.225311279296875, 2.296875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 12.0, 14.0, 10.0, 13.0, 10.0, 16.0, 18.0, 21.0, 26.0, 24.0, 36.0, 26.0, 39.0, 45.0, 49.0, 50.0, 120.0, 227.0, 1420.0, 275.0, 124.0, 88.0, 46.0, 44.0, 56.0, 29.0, 21.0, 33.0, 17.0, 24.0, 14.0, 19.0, 14.0, 12.0, 10.0, 7.0, 8.0, 8.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.958984375, -2.868560791015625, -2.77813720703125, -2.687713623046875, -2.5972900390625, -2.506866455078125, -2.41644287109375, -2.326019287109375, -2.235595703125, -2.145172119140625, -2.05474853515625, -1.964324951171875, -1.8739013671875, -1.783477783203125, -1.69305419921875, -1.602630615234375, -1.51220703125, -1.421783447265625, -1.33135986328125, -1.240936279296875, -1.1505126953125, -1.060089111328125, -0.96966552734375, -0.879241943359375, -0.788818359375, -0.698394775390625, -0.60797119140625, -0.517547607421875, -0.4271240234375, -0.336700439453125, -0.24627685546875, -0.155853271484375, -0.0654296875, 0.024993896484375, 0.11541748046875, 0.205841064453125, 0.2962646484375, 0.386688232421875, 0.47711181640625, 0.567535400390625, 0.657958984375, 0.748382568359375, 0.83880615234375, 0.929229736328125, 1.0196533203125, 1.110076904296875, 1.20050048828125, 1.290924072265625, 1.38134765625, 1.471771240234375, 1.56219482421875, 1.652618408203125, 1.7430419921875, 1.833465576171875, 1.92388916015625, 2.014312744140625, 2.104736328125, 2.195159912109375, 2.28558349609375, 2.376007080078125, 2.4664306640625, 2.556854248046875, 2.64727783203125, 2.737701416015625, 2.828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 8.0, 10.0, 9.0, 14.0, 16.0, 18.0, 24.0, 37.0, 32.0, 51.0, 96.0, 114.0, 169.0, 203.0, 277.0, 426.0, 650.0, 1303.0, 3172.0, 75369.0, 3044927.0, 13664.0, 2117.0, 1039.0, 588.0, 374.0, 262.0, 191.0, 122.0, 95.0, 81.0, 64.0, 47.0, 31.0, 26.0, 19.0, 19.0, 6.0, 10.0, 3.0, 12.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.7664794921875, -7.501708984375, -7.2369384765625, -6.97216796875, -6.7073974609375, -6.442626953125, -6.1778564453125, -5.9130859375, -5.6483154296875, -5.383544921875, -5.1187744140625, -4.85400390625, -4.5892333984375, -4.324462890625, -4.0596923828125, -3.794921875, -3.5301513671875, -3.265380859375, -3.0006103515625, -2.73583984375, -2.4710693359375, -2.206298828125, -1.9415283203125, -1.6767578125, -1.4119873046875, -1.147216796875, -0.8824462890625, -0.61767578125, -0.3529052734375, -0.088134765625, 0.1766357421875, 0.44140625, 0.7061767578125, 0.970947265625, 1.2357177734375, 1.50048828125, 1.7652587890625, 2.030029296875, 2.2947998046875, 2.5595703125, 2.8243408203125, 3.089111328125, 3.3538818359375, 3.61865234375, 3.8834228515625, 4.148193359375, 4.4129638671875, 4.677734375, 4.9425048828125, 5.207275390625, 5.4720458984375, 5.73681640625, 6.0015869140625, 6.266357421875, 6.5311279296875, 6.7958984375, 7.0606689453125, 7.325439453125, 7.5902099609375, 7.85498046875, 8.1197509765625, 8.384521484375, 8.6492919921875, 8.9140625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 12.0, 37.0, 104.0, 237.0, 288.0, 201.0, 88.0, 33.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.86227798461914, -30.184303283691406, -29.506328582763672, -28.828353881835938, -28.150379180908203, -27.47240447998047, -26.794429779052734, -26.116453170776367, -25.438478469848633, -24.7605037689209, -24.082529067993164, -23.40455436706543, -22.726579666137695, -22.048603057861328, -21.370628356933594, -20.69265365600586, -20.014678955078125, -19.33670425415039, -18.658729553222656, -17.980754852294922, -17.302780151367188, -16.624805450439453, -15.946829795837402, -15.268854141235352, -14.59088134765625, -13.912906646728516, -13.234931945800781, -12.556957244873047, -11.878981590270996, -11.201006889343262, -10.523032188415527, -9.845056533813477, -9.167082786560059, -8.489108085632324, -7.811132907867432, -7.133158206939697, -6.455183029174805, -5.77720832824707, -5.099233627319336, -4.421258449554443, -3.743283748626709, -3.0653088092803955, -2.387333869934082, -1.7093591690063477, -1.0313842296600342, -0.3534092903137207, 0.32456541061401367, 1.0025405883789062, 1.6805152893066406, 2.358490228652954, 3.0364651679992676, 3.714439868927002, 4.3924150466918945, 5.070389747619629, 5.748364448547363, 6.426339626312256, 7.10431432723999, 7.782289028167725, 8.460264205932617, 9.138238906860352, 9.816213607788086, 10.49418830871582, 11.172163009643555, 11.850138664245605, 12.52811336517334]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 16.0, 5.0, 18.0, 15.0, 14.0, 20.0, 22.0, 29.0, 23.0, 27.0, 24.0, 24.0, 42.0, 37.0, 33.0, 36.0, 45.0, 46.0, 36.0, 32.0, 41.0, 43.0, 30.0, 34.0, 41.0, 24.0, 18.0, 34.0, 26.0, 23.0, 25.0, 20.0, 21.0, 21.0, 13.0, 8.0, 5.0, 5.0, 3.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.582674026489258, -8.318626403808594, -8.05457878112793, -7.790531158447266, -7.526483535766602, -7.2624359130859375, -6.998387813568115, -6.734340190887451, -6.470292568206787, -6.206244945526123, -5.942197322845459, -5.678149700164795, -5.414101600646973, -5.150053977966309, -4.8860063552856445, -4.6219587326049805, -4.357911109924316, -4.093863487243652, -3.8298158645629883, -3.565768003463745, -3.301720380783081, -3.037672758102417, -2.773624897003174, -2.5095772743225098, -2.2455296516418457, -1.9814820289611816, -1.717434287071228, -1.4533865451812744, -1.1893389225006104, -0.9252912998199463, -0.6612435579299927, -0.39719581604003906, -0.1331491470336914, 0.13089853525161743, 0.39494621753692627, 0.6589938998222351, 0.923041582107544, 1.187089204788208, 1.4511369466781616, 1.7151846885681152, 1.9792323112487793, 2.2432799339294434, 2.5073275566101074, 2.7713754177093506, 3.0354230403900146, 3.2994706630706787, 3.563518524169922, 3.827566146850586, 4.09161376953125, 4.355661392211914, 4.619709014892578, 4.883756637573242, 5.147804260253906, 5.41185188293457, 5.675899982452393, 5.939947605133057, 6.203995227813721, 6.468042850494385, 6.732090473175049, 6.996138095855713, 7.260186195373535, 7.524233818054199, 7.788281440734863, 8.052329063415527, 8.316376686096191]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 3.0, 6.0, 3.0, 1.0, 6.0, 4.0, 4.0, 8.0, 14.0, 10.0, 13.0, 17.0, 18.0, 25.0, 19.0, 31.0, 35.0, 36.0, 28.0, 26.0, 33.0, 32.0, 47.0, 37.0, 33.0, 42.0, 47.0, 45.0, 46.0, 29.0, 34.0, 28.0, 29.0, 29.0, 30.0, 17.0, 18.0, 18.0, 21.0, 13.0, 14.0, 11.0, 8.0, 8.0, 8.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3349609375, -1.2929840087890625, -1.251007080078125, -1.2090301513671875, -1.16705322265625, -1.1250762939453125, -1.083099365234375, -1.0411224365234375, -0.9991455078125, -0.9571685791015625, -0.915191650390625, -0.8732147216796875, -0.83123779296875, -0.7892608642578125, -0.747283935546875, -0.7053070068359375, -0.663330078125, -0.6213531494140625, -0.579376220703125, -0.5373992919921875, -0.49542236328125, -0.4534454345703125, -0.411468505859375, -0.3694915771484375, -0.3275146484375, -0.2855377197265625, -0.243560791015625, -0.2015838623046875, -0.15960693359375, -0.1176300048828125, -0.075653076171875, -0.0336761474609375, 0.00830078125, 0.0502777099609375, 0.092254638671875, 0.1342315673828125, 0.17620849609375, 0.2181854248046875, 0.260162353515625, 0.3021392822265625, 0.3441162109375, 0.3860931396484375, 0.428070068359375, 0.4700469970703125, 0.51202392578125, 0.5540008544921875, 0.595977783203125, 0.6379547119140625, 0.679931640625, 0.7219085693359375, 0.763885498046875, 0.8058624267578125, 0.84783935546875, 0.8898162841796875, 0.931793212890625, 0.9737701416015625, 1.0157470703125, 1.0577239990234375, 1.099700927734375, 1.1416778564453125, 1.18365478515625, 1.2256317138671875, 1.267608642578125, 1.3095855712890625, 1.3515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 14.0, 24.0, 33.0, 50.0, 62.0, 71.0, 91.0, 147.0, 194.0, 307.0, 405.0, 569.0, 815.0, 1185.0, 1912.0, 3003.0, 5589.0, 11324.0, 28518.0, 116196.0, 719188.0, 2129917.0, 947575.0, 163770.0, 34909.0, 12820.0, 6130.0, 3423.0, 1992.0, 1309.0, 826.0, 557.0, 384.0, 272.0, 211.0, 129.0, 87.0, 70.0, 52.0, 29.0, 26.0, 22.0, 15.0, 11.0, 9.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.3046875, -2.229339599609375, -2.15399169921875, -2.078643798828125, -2.0032958984375, -1.927947998046875, -1.85260009765625, -1.777252197265625, -1.701904296875, -1.626556396484375, -1.55120849609375, -1.475860595703125, -1.4005126953125, -1.325164794921875, -1.24981689453125, -1.174468994140625, -1.09912109375, -1.023773193359375, -0.94842529296875, -0.873077392578125, -0.7977294921875, -0.722381591796875, -0.64703369140625, -0.571685791015625, -0.496337890625, -0.420989990234375, -0.34564208984375, -0.270294189453125, -0.1949462890625, -0.119598388671875, -0.04425048828125, 0.031097412109375, 0.1064453125, 0.181793212890625, 0.25714111328125, 0.332489013671875, 0.4078369140625, 0.483184814453125, 0.55853271484375, 0.633880615234375, 0.709228515625, 0.784576416015625, 0.85992431640625, 0.935272216796875, 1.0106201171875, 1.085968017578125, 1.16131591796875, 1.236663818359375, 1.31201171875, 1.387359619140625, 1.46270751953125, 1.538055419921875, 1.6134033203125, 1.688751220703125, 1.76409912109375, 1.839447021484375, 1.914794921875, 1.990142822265625, 2.06549072265625, 2.140838623046875, 2.2161865234375, 2.291534423828125, 2.36688232421875, 2.442230224609375, 2.517578125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 14.0, 33.0, 38.0, 62.0, 122.0, 200.0, 287.0, 480.0, 710.0, 714.0, 500.0, 327.0, 183.0, 134.0, 83.0, 62.0, 41.0, 26.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.916015625, -3.804656982421875, -3.69329833984375, -3.581939697265625, -3.4705810546875, -3.359222412109375, -3.24786376953125, -3.136505126953125, -3.025146484375, -2.913787841796875, -2.80242919921875, -2.691070556640625, -2.5797119140625, -2.468353271484375, -2.35699462890625, -2.245635986328125, -2.13427734375, -2.022918701171875, -1.91156005859375, -1.800201416015625, -1.6888427734375, -1.577484130859375, -1.46612548828125, -1.354766845703125, -1.243408203125, -1.132049560546875, -1.02069091796875, -0.909332275390625, -0.7979736328125, -0.686614990234375, -0.57525634765625, -0.463897705078125, -0.3525390625, -0.241180419921875, -0.12982177734375, -0.018463134765625, 0.0928955078125, 0.204254150390625, 0.31561279296875, 0.426971435546875, 0.538330078125, 0.649688720703125, 0.76104736328125, 0.872406005859375, 0.9837646484375, 1.095123291015625, 1.20648193359375, 1.317840576171875, 1.42919921875, 1.540557861328125, 1.65191650390625, 1.763275146484375, 1.8746337890625, 1.985992431640625, 2.09735107421875, 2.208709716796875, 2.320068359375, 2.431427001953125, 2.54278564453125, 2.654144287109375, 2.7655029296875, 2.876861572265625, 2.98822021484375, 3.099578857421875, 3.2109375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 13.0, 20.0, 41.0, 101.0, 350.0, 1934.0, 71170.0, 4101873.0, 17181.0, 1171.0, 257.0, 95.0, 37.0, 16.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.6373291015625, -11.212158203125, -10.7869873046875, -10.36181640625, -9.9366455078125, -9.511474609375, -9.0863037109375, -8.6611328125, -8.2359619140625, -7.810791015625, -7.3856201171875, -6.96044921875, -6.5352783203125, -6.110107421875, -5.6849365234375, -5.259765625, -4.8345947265625, -4.409423828125, -3.9842529296875, -3.55908203125, -3.1339111328125, -2.708740234375, -2.2835693359375, -1.8583984375, -1.4332275390625, -1.008056640625, -0.5828857421875, -0.15771484375, 0.2674560546875, 0.692626953125, 1.1177978515625, 1.54296875, 1.9681396484375, 2.393310546875, 2.8184814453125, 3.24365234375, 3.6688232421875, 4.093994140625, 4.5191650390625, 4.9443359375, 5.3695068359375, 5.794677734375, 6.2198486328125, 6.64501953125, 7.0701904296875, 7.495361328125, 7.9205322265625, 8.345703125, 8.7708740234375, 9.196044921875, 9.6212158203125, 10.04638671875, 10.4715576171875, 10.896728515625, 11.3218994140625, 11.7470703125, 12.1722412109375, 12.597412109375, 13.0225830078125, 13.44775390625, 13.8729248046875, 14.298095703125, 14.7232666015625, 15.1484375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 26.0, 894.0, 94.0, 1.0, 2.0], "bins": [-236.2930145263672, -232.3925323486328, -228.49203491210938, -224.591552734375, -220.69105529785156, -216.7905731201172, -212.89007568359375, -208.98959350585938, -205.08909606933594, -201.18861389160156, -197.28811645507812, -193.38763427734375, -189.4871368408203, -185.58665466308594, -181.6861572265625, -177.78567504882812, -173.8851776123047, -169.9846954345703, -166.08419799804688, -162.1837158203125, -158.28321838378906, -154.3827362060547, -150.48223876953125, -146.58175659179688, -142.68125915527344, -138.78077697753906, -134.88027954101562, -130.97979736328125, -127.07929992675781, -123.1788101196289, -119.2783203125, -115.3778305053711, -111.47734832763672, -107.57685852050781, -103.6763687133789, -99.77587890625, -95.8753890991211, -91.97489929199219, -88.07440948486328, -84.17391967773438, -80.27342987060547, -76.37294006347656, -72.47245025634766, -68.57196044921875, -64.67147064208984, -60.77098083496094, -56.87049102783203, -52.970001220703125, -49.06951141357422, -45.16902160644531, -41.268531799316406, -37.3680419921875, -33.467552185058594, -29.56706428527832, -25.666574478149414, -21.766084671020508, -17.865596771240234, -13.965106964111328, -10.064617156982422, -6.164128303527832, -2.263638496398926, 1.636850357055664, 5.53734016418457, 9.437829971313477, 13.3383207321167]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 14.0, 9.0, 24.0, 25.0, 20.0, 26.0, 39.0, 32.0, 48.0, 44.0, 44.0, 47.0, 58.0, 65.0, 59.0, 53.0, 68.0, 52.0, 51.0, 31.0, 46.0, 24.0, 30.0, 25.0, 18.0, 13.0, 5.0, 7.0, 3.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.324511528015137, -9.94625473022461, -9.567997932434082, -9.189741134643555, -8.811484336853027, -8.4332275390625, -8.054969787597656, -7.676713466644287, -7.29845666885376, -6.920199871063232, -6.541943073272705, -6.1636857986450195, -5.785429000854492, -5.407172203063965, -5.0289154052734375, -4.65065860748291, -4.272401809692383, -3.8941450119018555, -3.515888214111328, -3.1376311779022217, -2.7593743801116943, -2.381117582321167, -2.0028605461120605, -1.6246037483215332, -1.2463469505310059, -0.8680900931358337, -0.4898332357406616, -0.11157631874084473, 0.2666804790496826, 0.64493727684021, 1.0231943130493164, 1.4014511108398438, 1.779707908630371, 2.1579647064208984, 2.536221504211426, 2.9144785404205322, 3.2927353382110596, 3.670992136001587, 4.049249172210693, 4.427505970001221, 4.805762767791748, 5.184019565582275, 5.562276363372803, 5.940533638000488, 6.318790435791016, 6.697047233581543, 7.07530403137207, 7.453560829162598, 7.831817626953125, 8.210074424743652, 8.58833122253418, 8.966588020324707, 9.344844818115234, 9.723101615905762, 10.101358413696289, 10.479616165161133, 10.857872009277344, 11.236128807067871, 11.614385604858398, 11.992642402648926, 12.370899200439453, 12.74915599822998, 13.127412796020508, 13.505670547485352, 13.883927345275879]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 4.0, 7.0, 9.0, 12.0, 11.0, 13.0, 8.0, 21.0, 29.0, 30.0, 35.0, 23.0, 43.0, 22.0, 35.0, 37.0, 39.0, 51.0, 42.0, 39.0, 48.0, 41.0, 40.0, 35.0, 46.0, 36.0, 36.0, 24.0, 26.0, 23.0, 22.0, 17.0, 14.0, 8.0, 13.0, 8.0, 8.0, 11.0, 8.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.3232421875, -1.285736083984375, -1.24822998046875, -1.210723876953125, -1.1732177734375, -1.135711669921875, -1.09820556640625, -1.060699462890625, -1.023193359375, -0.985687255859375, -0.94818115234375, -0.910675048828125, -0.8731689453125, -0.835662841796875, -0.79815673828125, -0.760650634765625, -0.72314453125, -0.685638427734375, -0.64813232421875, -0.610626220703125, -0.5731201171875, -0.535614013671875, -0.49810791015625, -0.460601806640625, -0.423095703125, -0.385589599609375, -0.34808349609375, -0.310577392578125, -0.2730712890625, -0.235565185546875, -0.19805908203125, -0.160552978515625, -0.123046875, -0.085540771484375, -0.04803466796875, -0.010528564453125, 0.0269775390625, 0.064483642578125, 0.10198974609375, 0.139495849609375, 0.177001953125, 0.214508056640625, 0.25201416015625, 0.289520263671875, 0.3270263671875, 0.364532470703125, 0.40203857421875, 0.439544677734375, 0.47705078125, 0.514556884765625, 0.55206298828125, 0.589569091796875, 0.6270751953125, 0.664581298828125, 0.70208740234375, 0.739593505859375, 0.777099609375, 0.814605712890625, 0.85211181640625, 0.889617919921875, 0.9271240234375, 0.964630126953125, 1.00213623046875, 1.039642333984375, 1.0771484375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 16.0, 18.0, 17.0, 27.0, 39.0, 66.0, 84.0, 104.0, 148.0, 214.0, 248.0, 379.0, 480.0, 685.0, 955.0, 1245.0, 1791.0, 2394.0, 3490.0, 5095.0, 8095.0, 13192.0, 25907.0, 140037.0, 734136.0, 56032.0, 20317.0, 11004.0, 6834.0, 4412.0, 3104.0, 2132.0, 1563.0, 1142.0, 802.0, 640.0, 465.0, 350.0, 245.0, 169.0, 130.0, 95.0, 88.0, 36.0, 40.0, 20.0, 20.0, 21.0, 14.0, 1.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0546875, -1.0199127197265625, -0.985137939453125, -0.9503631591796875, -0.91558837890625, -0.8808135986328125, -0.846038818359375, -0.8112640380859375, -0.7764892578125, -0.7417144775390625, -0.706939697265625, -0.6721649169921875, -0.63739013671875, -0.6026153564453125, -0.567840576171875, -0.5330657958984375, -0.498291015625, -0.4635162353515625, -0.428741455078125, -0.3939666748046875, -0.35919189453125, -0.3244171142578125, -0.289642333984375, -0.2548675537109375, -0.2200927734375, -0.1853179931640625, -0.150543212890625, -0.1157684326171875, -0.08099365234375, -0.0462188720703125, -0.011444091796875, 0.0233306884765625, 0.05810546875, 0.0928802490234375, 0.127655029296875, 0.1624298095703125, 0.19720458984375, 0.2319793701171875, 0.266754150390625, 0.3015289306640625, 0.3363037109375, 0.3710784912109375, 0.405853271484375, 0.4406280517578125, 0.47540283203125, 0.5101776123046875, 0.544952392578125, 0.5797271728515625, 0.614501953125, 0.6492767333984375, 0.684051513671875, 0.7188262939453125, 0.75360107421875, 0.7883758544921875, 0.823150634765625, 0.8579254150390625, 0.8927001953125, 0.9274749755859375, 0.962249755859375, 0.9970245361328125, 1.03179931640625, 1.0665740966796875, 1.101348876953125, 1.1361236572265625, 1.1708984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 5.0, 13.0, 8.0, 16.0, 14.0, 12.0, 17.0, 21.0, 21.0, 25.0, 27.0, 31.0, 25.0, 27.0, 39.0, 31.0, 31.0, 46.0, 33.0, 1057.0, 42.0, 34.0, 39.0, 41.0, 40.0, 37.0, 26.0, 36.0, 32.0, 23.0, 25.0, 28.0, 16.0, 14.0, 14.0, 8.0, 7.0, 8.0, 8.0, 7.0, 7.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.908203125, -0.8805465698242188, -0.8528900146484375, -0.8252334594726562, -0.797576904296875, -0.7699203491210938, -0.7422637939453125, -0.7146072387695312, -0.68695068359375, -0.6592941284179688, -0.6316375732421875, -0.6039810180664062, -0.576324462890625, -0.5486679077148438, -0.5210113525390625, -0.49335479736328125, -0.4656982421875, -0.43804168701171875, -0.4103851318359375, -0.38272857666015625, -0.355072021484375, -0.32741546630859375, -0.2997589111328125, -0.27210235595703125, -0.24444580078125, -0.21678924560546875, -0.1891326904296875, -0.16147613525390625, -0.133819580078125, -0.10616302490234375, -0.0785064697265625, -0.05084991455078125, -0.023193359375, 0.00446319580078125, 0.0321197509765625, 0.05977630615234375, 0.087432861328125, 0.11508941650390625, 0.1427459716796875, 0.17040252685546875, 0.19805908203125, 0.22571563720703125, 0.2533721923828125, 0.28102874755859375, 0.308685302734375, 0.33634185791015625, 0.3639984130859375, 0.39165496826171875, 0.4193115234375, 0.44696807861328125, 0.4746246337890625, 0.5022811889648438, 0.529937744140625, 0.5575942993164062, 0.5852508544921875, 0.6129074096679688, 0.64056396484375, 0.6682205200195312, 0.6958770751953125, 0.7235336303710938, 0.751190185546875, 0.7788467407226562, 0.8065032958984375, 0.8341598510742188, 0.86181640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 12.0, 9.0, 13.0, 13.0, 27.0, 21.0, 42.0, 47.0, 73.0, 94.0, 132.0, 179.0, 263.0, 331.0, 440.0, 618.0, 855.0, 1186.0, 1785.0, 2758.0, 4509.0, 8206.0, 19521.0, 211399.0, 1795063.0, 25408.0, 9422.0, 4968.0, 3043.0, 2033.0, 1303.0, 925.0, 651.0, 455.0, 356.0, 262.0, 182.0, 127.0, 100.0, 102.0, 45.0, 41.0, 21.0, 23.0, 28.0, 9.0, 15.0, 6.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.533782958984375, -2.45233154296875, -2.370880126953125, -2.2894287109375, -2.207977294921875, -2.12652587890625, -2.045074462890625, -1.963623046875, -1.882171630859375, -1.80072021484375, -1.719268798828125, -1.6378173828125, -1.556365966796875, -1.47491455078125, -1.393463134765625, -1.31201171875, -1.230560302734375, -1.14910888671875, -1.067657470703125, -0.9862060546875, -0.904754638671875, -0.82330322265625, -0.741851806640625, -0.660400390625, -0.578948974609375, -0.49749755859375, -0.416046142578125, -0.3345947265625, -0.253143310546875, -0.17169189453125, -0.090240478515625, -0.0087890625, 0.072662353515625, 0.15411376953125, 0.235565185546875, 0.3170166015625, 0.398468017578125, 0.47991943359375, 0.561370849609375, 0.642822265625, 0.724273681640625, 0.80572509765625, 0.887176513671875, 0.9686279296875, 1.050079345703125, 1.13153076171875, 1.212982177734375, 1.29443359375, 1.375885009765625, 1.45733642578125, 1.538787841796875, 1.6202392578125, 1.701690673828125, 1.78314208984375, 1.864593505859375, 1.946044921875, 2.027496337890625, 2.10894775390625, 2.190399169921875, 2.2718505859375, 2.353302001953125, 2.43475341796875, 2.516204833984375, 2.59765625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 3.0, 1.0, 4.0, 5.0, 5.0, 5.0, 21.0, 37.0, 73.0, 221.0, 412.0, 94.0, 49.0, 17.0, 10.0, 9.0, 4.0, 4.0, 1.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1484375, -0.143829345703125, -0.13922119140625, -0.134613037109375, -0.1300048828125, -0.125396728515625, -0.12078857421875, -0.116180419921875, -0.111572265625, -0.106964111328125, -0.10235595703125, -0.097747802734375, -0.0931396484375, -0.088531494140625, -0.08392333984375, -0.079315185546875, -0.07470703125, -0.070098876953125, -0.06549072265625, -0.060882568359375, -0.0562744140625, -0.051666259765625, -0.04705810546875, -0.042449951171875, -0.037841796875, -0.033233642578125, -0.02862548828125, -0.024017333984375, -0.0194091796875, -0.014801025390625, -0.01019287109375, -0.005584716796875, -0.0009765625, 0.003631591796875, 0.00823974609375, 0.012847900390625, 0.0174560546875, 0.022064208984375, 0.02667236328125, 0.031280517578125, 0.035888671875, 0.040496826171875, 0.04510498046875, 0.049713134765625, 0.0543212890625, 0.058929443359375, 0.06353759765625, 0.068145751953125, 0.07275390625, 0.077362060546875, 0.08197021484375, 0.086578369140625, 0.0911865234375, 0.095794677734375, 0.10040283203125, 0.105010986328125, 0.109619140625, 0.114227294921875, 0.11883544921875, 0.123443603515625, 0.1280517578125, 0.132659912109375, 0.13726806640625, 0.141876220703125, 0.146484375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 3.0, 6.0, 16.0, 10.0, 18.0, 28.0, 45.0, 116.0, 262.0, 30184.0, 1017201.0, 325.0, 135.0, 68.0, 35.0, 13.0, 9.0, 17.0, 8.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.4609375, -3.349456787109375, -3.23797607421875, -3.126495361328125, -3.0150146484375, -2.903533935546875, -2.79205322265625, -2.680572509765625, -2.569091796875, -2.457611083984375, -2.34613037109375, -2.234649658203125, -2.1231689453125, -2.011688232421875, -1.90020751953125, -1.788726806640625, -1.67724609375, -1.565765380859375, -1.45428466796875, -1.342803955078125, -1.2313232421875, -1.119842529296875, -1.00836181640625, -0.896881103515625, -0.785400390625, -0.673919677734375, -0.56243896484375, -0.450958251953125, -0.3394775390625, -0.227996826171875, -0.11651611328125, -0.005035400390625, 0.1064453125, 0.217926025390625, 0.32940673828125, 0.440887451171875, 0.5523681640625, 0.663848876953125, 0.77532958984375, 0.886810302734375, 0.998291015625, 1.109771728515625, 1.22125244140625, 1.332733154296875, 1.4442138671875, 1.555694580078125, 1.66717529296875, 1.778656005859375, 1.89013671875, 2.001617431640625, 2.11309814453125, 2.224578857421875, 2.3360595703125, 2.447540283203125, 2.55902099609375, 2.670501708984375, 2.781982421875, 2.893463134765625, 3.00494384765625, 3.116424560546875, 3.2279052734375, 3.339385986328125, 3.45086669921875, 3.562347412109375, 3.673828125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 1008.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.829523503780365, -0.7842382788658142, -0.7389530539512634, -0.6936678290367126, -0.6483826041221619, -0.6030973792076111, -0.5578120946884155, -0.5125268697738647, -0.46724167466163635, -0.42195644974708557, -0.3766712248325348, -0.3313859701156616, -0.28610074520111084, -0.24081553518772125, -0.19553029537200928, -0.1502450704574585, -0.10495984554290771, -0.059674616903066635, -0.014389388263225555, 0.030895844101905823, 0.0761810690164566, 0.12146629393100739, 0.16675153374671936, 0.21203675866127014, 0.2573219835758209, 0.3026072084903717, 0.3478924334049225, 0.39317768812179565, 0.43846291303634644, 0.4837481379508972, 0.529033362865448, 0.5743185877799988, 0.6196037530899048, 0.6648889780044556, 0.7101742029190063, 0.7554594278335571, 0.8007446527481079, 0.8460298776626587, 0.8913151025772095, 0.9366003274917603, 0.981885552406311, 1.0271707773208618, 1.0724560022354126, 1.1177412271499634, 1.1630264520645142, 1.208311676979065, 1.2535969018936157, 1.2988821268081665, 1.3441674709320068, 1.3894526958465576, 1.4347379207611084, 1.4800231456756592, 1.52530837059021, 1.5705935955047607, 1.6158788204193115, 1.6611640453338623, 1.706449270248413, 1.7517344951629639, 1.7970197200775146, 1.8423049449920654, 1.8875901699066162, 1.932875394821167, 1.9781606197357178, 2.0234458446502686, 2.0687310695648193]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 2.0, 5.0, 9.0, 7.0, 5.0, 17.0, 12.0, 11.0, 17.0, 18.0, 23.0, 26.0, 32.0, 34.0, 40.0, 38.0, 31.0, 42.0, 43.0, 40.0, 34.0, 50.0, 27.0, 38.0, 35.0, 40.0, 41.0, 35.0, 20.0, 33.0, 27.0, 21.0, 24.0, 22.0, 18.0, 19.0, 7.0, 15.0, 12.0, 5.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08797043561935425, -0.08514339476823807, -0.08231634646654129, -0.07948930561542511, -0.07666225731372833, -0.07383521646261215, -0.07100817561149597, -0.0681811273097992, -0.06535408645868301, -0.06252704560756683, -0.059699997305870056, -0.056872956454753876, -0.0540459118783474, -0.05121886730194092, -0.04839182645082474, -0.04556478187441826, -0.04273773729801178, -0.0399106927216053, -0.03708364814519882, -0.03425660729408264, -0.03142956271767616, -0.028602518141269684, -0.025775475427508354, -0.022948432713747025, -0.020121388137340546, -0.017294343560934067, -0.014467300847172737, -0.011640257202088833, -0.008813213557004929, -0.005986169911921024, -0.00315912626683712, -0.0003320835530757904, 0.0024949610233306885, 0.005322004668414593, 0.008149048313498497, 0.010976091958582401, 0.013803135603666306, 0.016630180180072784, 0.019457222893834114, 0.022284265607595444, 0.025111310184001923, 0.0279383547604084, 0.03076539747416973, 0.03359244018793106, 0.03641948476433754, 0.03924652934074402, 0.0420735701918602, 0.04490061476826668, 0.04772765934467316, 0.050554703921079636, 0.053381748497486115, 0.056208789348602295, 0.059035833925008774, 0.06186287850141525, 0.06468991935253143, 0.06751696765422821, 0.07034400850534439, 0.07317104935646057, 0.07599809765815735, 0.07882513850927353, 0.08165217936038971, 0.08447922766208649, 0.08730626851320267, 0.09013330936431885, 0.09296035766601562]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 7.0, 12.0, 11.0, 13.0, 10.0, 24.0, 25.0, 31.0, 39.0, 21.0, 39.0, 22.0, 41.0, 35.0, 47.0, 43.0, 41.0, 40.0, 47.0, 42.0, 38.0, 37.0, 43.0, 39.0, 33.0, 28.0, 25.0, 21.0, 21.0, 17.0, 15.0, 7.0, 13.0, 8.0, 6.0, 13.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.3193359375, -1.281829833984375, -1.24432373046875, -1.206817626953125, -1.1693115234375, -1.131805419921875, -1.09429931640625, -1.056793212890625, -1.019287109375, -0.981781005859375, -0.94427490234375, -0.906768798828125, -0.8692626953125, -0.831756591796875, -0.79425048828125, -0.756744384765625, -0.71923828125, -0.681732177734375, -0.64422607421875, -0.606719970703125, -0.5692138671875, -0.531707763671875, -0.49420166015625, -0.456695556640625, -0.419189453125, -0.381683349609375, -0.34417724609375, -0.306671142578125, -0.2691650390625, -0.231658935546875, -0.19415283203125, -0.156646728515625, -0.119140625, -0.081634521484375, -0.04412841796875, -0.006622314453125, 0.0308837890625, 0.068389892578125, 0.10589599609375, 0.143402099609375, 0.180908203125, 0.218414306640625, 0.25592041015625, 0.293426513671875, 0.3309326171875, 0.368438720703125, 0.40594482421875, 0.443450927734375, 0.48095703125, 0.518463134765625, 0.55596923828125, 0.593475341796875, 0.6309814453125, 0.668487548828125, 0.70599365234375, 0.743499755859375, 0.781005859375, 0.818511962890625, 0.85601806640625, 0.893524169921875, 0.9310302734375, 0.968536376953125, 1.00604248046875, 1.043548583984375, 1.0810546875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 10.0, 9.0, 15.0, 12.0, 29.0, 35.0, 30.0, 52.0, 54.0, 90.0, 128.0, 135.0, 194.0, 264.0, 408.0, 543.0, 697.0, 1107.0, 1710.0, 2926.0, 6070.0, 14555.0, 46792.0, 198920.0, 508072.0, 192244.0, 44832.0, 14247.0, 5925.0, 3015.0, 1626.0, 1083.0, 703.0, 537.0, 398.0, 261.0, 217.0, 136.0, 103.0, 91.0, 69.0, 57.0, 36.0, 36.0, 25.0, 16.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0], "bins": [-1.7060546875, -1.656585693359375, -1.60711669921875, -1.557647705078125, -1.5081787109375, -1.458709716796875, -1.40924072265625, -1.359771728515625, -1.310302734375, -1.260833740234375, -1.21136474609375, -1.161895751953125, -1.1124267578125, -1.062957763671875, -1.01348876953125, -0.964019775390625, -0.91455078125, -0.865081787109375, -0.81561279296875, -0.766143798828125, -0.7166748046875, -0.667205810546875, -0.61773681640625, -0.568267822265625, -0.518798828125, -0.469329833984375, -0.41986083984375, -0.370391845703125, -0.3209228515625, -0.271453857421875, -0.22198486328125, -0.172515869140625, -0.123046875, -0.073577880859375, -0.02410888671875, 0.025360107421875, 0.0748291015625, 0.124298095703125, 0.17376708984375, 0.223236083984375, 0.272705078125, 0.322174072265625, 0.37164306640625, 0.421112060546875, 0.4705810546875, 0.520050048828125, 0.56951904296875, 0.618988037109375, 0.66845703125, 0.717926025390625, 0.76739501953125, 0.816864013671875, 0.8663330078125, 0.915802001953125, 0.96527099609375, 1.014739990234375, 1.064208984375, 1.113677978515625, 1.16314697265625, 1.212615966796875, 1.2620849609375, 1.311553955078125, 1.36102294921875, 1.410491943359375, 1.4599609375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 2.0, 1.0, 7.0, 7.0, 8.0, 14.0, 10.0, 15.0, 21.0, 19.0, 30.0, 28.0, 25.0, 52.0, 37.0, 74.0, 102.0, 139.0, 359.0, 1406.0, 195.0, 107.0, 71.0, 53.0, 43.0, 41.0, 41.0, 27.0, 26.0, 15.0, 20.0, 12.0, 5.0, 8.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4765625, -3.37164306640625, -3.2667236328125, -3.16180419921875, -3.056884765625, -2.95196533203125, -2.8470458984375, -2.74212646484375, -2.63720703125, -2.53228759765625, -2.4273681640625, -2.32244873046875, -2.217529296875, -2.11260986328125, -2.0076904296875, -1.90277099609375, -1.7978515625, -1.69293212890625, -1.5880126953125, -1.48309326171875, -1.378173828125, -1.27325439453125, -1.1683349609375, -1.06341552734375, -0.95849609375, -0.85357666015625, -0.7486572265625, -0.64373779296875, -0.538818359375, -0.43389892578125, -0.3289794921875, -0.22406005859375, -0.119140625, -0.01422119140625, 0.0906982421875, 0.19561767578125, 0.300537109375, 0.40545654296875, 0.5103759765625, 0.61529541015625, 0.72021484375, 0.82513427734375, 0.9300537109375, 1.03497314453125, 1.139892578125, 1.24481201171875, 1.3497314453125, 1.45465087890625, 1.5595703125, 1.66448974609375, 1.7694091796875, 1.87432861328125, 1.979248046875, 2.08416748046875, 2.1890869140625, 2.29400634765625, 2.39892578125, 2.50384521484375, 2.6087646484375, 2.71368408203125, 2.818603515625, 2.92352294921875, 3.0284423828125, 3.13336181640625, 3.23828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 11.0, 10.0, 16.0, 17.0, 14.0, 27.0, 26.0, 45.0, 73.0, 84.0, 109.0, 171.0, 288.0, 504.0, 1298.0, 7951.0, 3065006.0, 66384.0, 1977.0, 637.0, 334.0, 206.0, 130.0, 94.0, 62.0, 59.0, 38.0, 32.0, 22.0, 16.0, 13.0, 10.0, 12.0, 8.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.56085205078125, -5.3599853515625, -5.15911865234375, -4.958251953125, -4.75738525390625, -4.5565185546875, -4.35565185546875, -4.15478515625, -3.95391845703125, -3.7530517578125, -3.55218505859375, -3.351318359375, -3.15045166015625, -2.9495849609375, -2.74871826171875, -2.5478515625, -2.34698486328125, -2.1461181640625, -1.94525146484375, -1.744384765625, -1.54351806640625, -1.3426513671875, -1.14178466796875, -0.94091796875, -0.74005126953125, -0.5391845703125, -0.33831787109375, -0.137451171875, 0.06341552734375, 0.2642822265625, 0.46514892578125, 0.666015625, 0.86688232421875, 1.0677490234375, 1.26861572265625, 1.469482421875, 1.67034912109375, 1.8712158203125, 2.07208251953125, 2.27294921875, 2.47381591796875, 2.6746826171875, 2.87554931640625, 3.076416015625, 3.27728271484375, 3.4781494140625, 3.67901611328125, 3.8798828125, 4.08074951171875, 4.2816162109375, 4.48248291015625, 4.683349609375, 4.88421630859375, 5.0850830078125, 5.28594970703125, 5.48681640625, 5.68768310546875, 5.8885498046875, 6.08941650390625, 6.290283203125, 6.49114990234375, 6.6920166015625, 6.89288330078125, 7.09375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 14.0, 676.0, 318.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.85894012451172, -86.09623718261719, -84.33354187011719, -82.57083892822266, -80.80814361572266, -79.04544067382812, -77.28274536132812, -75.5200424194336, -73.75733947753906, -71.99463653564453, -70.23194122314453, -68.46923828125, -66.70654296875, -64.94384002685547, -63.1811408996582, -61.41844177246094, -59.65574645996094, -57.89304733276367, -56.130348205566406, -54.36764907836914, -52.604949951171875, -50.842247009277344, -49.07954788208008, -47.31684875488281, -45.55414962768555, -43.79145050048828, -42.028751373291016, -40.26605224609375, -38.50334930419922, -36.74065399169922, -34.97795104980469, -33.21525192260742, -31.452552795410156, -29.68985366821289, -27.927154541015625, -26.164453506469727, -24.40175437927246, -22.639055252075195, -20.876354217529297, -19.11365509033203, -17.350955963134766, -15.5882568359375, -13.825556755065918, -12.062856674194336, -10.30015754699707, -8.537458419799805, -6.774758338928223, -5.012058258056641, -3.249359130859375, -1.4866595268249512, 0.27604007720947266, 2.0387396812438965, 3.8014392852783203, 5.564138412475586, 7.326838493347168, 9.08953857421875, 10.852237701416016, 12.614936828613281, 14.377636909484863, 16.140336990356445, 17.90303611755371, 19.665735244750977, 21.428436279296875, 23.19113540649414, 24.953834533691406]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 12.0, 10.0, 13.0, 9.0, 18.0, 25.0, 17.0, 12.0, 29.0, 29.0, 35.0, 26.0, 30.0, 36.0, 47.0, 38.0, 52.0, 48.0, 48.0, 41.0, 49.0, 46.0, 54.0, 31.0, 35.0, 34.0, 25.0, 26.0, 21.0, 19.0, 15.0, 20.0, 6.0, 8.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.661385536193848, -8.432267189025879, -8.20314884185791, -7.9740309715271, -7.744913101196289, -7.51579475402832, -7.286676406860352, -7.057558536529541, -6.8284406661987305, -6.599322319030762, -6.370204448699951, -6.141086101531982, -5.911968231201172, -5.682849884033203, -5.453731536865234, -5.224613666534424, -4.995495319366455, -4.766376972198486, -4.537259101867676, -4.308140754699707, -4.0790228843688965, -3.8499045372009277, -3.620786428451538, -3.3916683197021484, -3.162550210952759, -2.933432102203369, -2.7043139934539795, -2.47519588470459, -2.246077537536621, -2.0169596672058105, -1.7878413200378418, -1.5587232112884521, -1.3296046257019043, -1.1004865169525146, -0.8713683485984802, -0.6422501802444458, -0.41313207149505615, -0.1840139627456665, 0.045104265213012695, 0.27422237396240234, 0.503340482711792, 0.7324585914611816, 0.9615767598152161, 1.1906949281692505, 1.4198130369186401, 1.6489311456680298, 1.878049373626709, 2.1071674823760986, 2.3362855911254883, 2.565403699874878, 2.7945218086242676, 3.0236401557922363, 3.252758026123047, 3.4818763732910156, 3.7109944820404053, 3.940112590789795, 4.1692304611206055, 4.398348808288574, 4.627466678619385, 4.8565850257873535, 5.085702896118164, 5.314821243286133, 5.543939590454102, 5.773057460784912, 6.002175807952881]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 10.0, 12.0, 17.0, 19.0, 14.0, 31.0, 20.0, 28.0, 28.0, 38.0, 38.0, 36.0, 44.0, 40.0, 46.0, 38.0, 42.0, 39.0, 49.0, 35.0, 41.0, 32.0, 23.0, 38.0, 31.0, 30.0, 26.0, 14.0, 23.0, 17.0, 12.0, 17.0, 7.0, 12.0, 11.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30078125, -1.2582244873046875, -1.215667724609375, -1.1731109619140625, -1.13055419921875, -1.0879974365234375, -1.045440673828125, -1.0028839111328125, -0.9603271484375, -0.9177703857421875, -0.875213623046875, -0.8326568603515625, -0.79010009765625, -0.7475433349609375, -0.704986572265625, -0.6624298095703125, -0.619873046875, -0.5773162841796875, -0.534759521484375, -0.4922027587890625, -0.44964599609375, -0.4070892333984375, -0.364532470703125, -0.3219757080078125, -0.2794189453125, -0.2368621826171875, -0.194305419921875, -0.1517486572265625, -0.10919189453125, -0.0666351318359375, -0.024078369140625, 0.0184783935546875, 0.06103515625, 0.1035919189453125, 0.146148681640625, 0.1887054443359375, 0.23126220703125, 0.2738189697265625, 0.316375732421875, 0.3589324951171875, 0.4014892578125, 0.4440460205078125, 0.486602783203125, 0.5291595458984375, 0.57171630859375, 0.6142730712890625, 0.656829833984375, 0.6993865966796875, 0.741943359375, 0.7845001220703125, 0.827056884765625, 0.8696136474609375, 0.91217041015625, 0.9547271728515625, 0.997283935546875, 1.0398406982421875, 1.0823974609375, 1.1249542236328125, 1.167510986328125, 1.2100677490234375, 1.25262451171875, 1.2951812744140625, 1.337738037109375, 1.3802947998046875, 1.4228515625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 5.0, 7.0, 8.0, 8.0, 10.0, 18.0, 19.0, 24.0, 36.0, 40.0, 53.0, 58.0, 77.0, 79.0, 113.0, 172.0, 295.0, 509.0, 902.0, 1942.0, 5441.0, 23834.0, 214749.0, 3102050.0, 780792.0, 49111.0, 8399.0, 2562.0, 1071.0, 621.0, 364.0, 211.0, 150.0, 112.0, 91.0, 69.0, 60.0, 46.0, 33.0, 24.0, 22.0, 17.0, 16.0, 16.0, 10.0, 9.0, 9.0, 3.0, 6.0, 1.0, 1.0], "bins": [-7.93359375, -7.7174072265625, -7.501220703125, -7.2850341796875, -7.06884765625, -6.8526611328125, -6.636474609375, -6.4202880859375, -6.2041015625, -5.9879150390625, -5.771728515625, -5.5555419921875, -5.33935546875, -5.1231689453125, -4.906982421875, -4.6907958984375, -4.474609375, -4.2584228515625, -4.042236328125, -3.8260498046875, -3.60986328125, -3.3936767578125, -3.177490234375, -2.9613037109375, -2.7451171875, -2.5289306640625, -2.312744140625, -2.0965576171875, -1.88037109375, -1.6641845703125, -1.447998046875, -1.2318115234375, -1.015625, -0.7994384765625, -0.583251953125, -0.3670654296875, -0.15087890625, 0.0653076171875, 0.281494140625, 0.4976806640625, 0.7138671875, 0.9300537109375, 1.146240234375, 1.3624267578125, 1.57861328125, 1.7947998046875, 2.010986328125, 2.2271728515625, 2.443359375, 2.6595458984375, 2.875732421875, 3.0919189453125, 3.30810546875, 3.5242919921875, 3.740478515625, 3.9566650390625, 4.1728515625, 4.3890380859375, 4.605224609375, 4.8214111328125, 5.03759765625, 5.2537841796875, 5.469970703125, 5.6861572265625, 5.90234375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 10.0, 6.0, 9.0, 14.0, 23.0, 29.0, 46.0, 43.0, 63.0, 70.0, 87.0, 116.0, 161.0, 203.0, 250.0, 337.0, 402.0, 390.0, 373.0, 310.0, 242.0, 168.0, 147.0, 146.0, 88.0, 61.0, 63.0, 45.0, 37.0, 27.0, 22.0, 17.0, 9.0, 10.0, 12.0, 12.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2109375, -2.127410888671875, -2.04388427734375, -1.960357666015625, -1.8768310546875, -1.793304443359375, -1.70977783203125, -1.626251220703125, -1.542724609375, -1.459197998046875, -1.37567138671875, -1.292144775390625, -1.2086181640625, -1.125091552734375, -1.04156494140625, -0.958038330078125, -0.87451171875, -0.790985107421875, -0.70745849609375, -0.623931884765625, -0.5404052734375, -0.456878662109375, -0.37335205078125, -0.289825439453125, -0.206298828125, -0.122772216796875, -0.03924560546875, 0.044281005859375, 0.1278076171875, 0.211334228515625, 0.29486083984375, 0.378387451171875, 0.4619140625, 0.545440673828125, 0.62896728515625, 0.712493896484375, 0.7960205078125, 0.879547119140625, 0.96307373046875, 1.046600341796875, 1.130126953125, 1.213653564453125, 1.29718017578125, 1.380706787109375, 1.4642333984375, 1.547760009765625, 1.63128662109375, 1.714813232421875, 1.79833984375, 1.881866455078125, 1.96539306640625, 2.048919677734375, 2.1324462890625, 2.215972900390625, 2.29949951171875, 2.383026123046875, 2.466552734375, 2.550079345703125, 2.63360595703125, 2.717132568359375, 2.8006591796875, 2.884185791015625, 2.96771240234375, 3.051239013671875, 3.134765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 13.0, 25.0, 67.0, 119.0, 308.0, 693.0, 1612.0, 4077.0, 11210.0, 33958.0, 126096.0, 613435.0, 2305275.0, 863482.0, 168672.0, 43177.0, 13622.0, 4952.0, 1956.0, 854.0, 348.0, 149.0, 75.0, 40.0, 23.0, 10.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.732574462890625, -2.63702392578125, -2.541473388671875, -2.4459228515625, -2.350372314453125, -2.25482177734375, -2.159271240234375, -2.063720703125, -1.968170166015625, -1.87261962890625, -1.777069091796875, -1.6815185546875, -1.585968017578125, -1.49041748046875, -1.394866943359375, -1.29931640625, -1.203765869140625, -1.10821533203125, -1.012664794921875, -0.9171142578125, -0.821563720703125, -0.72601318359375, -0.630462646484375, -0.534912109375, -0.439361572265625, -0.34381103515625, -0.248260498046875, -0.1527099609375, -0.057159423828125, 0.03839111328125, 0.133941650390625, 0.2294921875, 0.325042724609375, 0.42059326171875, 0.516143798828125, 0.6116943359375, 0.707244873046875, 0.80279541015625, 0.898345947265625, 0.993896484375, 1.089447021484375, 1.18499755859375, 1.280548095703125, 1.3760986328125, 1.471649169921875, 1.56719970703125, 1.662750244140625, 1.75830078125, 1.853851318359375, 1.94940185546875, 2.044952392578125, 2.1405029296875, 2.236053466796875, 2.33160400390625, 2.427154541015625, 2.522705078125, 2.618255615234375, 2.71380615234375, 2.809356689453125, 2.9049072265625, 3.000457763671875, 3.09600830078125, 3.191558837890625, 3.287109375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 10.0, 4.0, 12.0, 8.0, 16.0, 18.0, 15.0, 30.0, 36.0, 40.0, 55.0, 81.0, 57.0, 72.0, 79.0, 88.0, 76.0, 68.0, 47.0, 48.0, 34.0, 27.0, 15.0, 15.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.566234588623047, -23.92478370666504, -23.28333282470703, -22.641881942749023, -22.000431060791016, -21.358980178833008, -20.717529296875, -20.076078414916992, -19.434627532958984, -18.793176651000977, -18.15172576904297, -17.51027488708496, -16.868824005126953, -16.227373123168945, -15.585922241210938, -14.94447135925293, -14.303021430969238, -13.66157054901123, -13.020119667053223, -12.378668785095215, -11.737217903137207, -11.0957670211792, -10.454317092895508, -9.8128662109375, -9.171415328979492, -8.529964447021484, -7.888513565063477, -7.247062683105469, -6.605611801147461, -5.964160919189453, -5.3227105140686035, -4.681259632110596, -4.03980827331543, -3.398357391357422, -2.756906509399414, -2.1154558658599854, -1.4740049839019775, -0.8325541019439697, -0.19110345840454102, 0.4503474235534668, 1.0917983055114746, 1.7332491874694824, 2.3747000694274902, 3.016150712966919, 3.6576015949249268, 4.2990522384643555, 4.940503120422363, 5.581954002380371, 6.223404884338379, 6.864855766296387, 7.5063066482543945, 8.147757530212402, 8.78920841217041, 9.430659294128418, 10.07210922241211, 10.713560104370117, 11.355010986328125, 11.996461868286133, 12.63791275024414, 13.279363632202148, 13.920814514160156, 14.562265396118164, 15.203716278076172, 15.84516716003418, 16.486618041992188]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 7.0, 6.0, 10.0, 13.0, 15.0, 20.0, 21.0, 21.0, 22.0, 17.0, 33.0, 25.0, 35.0, 25.0, 31.0, 44.0, 35.0, 42.0, 31.0, 44.0, 32.0, 40.0, 47.0, 30.0, 36.0, 38.0, 29.0, 24.0, 27.0, 31.0, 29.0, 14.0, 19.0, 10.0, 14.0, 13.0, 10.0, 9.0, 13.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.437736511230469, -12.008167266845703, -11.578598022460938, -11.149028778076172, -10.719459533691406, -10.28989028930664, -9.860321998596191, -9.430752754211426, -9.00118350982666, -8.571614265441895, -8.142045021057129, -7.7124762535095215, -7.282907009124756, -6.85333776473999, -6.423768997192383, -5.994199752807617, -5.564630508422852, -5.135061264038086, -4.70549201965332, -4.275923252105713, -3.8463540077209473, -3.4167847633361816, -2.987215757369995, -2.5576467514038086, -2.128077507019043, -1.698508381843567, -1.2689392566680908, -0.8393701314926147, -0.40980100631713867, 0.019768238067626953, 0.4493372440338135, 0.87890625, 1.3084745407104492, 1.7380436658859253, 2.1676127910614014, 2.597181797027588, 3.0267510414123535, 3.456320285797119, 3.8858892917633057, 4.315458297729492, 4.745027542114258, 5.174596786499023, 5.604166030883789, 6.0337347984313965, 6.463304042816162, 6.892873287200928, 7.322442054748535, 7.752011299133301, 8.181580543518066, 8.611149787902832, 9.040719032287598, 9.470288276672363, 9.899856567382812, 10.329425811767578, 10.758995056152344, 11.18856430053711, 11.618133544921875, 12.04770278930664, 12.477272033691406, 12.906841278076172, 13.336410522460938, 13.765979766845703, 14.195548057556152, 14.625117301940918, 15.054686546325684]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 13.0, 14.0, 18.0, 15.0, 16.0, 20.0, 21.0, 21.0, 31.0, 25.0, 42.0, 36.0, 33.0, 35.0, 37.0, 40.0, 48.0, 46.0, 47.0, 37.0, 36.0, 31.0, 29.0, 30.0, 29.0, 28.0, 27.0, 25.0, 15.0, 16.0, 14.0, 13.0, 16.0, 11.0, 6.0, 10.0, 15.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.421875, -23.614013671875, -22.80615234375, -21.998291015625, -21.1904296875, -20.382568359375, -19.57470703125, -18.766845703125, -17.958984375, -17.151123046875, -16.34326171875, -15.535400390625, -14.7275390625, -13.919677734375, -13.11181640625, -12.303955078125, -11.49609375, -10.688232421875, -9.88037109375, -9.072509765625, -8.2646484375, -7.456787109375, -6.64892578125, -5.841064453125, -5.033203125, -4.225341796875, -3.41748046875, -2.609619140625, -1.8017578125, -0.993896484375, -0.18603515625, 0.621826171875, 1.4296875, 2.237548828125, 3.04541015625, 3.853271484375, 4.6611328125, 5.468994140625, 6.27685546875, 7.084716796875, 7.892578125, 8.700439453125, 9.50830078125, 10.316162109375, 11.1240234375, 11.931884765625, 12.73974609375, 13.547607421875, 14.35546875, 15.163330078125, 15.97119140625, 16.779052734375, 17.5869140625, 18.394775390625, 19.20263671875, 20.010498046875, 20.818359375, 21.626220703125, 22.43408203125, 23.241943359375, 24.0498046875, 24.857666015625, 25.66552734375, 26.473388671875, 27.28125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 6.0, 16.0, 15.0, 15.0, 25.0, 41.0, 60.0, 70.0, 89.0, 155.0, 242.0, 295.0, 476.0, 704.0, 1078.0, 1523.0, 2219.0, 3354.0, 5134.0, 7638.0, 11394.0, 17996.0, 27866.0, 42665.0, 65263.0, 94957.0, 130306.0, 155633.0, 143966.0, 110372.0, 77138.0, 51185.0, 33603.0, 21663.0, 13969.0, 9035.0, 5962.0, 4189.0, 2601.0, 1817.0, 1196.0, 843.0, 568.0, 349.0, 285.0, 173.0, 130.0, 96.0, 65.0, 42.0, 22.0, 19.0, 16.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.98583984375, -0.9537429809570312, -0.9216461181640625, -0.8895492553710938, -0.857452392578125, -0.8253555297851562, -0.7932586669921875, -0.7611618041992188, -0.72906494140625, -0.6969680786132812, -0.6648712158203125, -0.6327743530273438, -0.600677490234375, -0.5685806274414062, -0.5364837646484375, -0.5043869018554688, -0.4722900390625, -0.44019317626953125, -0.4080963134765625, -0.37599945068359375, -0.343902587890625, -0.31180572509765625, -0.2797088623046875, -0.24761199951171875, -0.21551513671875, -0.18341827392578125, -0.1513214111328125, -0.11922454833984375, -0.087127685546875, -0.05503082275390625, -0.0229339599609375, 0.00916290283203125, 0.041259765625, 0.07335662841796875, 0.1054534912109375, 0.13755035400390625, 0.169647216796875, 0.20174407958984375, 0.2338409423828125, 0.26593780517578125, 0.29803466796875, 0.33013153076171875, 0.3622283935546875, 0.39432525634765625, 0.426422119140625, 0.45851898193359375, 0.4906158447265625, 0.5227127075195312, 0.5548095703125, 0.5869064331054688, 0.6190032958984375, 0.6511001586914062, 0.683197021484375, 0.7152938842773438, 0.7473907470703125, 0.7794876098632812, 0.81158447265625, 0.8436813354492188, 0.8757781982421875, 0.9078750610351562, 0.939971923828125, 0.9720687866210938, 1.0041656494140625, 1.0362625122070312, 1.068359375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 2.0, 7.0, 14.0, 12.0, 13.0, 12.0, 13.0, 13.0, 18.0, 17.0, 11.0, 27.0, 24.0, 14.0, 28.0, 28.0, 28.0, 31.0, 38.0, 34.0, 29.0, 49.0, 37.0, 1057.0, 39.0, 37.0, 25.0, 37.0, 24.0, 33.0, 25.0, 26.0, 33.0, 19.0, 25.0, 15.0, 27.0, 10.0, 20.0, 14.0, 10.0, 8.0, 9.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.390625, -12.9595947265625, -12.528564453125, -12.0975341796875, -11.66650390625, -11.2354736328125, -10.804443359375, -10.3734130859375, -9.9423828125, -9.5113525390625, -9.080322265625, -8.6492919921875, -8.21826171875, -7.7872314453125, -7.356201171875, -6.9251708984375, -6.494140625, -6.0631103515625, -5.632080078125, -5.2010498046875, -4.77001953125, -4.3389892578125, -3.907958984375, -3.4769287109375, -3.0458984375, -2.6148681640625, -2.183837890625, -1.7528076171875, -1.32177734375, -0.8907470703125, -0.459716796875, -0.0286865234375, 0.40234375, 0.8333740234375, 1.264404296875, 1.6954345703125, 2.12646484375, 2.5574951171875, 2.988525390625, 3.4195556640625, 3.8505859375, 4.2816162109375, 4.712646484375, 5.1436767578125, 5.57470703125, 6.0057373046875, 6.436767578125, 6.8677978515625, 7.298828125, 7.7298583984375, 8.160888671875, 8.5919189453125, 9.02294921875, 9.4539794921875, 9.885009765625, 10.3160400390625, 10.7470703125, 11.1781005859375, 11.609130859375, 12.0401611328125, 12.47119140625, 12.9022216796875, 13.333251953125, 13.7642822265625, 14.1953125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 10.0, 13.0, 12.0, 20.0, 47.0, 70.0, 121.0, 154.0, 278.0, 434.0, 763.0, 1280.0, 2035.0, 3555.0, 6081.0, 10597.0, 18392.0, 31506.0, 54191.0, 90058.0, 143948.0, 975016.0, 429378.0, 130914.0, 81755.0, 48934.0, 28227.0, 16524.0, 9362.0, 5389.0, 3226.0, 1872.0, 1154.0, 718.0, 426.0, 245.0, 148.0, 104.0, 63.0, 39.0, 24.0, 16.0, 12.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0947265625, -1.0604095458984375, -1.026092529296875, -0.9917755126953125, -0.95745849609375, -0.9231414794921875, -0.888824462890625, -0.8545074462890625, -0.8201904296875, -0.7858734130859375, -0.751556396484375, -0.7172393798828125, -0.68292236328125, -0.6486053466796875, -0.614288330078125, -0.5799713134765625, -0.545654296875, -0.5113372802734375, -0.477020263671875, -0.4427032470703125, -0.40838623046875, -0.3740692138671875, -0.339752197265625, -0.3054351806640625, -0.2711181640625, -0.2368011474609375, -0.202484130859375, -0.1681671142578125, -0.13385009765625, -0.0995330810546875, -0.065216064453125, -0.0308990478515625, 0.00341796875, 0.0377349853515625, 0.072052001953125, 0.1063690185546875, 0.14068603515625, 0.1750030517578125, 0.209320068359375, 0.2436370849609375, 0.2779541015625, 0.3122711181640625, 0.346588134765625, 0.3809051513671875, 0.41522216796875, 0.4495391845703125, 0.483856201171875, 0.5181732177734375, 0.552490234375, 0.5868072509765625, 0.621124267578125, 0.6554412841796875, 0.68975830078125, 0.7240753173828125, 0.758392333984375, 0.7927093505859375, 0.8270263671875, 0.8613433837890625, 0.895660400390625, 0.9299774169921875, 0.96429443359375, 0.9986114501953125, 1.032928466796875, 1.0672454833984375, 1.1015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 17.0, 37.0, 70.0, 93.0, 118.0, 119.0, 111.0, 108.0, 97.0, 59.0, 56.0, 25.0, 28.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07275390625, -0.0700836181640625, -0.067413330078125, -0.0647430419921875, -0.06207275390625, -0.0594024658203125, -0.056732177734375, -0.0540618896484375, -0.0513916015625, -0.0487213134765625, -0.046051025390625, -0.0433807373046875, -0.04071044921875, -0.0380401611328125, -0.035369873046875, -0.0326995849609375, -0.030029296875, -0.0273590087890625, -0.024688720703125, -0.0220184326171875, -0.01934814453125, -0.0166778564453125, -0.014007568359375, -0.0113372802734375, -0.0086669921875, -0.0059967041015625, -0.003326416015625, -0.0006561279296875, 0.00201416015625, 0.0046844482421875, 0.007354736328125, 0.0100250244140625, 0.0126953125, 0.0153656005859375, 0.018035888671875, 0.0207061767578125, 0.02337646484375, 0.0260467529296875, 0.028717041015625, 0.0313873291015625, 0.0340576171875, 0.0367279052734375, 0.039398193359375, 0.0420684814453125, 0.04473876953125, 0.0474090576171875, 0.050079345703125, 0.0527496337890625, 0.055419921875, 0.0580902099609375, 0.060760498046875, 0.0634307861328125, 0.06610107421875, 0.0687713623046875, 0.071441650390625, 0.0741119384765625, 0.0767822265625, 0.0794525146484375, 0.082122802734375, 0.0847930908203125, 0.08746337890625, 0.0901336669921875, 0.092803955078125, 0.0954742431640625, 0.09814453125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 21.0, 28.0, 35.0, 33.0, 53.0, 83.0, 107.0, 152.0, 202.0, 284.0, 458.0, 623.0, 889.0, 1261.0, 1973.0, 3101.0, 5385.0, 12102.0, 45103.0, 291832.0, 544991.0, 100572.0, 20455.0, 7598.0, 3832.0, 2380.0, 1559.0, 974.0, 707.0, 508.0, 348.0, 263.0, 186.0, 107.0, 96.0, 67.0, 44.0, 38.0, 29.0, 21.0, 13.0, 8.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.315185546875, -0.30509185791015625, -0.2949981689453125, -0.28490447998046875, -0.274810791015625, -0.26471710205078125, -0.2546234130859375, -0.24452972412109375, -0.23443603515625, -0.22434234619140625, -0.2142486572265625, -0.20415496826171875, -0.194061279296875, -0.18396759033203125, -0.1738739013671875, -0.16378021240234375, -0.1536865234375, -0.14359283447265625, -0.1334991455078125, -0.12340545654296875, -0.113311767578125, -0.10321807861328125, -0.0931243896484375, -0.08303070068359375, -0.07293701171875, -0.06284332275390625, -0.0527496337890625, -0.04265594482421875, -0.032562255859375, -0.02246856689453125, -0.0123748779296875, -0.00228118896484375, 0.0078125, 0.01790618896484375, 0.0279998779296875, 0.03809356689453125, 0.048187255859375, 0.05828094482421875, 0.0683746337890625, 0.07846832275390625, 0.08856201171875, 0.09865570068359375, 0.1087493896484375, 0.11884307861328125, 0.128936767578125, 0.13903045654296875, 0.1491241455078125, 0.15921783447265625, 0.1693115234375, 0.17940521240234375, 0.1894989013671875, 0.19959259033203125, 0.209686279296875, 0.21977996826171875, 0.2298736572265625, 0.23996734619140625, 0.25006103515625, 0.26015472412109375, 0.2702484130859375, 0.28034210205078125, 0.290435791015625, 0.30052947998046875, 0.3106231689453125, 0.32071685791015625, 0.330810546875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 11.0, 14.0, 27.0, 31.0, 58.0, 105.0, 157.0, 142.0, 118.0, 100.0, 57.0, 49.0, 32.0, 22.0, 12.0, 15.0, 11.0, 6.0, 6.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10929163545370102, -0.10388729721307755, -0.09848296642303467, -0.0930786281824112, -0.08767428994178772, -0.08226995170116425, -0.07686561346054077, -0.0714612826704979, -0.06605694442987442, -0.060652606189250946, -0.05524827167391777, -0.049843937158584595, -0.04443959891796112, -0.039035260677337646, -0.03363092616200447, -0.028226591646671295, -0.02282225340604782, -0.017417917028069496, -0.012013580650091171, -0.006609244272112846, -0.0012049078941345215, 0.004199428483843803, 0.009603764861822128, 0.015008099377155304, 0.020412437617778778, 0.025816773995757103, 0.031221110373735428, 0.036625444889068604, 0.04202978312969208, 0.04743412137031555, 0.05283845588564873, 0.0582427904009819, 0.06364713609218597, 0.06905147433280945, 0.07445581257343292, 0.0798601433634758, 0.08526448160409927, 0.09066881984472275, 0.09607315063476562, 0.1014774888753891, 0.10688182711601257, 0.11228616535663605, 0.11769050359725952, 0.1230948343873024, 0.12849918007850647, 0.13390350341796875, 0.13930784165859222, 0.1447121798992157, 0.15011651813983917, 0.15552085638046265, 0.16092519462108612, 0.1663295328617096, 0.17173385620117188, 0.17713819444179535, 0.18254253268241882, 0.1879468709230423, 0.19335120916366577, 0.19875554740428925, 0.20415988564491272, 0.2095642238855362, 0.21496856212615967, 0.22037288546562195, 0.22577722370624542, 0.2311815619468689, 0.23658590018749237]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 8.0, 13.0, 15.0, 17.0, 30.0, 17.0, 33.0, 21.0, 16.0, 31.0, 34.0, 33.0, 27.0, 33.0, 32.0, 46.0, 41.0, 40.0, 46.0, 31.0, 40.0, 31.0, 33.0, 30.0, 32.0, 31.0, 24.0, 24.0, 25.0, 17.0, 18.0, 14.0, 19.0, 10.0, 16.0, 13.0, 7.0, 17.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.08956396579742432, -0.08706812560558319, -0.08457228541374207, -0.08207644522190094, -0.07958060503005981, -0.07708476483821869, -0.07458892464637756, -0.07209308445453644, -0.06959724426269531, -0.06710140407085419, -0.06460556387901306, -0.062109723687171936, -0.05961388349533081, -0.057118043303489685, -0.05462220311164856, -0.052126362919807434, -0.04963052272796631, -0.04713468253612518, -0.04463884234428406, -0.04214300215244293, -0.03964716196060181, -0.03715132176876068, -0.034655481576919556, -0.03215964138507843, -0.029663801193237305, -0.02716796100139618, -0.024672120809555054, -0.022176280617713928, -0.019680440425872803, -0.017184600234031677, -0.014688760042190552, -0.012192919850349426, -0.0096970796585083, -0.007201239466667175, -0.00470539927482605, -0.0022095590829849243, 0.00028628110885620117, 0.0027821213006973267, 0.005277961492538452, 0.007773801684379578, 0.010269641876220703, 0.012765482068061829, 0.015261322259902954, 0.01775716245174408, 0.020253002643585205, 0.02274884283542633, 0.025244683027267456, 0.02774052321910858, 0.030236363410949707, 0.03273220360279083, 0.03522804379463196, 0.037723883986473083, 0.04021972417831421, 0.042715564370155334, 0.04521140456199646, 0.047707244753837585, 0.05020308494567871, 0.052698925137519836, 0.05519476532936096, 0.05769060552120209, 0.06018644571304321, 0.06268228590488434, 0.06517812609672546, 0.06767396628856659, 0.07016980648040771]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 16.0, 13.0, 17.0, 13.0, 19.0, 24.0, 14.0, 24.0, 29.0, 29.0, 38.0, 36.0, 35.0, 35.0, 37.0, 42.0, 44.0, 39.0, 48.0, 38.0, 42.0, 28.0, 31.0, 30.0, 27.0, 27.0, 28.0, 23.0, 15.0, 17.0, 18.0, 14.0, 11.0, 14.0, 6.0, 9.0, 13.0, 9.0, 5.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.296875, -23.494873046875, -22.69287109375, -21.890869140625, -21.0888671875, -20.286865234375, -19.48486328125, -18.682861328125, -17.880859375, -17.078857421875, -16.27685546875, -15.474853515625, -14.6728515625, -13.870849609375, -13.06884765625, -12.266845703125, -11.46484375, -10.662841796875, -9.86083984375, -9.058837890625, -8.2568359375, -7.454833984375, -6.65283203125, -5.850830078125, -5.048828125, -4.246826171875, -3.44482421875, -2.642822265625, -1.8408203125, -1.038818359375, -0.23681640625, 0.565185546875, 1.3671875, 2.169189453125, 2.97119140625, 3.773193359375, 4.5751953125, 5.377197265625, 6.17919921875, 6.981201171875, 7.783203125, 8.585205078125, 9.38720703125, 10.189208984375, 10.9912109375, 11.793212890625, 12.59521484375, 13.397216796875, 14.19921875, 15.001220703125, 15.80322265625, 16.605224609375, 17.4072265625, 18.209228515625, 19.01123046875, 19.813232421875, 20.615234375, 21.417236328125, 22.21923828125, 23.021240234375, 23.8232421875, 24.625244140625, 25.42724609375, 26.229248046875, 27.03125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 10.0, 13.0, 12.0, 21.0, 24.0, 24.0, 31.0, 49.0, 55.0, 68.0, 98.0, 120.0, 205.0, 316.0, 571.0, 1241.0, 3950.0, 23176.0, 252985.0, 666884.0, 84373.0, 9871.0, 2315.0, 850.0, 372.0, 243.0, 177.0, 110.0, 87.0, 58.0, 37.0, 41.0, 30.0, 27.0, 21.0, 19.0, 8.0, 10.0, 13.0, 9.0, 2.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.325927734375, -5.14404296875, -4.962158203125, -4.7802734375, -4.598388671875, -4.41650390625, -4.234619140625, -4.052734375, -3.870849609375, -3.68896484375, -3.507080078125, -3.3251953125, -3.143310546875, -2.96142578125, -2.779541015625, -2.59765625, -2.415771484375, -2.23388671875, -2.052001953125, -1.8701171875, -1.688232421875, -1.50634765625, -1.324462890625, -1.142578125, -0.960693359375, -0.77880859375, -0.596923828125, -0.4150390625, -0.233154296875, -0.05126953125, 0.130615234375, 0.3125, 0.494384765625, 0.67626953125, 0.858154296875, 1.0400390625, 1.221923828125, 1.40380859375, 1.585693359375, 1.767578125, 1.949462890625, 2.13134765625, 2.313232421875, 2.4951171875, 2.677001953125, 2.85888671875, 3.040771484375, 3.22265625, 3.404541015625, 3.58642578125, 3.768310546875, 3.9501953125, 4.132080078125, 4.31396484375, 4.495849609375, 4.677734375, 4.859619140625, 5.04150390625, 5.223388671875, 5.4052734375, 5.587158203125, 5.76904296875, 5.950927734375, 6.1328125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 13.0, 9.0, 7.0, 14.0, 18.0, 19.0, 29.0, 28.0, 24.0, 43.0, 43.0, 59.0, 42.0, 38.0, 69.0, 213.0, 1948.0, 45.0, 51.0, 38.0, 38.0, 48.0, 35.0, 34.0, 34.0, 27.0, 23.0, 12.0, 6.0, 5.0, 10.0, 2.0, 5.0, 4.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.140625, -28.835205078125, -27.52978515625, -26.224365234375, -24.9189453125, -23.613525390625, -22.30810546875, -21.002685546875, -19.697265625, -18.391845703125, -17.08642578125, -15.781005859375, -14.4755859375, -13.170166015625, -11.86474609375, -10.559326171875, -9.25390625, -7.948486328125, -6.64306640625, -5.337646484375, -4.0322265625, -2.726806640625, -1.42138671875, -0.115966796875, 1.189453125, 2.494873046875, 3.80029296875, 5.105712890625, 6.4111328125, 7.716552734375, 9.02197265625, 10.327392578125, 11.6328125, 12.938232421875, 14.24365234375, 15.549072265625, 16.8544921875, 18.159912109375, 19.46533203125, 20.770751953125, 22.076171875, 23.381591796875, 24.68701171875, 25.992431640625, 27.2978515625, 28.603271484375, 29.90869140625, 31.214111328125, 32.51953125, 33.824951171875, 35.13037109375, 36.435791015625, 37.7412109375, 39.046630859375, 40.35205078125, 41.657470703125, 42.962890625, 44.268310546875, 45.57373046875, 46.879150390625, 48.1845703125, 49.489990234375, 50.79541015625, 52.100830078125, 53.40625]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 16.0, 15.0, 12.0, 22.0, 31.0, 49.0, 88.0, 149.0, 245.0, 459.0, 996.0, 2358.0, 7108.0, 39681.0, 398712.0, 2615578.0, 64795.0, 10202.0, 2801.0, 1093.0, 561.0, 281.0, 153.0, 86.0, 60.0, 37.0, 30.0, 13.0, 16.0, 7.0, 6.0, 9.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.18359375, -4.04913330078125, -3.9146728515625, -3.78021240234375, -3.645751953125, -3.51129150390625, -3.3768310546875, -3.24237060546875, -3.10791015625, -2.97344970703125, -2.8389892578125, -2.70452880859375, -2.570068359375, -2.43560791015625, -2.3011474609375, -2.16668701171875, -2.0322265625, -1.89776611328125, -1.7633056640625, -1.62884521484375, -1.494384765625, -1.35992431640625, -1.2254638671875, -1.09100341796875, -0.95654296875, -0.82208251953125, -0.6876220703125, -0.55316162109375, -0.418701171875, -0.28424072265625, -0.1497802734375, -0.01531982421875, 0.119140625, 0.25360107421875, 0.3880615234375, 0.52252197265625, 0.656982421875, 0.79144287109375, 0.9259033203125, 1.06036376953125, 1.19482421875, 1.32928466796875, 1.4637451171875, 1.59820556640625, 1.732666015625, 1.86712646484375, 2.0015869140625, 2.13604736328125, 2.2705078125, 2.40496826171875, 2.5394287109375, 2.67388916015625, 2.808349609375, 2.94281005859375, 3.0772705078125, 3.21173095703125, 3.34619140625, 3.48065185546875, 3.6151123046875, 3.74957275390625, 3.884033203125, 4.01849365234375, 4.1529541015625, 4.28741455078125, 4.421875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 22.0, 35.0, 101.0, 165.0, 237.0, 203.0, 102.0, 51.0, 13.0, 25.0, 4.0, 5.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.57614135742188, -74.96520233154297, -72.35425567626953, -69.74331665039062, -67.13237762451172, -64.52143859863281, -61.910491943359375, -59.29955291748047, -56.68861389160156, -54.07767105102539, -51.466732025146484, -48.85578918457031, -46.244850158691406, -43.633907318115234, -41.02296447753906, -38.412025451660156, -35.801082611083984, -33.19013977050781, -30.579200744628906, -27.968257904052734, -25.357318878173828, -22.746376037597656, -20.135435104370117, -17.524494171142578, -14.913553237915039, -12.3026123046875, -9.691671371459961, -7.0807294845581055, -4.469788551330566, -1.8588476181030273, 0.7520942687988281, 3.363035202026367, 5.973976135253906, 8.584917068481445, 11.195858001708984, 13.80679988861084, 16.417739868164062, 19.028682708740234, 21.639623641967773, 24.250564575195312, 26.86150550842285, 29.47244644165039, 32.08338928222656, 34.69432830810547, 37.30527114868164, 39.91621017456055, 42.52715301513672, 45.138092041015625, 47.7490348815918, 50.35997772216797, 52.970916748046875, 55.58185958862305, 58.19279861450195, 60.803741455078125, 63.41468048095703, 66.02561950683594, 68.63656616210938, 71.24750518798828, 73.85845184326172, 76.46939086914062, 79.08032989501953, 81.69126892089844, 84.30221557617188, 86.91315460205078, 89.52409362792969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 7.0, 6.0, 11.0, 9.0, 19.0, 18.0, 17.0, 22.0, 20.0, 19.0, 32.0, 43.0, 24.0, 51.0, 39.0, 49.0, 59.0, 52.0, 51.0, 52.0, 49.0, 48.0, 43.0, 40.0, 42.0, 22.0, 22.0, 30.0, 22.0, 14.0, 16.0, 10.0, 12.0, 7.0, 7.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-65.85429382324219, -64.00669860839844, -62.15910339355469, -60.31150817871094, -58.46390914916992, -56.61631393432617, -54.76871871948242, -52.92112350463867, -51.073524475097656, -49.225929260253906, -47.378334045410156, -45.530738830566406, -43.68313980102539, -41.83554458618164, -39.98794937133789, -38.14035415649414, -36.29275894165039, -34.44516372680664, -32.59756851196289, -30.749971389770508, -28.902374267578125, -27.054779052734375, -25.207183837890625, -23.359588623046875, -21.511991500854492, -19.664396286010742, -17.81679916381836, -15.96920394897461, -14.121607780456543, -12.274011611938477, -10.426416397094727, -8.57882022857666, -6.731227874755859, -4.883631706237793, -3.0360360145568848, -1.1884403228759766, 0.6591558456420898, 2.5067520141601562, 4.354347229003906, 6.201943397521973, 8.049539566040039, 9.897135734558105, 11.744731903076172, 13.592327117919922, 15.439923286437988, 17.287519454956055, 19.135114669799805, 20.982711791992188, 22.830307006835938, 24.677902221679688, 26.52549934387207, 28.37309455871582, 30.220691680908203, 32.06828689575195, 33.9158821105957, 35.76347732543945, 37.61107635498047, 39.45867156982422, 41.30626678466797, 43.15386199951172, 45.001461029052734, 46.849056243896484, 48.696651458740234, 50.544246673583984, 52.391841888427734]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 12.0, 11.0, 10.0, 14.0, 12.0, 23.0, 23.0, 30.0, 42.0, 47.0, 67.0, 114.0, 191.0, 370.0, 826.0, 2074.0, 6655.0, 1016666.0, 14385.0, 4121.0, 1483.0, 587.0, 271.0, 142.0, 75.0, 62.0, 44.0, 27.0, 26.0, 19.0, 26.0, 16.0, 12.0, 11.0, 8.0, 7.0, 8.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.988386154174805, -18.409578323364258, -17.830772399902344, -17.251964569091797, -16.67315673828125, -16.094348907470703, -15.515542984008789, -14.936735153198242, -14.357927322387695, -13.779120445251465, -13.200312614440918, -12.621505737304688, -12.04269790649414, -11.46389102935791, -10.88508415222168, -10.306276321411133, -9.727469444274902, -9.148662567138672, -8.569854736328125, -7.9910478591918945, -7.412240028381348, -6.833433151245117, -6.2546257972717285, -5.67581844329834, -5.097011089324951, -4.5182037353515625, -3.939396381378174, -3.3605892658233643, -2.7817819118499756, -2.202974557876587, -1.6241674423217773, -1.0453600883483887, -0.466552734375, 0.1122545599937439, 0.6910618543624878, 1.269869089126587, 1.8486764430999756, 2.4274837970733643, 3.006290912628174, 3.5850982666015625, 4.163905620574951, 4.74271297454834, 5.3215203285217285, 5.900327682495117, 6.479134559631348, 7.0579423904418945, 7.636749267578125, 8.215557098388672, 8.794363975524902, 9.373170852661133, 9.95197868347168, 10.53078556060791, 11.109593391418457, 11.688400268554688, 12.267208099365234, 12.846014976501465, 13.424821853637695, 14.003628730773926, 14.582436561584473, 15.161243438720703, 15.74005126953125, 16.318859100341797, 16.89766502380371, 17.476472854614258, 18.055280685424805]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 87.0, 51461816.0, 1197.0, 19.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1335.000244140625, -1276.30078125, -1217.6014404296875, -1158.9019775390625, -1100.20263671875, -1041.503173828125, -982.8037719726562, -924.1043701171875, -865.4049072265625, -806.7055053710938, -748.006103515625, -689.306640625, -630.6072387695312, -571.9078369140625, -513.2084350585938, -454.5090026855469, -395.80963134765625, -337.1102294921875, -278.4107971191406, -219.71139526367188, -161.01197814941406, -102.31256103515625, -43.6131591796875, 15.086273193359375, 73.78567504882812, 132.48509216308594, 191.18450927734375, 249.8839111328125, 308.58331298828125, 367.2827453613281, 425.9821472167969, 484.68157958984375, 543.3809814453125, 602.0803833007812, 660.77978515625, 719.479248046875, 778.1786499023438, 836.8780517578125, 895.5774536132812, 954.27685546875, 1012.976318359375, 1071.67578125, 1130.3751220703125, 1189.0745849609375, 1247.77392578125, 1306.473388671875, 1365.1728515625, 1423.8721923828125, 1482.571533203125, 1541.27099609375, 1599.9703369140625, 1658.6697998046875, 1717.369140625, 1776.068603515625, 1834.76806640625, 1893.4674072265625, 1952.1668701171875, 2010.8663330078125, 2069.565673828125, 2128.26513671875, 2186.964599609375, 2245.6640625, 2304.36328125, 2363.062744140625, 2421.76220703125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 11.0, 10.0, 24.0, 43.0, 47.0, 84.0, 125.0, 177.0, 298.0, 449.0, 815.0, 1377.0, 2332.0, 4187.0, 7696.0, 14654.0, 28518.0, 59813.0, 131520.0, 310315.0, 1021609.0, 3542184.0, 706612.0, 248623.0, 108088.0, 50265.0, 24216.0, 12263.0, 6542.0, 3581.0, 1963.0, 1145.0, 712.0, 435.0, 253.0, 157.0, 96.0, 65.0, 42.0, 25.0, 23.0, 10.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.87109375, -4.72515869140625, -4.5792236328125, -4.43328857421875, -4.287353515625, -4.14141845703125, -3.9954833984375, -3.84954833984375, -3.70361328125, -3.55767822265625, -3.4117431640625, -3.26580810546875, -3.119873046875, -2.97393798828125, -2.8280029296875, -2.68206787109375, -2.5361328125, -2.39019775390625, -2.2442626953125, -2.09832763671875, -1.952392578125, -1.80645751953125, -1.6605224609375, -1.51458740234375, -1.36865234375, -1.22271728515625, -1.0767822265625, -0.93084716796875, -0.784912109375, -0.63897705078125, -0.4930419921875, -0.34710693359375, -0.201171875, -0.05523681640625, 0.0906982421875, 0.23663330078125, 0.382568359375, 0.52850341796875, 0.6744384765625, 0.82037353515625, 0.96630859375, 1.11224365234375, 1.2581787109375, 1.40411376953125, 1.550048828125, 1.69598388671875, 1.8419189453125, 1.98785400390625, 2.1337890625, 2.27972412109375, 2.4256591796875, 2.57159423828125, 2.717529296875, 2.86346435546875, 3.0093994140625, 3.15533447265625, 3.30126953125, 3.44720458984375, 3.5931396484375, 3.73907470703125, 3.885009765625, 4.03094482421875, 4.1768798828125, 4.32281494140625, 4.46875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 12.0, 5.0, 14.0, 17.0, 9.0, 16.0, 31.0, 30.0, 34.0, 36.0, 37.0, 35.0, 42.0, 40.0, 79.0, 280.0, 487.0, 274.0, 102.0, 48.0, 44.0, 46.0, 45.0, 26.0, 29.0, 25.0, 30.0, 23.0, 22.0, 23.0, 16.0, 11.0, 9.0, 8.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33984375, -6.10955810546875, -5.8792724609375, -5.64898681640625, -5.418701171875, -5.18841552734375, -4.9581298828125, -4.72784423828125, -4.49755859375, -4.26727294921875, -4.0369873046875, -3.80670166015625, -3.576416015625, -3.34613037109375, -3.1158447265625, -2.88555908203125, -2.6552734375, -2.42498779296875, -2.1947021484375, -1.96441650390625, -1.734130859375, -1.50384521484375, -1.2735595703125, -1.04327392578125, -0.81298828125, -0.58270263671875, -0.3524169921875, -0.12213134765625, 0.108154296875, 0.33843994140625, 0.5687255859375, 0.79901123046875, 1.029296875, 1.25958251953125, 1.4898681640625, 1.72015380859375, 1.950439453125, 2.18072509765625, 2.4110107421875, 2.64129638671875, 2.87158203125, 3.10186767578125, 3.3321533203125, 3.56243896484375, 3.792724609375, 4.02301025390625, 4.2532958984375, 4.48358154296875, 4.7138671875, 4.94415283203125, 5.1744384765625, 5.40472412109375, 5.635009765625, 5.86529541015625, 6.0955810546875, 6.32586669921875, 6.55615234375, 6.78643798828125, 7.0167236328125, 7.24700927734375, 7.477294921875, 7.70758056640625, 7.9378662109375, 8.16815185546875, 8.3984375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 8.0, 16.0, 21.0, 20.0, 43.0, 51.0, 92.0, 158.0, 223.0, 331.0, 454.0, 654.0, 978.0, 1440.0, 2154.0, 3228.0, 4785.0, 7104.0, 11025.0, 16581.0, 25305.0, 38813.0, 59218.0, 90009.0, 134882.0, 202849.0, 301098.0, 566323.0, 2260727.0, 1370734.0, 418436.0, 258387.0, 174413.0, 116574.0, 76945.0, 50599.0, 33117.0, 21623.0, 13806.0, 9409.0, 6063.0, 4143.0, 2809.0, 1928.0, 1237.0, 895.0, 563.0, 396.0, 265.0, 178.0, 117.0, 79.0, 48.0, 31.0, 23.0, 14.0, 7.0, 7.0, 3.0, 2.0, 5.0], "bins": [-1.7314453125, -1.6770172119140625, -1.622589111328125, -1.5681610107421875, -1.51373291015625, -1.4593048095703125, -1.404876708984375, -1.3504486083984375, -1.2960205078125, -1.2415924072265625, -1.187164306640625, -1.1327362060546875, -1.07830810546875, -1.0238800048828125, -0.969451904296875, -0.9150238037109375, -0.860595703125, -0.8061676025390625, -0.751739501953125, -0.6973114013671875, -0.64288330078125, -0.5884552001953125, -0.534027099609375, -0.4795989990234375, -0.4251708984375, -0.3707427978515625, -0.316314697265625, -0.2618865966796875, -0.20745849609375, -0.1530303955078125, -0.098602294921875, -0.0441741943359375, 0.01025390625, 0.0646820068359375, 0.119110107421875, 0.1735382080078125, 0.22796630859375, 0.2823944091796875, 0.336822509765625, 0.3912506103515625, 0.4456787109375, 0.5001068115234375, 0.554534912109375, 0.6089630126953125, 0.66339111328125, 0.7178192138671875, 0.772247314453125, 0.8266754150390625, 0.881103515625, 0.9355316162109375, 0.989959716796875, 1.0443878173828125, 1.09881591796875, 1.1532440185546875, 1.207672119140625, 1.2621002197265625, 1.3165283203125, 1.3709564208984375, 1.425384521484375, 1.4798126220703125, 1.53424072265625, 1.5886688232421875, 1.643096923828125, 1.6975250244140625, 1.751953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 10.0, 8.0, 9.0, 9.0, 6.0, 15.0, 17.0, 16.0, 28.0, 14.0, 23.0, 27.0, 26.0, 24.0, 35.0, 38.0, 48.0, 45.0, 97.0, 246.0, 433.0, 310.0, 112.0, 61.0, 34.0, 35.0, 31.0, 34.0, 47.0, 20.0, 24.0, 19.0, 22.0, 11.0, 16.0, 14.0, 11.0, 8.0, 10.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.8515625, -9.55859375, -9.265625, -8.97265625, -8.6796875, -8.38671875, -8.09375, -7.80078125, -7.5078125, -7.21484375, -6.921875, -6.62890625, -6.3359375, -6.04296875, -5.75, -5.45703125, -5.1640625, -4.87109375, -4.578125, -4.28515625, -3.9921875, -3.69921875, -3.40625, -3.11328125, -2.8203125, -2.52734375, -2.234375, -1.94140625, -1.6484375, -1.35546875, -1.0625, -0.76953125, -0.4765625, -0.18359375, 0.109375, 0.40234375, 0.6953125, 0.98828125, 1.28125, 1.57421875, 1.8671875, 2.16015625, 2.453125, 2.74609375, 3.0390625, 3.33203125, 3.625, 3.91796875, 4.2109375, 4.50390625, 4.796875, 5.08984375, 5.3828125, 5.67578125, 5.96875, 6.26171875, 6.5546875, 6.84765625, 7.140625, 7.43359375, 7.7265625, 8.01953125, 8.3125, 8.60546875, 8.8984375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 6.0, 1.0, 5.0, 10.0, 17.0, 13.0, 23.0, 40.0, 43.0, 66.0, 71.0, 113.0, 148.0, 247.0, 349.0, 486.0, 775.0, 1119.0, 1715.0, 2859.0, 4711.0, 11190.0, 38291.0, 171082.0, 5878814.0, 127870.0, 30051.0, 9683.0, 4226.0, 2419.0, 1593.0, 1058.0, 723.0, 503.0, 349.0, 231.0, 178.0, 95.0, 77.0, 36.0, 28.0, 37.0, 27.0, 11.0, 10.0, 8.0, 7.0, 3.0, 4.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-18.890625, -18.3251953125, -17.759765625, -17.1943359375, -16.62890625, -16.0634765625, -15.498046875, -14.9326171875, -14.3671875, -13.8017578125, -13.236328125, -12.6708984375, -12.10546875, -11.5400390625, -10.974609375, -10.4091796875, -9.84375, -9.2783203125, -8.712890625, -8.1474609375, -7.58203125, -7.0166015625, -6.451171875, -5.8857421875, -5.3203125, -4.7548828125, -4.189453125, -3.6240234375, -3.05859375, -2.4931640625, -1.927734375, -1.3623046875, -0.796875, -0.2314453125, 0.333984375, 0.8994140625, 1.46484375, 2.0302734375, 2.595703125, 3.1611328125, 3.7265625, 4.2919921875, 4.857421875, 5.4228515625, 5.98828125, 6.5537109375, 7.119140625, 7.6845703125, 8.25, 8.8154296875, 9.380859375, 9.9462890625, 10.51171875, 11.0771484375, 11.642578125, 12.2080078125, 12.7734375, 13.3388671875, 13.904296875, 14.4697265625, 15.03515625, 15.6005859375, 16.166015625, 16.7314453125, 17.296875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 14.0, 12.0, 11.0, 17.0, 15.0, 28.0, 19.0, 34.0, 23.0, 37.0, 27.0, 36.0, 42.0, 34.0, 73.0, 219.0, 631.0, 236.0, 71.0, 38.0, 44.0, 29.0, 40.0, 27.0, 26.0, 29.0, 24.0, 34.0, 23.0, 13.0, 15.0, 17.0, 9.0, 7.0, 9.0, 3.0, 10.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.453125, -16.8818359375, -16.310546875, -15.7392578125, -15.16796875, -14.5966796875, -14.025390625, -13.4541015625, -12.8828125, -12.3115234375, -11.740234375, -11.1689453125, -10.59765625, -10.0263671875, -9.455078125, -8.8837890625, -8.3125, -7.7412109375, -7.169921875, -6.5986328125, -6.02734375, -5.4560546875, -4.884765625, -4.3134765625, -3.7421875, -3.1708984375, -2.599609375, -2.0283203125, -1.45703125, -0.8857421875, -0.314453125, 0.2568359375, 0.828125, 1.3994140625, 1.970703125, 2.5419921875, 3.11328125, 3.6845703125, 4.255859375, 4.8271484375, 5.3984375, 5.9697265625, 6.541015625, 7.1123046875, 7.68359375, 8.2548828125, 8.826171875, 9.3974609375, 9.96875, 10.5400390625, 11.111328125, 11.6826171875, 12.25390625, 12.8251953125, 13.396484375, 13.9677734375, 14.5390625, 15.1103515625, 15.681640625, 16.2529296875, 16.82421875, 17.3955078125, 17.966796875, 18.5380859375, 19.109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 11.0, 28.0, 291.0, 585.0, 43.0, 9.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-258.67364501953125, -251.8963623046875, -245.11907958984375, -238.341796875, -231.5644989013672, -224.78721618652344, -218.0099334716797, -211.23265075683594, -204.4553680419922, -197.67808532714844, -190.9008026123047, -184.12350463867188, -177.34622192382812, -170.56893920898438, -163.79165649414062, -157.01437377929688, -150.23709106445312, -143.45980834960938, -136.68252563476562, -129.90524291992188, -123.1279525756836, -116.35066223144531, -109.57337951660156, -102.79609680175781, -96.018798828125, -89.24151611328125, -82.46422576904297, -75.68694305419922, -68.90966033935547, -62.13237380981445, -55.35508728027344, -48.57780456542969, -41.80052185058594, -35.02323532104492, -28.245952606201172, -21.468666076660156, -14.691381454467773, -7.914096832275391, -1.136810302734375, 5.640472412109375, 12.41775894165039, 19.195043563842773, 25.972328186035156, 32.74961471557617, 39.52690124511719, 46.30418395996094, 53.08147048950195, 59.8587532043457, 66.63603973388672, 73.41332244873047, 80.19061279296875, 86.9678955078125, 93.74517822265625, 100.5224609375, 107.29975128173828, 114.07703399658203, 120.85432434082031, 127.63160705566406, 134.4088897705078, 141.18618774414062, 147.96347045898438, 154.74075317382812, 161.51803588867188, 168.29531860351562, 175.07260131835938]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 5.0, 8.0, 6.0, 17.0, 17.0, 21.0, 42.0, 123.0, 290.0, 232.0, 101.0, 32.0, 25.0, 15.0, 5.0, 10.0, 8.0, 10.0, 4.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-148.1147918701172, -144.09844970703125, -140.08209228515625, -136.0657501220703, -132.04940795898438, -128.03306579589844, -124.01671600341797, -120.0003662109375, -115.98402404785156, -111.96768188476562, -107.95133209228516, -103.93498229980469, -99.91864013671875, -95.90229797363281, -91.88594818115234, -87.86959838867188, -83.85325622558594, -79.8369140625, -75.82056427001953, -71.80421447753906, -67.78787231445312, -63.77152633666992, -59.75518035888672, -55.738834381103516, -51.72248840332031, -47.70614242553711, -43.689796447753906, -39.6734504699707, -35.6571044921875, -31.640758514404297, -27.624412536621094, -23.60806655883789, -19.591705322265625, -15.575359344482422, -11.559013366699219, -7.542667388916016, -3.5263214111328125, 0.4900245666503906, 4.506370544433594, 8.522716522216797, 12.5390625, 16.555408477783203, 20.571754455566406, 24.58810043334961, 28.604446411132812, 32.620792388916016, 36.63713836669922, 40.65348434448242, 44.669830322265625, 48.68617630004883, 52.70252227783203, 56.718868255615234, 60.73521423339844, 64.75155639648438, 68.76790618896484, 72.78425598144531, 76.80059814453125, 80.81694030761719, 84.83329010009766, 88.84963989257812, 92.86598205566406, 96.88232421875, 100.89867401123047, 104.91502380371094, 108.93136596679688]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 12.0, 9.0, 16.0, 24.0, 49.0, 71.0, 102.0, 219.0, 393.0, 947.0, 2457.0, 7724.0, 79848.0, 4079062.0, 16416.0, 3991.0, 1553.0, 633.0, 376.0, 165.0, 97.0, 36.0, 30.0, 18.0, 12.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5166015625, -1.4735260009765625, -1.430450439453125, -1.3873748779296875, -1.34429931640625, -1.3012237548828125, -1.258148193359375, -1.2150726318359375, -1.1719970703125, -1.1289215087890625, -1.085845947265625, -1.0427703857421875, -0.99969482421875, -0.9566192626953125, -0.913543701171875, -0.8704681396484375, -0.827392578125, -0.7843170166015625, -0.741241455078125, -0.6981658935546875, -0.65509033203125, -0.6120147705078125, -0.568939208984375, -0.5258636474609375, -0.4827880859375, -0.4397125244140625, -0.396636962890625, -0.3535614013671875, -0.31048583984375, -0.2674102783203125, -0.224334716796875, -0.1812591552734375, -0.13818359375, -0.0951080322265625, -0.052032470703125, -0.0089569091796875, 0.03411865234375, 0.0771942138671875, 0.120269775390625, 0.1633453369140625, 0.2064208984375, 0.2494964599609375, 0.292572021484375, 0.3356475830078125, 0.37872314453125, 0.4217987060546875, 0.464874267578125, 0.5079498291015625, 0.551025390625, 0.5941009521484375, 0.637176513671875, 0.6802520751953125, 0.72332763671875, 0.7664031982421875, 0.809478759765625, 0.8525543212890625, 0.8956298828125, 0.9387054443359375, 0.981781005859375, 1.0248565673828125, 1.06793212890625, 1.1110076904296875, 1.154083251953125, 1.1971588134765625, 1.240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 8.0, 8.0, 5.0, 5.0, 4.0, 12.0, 3.0, 8.0, 18.0, 14.0, 19.0, 750.0, 28.0, 18.0, 13.0, 7.0, 9.0, 7.0, 3.0, 8.0, 11.0, 7.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.2404499053955078, -0.23175430297851562, -0.22305870056152344, -0.21436309814453125, -0.20566749572753906, -0.19697189331054688, -0.1882762908935547, -0.1795806884765625, -0.1708850860595703, -0.16218948364257812, -0.15349388122558594, -0.14479827880859375, -0.13610267639160156, -0.12740707397460938, -0.11871147155761719, -0.110015869140625, -0.10132026672363281, -0.09262466430664062, -0.08392906188964844, -0.07523345947265625, -0.06653785705566406, -0.057842254638671875, -0.04914665222167969, -0.0404510498046875, -0.03175544738769531, -0.023059844970703125, -0.014364242553710938, -0.00566864013671875, 0.0030269622802734375, 0.011722564697265625, 0.020418167114257812, 0.02911376953125, 0.03780937194824219, 0.046504974365234375, 0.05520057678222656, 0.06389617919921875, 0.07259178161621094, 0.08128738403320312, 0.08998298645019531, 0.0986785888671875, 0.10737419128417969, 0.11606979370117188, 0.12476539611816406, 0.13346099853515625, 0.14215660095214844, 0.15085220336914062, 0.1595478057861328, 0.168243408203125, 0.1769390106201172, 0.18563461303710938, 0.19433021545410156, 0.20302581787109375, 0.21172142028808594, 0.22041702270507812, 0.2291126251220703, 0.2378082275390625, 0.2465038299560547, 0.2551994323730469, 0.26389503479003906, 0.27259063720703125, 0.28128623962402344, 0.2899818420410156, 0.2986774444580078, 0.307373046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 11.0, 17.0, 25.0, 24.0, 56.0, 100.0, 221.0, 432.0, 1110.0, 3044.0, 10591.0, 61708.0, 3844999.0, 243853.0, 21365.0, 4485.0, 1263.0, 524.0, 213.0, 97.0, 58.0, 30.0, 16.0, 7.0, 6.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.801544189453125, -1.75250244140625, -1.703460693359375, -1.6544189453125, -1.605377197265625, -1.55633544921875, -1.507293701171875, -1.458251953125, -1.409210205078125, -1.36016845703125, -1.311126708984375, -1.2620849609375, -1.213043212890625, -1.16400146484375, -1.114959716796875, -1.06591796875, -1.016876220703125, -0.96783447265625, -0.918792724609375, -0.8697509765625, -0.820709228515625, -0.77166748046875, -0.722625732421875, -0.673583984375, -0.624542236328125, -0.57550048828125, -0.526458740234375, -0.4774169921875, -0.428375244140625, -0.37933349609375, -0.330291748046875, -0.28125, -0.232208251953125, -0.18316650390625, -0.134124755859375, -0.0850830078125, -0.036041259765625, 0.01300048828125, 0.062042236328125, 0.111083984375, 0.160125732421875, 0.20916748046875, 0.258209228515625, 0.3072509765625, 0.356292724609375, 0.40533447265625, 0.454376220703125, 0.50341796875, 0.552459716796875, 0.60150146484375, 0.650543212890625, 0.6995849609375, 0.748626708984375, 0.79766845703125, 0.846710205078125, 0.895751953125, 0.944793701171875, 0.99383544921875, 1.042877197265625, 1.0919189453125, 1.140960693359375, 1.19000244140625, 1.239044189453125, 1.2880859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 12.0, 16.0, 19.0, 28.0, 33.0, 34.0, 41.0, 54.0, 110.0, 203.0, 630.0, 1726.0, 568.0, 203.0, 111.0, 76.0, 43.0, 28.0, 36.0, 15.0, 16.0, 13.0, 9.0, 4.0, 5.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3544921875, -0.34549903869628906, -0.3365058898925781, -0.3275127410888672, -0.31851959228515625, -0.3095264434814453, -0.3005332946777344, -0.29154014587402344, -0.2825469970703125, -0.27355384826660156, -0.2645606994628906, -0.2555675506591797, -0.24657440185546875, -0.2375812530517578, -0.22858810424804688, -0.21959495544433594, -0.210601806640625, -0.20160865783691406, -0.19261550903320312, -0.1836223602294922, -0.17462921142578125, -0.1656360626220703, -0.15664291381835938, -0.14764976501464844, -0.1386566162109375, -0.12966346740722656, -0.12067031860351562, -0.11167716979980469, -0.10268402099609375, -0.09369087219238281, -0.08469772338867188, -0.07570457458496094, -0.06671142578125, -0.05771827697753906, -0.048725128173828125, -0.03973197937011719, -0.03073883056640625, -0.021745681762695312, -0.012752532958984375, -0.0037593841552734375, 0.0052337646484375, 0.014226913452148438, 0.023220062255859375, 0.03221321105957031, 0.04120635986328125, 0.05019950866699219, 0.059192657470703125, 0.06818580627441406, 0.077178955078125, 0.08617210388183594, 0.09516525268554688, 0.10415840148925781, 0.11315155029296875, 0.12214469909667969, 0.13113784790039062, 0.14013099670410156, 0.1491241455078125, 0.15811729431152344, 0.16711044311523438, 0.1761035919189453, 0.18509674072265625, 0.1940898895263672, 0.20308303833007812, 0.21207618713378906, 0.2210693359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 11.0, 32.0, 76.0, 180.0, 256.0, 215.0, 108.0, 60.0, 28.0, 11.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00081205368042, -1.925870418548584, -1.850928783416748, -1.7759872674942017, -1.7010456323623657, -1.6261039972305298, -1.5511624813079834, -1.4762208461761475, -1.4012792110443115, -1.3263375759124756, -1.2513959407806396, -1.1764544248580933, -1.1015127897262573, -1.0265711545944214, -0.9516295790672302, -0.8766880035400391, -0.8017463684082031, -0.7268047332763672, -0.651863157749176, -0.5769215822219849, -0.5019799470901489, -0.4270383417606354, -0.3520967364311218, -0.27715516090393066, -0.20221352577209473, -0.12727192044258118, -0.05233031511306763, 0.022611290216445923, 0.09755289554595947, 0.17249450087547302, 0.24743610620498657, 0.32237768173217773, 0.39731931686401367, 0.4722609221935272, 0.5472025275230408, 0.6221441030502319, 0.6970857381820679, 0.7720273733139038, 0.846968948841095, 0.9219105243682861, 0.9968521595001221, 1.071793794631958, 1.146735429763794, 1.2216769456863403, 1.2966185808181763, 1.3715602159500122, 1.4465017318725586, 1.5214433670043945, 1.5963850021362305, 1.6713266372680664, 1.7462682723999023, 1.8212097883224487, 1.8961514234542847, 1.9710930585861206, 2.046034574508667, 2.120976209640503, 2.195917844772339, 2.270859479904175, 2.3458011150360107, 2.4207427501678467, 2.4956841468811035, 2.5706257820129395, 2.6455674171447754, 2.7205090522766113, 2.7954506874084473]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 11.0, 18.0, 19.0, 28.0, 40.0, 67.0, 76.0, 78.0, 82.0, 85.0, 84.0, 93.0, 80.0, 63.0, 53.0, 36.0, 26.0, 14.0, 15.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.716309905052185, -1.6665451526641846, -1.616780400276184, -1.5670156478881836, -1.5172507762908936, -1.467486023902893, -1.4177212715148926, -1.367956519126892, -1.3181917667388916, -1.2684270143508911, -1.2186622619628906, -1.1688973903656006, -1.1191326379776, -1.0693678855895996, -1.0196031332015991, -0.9698383808135986, -0.9200735688209534, -0.8703088164329529, -0.8205440044403076, -0.7707792520523071, -0.7210144996643066, -0.6712497472763062, -0.6214849352836609, -0.5717201828956604, -0.5219553709030151, -0.47219058871269226, -0.4224258363246918, -0.3726610541343689, -0.3228963017463684, -0.27313151955604553, -0.22336673736572266, -0.17360198497772217, -0.12383723258972168, -0.07407246530056, -0.02430769056081772, 0.02545708417892456, 0.07522185146808624, 0.12498661875724792, 0.1747514009475708, 0.2245161533355713, 0.27428093552589417, 0.32404571771621704, 0.37381047010421753, 0.4235752522945404, 0.4733400344848633, 0.5231047868728638, 0.5728695392608643, 0.6226342916488647, 0.67239910364151, 0.7221638560295105, 0.7719286680221558, 0.8216934204101562, 0.8714581727981567, 0.9212229251861572, 0.9709877371788025, 1.0207524299621582, 1.0705173015594482, 1.1202820539474487, 1.1700468063354492, 1.2198116779327393, 1.2695764303207397, 1.3193411827087402, 1.3691059350967407, 1.4188706874847412, 1.4686354398727417]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 14.0, 4.0, 12.0, 29.0, 35.0, 50.0, 60.0, 79.0, 113.0, 169.0, 227.0, 299.0, 440.0, 590.0, 893.0, 1319.0, 1845.0, 2737.0, 3982.0, 6030.0, 9198.0, 14417.0, 22742.0, 37925.0, 822959.0, 49878.0, 25406.0, 15994.0, 10187.0, 6561.0, 4431.0, 3039.0, 2146.0, 1435.0, 976.0, 664.0, 448.0, 355.0, 270.0, 167.0, 130.0, 97.0, 53.0, 47.0, 27.0, 29.0, 15.0, 9.0, 9.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.5537109375, -0.5367355346679688, -0.5197601318359375, -0.5027847290039062, -0.485809326171875, -0.46883392333984375, -0.4518585205078125, -0.43488311767578125, -0.41790771484375, -0.40093231201171875, -0.3839569091796875, -0.36698150634765625, -0.350006103515625, -0.33303070068359375, -0.3160552978515625, -0.29907989501953125, -0.2821044921875, -0.26512908935546875, -0.2481536865234375, -0.23117828369140625, -0.214202880859375, -0.19722747802734375, -0.1802520751953125, -0.16327667236328125, -0.14630126953125, -0.12932586669921875, -0.1123504638671875, -0.09537506103515625, -0.078399658203125, -0.06142425537109375, -0.0444488525390625, -0.02747344970703125, -0.010498046875, 0.00647735595703125, 0.0234527587890625, 0.04042816162109375, 0.057403564453125, 0.07437896728515625, 0.0913543701171875, 0.10832977294921875, 0.12530517578125, 0.14228057861328125, 0.1592559814453125, 0.17623138427734375, 0.193206787109375, 0.21018218994140625, 0.2271575927734375, 0.24413299560546875, 0.2611083984375, 0.27808380126953125, 0.2950592041015625, 0.31203460693359375, 0.329010009765625, 0.34598541259765625, 0.3629608154296875, 0.37993621826171875, 0.39691162109375, 0.41388702392578125, 0.4308624267578125, 0.44783782958984375, 0.464813232421875, 0.48178863525390625, 0.4987640380859375, 0.5157394409179688, 0.53271484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 8.0, 8.0, 7.0, 4.0, 6.0, 6.0, 5.0, 9.0, 15.0, 11.0, 18.0, 360.0, 417.0, 19.0, 15.0, 10.0, 10.0, 7.0, 4.0, 8.0, 9.0, 7.0, 6.0, 1.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.2384662628173828, -0.22998428344726562, -0.22150230407714844, -0.21302032470703125, -0.20453834533691406, -0.19605636596679688, -0.1875743865966797, -0.1790924072265625, -0.1706104278564453, -0.16212844848632812, -0.15364646911621094, -0.14516448974609375, -0.13668251037597656, -0.12820053100585938, -0.11971855163574219, -0.111236572265625, -0.10275459289550781, -0.09427261352539062, -0.08579063415527344, -0.07730865478515625, -0.06882667541503906, -0.060344696044921875, -0.05186271667480469, -0.0433807373046875, -0.03489875793457031, -0.026416778564453125, -0.017934799194335938, -0.00945281982421875, -0.0009708404541015625, 0.007511138916015625, 0.015993118286132812, 0.02447509765625, 0.03295707702636719, 0.041439056396484375, 0.04992103576660156, 0.05840301513671875, 0.06688499450683594, 0.07536697387695312, 0.08384895324707031, 0.0923309326171875, 0.10081291198730469, 0.10929489135742188, 0.11777687072753906, 0.12625885009765625, 0.13474082946777344, 0.14322280883789062, 0.1517047882080078, 0.160186767578125, 0.1686687469482422, 0.17715072631835938, 0.18563270568847656, 0.19411468505859375, 0.20259666442871094, 0.21107864379882812, 0.2195606231689453, 0.2280426025390625, 0.2365245819091797, 0.24500656127929688, 0.25348854064941406, 0.26197052001953125, 0.27045249938964844, 0.2789344787597656, 0.2874164581298828, 0.2958984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 17.0, 14.0, 19.0, 28.0, 36.0, 52.0, 58.0, 98.0, 122.0, 188.0, 313.0, 511.0, 1047.0, 2475.0, 7013.0, 25563.0, 121080.0, 509790.0, 299266.0, 59060.0, 13878.0, 4222.0, 1640.0, 751.0, 446.0, 234.0, 169.0, 115.0, 68.0, 54.0, 45.0, 30.0, 18.0, 20.0, 19.0, 7.0, 9.0, 10.0, 6.0, 4.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.810577392578125, -0.78424072265625, -0.757904052734375, -0.7315673828125, -0.705230712890625, -0.67889404296875, -0.652557373046875, -0.626220703125, -0.599884033203125, -0.57354736328125, -0.547210693359375, -0.5208740234375, -0.494537353515625, -0.46820068359375, -0.441864013671875, -0.41552734375, -0.389190673828125, -0.36285400390625, -0.336517333984375, -0.3101806640625, -0.283843994140625, -0.25750732421875, -0.231170654296875, -0.204833984375, -0.178497314453125, -0.15216064453125, -0.125823974609375, -0.0994873046875, -0.073150634765625, -0.04681396484375, -0.020477294921875, 0.005859375, 0.032196044921875, 0.05853271484375, 0.084869384765625, 0.1112060546875, 0.137542724609375, 0.16387939453125, 0.190216064453125, 0.216552734375, 0.242889404296875, 0.26922607421875, 0.295562744140625, 0.3218994140625, 0.348236083984375, 0.37457275390625, 0.400909423828125, 0.42724609375, 0.453582763671875, 0.47991943359375, 0.506256103515625, 0.5325927734375, 0.558929443359375, 0.58526611328125, 0.611602783203125, 0.637939453125, 0.664276123046875, 0.69061279296875, 0.716949462890625, 0.7432861328125, 0.769622802734375, 0.79595947265625, 0.822296142578125, 0.8486328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 11.0, 11.0, 9.0, 14.0, 16.0, 22.0, 25.0, 26.0, 21.0, 30.0, 44.0, 37.0, 49.0, 44.0, 42.0, 52.0, 32.0, 43.0, 41.0, 51.0, 33.0, 34.0, 41.0, 29.0, 33.0, 27.0, 28.0, 19.0, 20.0, 21.0, 16.0, 18.0, 13.0, 9.0, 6.0, 6.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9507675170898438, -0.9196014404296875, -0.8884353637695312, -0.857269287109375, -0.8261032104492188, -0.7949371337890625, -0.7637710571289062, -0.73260498046875, -0.7014389038085938, -0.6702728271484375, -0.6391067504882812, -0.607940673828125, -0.5767745971679688, -0.5456085205078125, -0.5144424438476562, -0.4832763671875, -0.45211029052734375, -0.4209442138671875, -0.38977813720703125, -0.358612060546875, -0.32744598388671875, -0.2962799072265625, -0.26511383056640625, -0.23394775390625, -0.20278167724609375, -0.1716156005859375, -0.14044952392578125, -0.109283447265625, -0.07811737060546875, -0.0469512939453125, -0.01578521728515625, 0.015380859375, 0.04654693603515625, 0.0777130126953125, 0.10887908935546875, 0.140045166015625, 0.17121124267578125, 0.2023773193359375, 0.23354339599609375, 0.26470947265625, 0.29587554931640625, 0.3270416259765625, 0.35820770263671875, 0.389373779296875, 0.42053985595703125, 0.4517059326171875, 0.48287200927734375, 0.5140380859375, 0.5452041625976562, 0.5763702392578125, 0.6075363159179688, 0.638702392578125, 0.6698684692382812, 0.7010345458984375, 0.7322006225585938, 0.76336669921875, 0.7945327758789062, 0.8256988525390625, 0.8568649291992188, 0.888031005859375, 0.9191970825195312, 0.9503631591796875, 0.9815292358398438, 1.0126953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 9.0, 20.0, 13.0, 21.0, 27.0, 38.0, 84.0, 167.0, 247.0, 515.0, 1071.0, 2743.0, 8807.0, 43967.0, 489382.0, 447009.0, 41344.0, 8256.0, 2668.0, 1069.0, 449.0, 264.0, 142.0, 79.0, 42.0, 33.0, 19.0, 18.0, 10.0, 5.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.736328125, -0.7117691040039062, -0.6872100830078125, -0.6626510620117188, -0.638092041015625, -0.6135330200195312, -0.5889739990234375, -0.5644149780273438, -0.53985595703125, -0.5152969360351562, -0.4907379150390625, -0.46617889404296875, -0.441619873046875, -0.41706085205078125, -0.3925018310546875, -0.36794281005859375, -0.3433837890625, -0.31882476806640625, -0.2942657470703125, -0.26970672607421875, -0.245147705078125, -0.22058868408203125, -0.1960296630859375, -0.17147064208984375, -0.14691162109375, -0.12235260009765625, -0.0977935791015625, -0.07323455810546875, -0.048675537109375, -0.02411651611328125, 0.0004425048828125, 0.02500152587890625, 0.049560546875, 0.07411956787109375, 0.0986785888671875, 0.12323760986328125, 0.147796630859375, 0.17235565185546875, 0.1969146728515625, 0.22147369384765625, 0.24603271484375, 0.27059173583984375, 0.2951507568359375, 0.31970977783203125, 0.344268798828125, 0.36882781982421875, 0.3933868408203125, 0.41794586181640625, 0.4425048828125, 0.46706390380859375, 0.4916229248046875, 0.5161819458007812, 0.540740966796875, 0.5652999877929688, 0.5898590087890625, 0.6144180297851562, 0.63897705078125, 0.6635360717773438, 0.6880950927734375, 0.7126541137695312, 0.737213134765625, 0.7617721557617188, 0.7863311767578125, 0.8108901977539062, 0.83544921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 6.0, 11.0, 23.0, 17.0, 29.0, 30.0, 44.0, 94.0, 87.0, 98.0, 102.0, 112.0, 89.0, 68.0, 51.0, 40.0, 21.0, 15.0, 14.0, 6.0, 9.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.289648056030273e-05, -7.070787250995636e-05, -6.851926445960999e-05, -6.633065640926361e-05, -6.414204835891724e-05, -6.195344030857086e-05, -5.976483225822449e-05, -5.757622420787811e-05, -5.538761615753174e-05, -5.3199008107185364e-05, -5.101040005683899e-05, -4.8821792006492615e-05, -4.663318395614624e-05, -4.4444575905799866e-05, -4.225596785545349e-05, -4.006735980510712e-05, -3.787875175476074e-05, -3.569014370441437e-05, -3.350153565406799e-05, -3.131292760372162e-05, -2.9124319553375244e-05, -2.693571150302887e-05, -2.4747103452682495e-05, -2.255849540233612e-05, -2.0369887351989746e-05, -1.818127930164337e-05, -1.5992671251296997e-05, -1.3804063200950623e-05, -1.1615455150604248e-05, -9.426847100257874e-06, -7.238239049911499e-06, -5.0496309995651245e-06, -2.86102294921875e-06, -6.724148988723755e-07, 1.516193151473999e-06, 3.7048012018203735e-06, 5.893409252166748e-06, 8.082017302513123e-06, 1.0270625352859497e-05, 1.2459233403205872e-05, 1.4647841453552246e-05, 1.683644950389862e-05, 1.9025057554244995e-05, 2.121366560459137e-05, 2.3402273654937744e-05, 2.559088170528412e-05, 2.7779489755630493e-05, 2.9968097805976868e-05, 3.215670585632324e-05, 3.434531390666962e-05, 3.653392195701599e-05, 3.8722530007362366e-05, 4.091113805770874e-05, 4.3099746108055115e-05, 4.528835415840149e-05, 4.7476962208747864e-05, 4.966557025909424e-05, 5.185417830944061e-05, 5.404278635978699e-05, 5.623139441013336e-05, 5.8420002460479736e-05, 6.060861051082611e-05, 6.279721856117249e-05, 6.498582661151886e-05, 6.717443466186523e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 8.0, 4.0, 5.0, 15.0, 16.0, 13.0, 28.0, 39.0, 62.0, 105.0, 169.0, 290.0, 535.0, 1350.0, 3568.0, 13945.0, 94183.0, 703066.0, 199195.0, 23429.0, 5250.0, 1756.0, 688.0, 320.0, 200.0, 105.0, 60.0, 54.0, 32.0, 18.0, 15.0, 7.0, 4.0, 8.0, 4.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85498046875, -0.82879638671875, -0.8026123046875, -0.77642822265625, -0.750244140625, -0.72406005859375, -0.6978759765625, -0.67169189453125, -0.6455078125, -0.61932373046875, -0.5931396484375, -0.56695556640625, -0.540771484375, -0.51458740234375, -0.4884033203125, -0.46221923828125, -0.43603515625, -0.40985107421875, -0.3836669921875, -0.35748291015625, -0.331298828125, -0.30511474609375, -0.2789306640625, -0.25274658203125, -0.2265625, -0.20037841796875, -0.1741943359375, -0.14801025390625, -0.121826171875, -0.09564208984375, -0.0694580078125, -0.04327392578125, -0.01708984375, 0.00909423828125, 0.0352783203125, 0.06146240234375, 0.087646484375, 0.11383056640625, 0.1400146484375, 0.16619873046875, 0.1923828125, 0.21856689453125, 0.2447509765625, 0.27093505859375, 0.297119140625, 0.32330322265625, 0.3494873046875, 0.37567138671875, 0.40185546875, 0.42803955078125, 0.4542236328125, 0.48040771484375, 0.506591796875, 0.53277587890625, 0.5589599609375, 0.58514404296875, 0.611328125, 0.63751220703125, 0.6636962890625, 0.68988037109375, 0.716064453125, 0.74224853515625, 0.7684326171875, 0.79461669921875, 0.82080078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 2.0, 6.0, 13.0, 7.0, 11.0, 11.0, 26.0, 31.0, 44.0, 42.0, 47.0, 67.0, 71.0, 70.0, 69.0, 69.0, 74.0, 60.0, 50.0, 48.0, 38.0, 34.0, 23.0, 25.0, 18.0, 7.0, 11.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5361328125, -0.5211143493652344, -0.5060958862304688, -0.4910774230957031, -0.4760589599609375, -0.4610404968261719, -0.44602203369140625, -0.4310035705566406, -0.415985107421875, -0.4009666442871094, -0.38594818115234375, -0.3709297180175781, -0.3559112548828125, -0.3408927917480469, -0.32587432861328125, -0.3108558654785156, -0.29583740234375, -0.2808189392089844, -0.26580047607421875, -0.2507820129394531, -0.2357635498046875, -0.22074508666992188, -0.20572662353515625, -0.19070816040039062, -0.175689697265625, -0.16067123413085938, -0.14565277099609375, -0.13063430786132812, -0.1156158447265625, -0.10059738159179688, -0.08557891845703125, -0.07056045532226562, -0.0555419921875, -0.040523529052734375, -0.02550506591796875, -0.010486602783203125, 0.0045318603515625, 0.019550323486328125, 0.03456878662109375, 0.049587249755859375, 0.064605712890625, 0.07962417602539062, 0.09464263916015625, 0.10966110229492188, 0.1246795654296875, 0.13969802856445312, 0.15471649169921875, 0.16973495483398438, 0.18475341796875, 0.19977188110351562, 0.21479034423828125, 0.22980880737304688, 0.2448272705078125, 0.2598457336425781, 0.27486419677734375, 0.2898826599121094, 0.304901123046875, 0.3199195861816406, 0.33493804931640625, 0.3499565124511719, 0.3649749755859375, 0.3799934387207031, 0.39501190185546875, 0.4100303649902344, 0.425048828125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 14.0, 78.0, 614.0, 238.0, 39.0, 14.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.327211380004883, -23.34517478942871, -22.363140106201172, -21.381103515625, -20.399066925048828, -19.41703224182129, -18.434995651245117, -17.452960968017578, -16.470924377441406, -15.48888874053955, -14.506853103637695, -13.524816513061523, -12.542780876159668, -11.560745239257812, -10.57870864868164, -9.596673011779785, -8.61463737487793, -7.632601737976074, -6.6505656242370605, -5.668529510498047, -4.686493873596191, -3.704458236694336, -2.7224221229553223, -1.7403860092163086, -0.7583503723144531, 0.22368550300598145, 1.205721378326416, 2.1877572536468506, 3.169793128967285, 4.151828765869141, 5.133864879608154, 6.115900993347168, 7.097938537597656, 8.079974174499512, 9.062009811401367, 10.044046401977539, 11.026082038879395, 12.00811767578125, 12.990154266357422, 13.972189903259277, 14.954225540161133, 15.936261177062988, 16.918296813964844, 17.900333404541016, 18.882369995117188, 19.864404678344727, 20.8464412689209, 21.828475952148438, 22.81051254272461, 23.79254913330078, 24.77458381652832, 25.756620407104492, 26.73865509033203, 27.720691680908203, 28.702728271484375, 29.684764862060547, 30.666799545288086, 31.648836135864258, 32.6308708190918, 33.61290740966797, 34.59494400024414, 35.57698059082031, 36.55901336669922, 37.54104995727539, 38.52308654785156]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 2.0, 5.0, 9.0, 7.0, 6.0, 11.0, 15.0, 29.0, 27.0, 66.0, 78.0, 127.0, 136.0, 125.0, 110.0, 64.0, 48.0, 24.0, 13.0, 14.0, 8.0, 8.0, 6.0, 7.0, 6.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.706003189086914, -16.194644927978516, -15.6832857131958, -15.171926498413086, -14.660568237304688, -14.149209022521973, -13.637849807739258, -13.12649154663086, -12.615132331848145, -12.10377311706543, -11.592414855957031, -11.081055641174316, -10.569696426391602, -10.058338165283203, -9.546978950500488, -9.035619735717773, -8.524261474609375, -8.01290225982666, -7.501543998718262, -6.990184783935547, -6.47882604598999, -5.967467308044434, -5.456108093261719, -4.944749355316162, -4.4333906173706055, -3.922031879425049, -3.410672903060913, -2.8993139266967773, -2.3879551887512207, -1.876596450805664, -1.3652374744415283, -0.8538784980773926, -0.34252166748046875, 0.16883718967437744, 0.6801960468292236, 1.1915549039840698, 1.702913761138916, 2.2142724990844727, 2.7256314754486084, 3.236990451812744, 3.748349189758301, 4.259707927703857, 4.771066665649414, 5.282425880432129, 5.7937846183776855, 6.305143356323242, 6.816502571105957, 7.327861309051514, 7.83922004699707, 8.350579261779785, 8.861937522888184, 9.373296737670898, 9.884654998779297, 10.396014213562012, 10.907373428344727, 11.418731689453125, 11.93009090423584, 12.441450119018555, 12.952808380126953, 13.464167594909668, 13.975526809692383, 14.486885070800781, 14.998244285583496, 15.509603500366211, 16.02096176147461]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 10.0, 8.0, 13.0, 10.0, 19.0, 27.0, 23.0, 56.0, 72.0, 128.0, 210.0, 323.0, 586.0, 1206.0, 2648.0, 6695.0, 20409.0, 250547.0, 3872040.0, 25236.0, 7618.0, 3151.0, 1515.0, 741.0, 414.0, 251.0, 128.0, 90.0, 41.0, 22.0, 17.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55859375, -3.457183837890625, -3.35577392578125, -3.254364013671875, -3.1529541015625, -3.051544189453125, -2.95013427734375, -2.848724365234375, -2.747314453125, -2.645904541015625, -2.54449462890625, -2.443084716796875, -2.3416748046875, -2.240264892578125, -2.13885498046875, -2.037445068359375, -1.93603515625, -1.834625244140625, -1.73321533203125, -1.631805419921875, -1.5303955078125, -1.428985595703125, -1.32757568359375, -1.226165771484375, -1.124755859375, -1.023345947265625, -0.92193603515625, -0.820526123046875, -0.7191162109375, -0.617706298828125, -0.51629638671875, -0.414886474609375, -0.3134765625, -0.212066650390625, -0.11065673828125, -0.009246826171875, 0.0921630859375, 0.193572998046875, 0.29498291015625, 0.396392822265625, 0.497802734375, 0.599212646484375, 0.70062255859375, 0.802032470703125, 0.9034423828125, 1.004852294921875, 1.10626220703125, 1.207672119140625, 1.30908203125, 1.410491943359375, 1.51190185546875, 1.613311767578125, 1.7147216796875, 1.816131591796875, 1.91754150390625, 2.018951416015625, 2.120361328125, 2.221771240234375, 2.32318115234375, 2.424591064453125, 2.5260009765625, 2.627410888671875, 2.72882080078125, 2.830230712890625, 2.931640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 5.0, 11.0, 12.0, 10.0, 15.0, 16.0, 47.0, 264.0, 391.0, 111.0, 18.0, 16.0, 12.0, 12.0, 6.0, 8.0, 11.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2222900390625, -0.21440696716308594, -0.20652389526367188, -0.1986408233642578, -0.19075775146484375, -0.1828746795654297, -0.17499160766601562, -0.16710853576660156, -0.1592254638671875, -0.15134239196777344, -0.14345932006835938, -0.1355762481689453, -0.12769317626953125, -0.11981010437011719, -0.11192703247070312, -0.10404396057128906, -0.096160888671875, -0.08827781677246094, -0.08039474487304688, -0.07251167297363281, -0.06462860107421875, -0.05674552917480469, -0.048862457275390625, -0.04097938537597656, -0.0330963134765625, -0.025213241577148438, -0.017330169677734375, -0.009447097778320312, -0.00156402587890625, 0.0063190460205078125, 0.014202117919921875, 0.022085189819335938, 0.02996826171875, 0.03785133361816406, 0.045734405517578125, 0.05361747741699219, 0.06150054931640625, 0.06938362121582031, 0.07726669311523438, 0.08514976501464844, 0.0930328369140625, 0.10091590881347656, 0.10879898071289062, 0.11668205261230469, 0.12456512451171875, 0.1324481964111328, 0.14033126831054688, 0.14821434020996094, 0.156097412109375, 0.16398048400878906, 0.17186355590820312, 0.1797466278076172, 0.18762969970703125, 0.1955127716064453, 0.20339584350585938, 0.21127891540527344, 0.2191619873046875, 0.22704505920410156, 0.23492813110351562, 0.2428112030029297, 0.25069427490234375, 0.2585773468017578, 0.2664604187011719, 0.27434349060058594, 0.2822265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 9.0, 10.0, 13.0, 18.0, 17.0, 27.0, 45.0, 54.0, 81.0, 122.0, 210.0, 350.0, 582.0, 1071.0, 2248.0, 5551.0, 14886.0, 50656.0, 315576.0, 3622006.0, 133197.0, 30208.0, 9741.0, 3978.0, 1619.0, 794.0, 461.0, 257.0, 158.0, 96.0, 70.0, 47.0, 33.0, 18.0, 13.0, 11.0, 7.0, 9.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.107421875, -2.045989990234375, -1.98455810546875, -1.923126220703125, -1.8616943359375, -1.800262451171875, -1.73883056640625, -1.677398681640625, -1.615966796875, -1.554534912109375, -1.49310302734375, -1.431671142578125, -1.3702392578125, -1.308807373046875, -1.24737548828125, -1.185943603515625, -1.12451171875, -1.063079833984375, -1.00164794921875, -0.940216064453125, -0.8787841796875, -0.817352294921875, -0.75592041015625, -0.694488525390625, -0.633056640625, -0.571624755859375, -0.51019287109375, -0.448760986328125, -0.3873291015625, -0.325897216796875, -0.26446533203125, -0.203033447265625, -0.1416015625, -0.080169677734375, -0.01873779296875, 0.042694091796875, 0.1041259765625, 0.165557861328125, 0.22698974609375, 0.288421630859375, 0.349853515625, 0.411285400390625, 0.47271728515625, 0.534149169921875, 0.5955810546875, 0.657012939453125, 0.71844482421875, 0.779876708984375, 0.84130859375, 0.902740478515625, 0.96417236328125, 1.025604248046875, 1.0870361328125, 1.148468017578125, 1.20989990234375, 1.271331787109375, 1.332763671875, 1.394195556640625, 1.45562744140625, 1.517059326171875, 1.5784912109375, 1.639923095703125, 1.70135498046875, 1.762786865234375, 1.82421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 14.0, 25.0, 40.0, 30.0, 71.0, 94.0, 166.0, 294.0, 2073.0, 600.0, 217.0, 126.0, 96.0, 55.0, 46.0, 33.0, 17.0, 14.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275634765625, -0.2663764953613281, -0.25711822509765625, -0.24785995483398438, -0.2386016845703125, -0.22934341430664062, -0.22008514404296875, -0.21082687377929688, -0.201568603515625, -0.19231033325195312, -0.18305206298828125, -0.17379379272460938, -0.1645355224609375, -0.15527725219726562, -0.14601898193359375, -0.13676071166992188, -0.12750244140625, -0.11824417114257812, -0.10898590087890625, -0.09972763061523438, -0.0904693603515625, -0.08121109008789062, -0.07195281982421875, -0.06269454956054688, -0.053436279296875, -0.044178009033203125, -0.03491973876953125, -0.025661468505859375, -0.0164031982421875, -0.007144927978515625, 0.00211334228515625, 0.011371612548828125, 0.0206298828125, 0.029888153076171875, 0.03914642333984375, 0.048404693603515625, 0.0576629638671875, 0.06692123413085938, 0.07617950439453125, 0.08543777465820312, 0.094696044921875, 0.10395431518554688, 0.11321258544921875, 0.12247085571289062, 0.1317291259765625, 0.14098739624023438, 0.15024566650390625, 0.15950393676757812, 0.16876220703125, 0.17802047729492188, 0.18727874755859375, 0.19653701782226562, 0.2057952880859375, 0.21505355834960938, 0.22431182861328125, 0.23357009887695312, 0.242828369140625, 0.2520866394042969, 0.26134490966796875, 0.2706031799316406, 0.2798614501953125, 0.2891197204589844, 0.29837799072265625, 0.3076362609863281, 0.31689453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 42.0, 137.0, 303.0, 320.0, 125.0, 34.0, 13.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.385256767272949, -2.270970106124878, -2.1566836833953857, -2.0423970222473145, -1.9281104803085327, -1.813823938369751, -1.6995373964309692, -1.5852508544921875, -1.4709641933441162, -1.3566776514053345, -1.2423911094665527, -1.1281044483184814, -1.0138179063796997, -0.899531364440918, -0.7852448225021362, -0.6709582209587097, -0.5566717386245728, -0.44238516688346863, -0.3280985951423645, -0.21381205320358276, -0.09952548146247864, 0.014761090278625488, 0.12904763221740723, 0.24333423376083374, 0.3576207756996155, 0.4719073474407196, 0.5861939191818237, 0.7004804611206055, 0.8147670030593872, 0.9290536046028137, 1.0433402061462402, 1.157626748085022, 1.2719132900238037, 1.3861998319625854, 1.5004863739013672, 1.6147730350494385, 1.7290595769882202, 1.843346118927002, 1.9576326608657837, 2.0719192028045654, 2.1862058639526367, 2.300492525100708, 2.4147789478302, 2.5290656089782715, 2.6433520317077637, 2.757638692855835, 2.8719253540039062, 2.9862117767333984, 3.1004981994628906, 3.214784860610962, 3.329071283340454, 3.4433579444885254, 3.5576443672180176, 3.671931028366089, 3.78621768951416, 3.9005041122436523, 4.014791011810303, 4.129077434539795, 4.243364334106445, 4.3576507568359375, 4.47193717956543, 4.586223602294922, 4.700510501861572, 4.8147969245910645, 4.929083347320557]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 10.0, 19.0, 35.0, 36.0, 55.0, 72.0, 101.0, 90.0, 101.0, 107.0, 70.0, 91.0, 58.0, 34.0, 29.0, 31.0, 13.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9932358264923096, -1.944029450416565, -1.8948231935501099, -1.8456168174743652, -1.7964105606079102, -1.7472041845321655, -1.697997808456421, -1.6487915515899658, -1.5995852947235107, -1.5503789186477661, -1.501172661781311, -1.4519662857055664, -1.4027600288391113, -1.3535536527633667, -1.304347276687622, -1.255141019821167, -1.2059346437454224, -1.1567282676696777, -1.1075220108032227, -1.058315634727478, -1.009109377861023, -0.9599030017852783, -0.9106966853141785, -0.8614903688430786, -0.8122840523719788, -0.7630777359008789, -0.713871419429779, -0.6646651029586792, -0.6154587268829346, -0.5662524700164795, -0.5170460939407349, -0.467839777469635, -0.4186335802078247, -0.36942726373672485, -0.320220947265625, -0.27101460099220276, -0.2218082845211029, -0.17260196805000305, -0.12339562177658081, -0.07418930530548096, -0.024982988834381104, 0.024223335087299347, 0.0734296590089798, 0.12263599038124084, 0.1718423068523407, 0.22104862332344055, 0.2702549695968628, 0.31946128606796265, 0.3686676025390625, 0.41787391901016235, 0.4670802354812622, 0.5162866115570068, 0.5654928684234619, 0.6146992444992065, 0.6639055609703064, 0.7131118774414062, 0.7623181939125061, 0.811524510383606, 0.8607308268547058, 0.9099371433258057, 0.9591435194015503, 1.0083497762680054, 1.05755615234375, 1.106762409210205, 1.1559687852859497]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 4.0, 10.0, 11.0, 11.0, 15.0, 27.0, 29.0, 44.0, 46.0, 74.0, 124.0, 206.0, 307.0, 453.0, 677.0, 1208.0, 2026.0, 3832.0, 8142.0, 18957.0, 58138.0, 798609.0, 109656.0, 24833.0, 10277.0, 4721.0, 2480.0, 1314.0, 799.0, 513.0, 325.0, 198.0, 139.0, 99.0, 69.0, 44.0, 33.0, 20.0, 17.0, 15.0, 10.0, 11.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.521484375, -1.47015380859375, -1.4188232421875, -1.36749267578125, -1.316162109375, -1.26483154296875, -1.2135009765625, -1.16217041015625, -1.11083984375, -1.05950927734375, -1.0081787109375, -0.95684814453125, -0.905517578125, -0.85418701171875, -0.8028564453125, -0.75152587890625, -0.7001953125, -0.64886474609375, -0.5975341796875, -0.54620361328125, -0.494873046875, -0.44354248046875, -0.3922119140625, -0.34088134765625, -0.28955078125, -0.23822021484375, -0.1868896484375, -0.13555908203125, -0.084228515625, -0.03289794921875, 0.0184326171875, 0.06976318359375, 0.12109375, 0.17242431640625, 0.2237548828125, 0.27508544921875, 0.326416015625, 0.37774658203125, 0.4290771484375, 0.48040771484375, 0.53173828125, 0.58306884765625, 0.6343994140625, 0.68572998046875, 0.737060546875, 0.78839111328125, 0.8397216796875, 0.89105224609375, 0.9423828125, 0.99371337890625, 1.0450439453125, 1.09637451171875, 1.147705078125, 1.19903564453125, 1.2503662109375, 1.30169677734375, 1.35302734375, 1.40435791015625, 1.4556884765625, 1.50701904296875, 1.558349609375, 1.60968017578125, 1.6610107421875, 1.71234130859375, 1.763671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 11.0, 9.0, 9.0, 11.0, 15.0, 30.0, 79.0, 252.0, 315.0, 140.0, 37.0, 17.0, 9.0, 20.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2186279296875, -0.2108631134033203, -0.20309829711914062, -0.19533348083496094, -0.18756866455078125, -0.17980384826660156, -0.17203903198242188, -0.1642742156982422, -0.1565093994140625, -0.1487445831298828, -0.14097976684570312, -0.13321495056152344, -0.12545013427734375, -0.11768531799316406, -0.10992050170898438, -0.10215568542480469, -0.094390869140625, -0.08662605285644531, -0.07886123657226562, -0.07109642028808594, -0.06333160400390625, -0.05556678771972656, -0.047801971435546875, -0.04003715515136719, -0.0322723388671875, -0.024507522583007812, -0.016742706298828125, -0.008977890014648438, -0.00121307373046875, 0.0065517425537109375, 0.014316558837890625, 0.022081375122070312, 0.02984619140625, 0.03761100769042969, 0.045375823974609375, 0.05314064025878906, 0.06090545654296875, 0.06867027282714844, 0.07643508911132812, 0.08419990539550781, 0.0919647216796875, 0.09972953796386719, 0.10749435424804688, 0.11525917053222656, 0.12302398681640625, 0.13078880310058594, 0.13855361938476562, 0.1463184356689453, 0.154083251953125, 0.1618480682373047, 0.16961288452148438, 0.17737770080566406, 0.18514251708984375, 0.19290733337402344, 0.20067214965820312, 0.2084369659423828, 0.2162017822265625, 0.2239665985107422, 0.23173141479492188, 0.23949623107910156, 0.24726104736328125, 0.25502586364746094, 0.2627906799316406, 0.2705554962158203, 0.2783203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 6.0, 9.0, 7.0, 11.0, 11.0, 30.0, 30.0, 54.0, 89.0, 140.0, 317.0, 728.0, 1744.0, 5565.0, 30453.0, 598249.0, 383357.0, 20781.0, 4411.0, 1364.0, 547.0, 278.0, 145.0, 86.0, 51.0, 33.0, 25.0, 11.0, 10.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.7978973388671875, -1.733489990234375, -1.6690826416015625, -1.60467529296875, -1.5402679443359375, -1.475860595703125, -1.4114532470703125, -1.3470458984375, -1.2826385498046875, -1.218231201171875, -1.1538238525390625, -1.08941650390625, -1.0250091552734375, -0.960601806640625, -0.8961944580078125, -0.831787109375, -0.7673797607421875, -0.702972412109375, -0.6385650634765625, -0.57415771484375, -0.5097503662109375, -0.445343017578125, -0.3809356689453125, -0.3165283203125, -0.2521209716796875, -0.187713623046875, -0.1233062744140625, -0.05889892578125, 0.0055084228515625, 0.069915771484375, 0.1343231201171875, 0.19873046875, 0.2631378173828125, 0.327545166015625, 0.3919525146484375, 0.45635986328125, 0.5207672119140625, 0.585174560546875, 0.6495819091796875, 0.7139892578125, 0.7783966064453125, 0.842803955078125, 0.9072113037109375, 0.97161865234375, 1.0360260009765625, 1.100433349609375, 1.1648406982421875, 1.229248046875, 1.2936553955078125, 1.358062744140625, 1.4224700927734375, 1.48687744140625, 1.5512847900390625, 1.615692138671875, 1.6800994873046875, 1.7445068359375, 1.8089141845703125, 1.873321533203125, 1.9377288818359375, 2.00213623046875, 2.0665435791015625, 2.130950927734375, 2.1953582763671875, 2.259765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 1.0, 6.0, 4.0, 6.0, 12.0, 11.0, 18.0, 19.0, 26.0, 22.0, 38.0, 30.0, 28.0, 33.0, 39.0, 35.0, 42.0, 43.0, 54.0, 44.0, 57.0, 56.0, 43.0, 45.0, 34.0, 23.0, 31.0, 40.0, 23.0, 29.0, 18.0, 20.0, 14.0, 9.0, 9.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.57177734375, -0.5554237365722656, -0.5390701293945312, -0.5227165222167969, -0.5063629150390625, -0.4900093078613281, -0.47365570068359375, -0.4573020935058594, -0.440948486328125, -0.4245948791503906, -0.40824127197265625, -0.3918876647949219, -0.3755340576171875, -0.3591804504394531, -0.34282684326171875, -0.3264732360839844, -0.31011962890625, -0.2937660217285156, -0.27741241455078125, -0.2610588073730469, -0.2447052001953125, -0.22835159301757812, -0.21199798583984375, -0.19564437866210938, -0.179290771484375, -0.16293716430664062, -0.14658355712890625, -0.13022994995117188, -0.1138763427734375, -0.09752273559570312, -0.08116912841796875, -0.06481552124023438, -0.0484619140625, -0.032108306884765625, -0.01575469970703125, 0.000598907470703125, 0.0169525146484375, 0.033306121826171875, 0.04965972900390625, 0.06601333618164062, 0.082366943359375, 0.09872055053710938, 0.11507415771484375, 0.13142776489257812, 0.1477813720703125, 0.16413497924804688, 0.18048858642578125, 0.19684219360351562, 0.21319580078125, 0.22954940795898438, 0.24590301513671875, 0.2622566223144531, 0.2786102294921875, 0.2949638366699219, 0.31131744384765625, 0.3276710510253906, 0.344024658203125, 0.3603782653808594, 0.37673187255859375, 0.3930854797363281, 0.4094390869140625, 0.4257926940917969, 0.44214630126953125, 0.4584999084472656, 0.474853515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 15.0, 15.0, 18.0, 44.0, 68.0, 89.0, 156.0, 310.0, 754.0, 1784.0, 5421.0, 23811.0, 214677.0, 694930.0, 87260.0, 13292.0, 3499.0, 1230.0, 569.0, 260.0, 136.0, 71.0, 42.0, 25.0, 26.0, 16.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251953125, -1.210662841796875, -1.16937255859375, -1.128082275390625, -1.0867919921875, -1.045501708984375, -1.00421142578125, -0.962921142578125, -0.921630859375, -0.880340576171875, -0.83905029296875, -0.797760009765625, -0.7564697265625, -0.715179443359375, -0.67388916015625, -0.632598876953125, -0.59130859375, -0.550018310546875, -0.50872802734375, -0.467437744140625, -0.4261474609375, -0.384857177734375, -0.34356689453125, -0.302276611328125, -0.260986328125, -0.219696044921875, -0.17840576171875, -0.137115478515625, -0.0958251953125, -0.054534912109375, -0.01324462890625, 0.028045654296875, 0.0693359375, 0.110626220703125, 0.15191650390625, 0.193206787109375, 0.2344970703125, 0.275787353515625, 0.31707763671875, 0.358367919921875, 0.399658203125, 0.440948486328125, 0.48223876953125, 0.523529052734375, 0.5648193359375, 0.606109619140625, 0.64739990234375, 0.688690185546875, 0.72998046875, 0.771270751953125, 0.81256103515625, 0.853851318359375, 0.8951416015625, 0.936431884765625, 0.97772216796875, 1.019012451171875, 1.060302734375, 1.101593017578125, 1.14288330078125, 1.184173583984375, 1.2254638671875, 1.266754150390625, 1.30804443359375, 1.349334716796875, 1.390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 17.0, 13.0, 23.0, 39.0, 59.0, 79.0, 113.0, 115.0, 133.0, 115.0, 80.0, 55.0, 33.0, 23.0, 17.0, 15.0, 9.0, 9.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00013375282287597656, -0.00013005267828702927, -0.00012635253369808197, -0.00012265238910913467, -0.00011895224452018738, -0.00011525209993124008, -0.00011155195534229279, -0.00010785181075334549, -0.0001041516661643982, -0.0001004515215754509, -9.67513769865036e-05, -9.30512323975563e-05, -8.935108780860901e-05, -8.565094321966171e-05, -8.195079863071442e-05, -7.825065404176712e-05, -7.455050945281982e-05, -7.085036486387253e-05, -6.715022027492523e-05, -6.345007568597794e-05, -5.974993109703064e-05, -5.6049786508083344e-05, -5.234964191913605e-05, -4.864949733018875e-05, -4.4949352741241455e-05, -4.124920815229416e-05, -3.754906356334686e-05, -3.384891897439957e-05, -3.014877438545227e-05, -2.6448629796504974e-05, -2.2748485207557678e-05, -1.9048340618610382e-05, -1.5348196029663086e-05, -1.164805144071579e-05, -7.947906851768494e-06, -4.2477622628211975e-06, -5.476176738739014e-07, 3.1525269150733948e-06, 6.852671504020691e-06, 1.0552816092967987e-05, 1.4252960681915283e-05, 1.795310527086258e-05, 2.1653249859809875e-05, 2.535339444875717e-05, 2.9053539037704468e-05, 3.2753683626651764e-05, 3.645382821559906e-05, 4.0153972804546356e-05, 4.385411739349365e-05, 4.755426198244095e-05, 5.1254406571388245e-05, 5.495455116033554e-05, 5.865469574928284e-05, 6.235484033823013e-05, 6.605498492717743e-05, 6.975512951612473e-05, 7.345527410507202e-05, 7.715541869401932e-05, 8.085556328296661e-05, 8.455570787191391e-05, 8.82558524608612e-05, 9.19559970498085e-05, 9.56561416387558e-05, 9.93562862277031e-05, 0.00010305643081665039]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 8.0, 14.0, 18.0, 14.0, 30.0, 47.0, 68.0, 123.0, 161.0, 351.0, 687.0, 1481.0, 4368.0, 15915.0, 95080.0, 607491.0, 273982.0, 36002.0, 7909.0, 2502.0, 1034.0, 524.0, 261.0, 161.0, 88.0, 66.0, 49.0, 25.0, 17.0, 19.0, 15.0, 7.0, 5.0, 4.0, 0.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1494140625, -1.1132049560546875, -1.076995849609375, -1.0407867431640625, -1.00457763671875, -0.9683685302734375, -0.932159423828125, -0.8959503173828125, -0.8597412109375, -0.8235321044921875, -0.787322998046875, -0.7511138916015625, -0.71490478515625, -0.6786956787109375, -0.642486572265625, -0.6062774658203125, -0.570068359375, -0.5338592529296875, -0.497650146484375, -0.4614410400390625, -0.42523193359375, -0.3890228271484375, -0.352813720703125, -0.3166046142578125, -0.2803955078125, -0.2441864013671875, -0.207977294921875, -0.1717681884765625, -0.13555908203125, -0.0993499755859375, -0.063140869140625, -0.0269317626953125, 0.00927734375, 0.0454864501953125, 0.081695556640625, 0.1179046630859375, 0.15411376953125, 0.1903228759765625, 0.226531982421875, 0.2627410888671875, 0.2989501953125, 0.3351593017578125, 0.371368408203125, 0.4075775146484375, 0.44378662109375, 0.4799957275390625, 0.516204833984375, 0.5524139404296875, 0.588623046875, 0.6248321533203125, 0.661041259765625, 0.6972503662109375, 0.73345947265625, 0.7696685791015625, 0.805877685546875, 0.8420867919921875, 0.8782958984375, 0.9145050048828125, 0.950714111328125, 0.9869232177734375, 1.02313232421875, 1.0593414306640625, 1.095550537109375, 1.1317596435546875, 1.16796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 14.0, 9.0, 18.0, 11.0, 13.0, 16.0, 24.0, 48.0, 33.0, 48.0, 64.0, 52.0, 51.0, 65.0, 65.0, 57.0, 59.0, 60.0, 51.0, 40.0, 29.0, 28.0, 28.0, 17.0, 12.0, 15.0, 8.0, 10.0, 10.0, 3.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332275390625, -0.320404052734375, -0.30853271484375, -0.296661376953125, -0.2847900390625, -0.272918701171875, -0.26104736328125, -0.249176025390625, -0.2373046875, -0.225433349609375, -0.21356201171875, -0.201690673828125, -0.1898193359375, -0.177947998046875, -0.16607666015625, -0.154205322265625, -0.142333984375, -0.130462646484375, -0.11859130859375, -0.106719970703125, -0.0948486328125, -0.082977294921875, -0.07110595703125, -0.059234619140625, -0.04736328125, -0.035491943359375, -0.02362060546875, -0.011749267578125, 0.0001220703125, 0.011993408203125, 0.02386474609375, 0.035736083984375, 0.047607421875, 0.059478759765625, 0.07135009765625, 0.083221435546875, 0.0950927734375, 0.106964111328125, 0.11883544921875, 0.130706787109375, 0.142578125, 0.154449462890625, 0.16632080078125, 0.178192138671875, 0.1900634765625, 0.201934814453125, 0.21380615234375, 0.225677490234375, 0.237548828125, 0.249420166015625, 0.26129150390625, 0.273162841796875, 0.2850341796875, 0.296905517578125, 0.30877685546875, 0.320648193359375, 0.33251953125, 0.344390869140625, 0.35626220703125, 0.368133544921875, 0.3800048828125, 0.391876220703125, 0.40374755859375, 0.415618896484375, 0.427490234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 14.0, 49.0, 143.0, 282.0, 318.0, 140.0, 32.0, 7.0, 0.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.96417999267578, -19.573678970336914, -19.183177947998047, -18.79267692565918, -18.402175903320312, -18.011674880981445, -17.621173858642578, -17.23067283630371, -16.840171813964844, -16.449670791625977, -16.05916976928711, -15.668668746948242, -15.278167724609375, -14.887666702270508, -14.49716567993164, -14.106664657592773, -13.716163635253906, -13.325662612915039, -12.935161590576172, -12.544660568237305, -12.154159545898438, -11.76365852355957, -11.373157501220703, -10.982656478881836, -10.592156410217285, -10.201655387878418, -9.81115436553955, -9.420653343200684, -9.030152320861816, -8.63965129852295, -8.249150276184082, -7.858649253845215, -7.468148231506348, -7.0776472091674805, -6.687146186828613, -6.296645164489746, -5.906144142150879, -5.515643119812012, -5.1251420974731445, -4.734641075134277, -4.34414005279541, -3.953639030456543, -3.563138008117676, -3.1726369857788086, -2.7821359634399414, -2.391634941101074, -2.001134157180786, -1.610633134841919, -1.2201323509216309, -0.8296313285827637, -0.43913036584854126, -0.04862940311431885, 0.34187161922454834, 0.7323726415634155, 1.1228735446929932, 1.5133745670318604, 1.9038755893707275, 2.2943766117095947, 2.684877634048462, 3.07537841796875, 3.465879440307617, 3.8563804626464844, 4.246881484985352, 4.637382507324219, 5.027883529663086]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 6.0, 8.0, 5.0, 11.0, 10.0, 18.0, 27.0, 32.0, 38.0, 54.0, 77.0, 86.0, 92.0, 87.0, 93.0, 72.0, 59.0, 49.0, 48.0, 31.0, 23.0, 22.0, 6.0, 10.0, 4.0, 10.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.99021053314209, -5.81521463394165, -5.640218257904053, -5.465222358703613, -5.290225982666016, -5.115230083465576, -4.940234184265137, -4.765237808227539, -4.5902419090271, -4.41524600982666, -4.2402496337890625, -4.065253734588623, -3.8902575969696045, -3.715261459350586, -3.5402655601501465, -3.365269422531128, -3.1902732849121094, -3.015277147293091, -2.8402810096740723, -2.665285110473633, -2.4902889728546143, -2.3152928352355957, -2.1402969360351562, -1.9653007984161377, -1.7903046607971191, -1.6153085231781006, -1.4403125047683716, -1.2653164863586426, -1.090320348739624, -0.9153242707252502, -0.7403281927108765, -0.5653321743011475, -0.3903355598449707, -0.21533948183059692, -0.040343403816223145, 0.13465267419815063, 0.3096487522125244, 0.4846448302268982, 0.659640908241272, 0.834636926651001, 1.0096330642700195, 1.184629201889038, 1.359625220298767, 1.534621238708496, 1.7096173763275146, 1.8846135139465332, 2.0596094131469727, 2.234605550765991, 2.4096016883850098, 2.5845978260040283, 2.759593963623047, 2.9345898628234863, 3.109586000442505, 3.2845821380615234, 3.459578037261963, 3.6345741748809814, 3.8095703125, 3.9845664501190186, 4.159562587738037, 4.334558486938477, 4.509554862976074, 4.684550762176514, 4.859546661376953, 5.034543037414551, 5.20953893661499]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 12.0, 16.0, 19.0, 23.0, 35.0, 51.0, 63.0, 47.0, 96.0, 155.0, 200.0, 288.0, 452.0, 860.0, 1494.0, 2979.0, 6528.0, 20507.0, 262529.0, 3850464.0, 31730.0, 8152.0, 3438.0, 1638.0, 941.0, 482.0, 380.0, 235.0, 109.0, 97.0, 60.0, 47.0, 40.0, 17.0, 22.0, 9.0, 14.0, 7.0, 3.0, 9.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.37109375, -3.259246826171875, -3.14739990234375, -3.035552978515625, -2.9237060546875, -2.811859130859375, -2.70001220703125, -2.588165283203125, -2.476318359375, -2.364471435546875, -2.25262451171875, -2.140777587890625, -2.0289306640625, -1.917083740234375, -1.80523681640625, -1.693389892578125, -1.58154296875, -1.469696044921875, -1.35784912109375, -1.246002197265625, -1.1341552734375, -1.022308349609375, -0.91046142578125, -0.798614501953125, -0.686767578125, -0.574920654296875, -0.46307373046875, -0.351226806640625, -0.2393798828125, -0.127532958984375, -0.01568603515625, 0.096160888671875, 0.2080078125, 0.319854736328125, 0.43170166015625, 0.543548583984375, 0.6553955078125, 0.767242431640625, 0.87908935546875, 0.990936279296875, 1.102783203125, 1.214630126953125, 1.32647705078125, 1.438323974609375, 1.5501708984375, 1.662017822265625, 1.77386474609375, 1.885711669921875, 1.99755859375, 2.109405517578125, 2.22125244140625, 2.333099365234375, 2.4449462890625, 2.556793212890625, 2.66864013671875, 2.780487060546875, 2.892333984375, 3.004180908203125, 3.11602783203125, 3.227874755859375, 3.3397216796875, 3.451568603515625, 3.56341552734375, 3.675262451171875, 3.787109375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 4.0, 7.0, 7.0, 10.0, 10.0, 21.0, 17.0, 58.0, 164.0, 287.0, 232.0, 88.0, 28.0, 22.0, 16.0, 6.0, 3.0, 6.0, 1.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21636009216308594, -0.20823287963867188, -0.2001056671142578, -0.19197845458984375, -0.1838512420654297, -0.17572402954101562, -0.16759681701660156, -0.1594696044921875, -0.15134239196777344, -0.14321517944335938, -0.1350879669189453, -0.12696075439453125, -0.11883354187011719, -0.11070632934570312, -0.10257911682128906, -0.094451904296875, -0.08632469177246094, -0.07819747924804688, -0.07007026672363281, -0.06194305419921875, -0.05381584167480469, -0.045688629150390625, -0.03756141662597656, -0.0294342041015625, -0.021306991577148438, -0.013179779052734375, -0.0050525665283203125, 0.00307464599609375, 0.011201858520507812, 0.019329071044921875, 0.027456283569335938, 0.03558349609375, 0.04371070861816406, 0.051837921142578125, 0.05996513366699219, 0.06809234619140625, 0.07621955871582031, 0.08434677124023438, 0.09247398376464844, 0.1006011962890625, 0.10872840881347656, 0.11685562133789062, 0.12498283386230469, 0.13311004638671875, 0.1412372589111328, 0.14936447143554688, 0.15749168395996094, 0.165618896484375, 0.17374610900878906, 0.18187332153320312, 0.1900005340576172, 0.19812774658203125, 0.2062549591064453, 0.21438217163085938, 0.22250938415527344, 0.2306365966796875, 0.23876380920410156, 0.24689102172851562, 0.2550182342529297, 0.26314544677734375, 0.2712726593017578, 0.2793998718261719, 0.28752708435058594, 0.295654296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 8.0, 6.0, 4.0, 14.0, 17.0, 24.0, 40.0, 54.0, 70.0, 112.0, 196.0, 328.0, 649.0, 1482.0, 3408.0, 8825.0, 26339.0, 105512.0, 3308619.0, 638412.0, 69155.0, 19211.0, 6703.0, 2695.0, 1117.0, 544.0, 266.0, 145.0, 91.0, 53.0, 41.0, 28.0, 25.0, 19.0, 15.0, 9.0, 7.0, 12.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.17578125, -2.102935791015625, -2.03009033203125, -1.957244873046875, -1.8843994140625, -1.811553955078125, -1.73870849609375, -1.665863037109375, -1.593017578125, -1.520172119140625, -1.44732666015625, -1.374481201171875, -1.3016357421875, -1.228790283203125, -1.15594482421875, -1.083099365234375, -1.01025390625, -0.937408447265625, -0.86456298828125, -0.791717529296875, -0.7188720703125, -0.646026611328125, -0.57318115234375, -0.500335693359375, -0.427490234375, -0.354644775390625, -0.28179931640625, -0.208953857421875, -0.1361083984375, -0.063262939453125, 0.00958251953125, 0.082427978515625, 0.1552734375, 0.228118896484375, 0.30096435546875, 0.373809814453125, 0.4466552734375, 0.519500732421875, 0.59234619140625, 0.665191650390625, 0.738037109375, 0.810882568359375, 0.88372802734375, 0.956573486328125, 1.0294189453125, 1.102264404296875, 1.17510986328125, 1.247955322265625, 1.32080078125, 1.393646240234375, 1.46649169921875, 1.539337158203125, 1.6121826171875, 1.685028076171875, 1.75787353515625, 1.830718994140625, 1.903564453125, 1.976409912109375, 2.04925537109375, 2.122100830078125, 2.1949462890625, 2.267791748046875, 2.34063720703125, 2.413482666015625, 2.486328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 6.0, 5.0, 5.0, 4.0, 5.0, 6.0, 15.0, 21.0, 28.0, 30.0, 43.0, 43.0, 68.0, 102.0, 166.0, 302.0, 1744.0, 764.0, 230.0, 152.0, 99.0, 68.0, 54.0, 29.0, 24.0, 22.0, 9.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.37060546875, -0.3610725402832031, -0.35153961181640625, -0.3420066833496094, -0.3324737548828125, -0.3229408264160156, -0.31340789794921875, -0.3038749694824219, -0.294342041015625, -0.2848091125488281, -0.27527618408203125, -0.2657432556152344, -0.2562103271484375, -0.24667739868164062, -0.23714447021484375, -0.22761154174804688, -0.21807861328125, -0.20854568481445312, -0.19901275634765625, -0.18947982788085938, -0.1799468994140625, -0.17041397094726562, -0.16088104248046875, -0.15134811401367188, -0.141815185546875, -0.13228225708007812, -0.12274932861328125, -0.11321640014648438, -0.1036834716796875, -0.09415054321289062, -0.08461761474609375, -0.07508468627929688, -0.0655517578125, -0.056018829345703125, -0.04648590087890625, -0.036952972412109375, -0.0274200439453125, -0.017887115478515625, -0.00835418701171875, 0.001178741455078125, 0.010711669921875, 0.020244598388671875, 0.02977752685546875, 0.039310455322265625, 0.0488433837890625, 0.058376312255859375, 0.06790924072265625, 0.07744216918945312, 0.08697509765625, 0.09650802612304688, 0.10604095458984375, 0.11557388305664062, 0.1251068115234375, 0.13463973999023438, 0.14417266845703125, 0.15370559692382812, 0.163238525390625, 0.17277145385742188, 0.18230438232421875, 0.19183731079101562, 0.2013702392578125, 0.21090316772460938, 0.22043609619140625, 0.22996902465820312, 0.239501953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 13.0, 52.0, 257.0, 456.0, 174.0, 38.0, 10.0, 7.0, 2.0, 1.0, 3.0], "bins": [-11.521320343017578, -11.316832542419434, -11.112343788146973, -10.907855987548828, -10.703367233276367, -10.498879432678223, -10.294390678405762, -10.089902877807617, -9.885414123535156, -9.680926322937012, -9.47643756866455, -9.271949768066406, -9.067461013793945, -8.8629732131958, -8.65848445892334, -8.453996658325195, -8.249507904052734, -8.04502010345459, -7.840531349182129, -7.636043071746826, -7.431554794311523, -7.227066516876221, -7.022578239440918, -6.818090438842773, -6.613602638244629, -6.409114360809326, -6.204626083374023, -6.000137805938721, -5.795649528503418, -5.591161251068115, -5.3866729736328125, -5.182185173034668, -4.977696895599365, -4.7732086181640625, -4.56872034072876, -4.364232063293457, -4.159743785858154, -3.9552555084228516, -3.750767469406128, -3.546279191970825, -3.3417909145355225, -3.1373026371002197, -2.932814359664917, -2.7283263206481934, -2.5238380432128906, -2.319349765777588, -2.114861488342285, -1.9103732109069824, -1.7058849334716797, -1.501396656036377, -1.2969083786010742, -1.092420220375061, -0.8879319429397583, -0.6834436655044556, -0.4789555072784424, -0.27446722984313965, -0.06997895240783691, 0.13450929522514343, 0.3389975428581238, 0.5434857606887817, 0.7479740381240845, 0.9524623155593872, 1.1569504737854004, 1.3614387512207031, 1.5659270286560059]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 11.0, 18.0, 32.0, 63.0, 72.0, 95.0, 102.0, 104.0, 110.0, 110.0, 79.0, 61.0, 58.0, 34.0, 19.0, 18.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2115280628204346, -3.132556438446045, -3.053584575653076, -2.9746129512786865, -2.895641326904297, -2.816669464111328, -2.7376978397369385, -2.658726215362549, -2.57975435256958, -2.5007827281951904, -2.4218108654022217, -2.342839241027832, -2.2638676166534424, -2.1848959922790527, -2.105924129486084, -2.0269525051116943, -1.9479808807373047, -1.8690091371536255, -1.7900375127792358, -1.7110657691955566, -1.632094144821167, -1.5531224012374878, -1.4741506576538086, -1.395179033279419, -1.3162072896957397, -1.2372355461120605, -1.158263921737671, -1.0792921781539917, -1.0003204345703125, -0.9213488101959229, -0.8423770666122437, -0.7634053826332092, -0.6844336986541748, -0.6054620146751404, -0.526490330696106, -0.44751858711242676, -0.36854690313339233, -0.2895752191543579, -0.2106035053730011, -0.1316317915916443, -0.05266010761260986, 0.026311591267585754, 0.10528329014778137, 0.184254989027977, 0.2632266879081726, 0.34219837188720703, 0.42117008566856384, 0.5001417994499207, 0.5791134834289551, 0.6580851674079895, 0.7370568513870239, 0.8160285949707031, 0.8950002789497375, 0.973971962928772, 1.0529437065124512, 1.1319153308868408, 1.21088707447052, 1.2898588180541992, 1.3688304424285889, 1.447802186012268, 1.5267739295959473, 1.605745553970337, 1.6847172975540161, 1.7636890411376953, 1.842660665512085]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 7.0, 7.0, 18.0, 21.0, 26.0, 30.0, 46.0, 53.0, 79.0, 112.0, 128.0, 225.0, 321.0, 470.0, 740.0, 1092.0, 1963.0, 3819.0, 8903.0, 28029.0, 196030.0, 693608.0, 81703.0, 17297.0, 6227.0, 3069.0, 1617.0, 996.0, 539.0, 428.0, 294.0, 178.0, 130.0, 83.0, 69.0, 44.0, 37.0, 36.0, 22.0, 12.0, 12.0, 5.0, 6.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3671875, -2.291595458984375, -2.21600341796875, -2.140411376953125, -2.0648193359375, -1.989227294921875, -1.91363525390625, -1.838043212890625, -1.762451171875, -1.686859130859375, -1.61126708984375, -1.535675048828125, -1.4600830078125, -1.384490966796875, -1.30889892578125, -1.233306884765625, -1.15771484375, -1.082122802734375, -1.00653076171875, -0.930938720703125, -0.8553466796875, -0.779754638671875, -0.70416259765625, -0.628570556640625, -0.552978515625, -0.477386474609375, -0.40179443359375, -0.326202392578125, -0.2506103515625, -0.175018310546875, -0.09942626953125, -0.023834228515625, 0.0517578125, 0.127349853515625, 0.20294189453125, 0.278533935546875, 0.3541259765625, 0.429718017578125, 0.50531005859375, 0.580902099609375, 0.656494140625, 0.732086181640625, 0.80767822265625, 0.883270263671875, 0.9588623046875, 1.034454345703125, 1.11004638671875, 1.185638427734375, 1.26123046875, 1.336822509765625, 1.41241455078125, 1.488006591796875, 1.5635986328125, 1.639190673828125, 1.71478271484375, 1.790374755859375, 1.865966796875, 1.941558837890625, 2.01715087890625, 2.092742919921875, 2.1683349609375, 2.243927001953125, 2.31951904296875, 2.395111083984375, 2.470703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 6.0, 13.0, 17.0, 40.0, 84.0, 147.0, 215.0, 210.0, 112.0, 74.0, 27.0, 15.0, 9.0, 5.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.21928977966308594, -0.21140670776367188, -0.2035236358642578, -0.19564056396484375, -0.1877574920654297, -0.17987442016601562, -0.17199134826660156, -0.1641082763671875, -0.15622520446777344, -0.14834213256835938, -0.1404590606689453, -0.13257598876953125, -0.12469291687011719, -0.11680984497070312, -0.10892677307128906, -0.101043701171875, -0.09316062927246094, -0.08527755737304688, -0.07739448547363281, -0.06951141357421875, -0.06162834167480469, -0.053745269775390625, -0.04586219787597656, -0.0379791259765625, -0.030096054077148438, -0.022212982177734375, -0.014329910278320312, -0.00644683837890625, 0.0014362335205078125, 0.009319305419921875, 0.017202377319335938, 0.02508544921875, 0.03296852111816406, 0.040851593017578125, 0.04873466491699219, 0.05661773681640625, 0.06450080871582031, 0.07238388061523438, 0.08026695251464844, 0.0881500244140625, 0.09603309631347656, 0.10391616821289062, 0.11179924011230469, 0.11968231201171875, 0.1275653839111328, 0.13544845581054688, 0.14333152770996094, 0.151214599609375, 0.15909767150878906, 0.16698074340820312, 0.1748638153076172, 0.18274688720703125, 0.1906299591064453, 0.19851303100585938, 0.20639610290527344, 0.2142791748046875, 0.22216224670410156, 0.23004531860351562, 0.2379283905029297, 0.24581146240234375, 0.2536945343017578, 0.2615776062011719, 0.26946067810058594, 0.27734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 5.0, 1.0, 2.0, 11.0, 9.0, 12.0, 15.0, 22.0, 32.0, 47.0, 68.0, 130.0, 187.0, 347.0, 610.0, 1092.0, 2342.0, 7638.0, 39663.0, 330655.0, 568448.0, 78042.0, 12504.0, 3399.0, 1426.0, 760.0, 410.0, 261.0, 150.0, 90.0, 40.0, 41.0, 20.0, 17.0, 13.0, 12.0, 14.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.731719970703125, -2.64117431640625, -2.550628662109375, -2.4600830078125, -2.369537353515625, -2.27899169921875, -2.188446044921875, -2.097900390625, -2.007354736328125, -1.91680908203125, -1.826263427734375, -1.7357177734375, -1.645172119140625, -1.55462646484375, -1.464080810546875, -1.37353515625, -1.282989501953125, -1.19244384765625, -1.101898193359375, -1.0113525390625, -0.920806884765625, -0.83026123046875, -0.739715576171875, -0.649169921875, -0.558624267578125, -0.46807861328125, -0.377532958984375, -0.2869873046875, -0.196441650390625, -0.10589599609375, -0.015350341796875, 0.0751953125, 0.165740966796875, 0.25628662109375, 0.346832275390625, 0.4373779296875, 0.527923583984375, 0.61846923828125, 0.709014892578125, 0.799560546875, 0.890106201171875, 0.98065185546875, 1.071197509765625, 1.1617431640625, 1.252288818359375, 1.34283447265625, 1.433380126953125, 1.52392578125, 1.614471435546875, 1.70501708984375, 1.795562744140625, 1.8861083984375, 1.976654052734375, 2.06719970703125, 2.157745361328125, 2.248291015625, 2.338836669921875, 2.42938232421875, 2.519927978515625, 2.6104736328125, 2.701019287109375, 2.79156494140625, 2.882110595703125, 2.97265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 6.0, 9.0, 14.0, 10.0, 11.0, 15.0, 17.0, 10.0, 9.0, 32.0, 25.0, 32.0, 29.0, 39.0, 23.0, 35.0, 25.0, 40.0, 49.0, 46.0, 28.0, 30.0, 46.0, 29.0, 32.0, 42.0, 32.0, 33.0, 21.0, 28.0, 36.0, 24.0, 16.0, 25.0, 9.0, 11.0, 13.0, 12.0, 9.0, 9.0, 5.0, 6.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.51318359375, -0.49681854248046875, -0.4804534912109375, -0.46408843994140625, -0.447723388671875, -0.43135833740234375, -0.4149932861328125, -0.39862823486328125, -0.38226318359375, -0.36589813232421875, -0.3495330810546875, -0.33316802978515625, -0.316802978515625, -0.30043792724609375, -0.2840728759765625, -0.26770782470703125, -0.2513427734375, -0.23497772216796875, -0.2186126708984375, -0.20224761962890625, -0.185882568359375, -0.16951751708984375, -0.1531524658203125, -0.13678741455078125, -0.12042236328125, -0.10405731201171875, -0.0876922607421875, -0.07132720947265625, -0.054962158203125, -0.03859710693359375, -0.0222320556640625, -0.00586700439453125, 0.010498046875, 0.02686309814453125, 0.0432281494140625, 0.05959320068359375, 0.075958251953125, 0.09232330322265625, 0.1086883544921875, 0.12505340576171875, 0.14141845703125, 0.15778350830078125, 0.1741485595703125, 0.19051361083984375, 0.206878662109375, 0.22324371337890625, 0.2396087646484375, 0.25597381591796875, 0.2723388671875, 0.28870391845703125, 0.3050689697265625, 0.32143402099609375, 0.337799072265625, 0.35416412353515625, 0.3705291748046875, 0.38689422607421875, 0.40325927734375, 0.41962432861328125, 0.4359893798828125, 0.45235443115234375, 0.468719482421875, 0.48508453369140625, 0.5014495849609375, 0.5178146362304688, 0.5341796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 7.0, 11.0, 27.0, 31.0, 45.0, 108.0, 166.0, 294.0, 829.0, 2297.0, 8671.0, 52925.0, 464836.0, 454031.0, 51959.0, 8523.0, 2265.0, 785.0, 313.0, 155.0, 109.0, 54.0, 29.0, 23.0, 20.0, 11.0, 10.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.568359375, -1.5142669677734375, -1.460174560546875, -1.4060821533203125, -1.35198974609375, -1.2978973388671875, -1.243804931640625, -1.1897125244140625, -1.1356201171875, -1.0815277099609375, -1.027435302734375, -0.9733428955078125, -0.91925048828125, -0.8651580810546875, -0.811065673828125, -0.7569732666015625, -0.702880859375, -0.6487884521484375, -0.594696044921875, -0.5406036376953125, -0.48651123046875, -0.4324188232421875, -0.378326416015625, -0.3242340087890625, -0.2701416015625, -0.2160491943359375, -0.161956787109375, -0.1078643798828125, -0.05377197265625, 0.0003204345703125, 0.054412841796875, 0.1085052490234375, 0.16259765625, 0.2166900634765625, 0.270782470703125, 0.3248748779296875, 0.37896728515625, 0.4330596923828125, 0.487152099609375, 0.5412445068359375, 0.5953369140625, 0.6494293212890625, 0.703521728515625, 0.7576141357421875, 0.81170654296875, 0.8657989501953125, 0.919891357421875, 0.9739837646484375, 1.028076171875, 1.0821685791015625, 1.136260986328125, 1.1903533935546875, 1.24444580078125, 1.2985382080078125, 1.352630615234375, 1.4067230224609375, 1.4608154296875, 1.5149078369140625, 1.569000244140625, 1.6230926513671875, 1.67718505859375, 1.7312774658203125, 1.785369873046875, 1.8394622802734375, 1.8935546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 11.0, 9.0, 16.0, 19.0, 24.0, 33.0, 33.0, 58.0, 105.0, 112.0, 120.0, 93.0, 96.0, 67.0, 67.0, 56.0, 35.0, 14.0, 12.0, 12.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001455545425415039, -0.00013820268213748932, -0.00013085082173347473, -0.00012349896132946014, -0.00011614710092544556, -0.00010879524052143097, -0.00010144338011741638, -9.40915197134018e-05, -8.673965930938721e-05, -7.938779890537262e-05, -7.203593850135803e-05, -6.468407809734344e-05, -5.733221769332886e-05, -4.998035728931427e-05, -4.262849688529968e-05, -3.5276636481285095e-05, -2.7924776077270508e-05, -2.057291567325592e-05, -1.3221055269241333e-05, -5.869194865226746e-06, 1.4826655387878418e-06, 8.83452594280243e-06, 1.6186386346817017e-05, 2.3538246750831604e-05, 3.089010715484619e-05, 3.824196755886078e-05, 4.5593827962875366e-05, 5.2945688366889954e-05, 6.029754877090454e-05, 6.764940917491913e-05, 7.500126957893372e-05, 8.23531299829483e-05, 8.970499038696289e-05, 9.705685079097748e-05, 0.00010440871119499207, 0.00011176057159900665, 0.00011911243200302124, 0.00012646429240703583, 0.00013381615281105042, 0.000141168013215065, 0.0001485198736190796, 0.00015587173402309418, 0.00016322359442710876, 0.00017057545483112335, 0.00017792731523513794, 0.00018527917563915253, 0.00019263103604316711, 0.0001999828964471817, 0.0002073347568511963, 0.00021468661725521088, 0.00022203847765922546, 0.00022939033806324005, 0.00023674219846725464, 0.00024409405887126923, 0.0002514459192752838, 0.0002587977796792984, 0.000266149640083313, 0.0002735015004873276, 0.00028085336089134216, 0.00028820522129535675, 0.00029555708169937134, 0.0003029089421033859, 0.0003102608025074005, 0.0003176126629114151, 0.0003249645233154297]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 4.0, 11.0, 17.0, 18.0, 22.0, 43.0, 73.0, 103.0, 166.0, 335.0, 640.0, 1244.0, 3110.0, 11339.0, 76908.0, 607259.0, 303552.0, 33164.0, 6370.0, 2041.0, 939.0, 491.0, 272.0, 161.0, 94.0, 51.0, 37.0, 27.0, 18.0, 11.0, 6.0, 8.0, 9.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2900390625, -1.2380218505859375, -1.186004638671875, -1.1339874267578125, -1.08197021484375, -1.0299530029296875, -0.977935791015625, -0.9259185791015625, -0.8739013671875, -0.8218841552734375, -0.769866943359375, -0.7178497314453125, -0.66583251953125, -0.6138153076171875, -0.561798095703125, -0.5097808837890625, -0.457763671875, -0.4057464599609375, -0.353729248046875, -0.3017120361328125, -0.24969482421875, -0.1976776123046875, -0.145660400390625, -0.0936431884765625, -0.0416259765625, 0.0103912353515625, 0.062408447265625, 0.1144256591796875, 0.16644287109375, 0.2184600830078125, 0.270477294921875, 0.3224945068359375, 0.37451171875, 0.4265289306640625, 0.478546142578125, 0.5305633544921875, 0.58258056640625, 0.6345977783203125, 0.686614990234375, 0.7386322021484375, 0.7906494140625, 0.8426666259765625, 0.894683837890625, 0.9467010498046875, 0.99871826171875, 1.0507354736328125, 1.102752685546875, 1.1547698974609375, 1.206787109375, 1.2588043212890625, 1.310821533203125, 1.3628387451171875, 1.41485595703125, 1.4668731689453125, 1.518890380859375, 1.5709075927734375, 1.6229248046875, 1.6749420166015625, 1.726959228515625, 1.7789764404296875, 1.83099365234375, 1.8830108642578125, 1.935028076171875, 1.9870452880859375, 2.0390625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 9.0, 9.0, 13.0, 21.0, 32.0, 19.0, 41.0, 39.0, 49.0, 46.0, 69.0, 76.0, 50.0, 80.0, 67.0, 72.0, 49.0, 53.0, 32.0, 28.0, 21.0, 19.0, 15.0, 23.0, 13.0, 10.0, 12.0, 4.0, 2.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468994140625, -0.4524269104003906, -0.43585968017578125, -0.4192924499511719, -0.4027252197265625, -0.3861579895019531, -0.36959075927734375, -0.3530235290527344, -0.336456298828125, -0.3198890686035156, -0.30332183837890625, -0.2867546081542969, -0.2701873779296875, -0.2536201477050781, -0.23705291748046875, -0.22048568725585938, -0.20391845703125, -0.18735122680664062, -0.17078399658203125, -0.15421676635742188, -0.1376495361328125, -0.12108230590820312, -0.10451507568359375, -0.08794784545898438, -0.071380615234375, -0.054813385009765625, -0.03824615478515625, -0.021678924560546875, -0.0051116943359375, 0.011455535888671875, 0.02802276611328125, 0.044589996337890625, 0.0611572265625, 0.07772445678710938, 0.09429168701171875, 0.11085891723632812, 0.1274261474609375, 0.14399337768554688, 0.16056060791015625, 0.17712783813476562, 0.193695068359375, 0.21026229858398438, 0.22682952880859375, 0.24339675903320312, 0.2599639892578125, 0.2765312194824219, 0.29309844970703125, 0.3096656799316406, 0.32623291015625, 0.3428001403808594, 0.35936737060546875, 0.3759346008300781, 0.3925018310546875, 0.4090690612792969, 0.42563629150390625, 0.4422035217285156, 0.458770751953125, 0.4753379821777344, 0.49190521240234375, 0.5084724426269531, 0.5250396728515625, 0.5416069030761719, 0.5581741333007812, 0.5747413635253906, 0.59130859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 28.0, 165.0, 457.0, 270.0, 55.0, 12.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.622913360595703, -26.4532527923584, -25.283594131469727, -24.113933563232422, -22.94427490234375, -21.774614334106445, -20.60495376586914, -19.43529510498047, -18.265634536743164, -17.09597396850586, -15.926315307617188, -14.756654739379883, -13.586995124816895, -12.417335510253906, -11.247674942016602, -10.078015327453613, -8.908355712890625, -7.738696098327637, -6.56903600692749, -5.399375915527344, -4.2297163009643555, -3.060056686401367, -1.8903965950012207, -0.7207365036010742, 0.44892311096191406, 1.6185829639434814, 2.788242816925049, 3.957902669906616, 5.127562522888184, 6.297222137451172, 7.466882228851318, 8.636542320251465, 9.806198120117188, 10.975857734680176, 12.145517349243164, 13.315177917480469, 14.484837532043457, 15.654497146606445, 16.82415771484375, 17.993816375732422, 19.163476943969727, 20.33313751220703, 21.502796173095703, 22.672456741333008, 23.842117309570312, 25.011775970458984, 26.18143653869629, 27.351097106933594, 28.520755767822266, 29.69041633605957, 30.860074996948242, 32.02973556518555, 33.19939422607422, 34.369056701660156, 35.53871536254883, 36.7083740234375, 37.87803649902344, 39.04769515991211, 40.21735763549805, 41.38701629638672, 42.55667495727539, 43.72633361816406, 44.89599609375, 46.06565475463867, 47.235313415527344]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 9.0, 17.0, 17.0, 29.0, 34.0, 34.0, 28.0, 47.0, 38.0, 51.0, 62.0, 62.0, 63.0, 53.0, 63.0, 47.0, 54.0, 54.0, 54.0, 34.0, 23.0, 25.0, 20.0, 21.0, 12.0, 10.0, 3.0, 9.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.230874538421631, -6.020956993103027, -5.811038970947266, -5.601121425628662, -5.391203880310059, -5.181285858154297, -4.971368312835693, -4.76145076751709, -4.551532745361328, -4.341615200042725, -4.131697177886963, -3.9217796325683594, -3.7118618488311768, -3.501944065093994, -3.2920265197753906, -3.082108736038208, -2.8721909523010254, -2.6622731685638428, -2.45235538482666, -2.2424378395080566, -2.032520055770874, -1.8226022720336914, -1.6126846075057983, -1.4027669429779053, -1.1928491592407227, -0.9829314351081848, -0.773013710975647, -0.5630959868431091, -0.3531782627105713, -0.14326047897338867, 0.0666571855545044, 0.27657485008239746, 0.4864921569824219, 0.6964098811149597, 0.9063276052474976, 1.1162452697753906, 1.3261630535125732, 1.5360808372497559, 1.745998501777649, 1.955916166305542, 2.1658339500427246, 2.3757517337799072, 2.58566951751709, 2.7955870628356934, 3.005504846572876, 3.2154226303100586, 3.425340175628662, 3.6352579593658447, 3.8451757431030273, 4.055093288421631, 4.265011310577393, 4.474928855895996, 4.684846878051758, 4.894764423370361, 5.104681968688965, 5.314599990844727, 5.52451753616333, 5.734435081481934, 5.944353103637695, 6.154270648956299, 6.364188194274902, 6.574106216430664, 6.784023761749268, 6.993941307067871, 7.203859329223633]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 4.0, 19.0, 37.0, 65.0, 173.0, 357.0, 994.0, 5403.0, 730282.0, 3449324.0, 6044.0, 1047.0, 286.0, 112.0, 57.0, 29.0, 11.0, 7.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.57421875, -9.265625, -8.95703125, -8.6484375, -8.33984375, -8.03125, -7.72265625, -7.4140625, -7.10546875, -6.796875, -6.48828125, -6.1796875, -5.87109375, -5.5625, -5.25390625, -4.9453125, -4.63671875, -4.328125, -4.01953125, -3.7109375, -3.40234375, -3.09375, -2.78515625, -2.4765625, -2.16796875, -1.859375, -1.55078125, -1.2421875, -0.93359375, -0.625, -0.31640625, -0.0078125, 0.30078125, 0.609375, 0.91796875, 1.2265625, 1.53515625, 1.84375, 2.15234375, 2.4609375, 2.76953125, 3.078125, 3.38671875, 3.6953125, 4.00390625, 4.3125, 4.62109375, 4.9296875, 5.23828125, 5.546875, 5.85546875, 6.1640625, 6.47265625, 6.78125, 7.08984375, 7.3984375, 7.70703125, 8.015625, 8.32421875, 8.6328125, 8.94140625, 9.25, 9.55859375, 9.8671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 22.0, 31.0, 79.0, 102.0, 158.0, 151.0, 138.0, 124.0, 67.0, 43.0, 22.0, 14.0, 8.0, 3.0, 1.0, 4.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281494140625, -0.2725791931152344, -0.26366424560546875, -0.2547492980957031, -0.2458343505859375, -0.23691940307617188, -0.22800445556640625, -0.21908950805664062, -0.210174560546875, -0.20125961303710938, -0.19234466552734375, -0.18342971801757812, -0.1745147705078125, -0.16559982299804688, -0.15668487548828125, -0.14776992797851562, -0.13885498046875, -0.12994003295898438, -0.12102508544921875, -0.11211013793945312, -0.1031951904296875, -0.09428024291992188, -0.08536529541015625, -0.07645034790039062, -0.067535400390625, -0.058620452880859375, -0.04970550537109375, -0.040790557861328125, -0.0318756103515625, -0.022960662841796875, -0.01404571533203125, -0.005130767822265625, 0.0037841796875, 0.012699127197265625, 0.02161407470703125, 0.030529022216796875, 0.0394439697265625, 0.048358917236328125, 0.05727386474609375, 0.06618881225585938, 0.075103759765625, 0.08401870727539062, 0.09293365478515625, 0.10184860229492188, 0.1107635498046875, 0.11967849731445312, 0.12859344482421875, 0.13750839233398438, 0.14642333984375, 0.15533828735351562, 0.16425323486328125, 0.17316818237304688, 0.1820831298828125, 0.19099807739257812, 0.19991302490234375, 0.20882797241210938, 0.217742919921875, 0.22665786743164062, 0.23557281494140625, 0.24448776245117188, 0.2534027099609375, 0.2623176574707031, 0.27123260498046875, 0.2801475524902344, 0.2890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 9.0, 15.0, 19.0, 34.0, 61.0, 107.0, 219.0, 441.0, 1056.0, 2870.0, 10065.0, 52386.0, 2814799.0, 1250811.0, 47363.0, 9431.0, 2714.0, 992.0, 460.0, 180.0, 99.0, 64.0, 30.0, 12.0, 10.0, 12.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7890625, -3.65826416015625, -3.5274658203125, -3.39666748046875, -3.265869140625, -3.13507080078125, -3.0042724609375, -2.87347412109375, -2.74267578125, -2.61187744140625, -2.4810791015625, -2.35028076171875, -2.219482421875, -2.08868408203125, -1.9578857421875, -1.82708740234375, -1.6962890625, -1.56549072265625, -1.4346923828125, -1.30389404296875, -1.173095703125, -1.04229736328125, -0.9114990234375, -0.78070068359375, -0.64990234375, -0.51910400390625, -0.3883056640625, -0.25750732421875, -0.126708984375, 0.00408935546875, 0.1348876953125, 0.26568603515625, 0.396484375, 0.52728271484375, 0.6580810546875, 0.78887939453125, 0.919677734375, 1.05047607421875, 1.1812744140625, 1.31207275390625, 1.44287109375, 1.57366943359375, 1.7044677734375, 1.83526611328125, 1.966064453125, 2.09686279296875, 2.2276611328125, 2.35845947265625, 2.4892578125, 2.62005615234375, 2.7508544921875, 2.88165283203125, 3.012451171875, 3.14324951171875, 3.2740478515625, 3.40484619140625, 3.53564453125, 3.66644287109375, 3.7972412109375, 3.92803955078125, 4.058837890625, 4.18963623046875, 4.3204345703125, 4.45123291015625, 4.58203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 8.0, 9.0, 10.0, 16.0, 28.0, 22.0, 38.0, 76.0, 127.0, 190.0, 497.0, 1864.0, 519.0, 238.0, 132.0, 91.0, 69.0, 38.0, 20.0, 15.0, 11.0, 18.0, 11.0, 7.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.367919921875, -0.3515892028808594, -0.33525848388671875, -0.3189277648925781, -0.3025970458984375, -0.2862663269042969, -0.26993560791015625, -0.2536048889160156, -0.237274169921875, -0.22094345092773438, -0.20461273193359375, -0.18828201293945312, -0.1719512939453125, -0.15562057495117188, -0.13928985595703125, -0.12295913696289062, -0.10662841796875, -0.09029769897460938, -0.07396697998046875, -0.057636260986328125, -0.0413055419921875, -0.024974822998046875, -0.00864410400390625, 0.007686614990234375, 0.024017333984375, 0.040348052978515625, 0.05667877197265625, 0.07300949096679688, 0.0893402099609375, 0.10567092895507812, 0.12200164794921875, 0.13833236694335938, 0.1546630859375, 0.17099380493164062, 0.18732452392578125, 0.20365524291992188, 0.2199859619140625, 0.23631668090820312, 0.25264739990234375, 0.2689781188964844, 0.285308837890625, 0.3016395568847656, 0.31797027587890625, 0.3343009948730469, 0.3506317138671875, 0.3669624328613281, 0.38329315185546875, 0.3996238708496094, 0.41595458984375, 0.4322853088378906, 0.44861602783203125, 0.4649467468261719, 0.4812774658203125, 0.4976081848144531, 0.5139389038085938, 0.5302696228027344, 0.546600341796875, 0.5629310607910156, 0.5792617797851562, 0.5955924987792969, 0.6119232177734375, 0.6282539367675781, 0.6445846557617188, 0.6609153747558594, 0.67724609375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 31.0, 44.0, 98.0, 190.0, 224.0, 175.0, 103.0, 70.0, 26.0, 15.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.266778945922852, -7.095783710479736, -6.924788951873779, -6.753793716430664, -6.582798480987549, -6.411803722381592, -6.240808486938477, -6.0698137283325195, -5.898818492889404, -5.727823257446289, -5.556828498840332, -5.385833263397217, -5.214838027954102, -5.0438432693481445, -4.872848033905029, -4.701852798461914, -4.530858039855957, -4.359862804412842, -4.188868045806885, -4.0178728103637695, -3.8468778133392334, -3.6758828163146973, -3.504887580871582, -3.333892583847046, -3.1628971099853516, -2.9919021129608154, -2.8209068775177, -2.649911880493164, -2.478916883468628, -2.307921886444092, -2.1369266510009766, -1.9659316539764404, -1.7949368953704834, -1.6239417791366577, -1.4529467821121216, -1.281951665878296, -1.1109566688537598, -0.9399615526199341, -0.7689664363861084, -0.5979714393615723, -0.4269763231277466, -0.2559812664985657, -0.08498618006706238, 0.08600890636444092, 0.2570039629936218, 0.42799901962280273, 0.5989941358566284, 0.7699891328811646, 0.9409842491149902, 1.111979365348816, 1.282974362373352, 1.4539694786071777, 1.6249644756317139, 1.7959595918655396, 1.9669547080993652, 2.1379497051239014, 2.3089447021484375, 2.4799396991729736, 2.650934934616089, 2.821929931640625, 2.992924928665161, 3.1639199256896973, 3.3349151611328125, 3.5059101581573486, 3.676905393600464]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 13.0, 15.0, 5.0, 6.0, 13.0, 16.0, 14.0, 9.0, 21.0, 25.0, 28.0, 26.0, 35.0, 38.0, 42.0, 36.0, 44.0, 47.0, 41.0, 40.0, 40.0, 28.0, 47.0, 34.0, 41.0, 27.0, 36.0, 36.0, 30.0, 19.0, 17.0, 20.0, 19.0, 14.0, 15.0, 10.0, 10.0, 4.0, 2.0, 7.0, 12.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2932707071304321, -1.2474721670150757, -1.2016737461090088, -1.1558752059936523, -1.110076665878296, -1.064278244972229, -1.0184797048568726, -0.9726812243461609, -0.9268827438354492, -0.8810842633247375, -0.8352857828140259, -0.7894872426986694, -0.7436887621879578, -0.6978902816772461, -0.6520917415618896, -0.606293261051178, -0.5604947805404663, -0.5146963000297546, -0.4688977897167206, -0.4230992794036865, -0.37730079889297485, -0.3315023183822632, -0.2857038080692291, -0.23990529775619507, -0.1941068172454834, -0.14830832183361053, -0.10250982642173767, -0.05671133100986481, -0.010912835597991943, 0.03488565981388092, 0.08068415522575378, 0.12648266553878784, 0.1722811460494995, 0.21807964146137238, 0.26387813687324524, 0.3096766471862793, 0.35547512769699097, 0.40127360820770264, 0.4470721185207367, 0.49287062883377075, 0.5386691093444824, 0.5844675898551941, 0.6302660703659058, 0.6760646104812622, 0.7218630909919739, 0.7676615715026855, 0.813460111618042, 0.8592585921287537, 0.9050570726394653, 0.950855553150177, 0.9966540336608887, 1.0424525737762451, 1.0882511138916016, 1.1340495347976685, 1.179848074913025, 1.2256464958190918, 1.2714450359344482, 1.3172435760498047, 1.3630419969558716, 1.408840537071228, 1.454638957977295, 1.5004374980926514, 1.5462360382080078, 1.5920345783233643, 1.6378329992294312]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 11.0, 3.0, 6.0, 9.0, 8.0, 17.0, 28.0, 43.0, 54.0, 55.0, 118.0, 130.0, 181.0, 258.0, 368.0, 542.0, 811.0, 1408.0, 2422.0, 5592.0, 15646.0, 58280.0, 295171.0, 506774.0, 117035.0, 26846.0, 8367.0, 3510.0, 1760.0, 950.0, 621.0, 449.0, 306.0, 216.0, 156.0, 102.0, 92.0, 62.0, 37.0, 28.0, 23.0, 16.0, 14.0, 10.0, 5.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.287109375, -2.22027587890625, -2.1534423828125, -2.08660888671875, -2.019775390625, -1.95294189453125, -1.8861083984375, -1.81927490234375, -1.75244140625, -1.68560791015625, -1.6187744140625, -1.55194091796875, -1.485107421875, -1.41827392578125, -1.3514404296875, -1.28460693359375, -1.2177734375, -1.15093994140625, -1.0841064453125, -1.01727294921875, -0.950439453125, -0.88360595703125, -0.8167724609375, -0.74993896484375, -0.68310546875, -0.61627197265625, -0.5494384765625, -0.48260498046875, -0.415771484375, -0.34893798828125, -0.2821044921875, -0.21527099609375, -0.1484375, -0.08160400390625, -0.0147705078125, 0.05206298828125, 0.118896484375, 0.18572998046875, 0.2525634765625, 0.31939697265625, 0.38623046875, 0.45306396484375, 0.5198974609375, 0.58673095703125, 0.653564453125, 0.72039794921875, 0.7872314453125, 0.85406494140625, 0.9208984375, 0.98773193359375, 1.0545654296875, 1.12139892578125, 1.188232421875, 1.25506591796875, 1.3218994140625, 1.38873291015625, 1.45556640625, 1.52239990234375, 1.5892333984375, 1.65606689453125, 1.722900390625, 1.78973388671875, 1.8565673828125, 1.92340087890625, 1.990234375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 16.0, 19.0, 43.0, 58.0, 91.0, 110.0, 125.0, 144.0, 120.0, 80.0, 69.0, 47.0, 18.0, 20.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258056640625, -0.24919509887695312, -0.24033355712890625, -0.23147201538085938, -0.2226104736328125, -0.21374893188476562, -0.20488739013671875, -0.19602584838867188, -0.187164306640625, -0.17830276489257812, -0.16944122314453125, -0.16057968139648438, -0.1517181396484375, -0.14285659790039062, -0.13399505615234375, -0.12513351440429688, -0.11627197265625, -0.10741043090820312, -0.09854888916015625, -0.08968734741210938, -0.0808258056640625, -0.07196426391601562, -0.06310272216796875, -0.054241180419921875, -0.045379638671875, -0.036518096923828125, -0.02765655517578125, -0.018795013427734375, -0.0099334716796875, -0.001071929931640625, 0.00778961181640625, 0.016651153564453125, 0.0255126953125, 0.034374237060546875, 0.04323577880859375, 0.052097320556640625, 0.0609588623046875, 0.06982040405273438, 0.07868194580078125, 0.08754348754882812, 0.096405029296875, 0.10526657104492188, 0.11412811279296875, 0.12298965454101562, 0.1318511962890625, 0.14071273803710938, 0.14957427978515625, 0.15843582153320312, 0.16729736328125, 0.17615890502929688, 0.18502044677734375, 0.19388198852539062, 0.2027435302734375, 0.21160507202148438, 0.22046661376953125, 0.22932815551757812, 0.238189697265625, 0.24705123901367188, 0.25591278076171875, 0.2647743225097656, 0.2736358642578125, 0.2824974060058594, 0.29135894775390625, 0.3002204895019531, 0.30908203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 7.0, 4.0, 5.0, 8.0, 10.0, 15.0, 29.0, 34.0, 42.0, 90.0, 140.0, 234.0, 450.0, 913.0, 2025.0, 6109.0, 31378.0, 291275.0, 628410.0, 70958.0, 10832.0, 3027.0, 1112.0, 575.0, 340.0, 190.0, 107.0, 79.0, 45.0, 25.0, 22.0, 12.0, 15.0, 8.0, 7.0, 5.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.3726806640625, -3.260986328125, -3.1492919921875, -3.03759765625, -2.9259033203125, -2.814208984375, -2.7025146484375, -2.5908203125, -2.4791259765625, -2.367431640625, -2.2557373046875, -2.14404296875, -2.0323486328125, -1.920654296875, -1.8089599609375, -1.697265625, -1.5855712890625, -1.473876953125, -1.3621826171875, -1.25048828125, -1.1387939453125, -1.027099609375, -0.9154052734375, -0.8037109375, -0.6920166015625, -0.580322265625, -0.4686279296875, -0.35693359375, -0.2452392578125, -0.133544921875, -0.0218505859375, 0.08984375, 0.2015380859375, 0.313232421875, 0.4249267578125, 0.53662109375, 0.6483154296875, 0.760009765625, 0.8717041015625, 0.9833984375, 1.0950927734375, 1.206787109375, 1.3184814453125, 1.43017578125, 1.5418701171875, 1.653564453125, 1.7652587890625, 1.876953125, 1.9886474609375, 2.100341796875, 2.2120361328125, 2.32373046875, 2.4354248046875, 2.547119140625, 2.6588134765625, 2.7705078125, 2.8822021484375, 2.993896484375, 3.1055908203125, 3.21728515625, 3.3289794921875, 3.440673828125, 3.5523681640625, 3.6640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 18.0, 8.0, 15.0, 11.0, 15.0, 21.0, 18.0, 23.0, 34.0, 22.0, 40.0, 39.0, 37.0, 39.0, 40.0, 38.0, 50.0, 53.0, 37.0, 57.0, 39.0, 36.0, 41.0, 44.0, 32.0, 21.0, 26.0, 23.0, 14.0, 15.0, 9.0, 8.0, 10.0, 12.0, 7.0, 8.0, 8.0, 5.0, 1.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.7041015625, -0.6799468994140625, -0.655792236328125, -0.6316375732421875, -0.60748291015625, -0.5833282470703125, -0.559173583984375, -0.5350189208984375, -0.5108642578125, -0.4867095947265625, -0.462554931640625, -0.4384002685546875, -0.41424560546875, -0.3900909423828125, -0.365936279296875, -0.3417816162109375, -0.317626953125, -0.2934722900390625, -0.269317626953125, -0.2451629638671875, -0.22100830078125, -0.1968536376953125, -0.172698974609375, -0.1485443115234375, -0.1243896484375, -0.1002349853515625, -0.076080322265625, -0.0519256591796875, -0.02777099609375, -0.0036163330078125, 0.020538330078125, 0.0446929931640625, 0.06884765625, 0.0930023193359375, 0.117156982421875, 0.1413116455078125, 0.16546630859375, 0.1896209716796875, 0.213775634765625, 0.2379302978515625, 0.2620849609375, 0.2862396240234375, 0.310394287109375, 0.3345489501953125, 0.35870361328125, 0.3828582763671875, 0.407012939453125, 0.4311676025390625, 0.455322265625, 0.4794769287109375, 0.503631591796875, 0.5277862548828125, 0.55194091796875, 0.5760955810546875, 0.600250244140625, 0.6244049072265625, 0.6485595703125, 0.6727142333984375, 0.696868896484375, 0.7210235595703125, 0.74517822265625, 0.7693328857421875, 0.793487548828125, 0.8176422119140625, 0.841796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 13.0, 24.0, 34.0, 50.0, 92.0, 146.0, 350.0, 701.0, 1736.0, 4906.0, 17258.0, 83832.0, 464829.0, 387335.0, 65934.0, 14176.0, 4293.0, 1509.0, 651.0, 302.0, 172.0, 81.0, 57.0, 29.0, 14.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3095703125, -1.2720794677734375, -1.234588623046875, -1.1970977783203125, -1.15960693359375, -1.1221160888671875, -1.084625244140625, -1.0471343994140625, -1.0096435546875, -0.9721527099609375, -0.934661865234375, -0.8971710205078125, -0.85968017578125, -0.8221893310546875, -0.784698486328125, -0.7472076416015625, -0.709716796875, -0.6722259521484375, -0.634735107421875, -0.5972442626953125, -0.55975341796875, -0.5222625732421875, -0.484771728515625, -0.4472808837890625, -0.4097900390625, -0.3722991943359375, -0.334808349609375, -0.2973175048828125, -0.25982666015625, -0.2223358154296875, -0.184844970703125, -0.1473541259765625, -0.10986328125, -0.0723724365234375, -0.034881591796875, 0.0026092529296875, 0.04010009765625, 0.0775909423828125, 0.115081787109375, 0.1525726318359375, 0.1900634765625, 0.2275543212890625, 0.265045166015625, 0.3025360107421875, 0.34002685546875, 0.3775177001953125, 0.415008544921875, 0.4524993896484375, 0.489990234375, 0.5274810791015625, 0.564971923828125, 0.6024627685546875, 0.63995361328125, 0.6774444580078125, 0.714935302734375, 0.7524261474609375, 0.7899169921875, 0.8274078369140625, 0.864898681640625, 0.9023895263671875, 0.93988037109375, 0.9773712158203125, 1.014862060546875, 1.0523529052734375, 1.08984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 18.0, 34.0, 40.0, 64.0, 112.0, 136.0, 144.0, 112.0, 95.0, 63.0, 46.0, 34.0, 21.0, 13.0, 12.0, 6.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002906322479248047, -0.0002824142575263977, -0.0002741962671279907, -0.00026597827672958374, -0.00025776028633117676, -0.0002495422959327698, -0.0002413243055343628, -0.0002331063151359558, -0.00022488832473754883, -0.00021667033433914185, -0.00020845234394073486, -0.00020023435354232788, -0.0001920163631439209, -0.00018379837274551392, -0.00017558038234710693, -0.00016736239194869995, -0.00015914440155029297, -0.00015092641115188599, -0.000142708420753479, -0.00013449043035507202, -0.00012627243995666504, -0.00011805444955825806, -0.00010983645915985107, -0.00010161846876144409, -9.340047836303711e-05, -8.518248796463013e-05, -7.696449756622314e-05, -6.874650716781616e-05, -6.052851676940918e-05, -5.23105263710022e-05, -4.4092535972595215e-05, -3.587454557418823e-05, -2.765655517578125e-05, -1.9438564777374268e-05, -1.1220574378967285e-05, -3.0025839805603027e-06, 5.21540641784668e-06, 1.3433396816253662e-05, 2.1651387214660645e-05, 2.9869377613067627e-05, 3.808736801147461e-05, 4.630535840988159e-05, 5.4523348808288574e-05, 6.274133920669556e-05, 7.095932960510254e-05, 7.917732000350952e-05, 8.73953104019165e-05, 9.561330080032349e-05, 0.00010383129119873047, 0.00011204928159713745, 0.00012026727199554443, 0.00012848526239395142, 0.0001367032527923584, 0.00014492124319076538, 0.00015313923358917236, 0.00016135722398757935, 0.00016957521438598633, 0.0001777932047843933, 0.0001860111951828003, 0.00019422918558120728, 0.00020244717597961426, 0.00021066516637802124, 0.00021888315677642822, 0.0002271011471748352, 0.0002353191375732422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 12.0, 26.0, 52.0, 101.0, 241.0, 791.0, 4232.0, 101104.0, 915192.0, 23867.0, 2140.0, 487.0, 175.0, 63.0, 35.0, 11.0, 7.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.0657958984375, -3.959716796875, -3.8536376953125, -3.74755859375, -3.6414794921875, -3.535400390625, -3.4293212890625, -3.3232421875, -3.2171630859375, -3.111083984375, -3.0050048828125, -2.89892578125, -2.7928466796875, -2.686767578125, -2.5806884765625, -2.474609375, -2.3685302734375, -2.262451171875, -2.1563720703125, -2.05029296875, -1.9442138671875, -1.838134765625, -1.7320556640625, -1.6259765625, -1.5198974609375, -1.413818359375, -1.3077392578125, -1.20166015625, -1.0955810546875, -0.989501953125, -0.8834228515625, -0.77734375, -0.6712646484375, -0.565185546875, -0.4591064453125, -0.35302734375, -0.2469482421875, -0.140869140625, -0.0347900390625, 0.0712890625, 0.1773681640625, 0.283447265625, 0.3895263671875, 0.49560546875, 0.6016845703125, 0.707763671875, 0.8138427734375, 0.919921875, 1.0260009765625, 1.132080078125, 1.2381591796875, 1.34423828125, 1.4503173828125, 1.556396484375, 1.6624755859375, 1.7685546875, 1.8746337890625, 1.980712890625, 2.0867919921875, 2.19287109375, 2.2989501953125, 2.405029296875, 2.5111083984375, 2.6171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 15.0, 18.0, 11.0, 24.0, 34.0, 37.0, 46.0, 59.0, 68.0, 74.0, 83.0, 86.0, 73.0, 71.0, 74.0, 49.0, 33.0, 38.0, 25.0, 20.0, 14.0, 16.0, 9.0, 4.0, 1.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.80078125, -0.7814712524414062, -0.7621612548828125, -0.7428512573242188, -0.723541259765625, -0.7042312622070312, -0.6849212646484375, -0.6656112670898438, -0.64630126953125, -0.6269912719726562, -0.6076812744140625, -0.5883712768554688, -0.569061279296875, -0.5497512817382812, -0.5304412841796875, -0.5111312866210938, -0.4918212890625, -0.47251129150390625, -0.4532012939453125, -0.43389129638671875, -0.414581298828125, -0.39527130126953125, -0.3759613037109375, -0.35665130615234375, -0.33734130859375, -0.31803131103515625, -0.2987213134765625, -0.27941131591796875, -0.260101318359375, -0.24079132080078125, -0.2214813232421875, -0.20217132568359375, -0.182861328125, -0.16355133056640625, -0.1442413330078125, -0.12493133544921875, -0.105621337890625, -0.08631134033203125, -0.0670013427734375, -0.04769134521484375, -0.02838134765625, -0.00907135009765625, 0.0102386474609375, 0.02954864501953125, 0.048858642578125, 0.06816864013671875, 0.0874786376953125, 0.10678863525390625, 0.1260986328125, 0.14540863037109375, 0.1647186279296875, 0.18402862548828125, 0.203338623046875, 0.22264862060546875, 0.2419586181640625, 0.26126861572265625, 0.28057861328125, 0.29988861083984375, 0.3191986083984375, 0.33850860595703125, 0.357818603515625, 0.37712860107421875, 0.3964385986328125, 0.41574859619140625, 0.43505859375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 21.0, 48.0, 75.0, 128.0, 196.0, 202.0, 150.0, 88.0, 45.0, 14.0, 14.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.611410140991211, -10.024029731750488, -9.436649322509766, -8.84926986694336, -8.261889457702637, -7.674509048461914, -7.08712911605835, -6.499749183654785, -5.9123687744140625, -5.32498836517334, -4.737608432769775, -4.150228500366211, -3.5628480911254883, -2.9754679203033447, -2.388087749481201, -1.8007078170776367, -1.213327407836914, -0.6259472370147705, -0.03856706619262695, 0.5488131046295166, 1.1361932754516602, 1.7235734462738037, 2.3109536170959473, 2.8983335494995117, 3.4857139587402344, 4.073094367980957, 4.6604743003845215, 5.247854232788086, 5.835234642028809, 6.422615051269531, 7.009994983673096, 7.59737491607666, 8.18475341796875, 8.772133827209473, 9.359514236450195, 9.946893692016602, 10.534274101257324, 11.121654510498047, 11.709033966064453, 12.296414375305176, 12.883794784545898, 13.471175193786621, 14.058555603027344, 14.64593505859375, 15.233315467834473, 15.820695877075195, 16.4080753326416, 16.99545669555664, 17.582836151123047, 18.170215606689453, 18.757596969604492, 19.3449764251709, 19.932357788085938, 20.519737243652344, 21.10711669921875, 21.694496154785156, 22.281877517700195, 22.8692569732666, 23.45663833618164, 24.044017791748047, 24.631397247314453, 25.218778610229492, 25.8061580657959, 26.393539428710938, 26.980918884277344]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 2.0, 4.0, 6.0, 3.0, 15.0, 7.0, 6.0, 15.0, 16.0, 17.0, 17.0, 23.0, 30.0, 26.0, 30.0, 32.0, 30.0, 35.0, 22.0, 36.0, 41.0, 37.0, 48.0, 34.0, 40.0, 27.0, 49.0, 38.0, 28.0, 36.0, 27.0, 26.0, 27.0, 20.0, 17.0, 23.0, 15.0, 12.0, 16.0, 11.0, 7.0, 12.0, 8.0, 10.0, 4.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0], "bins": [-4.424734115600586, -4.280102252960205, -4.135470390319824, -3.9908382892608643, -3.8462064266204834, -3.7015743255615234, -3.5569424629211426, -3.4123106002807617, -3.267678737640381, -3.123046875, -2.97841477394104, -2.833782911300659, -2.6891510486602783, -2.5445189476013184, -2.3998870849609375, -2.2552552223205566, -2.1106231212615967, -1.9659911394119263, -1.8213592767715454, -1.676727294921875, -1.5320954322814941, -1.3874634504318237, -1.2428314685821533, -1.0981996059417725, -0.953567624092102, -0.8089357018470764, -0.6643037796020508, -0.5196717977523804, -0.37503987550735474, -0.2304079532623291, -0.08577597141265869, 0.05885589122772217, 0.20348787307739258, 0.3481197953224182, 0.49275174736976624, 0.6373836994171143, 0.7820156216621399, 0.9266475439071655, 1.071279525756836, 1.2159113883972168, 1.3605433702468872, 1.5051753520965576, 1.6498072147369385, 1.7944391965866089, 1.9390711784362793, 2.08370304107666, 2.228334903717041, 2.372966766357422, 2.517598867416382, 2.6622307300567627, 2.8068628311157227, 2.9514946937561035, 3.0961265563964844, 3.2407584190368652, 3.385390520095825, 3.530022382736206, 3.674654483795166, 3.819286346435547, 3.963918447494507, 4.108550071716309, 4.253182411193848, 4.3978142738342285, 4.542446136474609, 4.68707799911499, 4.831709861755371]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 11.0, 5.0, 12.0, 21.0, 37.0, 47.0, 52.0, 71.0, 121.0, 169.0, 328.0, 608.0, 1236.0, 2869.0, 8878.0, 40626.0, 747841.0, 3320244.0, 54016.0, 10885.0, 3279.0, 1354.0, 653.0, 346.0, 204.0, 132.0, 81.0, 44.0, 30.0, 21.0, 17.0, 13.0, 12.0, 7.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.099609375, -3.01123046875, -2.9228515625, -2.83447265625, -2.74609375, -2.65771484375, -2.5693359375, -2.48095703125, -2.392578125, -2.30419921875, -2.2158203125, -2.12744140625, -2.0390625, -1.95068359375, -1.8623046875, -1.77392578125, -1.685546875, -1.59716796875, -1.5087890625, -1.42041015625, -1.33203125, -1.24365234375, -1.1552734375, -1.06689453125, -0.978515625, -0.89013671875, -0.8017578125, -0.71337890625, -0.625, -0.53662109375, -0.4482421875, -0.35986328125, -0.271484375, -0.18310546875, -0.0947265625, -0.00634765625, 0.08203125, 0.17041015625, 0.2587890625, 0.34716796875, 0.435546875, 0.52392578125, 0.6123046875, 0.70068359375, 0.7890625, 0.87744140625, 0.9658203125, 1.05419921875, 1.142578125, 1.23095703125, 1.3193359375, 1.40771484375, 1.49609375, 1.58447265625, 1.6728515625, 1.76123046875, 1.849609375, 1.93798828125, 2.0263671875, 2.11474609375, 2.203125, 2.29150390625, 2.3798828125, 2.46826171875, 2.556640625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 10.0, 13.0, 16.0, 28.0, 35.0, 52.0, 81.0, 77.0, 109.0, 115.0, 95.0, 91.0, 75.0, 55.0, 46.0, 31.0, 20.0, 22.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24203109741210938, -0.23357391357421875, -0.22511672973632812, -0.2166595458984375, -0.20820236206054688, -0.19974517822265625, -0.19128799438476562, -0.182830810546875, -0.17437362670898438, -0.16591644287109375, -0.15745925903320312, -0.1490020751953125, -0.14054489135742188, -0.13208770751953125, -0.12363052368164062, -0.11517333984375, -0.10671615600585938, -0.09825897216796875, -0.08980178833007812, -0.0813446044921875, -0.07288742065429688, -0.06443023681640625, -0.055973052978515625, -0.047515869140625, -0.039058685302734375, -0.03060150146484375, -0.022144317626953125, -0.0136871337890625, -0.005229949951171875, 0.00322723388671875, 0.011684417724609375, 0.0201416015625, 0.028598785400390625, 0.03705596923828125, 0.045513153076171875, 0.0539703369140625, 0.062427520751953125, 0.07088470458984375, 0.07934188842773438, 0.087799072265625, 0.09625625610351562, 0.10471343994140625, 0.11317062377929688, 0.1216278076171875, 0.13008499145507812, 0.13854217529296875, 0.14699935913085938, 0.15545654296875, 0.16391372680664062, 0.17237091064453125, 0.18082809448242188, 0.1892852783203125, 0.19774246215820312, 0.20619964599609375, 0.21465682983398438, 0.223114013671875, 0.23157119750976562, 0.24002838134765625, 0.24848556518554688, 0.2569427490234375, 0.2653999328613281, 0.27385711669921875, 0.2823143005371094, 0.290771484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 6.0, 15.0, 29.0, 37.0, 71.0, 114.0, 255.0, 544.0, 1393.0, 4375.0, 19542.0, 193373.0, 3867898.0, 89150.0, 12452.0, 3109.0, 1094.0, 426.0, 180.0, 91.0, 55.0, 28.0, 16.0, 10.0, 3.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.88897705078125, -4.7467041015625, -4.60443115234375, -4.462158203125, -4.31988525390625, -4.1776123046875, -4.03533935546875, -3.89306640625, -3.75079345703125, -3.6085205078125, -3.46624755859375, -3.323974609375, -3.18170166015625, -3.0394287109375, -2.89715576171875, -2.7548828125, -2.61260986328125, -2.4703369140625, -2.32806396484375, -2.185791015625, -2.04351806640625, -1.9012451171875, -1.75897216796875, -1.61669921875, -1.47442626953125, -1.3321533203125, -1.18988037109375, -1.047607421875, -0.90533447265625, -0.7630615234375, -0.62078857421875, -0.478515625, -0.33624267578125, -0.1939697265625, -0.05169677734375, 0.090576171875, 0.23284912109375, 0.3751220703125, 0.51739501953125, 0.65966796875, 0.80194091796875, 0.9442138671875, 1.08648681640625, 1.228759765625, 1.37103271484375, 1.5133056640625, 1.65557861328125, 1.7978515625, 1.94012451171875, 2.0823974609375, 2.22467041015625, 2.366943359375, 2.50921630859375, 2.6514892578125, 2.79376220703125, 2.93603515625, 3.07830810546875, 3.2205810546875, 3.36285400390625, 3.505126953125, 3.64739990234375, 3.7896728515625, 3.93194580078125, 4.07421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 7.0, 10.0, 7.0, 9.0, 9.0, 20.0, 26.0, 43.0, 60.0, 83.0, 162.0, 361.0, 1876.0, 727.0, 271.0, 127.0, 92.0, 49.0, 34.0, 32.0, 20.0, 14.0, 10.0, 10.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69384765625, -0.6738967895507812, -0.6539459228515625, -0.6339950561523438, -0.614044189453125, -0.5940933227539062, -0.5741424560546875, -0.5541915893554688, -0.53424072265625, -0.5142898559570312, -0.4943389892578125, -0.47438812255859375, -0.454437255859375, -0.43448638916015625, -0.4145355224609375, -0.39458465576171875, -0.3746337890625, -0.35468292236328125, -0.3347320556640625, -0.31478118896484375, -0.294830322265625, -0.27487945556640625, -0.2549285888671875, -0.23497772216796875, -0.21502685546875, -0.19507598876953125, -0.1751251220703125, -0.15517425537109375, -0.135223388671875, -0.11527252197265625, -0.0953216552734375, -0.07537078857421875, -0.055419921875, -0.03546905517578125, -0.0155181884765625, 0.00443267822265625, 0.024383544921875, 0.04433441162109375, 0.0642852783203125, 0.08423614501953125, 0.10418701171875, 0.12413787841796875, 0.1440887451171875, 0.16403961181640625, 0.183990478515625, 0.20394134521484375, 0.2238922119140625, 0.24384307861328125, 0.2637939453125, 0.28374481201171875, 0.3036956787109375, 0.32364654541015625, 0.343597412109375, 0.36354827880859375, 0.3834991455078125, 0.40345001220703125, 0.42340087890625, 0.44335174560546875, 0.4633026123046875, 0.48325347900390625, 0.503204345703125, 0.5231552124023438, 0.5431060791015625, 0.5630569458007812, 0.5830078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 16.0, 23.0, 55.0, 98.0, 168.0, 212.0, 177.0, 112.0, 69.0, 28.0, 11.0, 12.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.842047691345215, -6.660569190979004, -6.479090213775635, -6.297611713409424, -6.116132736206055, -5.934654235839844, -5.753175735473633, -5.571696758270264, -5.3902177810668945, -5.208739280700684, -5.0272603034973145, -4.8457818031311035, -4.664302825927734, -4.482824325561523, -4.3013458251953125, -4.119866847991943, -3.9383883476257324, -3.7569096088409424, -3.5754308700561523, -3.3939523696899414, -3.2124733924865723, -3.0309948921203613, -2.8495161533355713, -2.6680374145507812, -2.486558675765991, -2.305079936981201, -2.123601198196411, -1.9421225786209106, -1.7606438398361206, -1.5791651010513306, -1.39768648147583, -1.21620774269104, -1.03472900390625, -0.85325026512146, -0.6717715859413147, -0.49029290676116943, -0.3088141679763794, -0.12733542919158936, 0.05414319038391113, 0.23562192916870117, 0.4171006679534912, 0.5985794067382812, 0.7800580859184265, 0.9615367650985718, 1.1430155038833618, 1.3244942426681519, 1.5059728622436523, 1.6874516010284424, 1.8689303398132324, 2.0504090785980225, 2.2318878173828125, 2.4133663177490234, 2.5948452949523926, 2.7763237953186035, 2.9578025341033936, 3.1392812728881836, 3.3207600116729736, 3.5022387504577637, 3.6837174892425537, 3.8651962280273438, 4.046674728393555, 4.228153705596924, 4.409632205963135, 4.591111183166504, 4.772589683532715]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 6.0, 9.0, 2.0, 10.0, 17.0, 18.0, 16.0, 18.0, 12.0, 29.0, 31.0, 28.0, 38.0, 47.0, 28.0, 31.0, 40.0, 52.0, 61.0, 50.0, 40.0, 48.0, 28.0, 39.0, 32.0, 41.0, 28.0, 27.0, 22.0, 22.0, 22.0, 19.0, 18.0, 18.0, 4.0, 12.0, 8.0, 5.0, 3.0, 3.0, 7.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9606208801269531, -1.9014036655426025, -1.8421863317489624, -1.7829689979553223, -1.7237517833709717, -1.664534568786621, -1.605317234992981, -1.5460999011993408, -1.4868826866149902, -1.4276654720306396, -1.3684481382369995, -1.3092308044433594, -1.2500135898590088, -1.1907963752746582, -1.131579041481018, -1.072361707687378, -1.0131444931030273, -0.953927218914032, -0.8947099447250366, -0.8354926705360413, -0.7762753963470459, -0.7170581221580505, -0.6578408479690552, -0.5986235737800598, -0.5394062995910645, -0.4801890254020691, -0.42097175121307373, -0.36175447702407837, -0.302537202835083, -0.24331992864608765, -0.18410265445709229, -0.12488538026809692, -0.06566810607910156, -0.006450831890106201, 0.05276644229888916, 0.11198371648788452, 0.17120099067687988, 0.23041826486587524, 0.2896355390548706, 0.34885281324386597, 0.40807008743286133, 0.4672873616218567, 0.526504635810852, 0.5857219099998474, 0.6449391841888428, 0.7041564583778381, 0.7633737325668335, 0.8225910067558289, 0.8818082809448242, 0.9410255551338196, 1.000242829322815, 1.059460163116455, 1.1186773777008057, 1.1778945922851562, 1.2371119260787964, 1.2963292598724365, 1.355546474456787, 1.4147636890411377, 1.4739810228347778, 1.533198356628418, 1.5924155712127686, 1.6516327857971191, 1.7108501195907593, 1.7700674533843994, 1.82928466796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 16.0, 17.0, 34.0, 40.0, 43.0, 64.0, 83.0, 118.0, 149.0, 225.0, 341.0, 560.0, 890.0, 1731.0, 3300.0, 8127.0, 22808.0, 73386.0, 246537.0, 441682.0, 169417.0, 50533.0, 16185.0, 6050.0, 2638.0, 1266.0, 716.0, 472.0, 291.0, 211.0, 153.0, 117.0, 93.0, 55.0, 42.0, 41.0, 33.0, 17.0, 13.0, 8.0, 8.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6005859375, -1.5478363037109375, -1.495086669921875, -1.4423370361328125, -1.38958740234375, -1.3368377685546875, -1.284088134765625, -1.2313385009765625, -1.1785888671875, -1.1258392333984375, -1.073089599609375, -1.0203399658203125, -0.96759033203125, -0.9148406982421875, -0.862091064453125, -0.8093414306640625, -0.756591796875, -0.7038421630859375, -0.651092529296875, -0.5983428955078125, -0.54559326171875, -0.4928436279296875, -0.440093994140625, -0.3873443603515625, -0.3345947265625, -0.2818450927734375, -0.229095458984375, -0.1763458251953125, -0.12359619140625, -0.0708465576171875, -0.018096923828125, 0.0346527099609375, 0.08740234375, 0.1401519775390625, 0.192901611328125, 0.2456512451171875, 0.29840087890625, 0.3511505126953125, 0.403900146484375, 0.4566497802734375, 0.5093994140625, 0.5621490478515625, 0.614898681640625, 0.6676483154296875, 0.72039794921875, 0.7731475830078125, 0.825897216796875, 0.8786468505859375, 0.931396484375, 0.9841461181640625, 1.036895751953125, 1.0896453857421875, 1.14239501953125, 1.1951446533203125, 1.247894287109375, 1.3006439208984375, 1.3533935546875, 1.4061431884765625, 1.458892822265625, 1.5116424560546875, 1.56439208984375, 1.6171417236328125, 1.669891357421875, 1.7226409912109375, 1.775390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 10.0, 20.0, 19.0, 19.0, 38.0, 53.0, 71.0, 78.0, 87.0, 83.0, 99.0, 84.0, 70.0, 72.0, 56.0, 36.0, 30.0, 22.0, 15.0, 8.0, 7.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.254150390625, -0.2459564208984375, -0.237762451171875, -0.2295684814453125, -0.22137451171875, -0.2131805419921875, -0.204986572265625, -0.1967926025390625, -0.1885986328125, -0.1804046630859375, -0.172210693359375, -0.1640167236328125, -0.15582275390625, -0.1476287841796875, -0.139434814453125, -0.1312408447265625, -0.123046875, -0.1148529052734375, -0.106658935546875, -0.0984649658203125, -0.09027099609375, -0.0820770263671875, -0.073883056640625, -0.0656890869140625, -0.0574951171875, -0.0493011474609375, -0.041107177734375, -0.0329132080078125, -0.02471923828125, -0.0165252685546875, -0.008331298828125, -0.0001373291015625, 0.008056640625, 0.0162506103515625, 0.024444580078125, 0.0326385498046875, 0.04083251953125, 0.0490264892578125, 0.057220458984375, 0.0654144287109375, 0.0736083984375, 0.0818023681640625, 0.089996337890625, 0.0981903076171875, 0.10638427734375, 0.1145782470703125, 0.122772216796875, 0.1309661865234375, 0.13916015625, 0.1473541259765625, 0.155548095703125, 0.1637420654296875, 0.17193603515625, 0.1801300048828125, 0.188323974609375, 0.1965179443359375, 0.2047119140625, 0.2129058837890625, 0.221099853515625, 0.2292938232421875, 0.23748779296875, 0.2456817626953125, 0.253875732421875, 0.2620697021484375, 0.270263671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 14.0, 14.0, 42.0, 50.0, 70.0, 113.0, 172.0, 328.0, 513.0, 929.0, 1851.0, 4737.0, 18742.0, 117746.0, 595068.0, 258056.0, 36951.0, 7645.0, 2650.0, 1208.0, 636.0, 357.0, 242.0, 136.0, 93.0, 58.0, 40.0, 25.0, 19.0, 13.0, 15.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.20703125, -2.130126953125, -2.05322265625, -1.976318359375, -1.8994140625, -1.822509765625, -1.74560546875, -1.668701171875, -1.591796875, -1.514892578125, -1.43798828125, -1.361083984375, -1.2841796875, -1.207275390625, -1.13037109375, -1.053466796875, -0.9765625, -0.899658203125, -0.82275390625, -0.745849609375, -0.6689453125, -0.592041015625, -0.51513671875, -0.438232421875, -0.361328125, -0.284423828125, -0.20751953125, -0.130615234375, -0.0537109375, 0.023193359375, 0.10009765625, 0.177001953125, 0.25390625, 0.330810546875, 0.40771484375, 0.484619140625, 0.5615234375, 0.638427734375, 0.71533203125, 0.792236328125, 0.869140625, 0.946044921875, 1.02294921875, 1.099853515625, 1.1767578125, 1.253662109375, 1.33056640625, 1.407470703125, 1.484375, 1.561279296875, 1.63818359375, 1.715087890625, 1.7919921875, 1.868896484375, 1.94580078125, 2.022705078125, 2.099609375, 2.176513671875, 2.25341796875, 2.330322265625, 2.4072265625, 2.484130859375, 2.56103515625, 2.637939453125, 2.71484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 4.0, 6.0, 9.0, 12.0, 9.0, 11.0, 14.0, 22.0, 19.0, 21.0, 23.0, 22.0, 20.0, 30.0, 39.0, 38.0, 42.0, 34.0, 50.0, 45.0, 42.0, 43.0, 52.0, 37.0, 26.0, 51.0, 39.0, 31.0, 36.0, 30.0, 21.0, 19.0, 18.0, 12.0, 17.0, 16.0, 6.0, 6.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7276077270507812, -0.7037506103515625, -0.6798934936523438, -0.656036376953125, -0.6321792602539062, -0.6083221435546875, -0.5844650268554688, -0.56060791015625, -0.5367507934570312, -0.5128936767578125, -0.48903656005859375, -0.465179443359375, -0.44132232666015625, -0.4174652099609375, -0.39360809326171875, -0.3697509765625, -0.34589385986328125, -0.3220367431640625, -0.29817962646484375, -0.274322509765625, -0.25046539306640625, -0.2266082763671875, -0.20275115966796875, -0.17889404296875, -0.15503692626953125, -0.1311798095703125, -0.10732269287109375, -0.083465576171875, -0.05960845947265625, -0.0357513427734375, -0.01189422607421875, 0.011962890625, 0.03582000732421875, 0.0596771240234375, 0.08353424072265625, 0.107391357421875, 0.13124847412109375, 0.1551055908203125, 0.17896270751953125, 0.20281982421875, 0.22667694091796875, 0.2505340576171875, 0.27439117431640625, 0.298248291015625, 0.32210540771484375, 0.3459625244140625, 0.36981964111328125, 0.3936767578125, 0.41753387451171875, 0.4413909912109375, 0.46524810791015625, 0.489105224609375, 0.5129623413085938, 0.5368194580078125, 0.5606765747070312, 0.58453369140625, 0.6083908081054688, 0.6322479248046875, 0.6561050415039062, 0.679962158203125, 0.7038192749023438, 0.7276763916015625, 0.7515335083007812, 0.775390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 11.0, 16.0, 13.0, 30.0, 37.0, 65.0, 118.0, 200.0, 370.0, 795.0, 2018.0, 6248.0, 24840.0, 157995.0, 638881.0, 178851.0, 27442.0, 6739.0, 2130.0, 826.0, 411.0, 199.0, 127.0, 57.0, 39.0, 27.0, 18.0, 10.0, 8.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76025390625, -0.7279434204101562, -0.6956329345703125, -0.6633224487304688, -0.631011962890625, -0.5987014770507812, -0.5663909912109375, -0.5340805053710938, -0.50177001953125, -0.46945953369140625, -0.4371490478515625, -0.40483856201171875, -0.372528076171875, -0.34021759033203125, -0.3079071044921875, -0.27559661865234375, -0.2432861328125, -0.21097564697265625, -0.1786651611328125, -0.14635467529296875, -0.114044189453125, -0.08173370361328125, -0.0494232177734375, -0.01711273193359375, 0.01519775390625, 0.04750823974609375, 0.0798187255859375, 0.11212921142578125, 0.144439697265625, 0.17675018310546875, 0.2090606689453125, 0.24137115478515625, 0.273681640625, 0.30599212646484375, 0.3383026123046875, 0.37061309814453125, 0.402923583984375, 0.43523406982421875, 0.4675445556640625, 0.49985504150390625, 0.53216552734375, 0.5644760131835938, 0.5967864990234375, 0.6290969848632812, 0.661407470703125, 0.6937179565429688, 0.7260284423828125, 0.7583389282226562, 0.7906494140625, 0.8229598999023438, 0.8552703857421875, 0.8875808715820312, 0.919891357421875, 0.9522018432617188, 0.9845123291015625, 1.0168228149414062, 1.04913330078125, 1.0814437866210938, 1.1137542724609375, 1.1460647583007812, 1.178375244140625, 1.2106857299804688, 1.2429962158203125, 1.2753067016601562, 1.3076171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 10.0, 6.0, 9.0, 18.0, 18.0, 23.0, 28.0, 37.0, 34.0, 51.0, 50.0, 66.0, 78.0, 74.0, 73.0, 74.0, 60.0, 57.0, 35.0, 39.0, 33.0, 24.0, 20.0, 14.0, 17.0, 5.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010961294174194336, -0.00010579172521829605, -0.00010197050869464874, -9.814929217100143e-05, -9.432807564735413e-05, -9.050685912370682e-05, -8.668564260005951e-05, -8.28644260764122e-05, -7.904320955276489e-05, -7.522199302911758e-05, -7.140077650547028e-05, -6.757955998182297e-05, -6.375834345817566e-05, -5.993712693452835e-05, -5.611591041088104e-05, -5.2294693887233734e-05, -4.8473477363586426e-05, -4.465226083993912e-05, -4.083104431629181e-05, -3.70098277926445e-05, -3.318861126899719e-05, -2.9367394745349884e-05, -2.5546178221702576e-05, -2.1724961698055267e-05, -1.790374517440796e-05, -1.408252865076065e-05, -1.0261312127113342e-05, -6.440095603466034e-06, -2.6188790798187256e-06, 1.2023374438285828e-06, 5.023553967475891e-06, 8.8447704911232e-06, 1.2665987014770508e-05, 1.6487203538417816e-05, 2.0308420062065125e-05, 2.4129636585712433e-05, 2.795085310935974e-05, 3.177206963300705e-05, 3.559328615665436e-05, 3.9414502680301666e-05, 4.3235719203948975e-05, 4.705693572759628e-05, 5.087815225124359e-05, 5.46993687748909e-05, 5.852058529853821e-05, 6.234180182218552e-05, 6.616301834583282e-05, 6.998423486948013e-05, 7.380545139312744e-05, 7.762666791677475e-05, 8.144788444042206e-05, 8.526910096406937e-05, 8.909031748771667e-05, 9.291153401136398e-05, 9.673275053501129e-05, 0.0001005539670586586, 0.00010437518358230591, 0.00010819640010595322, 0.00011201761662960052, 0.00011583883315324783, 0.00011966004967689514, 0.00012348126620054245, 0.00012730248272418976, 0.00013112369924783707, 0.00013494491577148438]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 10.0, 11.0, 23.0, 34.0, 56.0, 90.0, 159.0, 263.0, 581.0, 1206.0, 3270.0, 11251.0, 56623.0, 490776.0, 421164.0, 47765.0, 9926.0, 3068.0, 1141.0, 508.0, 248.0, 149.0, 88.0, 50.0, 29.0, 21.0, 12.0, 7.0, 12.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9121246337890625, -0.876983642578125, -0.8418426513671875, -0.80670166015625, -0.7715606689453125, -0.736419677734375, -0.7012786865234375, -0.6661376953125, -0.6309967041015625, -0.595855712890625, -0.5607147216796875, -0.52557373046875, -0.4904327392578125, -0.455291748046875, -0.4201507568359375, -0.385009765625, -0.3498687744140625, -0.314727783203125, -0.2795867919921875, -0.24444580078125, -0.2093048095703125, -0.174163818359375, -0.1390228271484375, -0.1038818359375, -0.0687408447265625, -0.033599853515625, 0.0015411376953125, 0.03668212890625, 0.0718231201171875, 0.106964111328125, 0.1421051025390625, 0.17724609375, 0.2123870849609375, 0.247528076171875, 0.2826690673828125, 0.31781005859375, 0.3529510498046875, 0.388092041015625, 0.4232330322265625, 0.4583740234375, 0.4935150146484375, 0.528656005859375, 0.5637969970703125, 0.59893798828125, 0.6340789794921875, 0.669219970703125, 0.7043609619140625, 0.739501953125, 0.7746429443359375, 0.809783935546875, 0.8449249267578125, 0.88006591796875, 0.9152069091796875, 0.950347900390625, 0.9854888916015625, 1.0206298828125, 1.0557708740234375, 1.090911865234375, 1.1260528564453125, 1.16119384765625, 1.1963348388671875, 1.231475830078125, 1.2666168212890625, 1.3017578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 6.0, 3.0, 12.0, 13.0, 21.0, 25.0, 43.0, 39.0, 52.0, 81.0, 84.0, 73.0, 83.0, 80.0, 74.0, 70.0, 56.0, 38.0, 25.0, 23.0, 13.0, 17.0, 17.0, 13.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.578125, -0.5622215270996094, -0.5463180541992188, -0.5304145812988281, -0.5145111083984375, -0.4986076354980469, -0.48270416259765625, -0.4668006896972656, -0.450897216796875, -0.4349937438964844, -0.41909027099609375, -0.4031867980957031, -0.3872833251953125, -0.3713798522949219, -0.35547637939453125, -0.3395729064941406, -0.32366943359375, -0.3077659606933594, -0.29186248779296875, -0.2759590148925781, -0.2600555419921875, -0.24415206909179688, -0.22824859619140625, -0.21234512329101562, -0.196441650390625, -0.18053817749023438, -0.16463470458984375, -0.14873123168945312, -0.1328277587890625, -0.11692428588867188, -0.10102081298828125, -0.08511734008789062, -0.0692138671875, -0.053310394287109375, -0.03740692138671875, -0.021503448486328125, -0.0055999755859375, 0.010303497314453125, 0.02620697021484375, 0.042110443115234375, 0.058013916015625, 0.07391738891601562, 0.08982086181640625, 0.10572433471679688, 0.1216278076171875, 0.13753128051757812, 0.15343475341796875, 0.16933822631835938, 0.18524169921875, 0.20114517211914062, 0.21704864501953125, 0.23295211791992188, 0.2488555908203125, 0.2647590637207031, 0.28066253662109375, 0.2965660095214844, 0.312469482421875, 0.3283729553222656, 0.34427642822265625, 0.3601799011230469, 0.3760833740234375, 0.3919868469238281, 0.40789031982421875, 0.4237937927246094, 0.439697265625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 37.0, 91.0, 196.0, 270.0, 236.0, 106.0, 31.0, 13.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984037399291992, -9.29964542388916, -8.615253448486328, -7.93086051940918, -7.246468544006348, -6.562076568603516, -5.877684116363525, -5.193291664123535, -4.508899688720703, -3.824507474899292, -3.140115261077881, -2.4557230472564697, -1.7713308334350586, -1.0869386196136475, -0.40254640579223633, 0.2818460464477539, 0.9662380218505859, 1.650630235671997, 2.335022449493408, 3.0194146633148193, 3.7038068771362305, 4.3881988525390625, 5.072591304779053, 5.756983757019043, 6.441375732421875, 7.125767707824707, 7.810160160064697, 8.494552612304688, 9.17894458770752, 9.863336563110352, 10.5477294921875, 11.232121467590332, 11.916511535644531, 12.600903511047363, 13.285295486450195, 13.969688415527344, 14.654080390930176, 15.338472366333008, 16.022865295410156, 16.707256317138672, 17.39164924621582, 18.07604217529297, 18.760433197021484, 19.444826126098633, 20.12921905517578, 20.813610076904297, 21.498003005981445, 22.182395935058594, 22.86678695678711, 23.551179885864258, 24.235570907592773, 24.919963836669922, 25.604354858398438, 26.288747787475586, 26.973140716552734, 27.65753173828125, 28.3419246673584, 29.026317596435547, 29.710708618164062, 30.39510154724121, 31.07949447631836, 31.763885498046875, 32.44827651977539, 33.13267135620117, 33.81706237792969]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 11.0, 7.0, 12.0, 13.0, 14.0, 14.0, 20.0, 32.0, 37.0, 32.0, 32.0, 35.0, 35.0, 37.0, 55.0, 47.0, 34.0, 48.0, 52.0, 44.0, 40.0, 43.0, 31.0, 26.0, 35.0, 32.0, 21.0, 20.0, 21.0, 16.0, 20.0, 10.0, 8.0, 8.0, 6.0, 9.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.82372522354126, -4.681885242462158, -4.540044784545898, -4.398204803466797, -4.256364822387695, -4.114524841308594, -3.972684621810913, -3.8308444023132324, -3.689004421234131, -3.5471644401550293, -3.4053242206573486, -3.263484001159668, -3.1216440200805664, -2.979804039001465, -2.837963819503784, -2.6961236000061035, -2.554283618927002, -2.4124436378479004, -2.2706034183502197, -2.128763198852539, -1.9869232177734375, -1.8450831174850464, -1.7032430171966553, -1.5614029169082642, -1.419562816619873, -1.277722716331482, -1.1358826160430908, -0.9940425157546997, -0.8522024154663086, -0.7103623151779175, -0.5685222148895264, -0.42668211460113525, -0.28484201431274414, -0.14300191402435303, -0.001161813735961914, 0.1406782865524292, 0.2825183868408203, 0.4243584871292114, 0.5661985874176025, 0.7080386877059937, 0.8498787879943848, 0.9917188882827759, 1.133558988571167, 1.275399088859558, 1.4172391891479492, 1.5590792894363403, 1.7009193897247314, 1.8427594900131226, 1.9845995903015137, 2.1264395713806152, 2.268279790878296, 2.4101200103759766, 2.551959991455078, 2.6937999725341797, 2.8356401920318604, 2.977480411529541, 3.1193203926086426, 3.261160373687744, 3.403000593185425, 3.5448408126831055, 3.686680793762207, 3.8285207748413086, 3.9703609943389893, 4.11220121383667, 4.2540411949157715]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 16.0, 34.0, 41.0, 78.0, 117.0, 175.0, 334.0, 601.0, 1174.0, 2953.0, 8677.0, 34810.0, 357436.0, 3700758.0, 65907.0, 13633.0, 4080.0, 1696.0, 733.0, 397.0, 216.0, 135.0, 73.0, 54.0, 33.0, 26.0, 12.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.74609375, -2.670196533203125, -2.59429931640625, -2.518402099609375, -2.4425048828125, -2.366607666015625, -2.29071044921875, -2.214813232421875, -2.138916015625, -2.063018798828125, -1.98712158203125, -1.911224365234375, -1.8353271484375, -1.759429931640625, -1.68353271484375, -1.607635498046875, -1.53173828125, -1.455841064453125, -1.37994384765625, -1.304046630859375, -1.2281494140625, -1.152252197265625, -1.07635498046875, -1.000457763671875, -0.924560546875, -0.848663330078125, -0.77276611328125, -0.696868896484375, -0.6209716796875, -0.545074462890625, -0.46917724609375, -0.393280029296875, -0.3173828125, -0.241485595703125, -0.16558837890625, -0.089691162109375, -0.0137939453125, 0.062103271484375, 0.13800048828125, 0.213897705078125, 0.289794921875, 0.365692138671875, 0.44158935546875, 0.517486572265625, 0.5933837890625, 0.669281005859375, 0.74517822265625, 0.821075439453125, 0.89697265625, 0.972869873046875, 1.04876708984375, 1.124664306640625, 1.2005615234375, 1.276458740234375, 1.35235595703125, 1.428253173828125, 1.504150390625, 1.580047607421875, 1.65594482421875, 1.731842041015625, 1.8077392578125, 1.883636474609375, 1.95953369140625, 2.035430908203125, 2.111328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 13.0, 18.0, 31.0, 42.0, 53.0, 58.0, 78.0, 75.0, 97.0, 73.0, 98.0, 74.0, 63.0, 52.0, 40.0, 24.0, 27.0, 18.0, 20.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2566509246826172, -0.24865341186523438, -0.24065589904785156, -0.23265838623046875, -0.22466087341308594, -0.21666336059570312, -0.2086658477783203, -0.2006683349609375, -0.1926708221435547, -0.18467330932617188, -0.17667579650878906, -0.16867828369140625, -0.16068077087402344, -0.15268325805664062, -0.1446857452392578, -0.136688232421875, -0.1286907196044922, -0.12069320678710938, -0.11269569396972656, -0.10469818115234375, -0.09670066833496094, -0.08870315551757812, -0.08070564270019531, -0.0727081298828125, -0.06471061706542969, -0.056713104248046875, -0.04871559143066406, -0.04071807861328125, -0.03272056579589844, -0.024723052978515625, -0.016725540161132812, -0.00872802734375, -0.0007305145263671875, 0.007266998291015625, 0.015264511108398438, 0.02326202392578125, 0.03125953674316406, 0.039257049560546875, 0.04725456237792969, 0.0552520751953125, 0.06324958801269531, 0.07124710083007812, 0.07924461364746094, 0.08724212646484375, 0.09523963928222656, 0.10323715209960938, 0.11123466491699219, 0.119232177734375, 0.1272296905517578, 0.13522720336914062, 0.14322471618652344, 0.15122222900390625, 0.15921974182128906, 0.16721725463867188, 0.1752147674560547, 0.1832122802734375, 0.1912097930908203, 0.19920730590820312, 0.20720481872558594, 0.21520233154296875, 0.22319984436035156, 0.23119735717773438, 0.2391948699951172, 0.2471923828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 15.0, 45.0, 41.0, 77.0, 138.0, 223.0, 390.0, 802.0, 1530.0, 3752.0, 12121.0, 70025.0, 3829548.0, 243298.0, 21760.0, 6018.0, 2203.0, 1046.0, 526.0, 286.0, 163.0, 80.0, 64.0, 37.0, 28.0, 11.0, 15.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.899261474609375, -2.79071044921875, -2.682159423828125, -2.5736083984375, -2.465057373046875, -2.35650634765625, -2.247955322265625, -2.139404296875, -2.030853271484375, -1.92230224609375, -1.813751220703125, -1.7052001953125, -1.596649169921875, -1.48809814453125, -1.379547119140625, -1.27099609375, -1.162445068359375, -1.05389404296875, -0.945343017578125, -0.8367919921875, -0.728240966796875, -0.61968994140625, -0.511138916015625, -0.402587890625, -0.294036865234375, -0.18548583984375, -0.076934814453125, 0.0316162109375, 0.140167236328125, 0.24871826171875, 0.357269287109375, 0.4658203125, 0.574371337890625, 0.68292236328125, 0.791473388671875, 0.9000244140625, 1.008575439453125, 1.11712646484375, 1.225677490234375, 1.334228515625, 1.442779541015625, 1.55133056640625, 1.659881591796875, 1.7684326171875, 1.876983642578125, 1.98553466796875, 2.094085693359375, 2.20263671875, 2.311187744140625, 2.41973876953125, 2.528289794921875, 2.6368408203125, 2.745391845703125, 2.85394287109375, 2.962493896484375, 3.071044921875, 3.179595947265625, 3.28814697265625, 3.396697998046875, 3.5052490234375, 3.613800048828125, 3.72235107421875, 3.830902099609375, 3.939453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 9.0, 17.0, 22.0, 34.0, 67.0, 129.0, 304.0, 2247.0, 808.0, 205.0, 91.0, 48.0, 27.0, 16.0, 11.0, 4.0, 10.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7910385131835938, -0.7661590576171875, -0.7412796020507812, -0.716400146484375, -0.6915206909179688, -0.6666412353515625, -0.6417617797851562, -0.61688232421875, -0.5920028686523438, -0.5671234130859375, -0.5422439575195312, -0.517364501953125, -0.49248504638671875, -0.4676055908203125, -0.44272613525390625, -0.4178466796875, -0.39296722412109375, -0.3680877685546875, -0.34320831298828125, -0.318328857421875, -0.29344940185546875, -0.2685699462890625, -0.24369049072265625, -0.21881103515625, -0.19393157958984375, -0.1690521240234375, -0.14417266845703125, -0.119293212890625, -0.09441375732421875, -0.0695343017578125, -0.04465484619140625, -0.019775390625, 0.00510406494140625, 0.0299835205078125, 0.05486297607421875, 0.079742431640625, 0.10462188720703125, 0.1295013427734375, 0.15438079833984375, 0.17926025390625, 0.20413970947265625, 0.2290191650390625, 0.25389862060546875, 0.278778076171875, 0.30365753173828125, 0.3285369873046875, 0.35341644287109375, 0.3782958984375, 0.40317535400390625, 0.4280548095703125, 0.45293426513671875, 0.477813720703125, 0.5026931762695312, 0.5275726318359375, 0.5524520874023438, 0.57733154296875, 0.6022109985351562, 0.6270904541015625, 0.6519699096679688, 0.676849365234375, 0.7017288208007812, 0.7266082763671875, 0.7514877319335938, 0.7763671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 13.0, 13.0, 24.0, 52.0, 71.0, 105.0, 172.0, 182.0, 151.0, 102.0, 49.0, 24.0, 16.0, 11.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9491071701049805, -4.785512924194336, -4.621918201446533, -4.458323955535889, -4.294729709625244, -4.131134986877441, -3.967540740966797, -3.8039464950561523, -3.6403520107269287, -3.476757526397705, -3.3131632804870605, -3.149568796157837, -2.9859743118286133, -2.8223800659179688, -2.658785581588745, -2.4951910972595215, -2.331596851348877, -2.1680023670196533, -2.004408121109009, -1.8408136367797852, -1.677219271659851, -1.513624906539917, -1.3500304222106934, -1.1864360570907593, -1.0228416919708252, -0.8592473268508911, -0.6956529021263123, -0.5320584774017334, -0.3684641122817993, -0.20486974716186523, -0.04127532243728638, 0.12231910228729248, 0.28591394424438477, 0.44950833916664124, 0.6131027340888977, 0.7766971588134766, 0.9402915239334106, 1.1038858890533447, 1.2674803733825684, 1.4310747385025024, 1.5946691036224365, 1.7582634687423706, 1.9218578338623047, 2.0854523181915283, 2.249046802520752, 2.4126410484313965, 2.57623553276062, 2.7398300170898438, 2.9034242630004883, 3.067018747329712, 3.2306129932403564, 3.39420747756958, 3.5578017234802246, 3.7213962078094482, 3.884990692138672, 4.048584938049316, 4.212179183959961, 4.3757734298706055, 4.539368152618408, 4.702962398529053, 4.866556644439697, 5.0301513671875, 5.1937456130981445, 5.357339859008789, 5.520934581756592]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 6.0, 3.0, 3.0, 6.0, 12.0, 7.0, 14.0, 11.0, 18.0, 18.0, 23.0, 20.0, 32.0, 26.0, 25.0, 27.0, 56.0, 29.0, 42.0, 51.0, 36.0, 51.0, 43.0, 43.0, 53.0, 41.0, 37.0, 29.0, 28.0, 15.0, 32.0, 32.0, 19.0, 21.0, 28.0, 17.0, 9.0, 10.0, 9.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544095754623413, -1.4880732297897339, -1.4320507049560547, -1.3760281801223755, -1.3200056552886963, -1.2639830112457275, -1.207960605621338, -1.1519379615783691, -1.09591543674469, -1.0398929119110107, -0.9838703870773315, -0.9278478622436523, -0.8718252778053284, -0.8158027529716492, -0.75978022813797, -0.703757643699646, -0.6477351784706116, -0.5917126536369324, -0.5356901288032532, -0.4796675741672516, -0.42364501953125, -0.3676224946975708, -0.3115999698638916, -0.25557741522789, -0.19955489039421082, -0.14353235065937042, -0.08750981837511063, -0.03148728609085083, 0.024535253643989563, 0.08055779337882996, 0.13658031821250916, 0.19260287284851074, 0.24862539768218994, 0.30464792251586914, 0.3606704771518707, 0.4166930019855499, 0.4727155566215515, 0.5287380814552307, 0.5847606062889099, 0.6407831907272339, 0.6968057155609131, 0.7528282403945923, 0.8088507652282715, 0.8648732900619507, 0.9208958745002747, 0.9769183993339539, 1.0329408645629883, 1.088963508605957, 1.1449859142303467, 1.2010084390640259, 1.257030963897705, 1.3130534887313843, 1.3690760135650635, 1.4250986576080322, 1.4811210632324219, 1.5371437072753906, 1.5931662321090698, 1.649188756942749, 1.7052112817764282, 1.7612338066101074, 1.8172563314437866, 1.8732788562774658, 1.9293015003204346, 1.9853240251541138, 2.041346549987793]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 9.0, 9.0, 9.0, 11.0, 15.0, 18.0, 19.0, 24.0, 31.0, 47.0, 77.0, 145.0, 206.0, 356.0, 634.0, 1164.0, 2354.0, 5347.0, 13738.0, 43025.0, 161581.0, 462087.0, 256612.0, 67352.0, 19911.0, 7233.0, 3109.0, 1483.0, 784.0, 426.0, 264.0, 129.0, 81.0, 64.0, 51.0, 38.0, 23.0, 17.0, 14.0, 15.0, 8.0, 5.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7373046875, -1.6787567138671875, -1.620208740234375, -1.5616607666015625, -1.50311279296875, -1.4445648193359375, -1.386016845703125, -1.3274688720703125, -1.2689208984375, -1.2103729248046875, -1.151824951171875, -1.0932769775390625, -1.03472900390625, -0.9761810302734375, -0.917633056640625, -0.8590850830078125, -0.800537109375, -0.7419891357421875, -0.683441162109375, -0.6248931884765625, -0.56634521484375, -0.5077972412109375, -0.449249267578125, -0.3907012939453125, -0.3321533203125, -0.2736053466796875, -0.215057373046875, -0.1565093994140625, -0.09796142578125, -0.0394134521484375, 0.019134521484375, 0.0776824951171875, 0.13623046875, 0.1947784423828125, 0.253326416015625, 0.3118743896484375, 0.37042236328125, 0.4289703369140625, 0.487518310546875, 0.5460662841796875, 0.6046142578125, 0.6631622314453125, 0.721710205078125, 0.7802581787109375, 0.83880615234375, 0.8973541259765625, 0.955902099609375, 1.0144500732421875, 1.072998046875, 1.1315460205078125, 1.190093994140625, 1.2486419677734375, 1.30718994140625, 1.3657379150390625, 1.424285888671875, 1.4828338623046875, 1.5413818359375, 1.5999298095703125, 1.658477783203125, 1.7170257568359375, 1.77557373046875, 1.8341217041015625, 1.892669677734375, 1.9512176513671875, 2.009765625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 11.0, 5.0, 15.0, 16.0, 23.0, 20.0, 40.0, 53.0, 51.0, 61.0, 74.0, 79.0, 75.0, 63.0, 90.0, 59.0, 60.0, 61.0, 35.0, 25.0, 25.0, 11.0, 13.0, 8.0, 2.0, 12.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.25578880310058594, -0.24790573120117188, -0.2400226593017578, -0.23213958740234375, -0.2242565155029297, -0.21637344360351562, -0.20849037170410156, -0.2006072998046875, -0.19272422790527344, -0.18484115600585938, -0.1769580841064453, -0.16907501220703125, -0.1611919403076172, -0.15330886840820312, -0.14542579650878906, -0.137542724609375, -0.12965965270996094, -0.12177658081054688, -0.11389350891113281, -0.10601043701171875, -0.09812736511230469, -0.09024429321289062, -0.08236122131347656, -0.0744781494140625, -0.06659507751464844, -0.058712005615234375, -0.05082893371582031, -0.04294586181640625, -0.03506278991699219, -0.027179718017578125, -0.019296646118164062, -0.01141357421875, -0.0035305023193359375, 0.004352569580078125, 0.012235641479492188, 0.02011871337890625, 0.028001785278320312, 0.035884857177734375, 0.04376792907714844, 0.0516510009765625, 0.05953407287597656, 0.06741714477539062, 0.07530021667480469, 0.08318328857421875, 0.09106636047363281, 0.09894943237304688, 0.10683250427246094, 0.114715576171875, 0.12259864807128906, 0.13048171997070312, 0.1383647918701172, 0.14624786376953125, 0.1541309356689453, 0.16201400756835938, 0.16989707946777344, 0.1777801513671875, 0.18566322326660156, 0.19354629516601562, 0.2014293670654297, 0.20931243896484375, 0.2171955108642578, 0.22507858276367188, 0.23296165466308594, 0.2408447265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 10.0, 9.0, 14.0, 21.0, 36.0, 39.0, 60.0, 117.0, 133.0, 269.0, 375.0, 621.0, 1148.0, 2415.0, 6077.0, 21454.0, 101755.0, 470124.0, 350555.0, 68314.0, 15571.0, 4906.0, 2006.0, 935.0, 557.0, 352.0, 216.0, 141.0, 96.0, 65.0, 47.0, 38.0, 17.0, 16.0, 8.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.619140625, -1.55657958984375, -1.4940185546875, -1.43145751953125, -1.368896484375, -1.30633544921875, -1.2437744140625, -1.18121337890625, -1.11865234375, -1.05609130859375, -0.9935302734375, -0.93096923828125, -0.868408203125, -0.80584716796875, -0.7432861328125, -0.68072509765625, -0.6181640625, -0.55560302734375, -0.4930419921875, -0.43048095703125, -0.367919921875, -0.30535888671875, -0.2427978515625, -0.18023681640625, -0.11767578125, -0.05511474609375, 0.0074462890625, 0.07000732421875, 0.132568359375, 0.19512939453125, 0.2576904296875, 0.32025146484375, 0.3828125, 0.44537353515625, 0.5079345703125, 0.57049560546875, 0.633056640625, 0.69561767578125, 0.7581787109375, 0.82073974609375, 0.88330078125, 0.94586181640625, 1.0084228515625, 1.07098388671875, 1.133544921875, 1.19610595703125, 1.2586669921875, 1.32122802734375, 1.3837890625, 1.44635009765625, 1.5089111328125, 1.57147216796875, 1.634033203125, 1.69659423828125, 1.7591552734375, 1.82171630859375, 1.88427734375, 1.94683837890625, 2.0093994140625, 2.07196044921875, 2.134521484375, 2.19708251953125, 2.2596435546875, 2.32220458984375, 2.384765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 11.0, 10.0, 18.0, 22.0, 31.0, 20.0, 25.0, 31.0, 44.0, 36.0, 44.0, 38.0, 32.0, 47.0, 48.0, 54.0, 42.0, 38.0, 45.0, 41.0, 36.0, 32.0, 32.0, 29.0, 18.0, 18.0, 23.0, 14.0, 14.0, 11.0, 19.0, 7.0, 5.0, 2.0, 8.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70458984375, -0.680511474609375, -0.65643310546875, -0.632354736328125, -0.6082763671875, -0.584197998046875, -0.56011962890625, -0.536041259765625, -0.511962890625, -0.487884521484375, -0.46380615234375, -0.439727783203125, -0.4156494140625, -0.391571044921875, -0.36749267578125, -0.343414306640625, -0.3193359375, -0.295257568359375, -0.27117919921875, -0.247100830078125, -0.2230224609375, -0.198944091796875, -0.17486572265625, -0.150787353515625, -0.126708984375, -0.102630615234375, -0.07855224609375, -0.054473876953125, -0.0303955078125, -0.006317138671875, 0.01776123046875, 0.041839599609375, 0.06591796875, 0.089996337890625, 0.11407470703125, 0.138153076171875, 0.1622314453125, 0.186309814453125, 0.21038818359375, 0.234466552734375, 0.258544921875, 0.282623291015625, 0.30670166015625, 0.330780029296875, 0.3548583984375, 0.378936767578125, 0.40301513671875, 0.427093505859375, 0.451171875, 0.475250244140625, 0.49932861328125, 0.523406982421875, 0.5474853515625, 0.571563720703125, 0.59564208984375, 0.619720458984375, 0.643798828125, 0.667877197265625, 0.69195556640625, 0.716033935546875, 0.7401123046875, 0.764190673828125, 0.78826904296875, 0.812347412109375, 0.83642578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 6.0, 9.0, 22.0, 27.0, 61.0, 72.0, 125.0, 232.0, 518.0, 1223.0, 3614.0, 12728.0, 61437.0, 411005.0, 464327.0, 72323.0, 14319.0, 3985.0, 1331.0, 551.0, 255.0, 150.0, 70.0, 49.0, 35.0, 18.0, 18.0, 8.0, 8.0, 6.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6708297729492188, -0.6429290771484375, -0.6150283813476562, -0.587127685546875, -0.5592269897460938, -0.5313262939453125, -0.5034255981445312, -0.47552490234375, -0.44762420654296875, -0.4197235107421875, -0.39182281494140625, -0.363922119140625, -0.33602142333984375, -0.3081207275390625, -0.28022003173828125, -0.2523193359375, -0.22441864013671875, -0.1965179443359375, -0.16861724853515625, -0.140716552734375, -0.11281585693359375, -0.0849151611328125, -0.05701446533203125, -0.02911376953125, -0.00121307373046875, 0.0266876220703125, 0.05458831787109375, 0.082489013671875, 0.11038970947265625, 0.1382904052734375, 0.16619110107421875, 0.194091796875, 0.22199249267578125, 0.2498931884765625, 0.27779388427734375, 0.305694580078125, 0.33359527587890625, 0.3614959716796875, 0.38939666748046875, 0.41729736328125, 0.44519805908203125, 0.4730987548828125, 0.5009994506835938, 0.528900146484375, 0.5568008422851562, 0.5847015380859375, 0.6126022338867188, 0.6405029296875, 0.6684036254882812, 0.6963043212890625, 0.7242050170898438, 0.752105712890625, 0.7800064086914062, 0.8079071044921875, 0.8358078002929688, 0.86370849609375, 0.8916091918945312, 0.9195098876953125, 0.9474105834960938, 0.975311279296875, 1.0032119750976562, 1.0311126708984375, 1.0590133666992188, 1.0869140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 10.0, 14.0, 17.0, 18.0, 34.0, 20.0, 22.0, 46.0, 53.0, 50.0, 49.0, 46.0, 62.0, 53.0, 70.0, 62.0, 46.0, 65.0, 38.0, 25.0, 31.0, 35.0, 22.0, 10.0, 22.0, 12.0, 11.0, 10.0, 1.0, 8.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011682510375976562, -0.00011335313320159912, -0.00010988116264343262, -0.00010640919208526611, -0.00010293722152709961, -9.94652509689331e-05, -9.59932804107666e-05, -9.25213098526001e-05, -8.90493392944336e-05, -8.557736873626709e-05, -8.210539817810059e-05, -7.863342761993408e-05, -7.516145706176758e-05, -7.168948650360107e-05, -6.821751594543457e-05, -6.474554538726807e-05, -6.127357482910156e-05, -5.780160427093506e-05, -5.4329633712768555e-05, -5.085766315460205e-05, -4.738569259643555e-05, -4.391372203826904e-05, -4.044175148010254e-05, -3.6969780921936035e-05, -3.349781036376953e-05, -3.0025839805603027e-05, -2.6553869247436523e-05, -2.308189868927002e-05, -1.9609928131103516e-05, -1.6137957572937012e-05, -1.2665987014770508e-05, -9.194016456604004e-06, -5.7220458984375e-06, -2.250075340270996e-06, 1.2218952178955078e-06, 4.693865776062012e-06, 8.165836334228516e-06, 1.163780689239502e-05, 1.5109777450561523e-05, 1.8581748008728027e-05, 2.205371856689453e-05, 2.5525689125061035e-05, 2.899765968322754e-05, 3.246963024139404e-05, 3.594160079956055e-05, 3.941357135772705e-05, 4.2885541915893555e-05, 4.635751247406006e-05, 4.982948303222656e-05, 5.3301453590393066e-05, 5.677342414855957e-05, 6.0245394706726074e-05, 6.371736526489258e-05, 6.718933582305908e-05, 7.066130638122559e-05, 7.413327693939209e-05, 7.76052474975586e-05, 8.10772180557251e-05, 8.45491886138916e-05, 8.80211591720581e-05, 9.149312973022461e-05, 9.496510028839111e-05, 9.843707084655762e-05, 0.00010190904140472412, 0.00010538101196289062]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 7.0, 22.0, 23.0, 36.0, 83.0, 142.0, 314.0, 670.0, 1708.0, 5987.0, 33524.0, 439157.0, 517654.0, 39311.0, 6691.0, 1831.0, 683.0, 301.0, 178.0, 90.0, 48.0, 28.0, 18.0, 8.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.046875, -1.0066680908203125, -0.966461181640625, -0.9262542724609375, -0.88604736328125, -0.8458404541015625, -0.805633544921875, -0.7654266357421875, -0.7252197265625, -0.6850128173828125, -0.644805908203125, -0.6045989990234375, -0.56439208984375, -0.5241851806640625, -0.483978271484375, -0.4437713623046875, -0.403564453125, -0.3633575439453125, -0.323150634765625, -0.2829437255859375, -0.24273681640625, -0.2025299072265625, -0.162322998046875, -0.1221160888671875, -0.0819091796875, -0.0417022705078125, -0.001495361328125, 0.0387115478515625, 0.07891845703125, 0.1191253662109375, 0.159332275390625, 0.1995391845703125, 0.23974609375, 0.2799530029296875, 0.320159912109375, 0.3603668212890625, 0.40057373046875, 0.4407806396484375, 0.480987548828125, 0.5211944580078125, 0.5614013671875, 0.6016082763671875, 0.641815185546875, 0.6820220947265625, 0.72222900390625, 0.7624359130859375, 0.802642822265625, 0.8428497314453125, 0.883056640625, 0.9232635498046875, 0.963470458984375, 1.0036773681640625, 1.04388427734375, 1.0840911865234375, 1.124298095703125, 1.1645050048828125, 1.2047119140625, 1.2449188232421875, 1.285125732421875, 1.3253326416015625, 1.36553955078125, 1.4057464599609375, 1.445953369140625, 1.4861602783203125, 1.5263671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 16.0, 6.0, 18.0, 19.0, 25.0, 34.0, 36.0, 51.0, 49.0, 57.0, 71.0, 72.0, 73.0, 75.0, 55.0, 59.0, 55.0, 41.0, 28.0, 31.0, 22.0, 15.0, 18.0, 14.0, 13.0, 7.0, 7.0, 1.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.3427162170410156, -0.32947540283203125, -0.3162345886230469, -0.3029937744140625, -0.2897529602050781, -0.27651214599609375, -0.2632713317871094, -0.250030517578125, -0.23678970336914062, -0.22354888916015625, -0.21030807495117188, -0.1970672607421875, -0.18382644653320312, -0.17058563232421875, -0.15734481811523438, -0.14410400390625, -0.13086318969726562, -0.11762237548828125, -0.10438156127929688, -0.0911407470703125, -0.07789993286132812, -0.06465911865234375, -0.051418304443359375, -0.038177490234375, -0.024936676025390625, -0.01169586181640625, 0.001544952392578125, 0.0147857666015625, 0.028026580810546875, 0.04126739501953125, 0.054508209228515625, 0.0677490234375, 0.08098983764648438, 0.09423065185546875, 0.10747146606445312, 0.1207122802734375, 0.13395309448242188, 0.14719390869140625, 0.16043472290039062, 0.173675537109375, 0.18691635131835938, 0.20015716552734375, 0.21339797973632812, 0.2266387939453125, 0.23987960815429688, 0.25312042236328125, 0.2663612365722656, 0.27960205078125, 0.2928428649902344, 0.30608367919921875, 0.3193244934082031, 0.3325653076171875, 0.3458061218261719, 0.35904693603515625, 0.3722877502441406, 0.385528564453125, 0.3987693786621094, 0.41201019287109375, 0.4252510070800781, 0.4384918212890625, 0.4517326354980469, 0.46497344970703125, 0.4782142639160156, 0.491455078125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 4.0, 18.0, 20.0, 22.0, 43.0, 39.0, 46.0, 66.0, 85.0, 94.0, 75.0, 76.0, 80.0, 70.0, 50.0, 59.0, 36.0, 22.0, 21.0, 14.0, 10.0, 10.0, 6.0, 10.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.951740264892578, -5.75117301940918, -5.550605773925781, -5.350038528442383, -5.149471282958984, -4.948904037475586, -4.7483367919921875, -4.547769546508789, -4.347202301025391, -4.146635055541992, -3.9460678100585938, -3.7455005645751953, -3.544933319091797, -3.3443660736083984, -3.143799066543579, -2.9432318210601807, -2.7426648139953613, -2.542097568511963, -2.3415303230285645, -2.140963077545166, -1.9403959512710571, -1.7398287057876587, -1.5392615795135498, -1.3386943340301514, -1.138127088546753, -0.9375598430633545, -0.7369926571846008, -0.5364254713058472, -0.33585822582244873, -0.1352909803390503, 0.0652761459350586, 0.26584339141845703, 0.46641063690185547, 0.6669778823852539, 0.8675450682640076, 1.0681122541427612, 1.2686794996261597, 1.469246745109558, 1.669813871383667, 1.8703811168670654, 2.070948362350464, 2.2715156078338623, 2.4720828533172607, 2.67264986038208, 2.8732171058654785, 3.073784351348877, 3.2743515968322754, 3.474918842315674, 3.6754860877990723, 3.8760533332824707, 4.076620578765869, 4.277187824249268, 4.477755069732666, 4.6783223152160645, 4.878889083862305, 5.079456329345703, 5.280023574829102, 5.4805908203125, 5.681158065795898, 5.881725311279297, 6.082292556762695, 6.282859802246094, 6.483427047729492, 6.683994293212891, 6.884561538696289]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 5.0, 9.0, 11.0, 16.0, 13.0, 25.0, 25.0, 31.0, 31.0, 33.0, 27.0, 42.0, 42.0, 55.0, 39.0, 49.0, 55.0, 47.0, 38.0, 39.0, 43.0, 38.0, 38.0, 37.0, 33.0, 25.0, 28.0, 16.0, 13.0, 15.0, 10.0, 17.0, 8.0, 4.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.936922073364258, -4.794308662414551, -4.651695251464844, -4.509081840515137, -4.36646842956543, -4.2238545417785645, -4.081241130828857, -3.9386277198791504, -3.7960143089294434, -3.6534008979797363, -3.5107874870300293, -3.368173837661743, -3.225560426712036, -3.082947015762329, -2.940333366394043, -2.797719955444336, -2.655106544494629, -2.512493133544922, -2.369879722595215, -2.2272660732269287, -2.0846526622772217, -1.9420392513275146, -1.799425721168518, -1.6568121910095215, -1.5141987800598145, -1.3715853691101074, -1.2289718389511108, -1.0863583087921143, -0.9437448978424072, -0.8011314272880554, -0.6585179567337036, -0.5159044861793518, -0.3732905387878418, -0.23067706823349, -0.08806359767913818, 0.05454987287521362, 0.19716334342956543, 0.33977681398391724, 0.48239028453826904, 0.6250037550926208, 0.7676172256469727, 0.9102306962013245, 1.0528441667556763, 1.1954576969146729, 1.3380711078643799, 1.480684518814087, 1.6232980489730835, 1.76591157913208, 1.908524990081787, 2.051138401031494, 2.193751811981201, 2.3363654613494873, 2.4789788722991943, 2.6215922832489014, 2.7642059326171875, 2.9068193435668945, 3.0494327545166016, 3.1920461654663086, 3.3346595764160156, 3.4772732257843018, 3.619886636734009, 3.762500047683716, 3.905113697052002, 4.047727108001709, 4.190340518951416]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 8.0, 12.0, 16.0, 26.0, 36.0, 47.0, 65.0, 107.0, 169.0, 246.0, 485.0, 811.0, 1579.0, 3550.0, 8148.0, 22771.0, 91088.0, 3108805.0, 856728.0, 68744.0, 18512.0, 6681.0, 2704.0, 1268.0, 675.0, 359.0, 222.0, 137.0, 89.0, 61.0, 45.0, 19.0, 17.0, 9.0, 10.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9296875, -1.875946044921875, -1.82220458984375, -1.768463134765625, -1.7147216796875, -1.660980224609375, -1.60723876953125, -1.553497314453125, -1.499755859375, -1.446014404296875, -1.39227294921875, -1.338531494140625, -1.2847900390625, -1.231048583984375, -1.17730712890625, -1.123565673828125, -1.06982421875, -1.016082763671875, -0.96234130859375, -0.908599853515625, -0.8548583984375, -0.801116943359375, -0.74737548828125, -0.693634033203125, -0.639892578125, -0.586151123046875, -0.53240966796875, -0.478668212890625, -0.4249267578125, -0.371185302734375, -0.31744384765625, -0.263702392578125, -0.2099609375, -0.156219482421875, -0.10247802734375, -0.048736572265625, 0.0050048828125, 0.058746337890625, 0.11248779296875, 0.166229248046875, 0.219970703125, 0.273712158203125, 0.32745361328125, 0.381195068359375, 0.4349365234375, 0.488677978515625, 0.54241943359375, 0.596160888671875, 0.64990234375, 0.703643798828125, 0.75738525390625, 0.811126708984375, 0.8648681640625, 0.918609619140625, 0.97235107421875, 1.026092529296875, 1.079833984375, 1.133575439453125, 1.18731689453125, 1.241058349609375, 1.2947998046875, 1.348541259765625, 1.40228271484375, 1.456024169921875, 1.509765625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 15.0, 6.0, 13.0, 16.0, 34.0, 31.0, 48.0, 62.0, 62.0, 75.0, 77.0, 75.0, 70.0, 77.0, 66.0, 58.0, 45.0, 43.0, 32.0, 24.0, 15.0, 13.0, 11.0, 7.0, 2.0, 5.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26318359375, -0.25535011291503906, -0.24751663208007812, -0.2396831512451172, -0.23184967041015625, -0.2240161895751953, -0.21618270874023438, -0.20834922790527344, -0.2005157470703125, -0.19268226623535156, -0.18484878540039062, -0.1770153045654297, -0.16918182373046875, -0.1613483428955078, -0.15351486206054688, -0.14568138122558594, -0.137847900390625, -0.13001441955566406, -0.12218093872070312, -0.11434745788574219, -0.10651397705078125, -0.09868049621582031, -0.09084701538085938, -0.08301353454589844, -0.0751800537109375, -0.06734657287597656, -0.059513092041015625, -0.05167961120605469, -0.04384613037109375, -0.03601264953613281, -0.028179168701171875, -0.020345687866210938, -0.01251220703125, -0.0046787261962890625, 0.003154754638671875, 0.010988235473632812, 0.01882171630859375, 0.026655197143554688, 0.034488677978515625, 0.04232215881347656, 0.0501556396484375, 0.05798912048339844, 0.06582260131835938, 0.07365608215332031, 0.08148956298828125, 0.08932304382324219, 0.09715652465820312, 0.10499000549316406, 0.112823486328125, 0.12065696716308594, 0.12849044799804688, 0.1363239288330078, 0.14415740966796875, 0.1519908905029297, 0.15982437133789062, 0.16765785217285156, 0.1754913330078125, 0.18332481384277344, 0.19115829467773438, 0.1989917755126953, 0.20682525634765625, 0.2146587371826172, 0.22249221801757812, 0.23032569885253906, 0.2381591796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 5.0, 7.0, 21.0, 22.0, 35.0, 45.0, 64.0, 118.0, 179.0, 314.0, 621.0, 1374.0, 3282.0, 8679.0, 29351.0, 167016.0, 3594377.0, 325463.0, 43607.0, 11931.0, 4248.0, 1757.0, 799.0, 409.0, 212.0, 133.0, 71.0, 53.0, 32.0, 17.0, 6.0, 4.0, 4.0, 9.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9324951171875, -1.864990234375, -1.7974853515625, -1.72998046875, -1.6624755859375, -1.594970703125, -1.5274658203125, -1.4599609375, -1.3924560546875, -1.324951171875, -1.2574462890625, -1.18994140625, -1.1224365234375, -1.054931640625, -0.9874267578125, -0.919921875, -0.8524169921875, -0.784912109375, -0.7174072265625, -0.64990234375, -0.5823974609375, -0.514892578125, -0.4473876953125, -0.3798828125, -0.3123779296875, -0.244873046875, -0.1773681640625, -0.10986328125, -0.0423583984375, 0.025146484375, 0.0926513671875, 0.16015625, 0.2276611328125, 0.295166015625, 0.3626708984375, 0.43017578125, 0.4976806640625, 0.565185546875, 0.6326904296875, 0.7001953125, 0.7677001953125, 0.835205078125, 0.9027099609375, 0.97021484375, 1.0377197265625, 1.105224609375, 1.1727294921875, 1.240234375, 1.3077392578125, 1.375244140625, 1.4427490234375, 1.51025390625, 1.5777587890625, 1.645263671875, 1.7127685546875, 1.7802734375, 1.8477783203125, 1.915283203125, 1.9827880859375, 2.05029296875, 2.1177978515625, 2.185302734375, 2.2528076171875, 2.3203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 10.0, 12.0, 13.0, 13.0, 34.0, 40.0, 65.0, 85.0, 176.0, 337.0, 862.0, 1375.0, 461.0, 214.0, 104.0, 77.0, 51.0, 35.0, 27.0, 18.0, 9.0, 9.0, 12.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.826171875, -0.8056106567382812, -0.7850494384765625, -0.7644882202148438, -0.743927001953125, -0.7233657836914062, -0.7028045654296875, -0.6822433471679688, -0.66168212890625, -0.6411209106445312, -0.6205596923828125, -0.5999984741210938, -0.579437255859375, -0.5588760375976562, -0.5383148193359375, -0.5177536010742188, -0.4971923828125, -0.47663116455078125, -0.4560699462890625, -0.43550872802734375, -0.414947509765625, -0.39438629150390625, -0.3738250732421875, -0.35326385498046875, -0.33270263671875, -0.31214141845703125, -0.2915802001953125, -0.27101898193359375, -0.250457763671875, -0.22989654541015625, -0.2093353271484375, -0.18877410888671875, -0.168212890625, -0.14765167236328125, -0.1270904541015625, -0.10652923583984375, -0.085968017578125, -0.06540679931640625, -0.0448455810546875, -0.02428436279296875, -0.00372314453125, 0.01683807373046875, 0.0373992919921875, 0.05796051025390625, 0.078521728515625, 0.09908294677734375, 0.1196441650390625, 0.14020538330078125, 0.1607666015625, 0.18132781982421875, 0.2018890380859375, 0.22245025634765625, 0.243011474609375, 0.26357269287109375, 0.2841339111328125, 0.30469512939453125, 0.32525634765625, 0.34581756591796875, 0.3663787841796875, 0.38694000244140625, 0.407501220703125, 0.42806243896484375, 0.4486236572265625, 0.46918487548828125, 0.48974609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 9.0, 11.0, 11.0, 32.0, 39.0, 50.0, 83.0, 79.0, 129.0, 124.0, 114.0, 109.0, 69.0, 51.0, 34.0, 19.0, 12.0, 12.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9397687911987305, -4.799509525299072, -4.659249782562256, -4.518990516662598, -4.378730773925781, -4.238471508026123, -4.098211765289307, -3.9579524993896484, -3.817692756652832, -3.6774332523345947, -3.5371737480163574, -3.39691424369812, -3.256654739379883, -3.1163952350616455, -2.976135730743408, -2.83587646484375, -2.6956169605255127, -2.5553574562072754, -2.415097951889038, -2.274838447570801, -2.1345789432525635, -1.9943194389343262, -1.8540600538253784, -1.7138005495071411, -1.5735410451889038, -1.4332815408706665, -1.2930220365524292, -1.1527626514434814, -1.0125031471252441, -0.8722435832023621, -0.7319841384887695, -0.5917246341705322, -0.4514651298522949, -0.3112056255340576, -0.1709461510181427, -0.030686676502227783, 0.10957282781600952, 0.24983233213424683, 0.39009177684783936, 0.5303512811660767, 0.670610785484314, 0.8108702898025513, 0.9511297941207886, 1.0913891792297363, 1.2316486835479736, 1.371908187866211, 1.5121676921844482, 1.6524271965026855, 1.7926867008209229, 1.9329462051391602, 2.0732057094573975, 2.2134652137756348, 2.353724718093872, 2.4939842224121094, 2.6342434883117676, 2.774503231048584, 2.914762496948242, 3.0550220012664795, 3.195281505584717, 3.335541009902954, 3.4758005142211914, 3.6160600185394287, 3.756319522857666, 3.896578788757324, 4.036838531494141]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 11.0, 7.0, 11.0, 10.0, 13.0, 16.0, 20.0, 27.0, 26.0, 34.0, 31.0, 44.0, 38.0, 35.0, 53.0, 41.0, 55.0, 43.0, 29.0, 44.0, 47.0, 48.0, 41.0, 44.0, 29.0, 18.0, 24.0, 24.0, 25.0, 22.0, 17.0, 12.0, 12.0, 10.0, 8.0, 9.0, 8.0, 4.0, 5.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2801971435546875, -2.213913917541504, -2.1476309299468994, -2.081347703933716, -2.0150644779205322, -1.9487813711166382, -1.8824982643127441, -1.8162150382995605, -1.7499319314956665, -1.6836488246917725, -1.6173655986785889, -1.5510824918746948, -1.4847993850708008, -1.4185161590576172, -1.3522330522537231, -1.285949945449829, -1.2196667194366455, -1.1533836126327515, -1.0871003866195679, -1.0208172798156738, -0.954534113407135, -0.8882509469985962, -0.8219678401947021, -0.7556846737861633, -0.6894015073776245, -0.6231183409690857, -0.5568351745605469, -0.49055206775665283, -0.424268901348114, -0.3579857349395752, -0.29170259833335876, -0.22541946172714233, -0.15913617610931396, -0.09285302460193634, -0.026569873094558716, 0.03971327841281891, 0.10599642992019653, 0.17227959632873535, 0.23856273293495178, 0.3048458695411682, 0.37112903594970703, 0.43741220235824585, 0.5036953687667847, 0.5699784755706787, 0.6362616419792175, 0.7025448083877563, 0.7688279151916504, 0.8351110816001892, 0.901394248008728, 0.9676774144172668, 1.0339605808258057, 1.1002436876296997, 1.1665267944335938, 1.2328100204467773, 1.2990931272506714, 1.3653762340545654, 1.431659460067749, 1.497942566871643, 1.5642257928848267, 1.6305088996887207, 1.6967921257019043, 1.7630752325057983, 1.8293583393096924, 1.895641565322876, 1.96192467212677]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 5.0, 12.0, 15.0, 18.0, 25.0, 37.0, 31.0, 56.0, 71.0, 107.0, 126.0, 212.0, 354.0, 464.0, 840.0, 1456.0, 2777.0, 5735.0, 12516.0, 29713.0, 78577.0, 236806.0, 436376.0, 149272.0, 53115.0, 20973.0, 9102.0, 4362.0, 2150.0, 1218.0, 670.0, 429.0, 264.0, 174.0, 125.0, 98.0, 64.0, 53.0, 40.0, 26.0, 22.0, 10.0, 8.0, 13.0, 6.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3916015625, -1.342437744140625, -1.29327392578125, -1.244110107421875, -1.1949462890625, -1.145782470703125, -1.09661865234375, -1.047454833984375, -0.998291015625, -0.949127197265625, -0.89996337890625, -0.850799560546875, -0.8016357421875, -0.752471923828125, -0.70330810546875, -0.654144287109375, -0.60498046875, -0.555816650390625, -0.50665283203125, -0.457489013671875, -0.4083251953125, -0.359161376953125, -0.30999755859375, -0.260833740234375, -0.211669921875, -0.162506103515625, -0.11334228515625, -0.064178466796875, -0.0150146484375, 0.034149169921875, 0.08331298828125, 0.132476806640625, 0.181640625, 0.230804443359375, 0.27996826171875, 0.329132080078125, 0.3782958984375, 0.427459716796875, 0.47662353515625, 0.525787353515625, 0.574951171875, 0.624114990234375, 0.67327880859375, 0.722442626953125, 0.7716064453125, 0.820770263671875, 0.86993408203125, 0.919097900390625, 0.96826171875, 1.017425537109375, 1.06658935546875, 1.115753173828125, 1.1649169921875, 1.214080810546875, 1.26324462890625, 1.312408447265625, 1.361572265625, 1.410736083984375, 1.45989990234375, 1.509063720703125, 1.5582275390625, 1.607391357421875, 1.65655517578125, 1.705718994140625, 1.7548828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 10.0, 16.0, 15.0, 21.0, 14.0, 31.0, 43.0, 53.0, 59.0, 54.0, 52.0, 87.0, 79.0, 67.0, 77.0, 56.0, 71.0, 48.0, 33.0, 27.0, 18.0, 14.0, 13.0, 9.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2587890625, -0.2509918212890625, -0.243194580078125, -0.2353973388671875, -0.22760009765625, -0.2198028564453125, -0.212005615234375, -0.2042083740234375, -0.1964111328125, -0.1886138916015625, -0.180816650390625, -0.1730194091796875, -0.16522216796875, -0.1574249267578125, -0.149627685546875, -0.1418304443359375, -0.134033203125, -0.1262359619140625, -0.118438720703125, -0.1106414794921875, -0.10284423828125, -0.0950469970703125, -0.087249755859375, -0.0794525146484375, -0.0716552734375, -0.0638580322265625, -0.056060791015625, -0.0482635498046875, -0.04046630859375, -0.0326690673828125, -0.024871826171875, -0.0170745849609375, -0.00927734375, -0.0014801025390625, 0.006317138671875, 0.0141143798828125, 0.02191162109375, 0.0297088623046875, 0.037506103515625, 0.0453033447265625, 0.0531005859375, 0.0608978271484375, 0.068695068359375, 0.0764923095703125, 0.08428955078125, 0.0920867919921875, 0.099884033203125, 0.1076812744140625, 0.115478515625, 0.1232757568359375, 0.131072998046875, 0.1388702392578125, 0.14666748046875, 0.1544647216796875, 0.162261962890625, 0.1700592041015625, 0.1778564453125, 0.1856536865234375, 0.193450927734375, 0.2012481689453125, 0.20904541015625, 0.2168426513671875, 0.224639892578125, 0.2324371337890625, 0.240234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 13.0, 12.0, 19.0, 27.0, 53.0, 50.0, 111.0, 180.0, 264.0, 456.0, 724.0, 1484.0, 2995.0, 7496.0, 22555.0, 85992.0, 442913.0, 376371.0, 74206.0, 19666.0, 6762.0, 2961.0, 1378.0, 726.0, 412.0, 227.0, 166.0, 117.0, 61.0, 39.0, 33.0, 22.0, 17.0, 8.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.03515625, -1.973388671875, -1.91162109375, -1.849853515625, -1.7880859375, -1.726318359375, -1.66455078125, -1.602783203125, -1.541015625, -1.479248046875, -1.41748046875, -1.355712890625, -1.2939453125, -1.232177734375, -1.17041015625, -1.108642578125, -1.046875, -0.985107421875, -0.92333984375, -0.861572265625, -0.7998046875, -0.738037109375, -0.67626953125, -0.614501953125, -0.552734375, -0.490966796875, -0.42919921875, -0.367431640625, -0.3056640625, -0.243896484375, -0.18212890625, -0.120361328125, -0.05859375, 0.003173828125, 0.06494140625, 0.126708984375, 0.1884765625, 0.250244140625, 0.31201171875, 0.373779296875, 0.435546875, 0.497314453125, 0.55908203125, 0.620849609375, 0.6826171875, 0.744384765625, 0.80615234375, 0.867919921875, 0.9296875, 0.991455078125, 1.05322265625, 1.114990234375, 1.1767578125, 1.238525390625, 1.30029296875, 1.362060546875, 1.423828125, 1.485595703125, 1.54736328125, 1.609130859375, 1.6708984375, 1.732666015625, 1.79443359375, 1.856201171875, 1.91796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 8.0, 4.0, 6.0, 6.0, 6.0, 9.0, 5.0, 12.0, 10.0, 19.0, 16.0, 22.0, 40.0, 31.0, 30.0, 28.0, 29.0, 35.0, 41.0, 32.0, 30.0, 41.0, 25.0, 39.0, 46.0, 44.0, 39.0, 41.0, 32.0, 32.0, 36.0, 29.0, 27.0, 22.0, 17.0, 19.0, 18.0, 19.0, 14.0, 8.0, 9.0, 8.0, 4.0, 8.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.861328125, -0.83636474609375, -0.8114013671875, -0.78643798828125, -0.761474609375, -0.73651123046875, -0.7115478515625, -0.68658447265625, -0.66162109375, -0.63665771484375, -0.6116943359375, -0.58673095703125, -0.561767578125, -0.53680419921875, -0.5118408203125, -0.48687744140625, -0.4619140625, -0.43695068359375, -0.4119873046875, -0.38702392578125, -0.362060546875, -0.33709716796875, -0.3121337890625, -0.28717041015625, -0.26220703125, -0.23724365234375, -0.2122802734375, -0.18731689453125, -0.162353515625, -0.13739013671875, -0.1124267578125, -0.08746337890625, -0.0625, -0.03753662109375, -0.0125732421875, 0.01239013671875, 0.037353515625, 0.06231689453125, 0.0872802734375, 0.11224365234375, 0.13720703125, 0.16217041015625, 0.1871337890625, 0.21209716796875, 0.237060546875, 0.26202392578125, 0.2869873046875, 0.31195068359375, 0.3369140625, 0.36187744140625, 0.3868408203125, 0.41180419921875, 0.436767578125, 0.46173095703125, 0.4866943359375, 0.51165771484375, 0.53662109375, 0.56158447265625, 0.5865478515625, 0.61151123046875, 0.636474609375, 0.66143798828125, 0.6864013671875, 0.71136474609375, 0.736328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 14.0, 15.0, 17.0, 30.0, 40.0, 73.0, 108.0, 220.0, 447.0, 957.0, 2212.0, 6001.0, 21198.0, 104772.0, 580578.0, 271569.0, 43307.0, 10763.0, 3480.0, 1397.0, 580.0, 290.0, 173.0, 98.0, 65.0, 35.0, 29.0, 17.0, 18.0, 6.0, 8.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8427505493164062, -0.8100128173828125, -0.7772750854492188, -0.744537353515625, -0.7117996215820312, -0.6790618896484375, -0.6463241577148438, -0.61358642578125, -0.5808486938476562, -0.5481109619140625, -0.5153732299804688, -0.482635498046875, -0.44989776611328125, -0.4171600341796875, -0.38442230224609375, -0.3516845703125, -0.31894683837890625, -0.2862091064453125, -0.25347137451171875, -0.220733642578125, -0.18799591064453125, -0.1552581787109375, -0.12252044677734375, -0.08978271484375, -0.05704498291015625, -0.0243072509765625, 0.00843048095703125, 0.041168212890625, 0.07390594482421875, 0.1066436767578125, 0.13938140869140625, 0.172119140625, 0.20485687255859375, 0.2375946044921875, 0.27033233642578125, 0.303070068359375, 0.33580780029296875, 0.3685455322265625, 0.40128326416015625, 0.43402099609375, 0.46675872802734375, 0.4994964599609375, 0.5322341918945312, 0.564971923828125, 0.5977096557617188, 0.6304473876953125, 0.6631851196289062, 0.6959228515625, 0.7286605834960938, 0.7613983154296875, 0.7941360473632812, 0.826873779296875, 0.8596115112304688, 0.8923492431640625, 0.9250869750976562, 0.95782470703125, 0.9905624389648438, 1.0233001708984375, 1.0560379028320312, 1.088775634765625, 1.1215133666992188, 1.1542510986328125, 1.1869888305664062, 1.2197265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 3.0, 9.0, 5.0, 11.0, 9.0, 24.0, 9.0, 33.0, 47.0, 56.0, 65.0, 86.0, 131.0, 105.0, 93.0, 81.0, 48.0, 43.0, 35.0, 27.0, 17.0, 12.0, 15.0, 9.0, 4.0, 7.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001920461654663086, -0.00018587149679660797, -0.00017969682812690735, -0.00017352215945720673, -0.0001673474907875061, -0.00016117282211780548, -0.00015499815344810486, -0.00014882348477840424, -0.0001426488161087036, -0.000136474147439003, -0.00013029947876930237, -0.00012412481009960175, -0.00011795014142990112, -0.0001117754727602005, -0.00010560080409049988, -9.942613542079926e-05, -9.325146675109863e-05, -8.707679808139801e-05, -8.090212941169739e-05, -7.472746074199677e-05, -6.855279207229614e-05, -6.237812340259552e-05, -5.62034547328949e-05, -5.0028786063194275e-05, -4.385411739349365e-05, -3.767944872379303e-05, -3.150478005409241e-05, -2.5330111384391785e-05, -1.9155442714691162e-05, -1.298077404499054e-05, -6.806105375289917e-06, -6.314367055892944e-07, 5.543231964111328e-06, 1.171790063381195e-05, 1.7892569303512573e-05, 2.4067237973213196e-05, 3.024190664291382e-05, 3.641657531261444e-05, 4.2591243982315063e-05, 4.8765912652015686e-05, 5.494058132171631e-05, 6.111524999141693e-05, 6.728991866111755e-05, 7.346458733081818e-05, 7.96392560005188e-05, 8.581392467021942e-05, 9.198859333992004e-05, 9.816326200962067e-05, 0.00010433793067932129, 0.00011051259934902191, 0.00011668726801872253, 0.00012286193668842316, 0.00012903660535812378, 0.0001352112740278244, 0.00014138594269752502, 0.00014756061136722565, 0.00015373528003692627, 0.0001599099487066269, 0.00016608461737632751, 0.00017225928604602814, 0.00017843395471572876, 0.00018460862338542938, 0.00019078329205513, 0.00019695796072483063, 0.00020313262939453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 12.0, 11.0, 11.0, 23.0, 27.0, 50.0, 88.0, 88.0, 183.0, 293.0, 496.0, 1045.0, 2073.0, 4919.0, 13226.0, 44361.0, 211102.0, 557153.0, 158652.0, 35567.0, 10980.0, 4182.0, 1814.0, 946.0, 473.0, 273.0, 190.0, 100.0, 62.0, 51.0, 32.0, 15.0, 21.0, 16.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79931640625, -0.7738723754882812, -0.7484283447265625, -0.7229843139648438, -0.697540283203125, -0.6720962524414062, -0.6466522216796875, -0.6212081909179688, -0.59576416015625, -0.5703201293945312, -0.5448760986328125, -0.5194320678710938, -0.493988037109375, -0.46854400634765625, -0.4430999755859375, -0.41765594482421875, -0.3922119140625, -0.36676788330078125, -0.3413238525390625, -0.31587982177734375, -0.290435791015625, -0.26499176025390625, -0.2395477294921875, -0.21410369873046875, -0.18865966796875, -0.16321563720703125, -0.1377716064453125, -0.11232757568359375, -0.086883544921875, -0.06143951416015625, -0.0359954833984375, -0.01055145263671875, 0.014892578125, 0.04033660888671875, 0.0657806396484375, 0.09122467041015625, 0.116668701171875, 0.14211273193359375, 0.1675567626953125, 0.19300079345703125, 0.21844482421875, 0.24388885498046875, 0.2693328857421875, 0.29477691650390625, 0.320220947265625, 0.34566497802734375, 0.3711090087890625, 0.39655303955078125, 0.4219970703125, 0.44744110107421875, 0.4728851318359375, 0.49832916259765625, 0.523773193359375, 0.5492172241210938, 0.5746612548828125, 0.6001052856445312, 0.62554931640625, 0.6509933471679688, 0.6764373779296875, 0.7018814086914062, 0.727325439453125, 0.7527694702148438, 0.7782135009765625, 0.8036575317382812, 0.8291015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 9.0, 5.0, 9.0, 17.0, 15.0, 26.0, 30.0, 41.0, 52.0, 68.0, 100.0, 96.0, 125.0, 78.0, 91.0, 72.0, 45.0, 27.0, 33.0, 13.0, 17.0, 11.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380859375, -0.36128997802734375, -0.3417205810546875, -0.32215118408203125, -0.302581787109375, -0.28301239013671875, -0.2634429931640625, -0.24387359619140625, -0.22430419921875, -0.20473480224609375, -0.1851654052734375, -0.16559600830078125, -0.146026611328125, -0.12645721435546875, -0.1068878173828125, -0.08731842041015625, -0.0677490234375, -0.04817962646484375, -0.0286102294921875, -0.00904083251953125, 0.010528564453125, 0.03009796142578125, 0.0496673583984375, 0.06923675537109375, 0.08880615234375, 0.10837554931640625, 0.1279449462890625, 0.14751434326171875, 0.167083740234375, 0.18665313720703125, 0.2062225341796875, 0.22579193115234375, 0.245361328125, 0.26493072509765625, 0.2845001220703125, 0.30406951904296875, 0.323638916015625, 0.34320831298828125, 0.3627777099609375, 0.38234710693359375, 0.40191650390625, 0.42148590087890625, 0.4410552978515625, 0.46062469482421875, 0.480194091796875, 0.49976348876953125, 0.5193328857421875, 0.5389022827148438, 0.5584716796875, 0.5780410766601562, 0.5976104736328125, 0.6171798706054688, 0.636749267578125, 0.6563186645507812, 0.6758880615234375, 0.6954574584960938, 0.71502685546875, 0.7345962524414062, 0.7541656494140625, 0.7737350463867188, 0.793304443359375, 0.8128738403320312, 0.8324432373046875, 0.8520126342773438, 0.87158203125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 15.0, 13.0, 26.0, 46.0, 82.0, 104.0, 132.0, 142.0, 142.0, 104.0, 84.0, 48.0, 24.0, 16.0, 13.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.289434432983398, -13.864534378051758, -13.4396333694458, -13.014732360839844, -12.589832305908203, -12.164932250976562, -11.740031242370605, -11.315130233764648, -10.890230178833008, -10.465330123901367, -10.04042911529541, -9.615528106689453, -9.190628051757812, -8.765727996826172, -8.340826988220215, -7.915926456451416, -7.491025924682617, -7.066125392913818, -6.6412248611450195, -6.216324329376221, -5.791423797607422, -5.366523265838623, -4.941622734069824, -4.516722202301025, -4.091821670532227, -3.6669211387634277, -3.242020606994629, -2.81712007522583, -2.3922195434570312, -1.9673190116882324, -1.5424184799194336, -1.1175179481506348, -0.6926183700561523, -0.2677178382873535, 0.1571826934814453, 0.5820832252502441, 1.006983757019043, 1.4318842887878418, 1.8567848205566406, 2.2816853523254395, 2.7065858840942383, 3.131486415863037, 3.556386947631836, 3.9812874794006348, 4.406188011169434, 4.831088542938232, 5.255989074707031, 5.68088960647583, 6.105790138244629, 6.530690670013428, 6.955591201782227, 7.380491733551025, 7.805392265319824, 8.230293273925781, 8.655193328857422, 9.080093383789062, 9.50499439239502, 9.929895401000977, 10.354795455932617, 10.779695510864258, 11.204596519470215, 11.629497528076172, 12.054397583007812, 12.479297637939453, 12.90419864654541]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 11.0, 10.0, 6.0, 8.0, 20.0, 19.0, 28.0, 24.0, 33.0, 38.0, 47.0, 64.0, 41.0, 49.0, 47.0, 52.0, 55.0, 56.0, 64.0, 54.0, 59.0, 49.0, 29.0, 33.0, 25.0, 19.0, 19.0, 6.0, 9.0, 8.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.437862873077393, -5.237143516540527, -5.03642463684082, -4.835705280303955, -4.63498592376709, -4.434267044067383, -4.233547687530518, -4.032828330993652, -3.832109212875366, -3.63139009475708, -3.430670738220215, -3.2299516201019287, -3.0292325019836426, -2.8285131454467773, -2.627794027328491, -2.427074909210205, -2.22635555267334, -2.0256364345550537, -1.8249170780181885, -1.6241979598999023, -1.4234787225723267, -1.222759485244751, -1.0220403671264648, -0.8213211297988892, -0.6206018924713135, -0.4198826849460602, -0.21916347742080688, -0.018444299697875977, 0.1822749376296997, 0.3829941749572754, 0.5837132930755615, 0.7844325304031372, 0.9851522445678711, 1.1858714818954468, 1.3865907192230225, 1.5873098373413086, 1.7880290746688843, 1.98874831199646, 2.189467430114746, 2.3901867866516113, 2.5909059047698975, 2.7916250228881836, 2.992344379425049, 3.193063497543335, 3.393782615661621, 3.5945019721984863, 3.7952210903167725, 3.9959402084350586, 4.196659564971924, 4.397378921508789, 4.598097801208496, 4.798817157745361, 4.999536514282227, 5.200255393981934, 5.400974750518799, 5.601694107055664, 5.802412986755371, 6.003132343292236, 6.203851222991943, 6.404570579528809, 6.605289936065674, 6.806009292602539, 7.006728172302246, 7.207447528839111, 7.408166885375977]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 6.0, 14.0, 23.0, 28.0, 35.0, 72.0, 79.0, 137.0, 237.0, 364.0, 625.0, 1158.0, 2344.0, 5111.0, 12866.0, 45494.0, 622952.0, 3412498.0, 62778.0, 15823.0, 5863.0, 2679.0, 1322.0, 668.0, 402.0, 247.0, 163.0, 92.0, 54.0, 33.0, 32.0, 17.0, 16.0, 8.0, 5.0, 7.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1796875, -2.109588623046875, -2.03948974609375, -1.969390869140625, -1.8992919921875, -1.829193115234375, -1.75909423828125, -1.688995361328125, -1.618896484375, -1.548797607421875, -1.47869873046875, -1.408599853515625, -1.3385009765625, -1.268402099609375, -1.19830322265625, -1.128204345703125, -1.05810546875, -0.988006591796875, -0.91790771484375, -0.847808837890625, -0.7777099609375, -0.707611083984375, -0.63751220703125, -0.567413330078125, -0.497314453125, -0.427215576171875, -0.35711669921875, -0.287017822265625, -0.2169189453125, -0.146820068359375, -0.07672119140625, -0.006622314453125, 0.0634765625, 0.133575439453125, 0.20367431640625, 0.273773193359375, 0.3438720703125, 0.413970947265625, 0.48406982421875, 0.554168701171875, 0.624267578125, 0.694366455078125, 0.76446533203125, 0.834564208984375, 0.9046630859375, 0.974761962890625, 1.04486083984375, 1.114959716796875, 1.18505859375, 1.255157470703125, 1.32525634765625, 1.395355224609375, 1.4654541015625, 1.535552978515625, 1.60565185546875, 1.675750732421875, 1.745849609375, 1.815948486328125, 1.88604736328125, 1.956146240234375, 2.0262451171875, 2.096343994140625, 2.16644287109375, 2.236541748046875, 2.306640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 8.0, 10.0, 16.0, 14.0, 16.0, 34.0, 35.0, 39.0, 46.0, 45.0, 54.0, 74.0, 65.0, 75.0, 61.0, 66.0, 59.0, 47.0, 40.0, 46.0, 32.0, 25.0, 21.0, 17.0, 7.0, 16.0, 3.0, 5.0, 8.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.263427734375, -0.25573158264160156, -0.24803543090820312, -0.2403392791748047, -0.23264312744140625, -0.2249469757080078, -0.21725082397460938, -0.20955467224121094, -0.2018585205078125, -0.19416236877441406, -0.18646621704101562, -0.1787700653076172, -0.17107391357421875, -0.1633777618408203, -0.15568161010742188, -0.14798545837402344, -0.140289306640625, -0.13259315490722656, -0.12489700317382812, -0.11720085144042969, -0.10950469970703125, -0.10180854797363281, -0.09411239624023438, -0.08641624450683594, -0.0787200927734375, -0.07102394104003906, -0.06332778930664062, -0.05563163757324219, -0.04793548583984375, -0.04023933410644531, -0.032543182373046875, -0.024847030639648438, -0.01715087890625, -0.009454727172851562, -0.001758575439453125, 0.0059375762939453125, 0.01363372802734375, 0.021329879760742188, 0.029026031494140625, 0.03672218322753906, 0.0444183349609375, 0.05211448669433594, 0.059810638427734375, 0.06750679016113281, 0.07520294189453125, 0.08289909362792969, 0.09059524536132812, 0.09829139709472656, 0.105987548828125, 0.11368370056152344, 0.12137985229492188, 0.1290760040283203, 0.13677215576171875, 0.1444683074951172, 0.15216445922851562, 0.15986061096191406, 0.1675567626953125, 0.17525291442871094, 0.18294906616210938, 0.1906452178955078, 0.19834136962890625, 0.2060375213623047, 0.21373367309570312, 0.22142982482910156, 0.2291259765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 8.0, 10.0, 11.0, 23.0, 16.0, 21.0, 32.0, 41.0, 65.0, 100.0, 146.0, 296.0, 554.0, 1232.0, 3108.0, 10359.0, 57428.0, 3774256.0, 312609.0, 24270.0, 5880.0, 2008.0, 801.0, 362.0, 210.0, 133.0, 78.0, 61.0, 41.0, 26.0, 22.0, 20.0, 14.0, 8.0, 9.0, 5.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-4.11328125, -3.998321533203125, -3.88336181640625, -3.768402099609375, -3.6534423828125, -3.538482666015625, -3.42352294921875, -3.308563232421875, -3.193603515625, -3.078643798828125, -2.96368408203125, -2.848724365234375, -2.7337646484375, -2.618804931640625, -2.50384521484375, -2.388885498046875, -2.27392578125, -2.158966064453125, -2.04400634765625, -1.929046630859375, -1.8140869140625, -1.699127197265625, -1.58416748046875, -1.469207763671875, -1.354248046875, -1.239288330078125, -1.12432861328125, -1.009368896484375, -0.8944091796875, -0.779449462890625, -0.66448974609375, -0.549530029296875, -0.4345703125, -0.319610595703125, -0.20465087890625, -0.089691162109375, 0.0252685546875, 0.140228271484375, 0.25518798828125, 0.370147705078125, 0.485107421875, 0.600067138671875, 0.71502685546875, 0.829986572265625, 0.9449462890625, 1.059906005859375, 1.17486572265625, 1.289825439453125, 1.40478515625, 1.519744873046875, 1.63470458984375, 1.749664306640625, 1.8646240234375, 1.979583740234375, 2.09454345703125, 2.209503173828125, 2.324462890625, 2.439422607421875, 2.55438232421875, 2.669342041015625, 2.7843017578125, 2.899261474609375, 3.01422119140625, 3.129180908203125, 3.244140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 21.0, 32.0, 70.0, 148.0, 535.0, 2622.0, 366.0, 123.0, 50.0, 33.0, 19.0, 16.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9249649047851562, -0.8836212158203125, -0.8422775268554688, -0.800933837890625, -0.7595901489257812, -0.7182464599609375, -0.6769027709960938, -0.63555908203125, -0.5942153930664062, -0.5528717041015625, -0.5115280151367188, -0.470184326171875, -0.42884063720703125, -0.3874969482421875, -0.34615325927734375, -0.3048095703125, -0.26346588134765625, -0.2221221923828125, -0.18077850341796875, -0.139434814453125, -0.09809112548828125, -0.0567474365234375, -0.01540374755859375, 0.02593994140625, 0.06728363037109375, 0.1086273193359375, 0.14997100830078125, 0.191314697265625, 0.23265838623046875, 0.2740020751953125, 0.31534576416015625, 0.356689453125, 0.39803314208984375, 0.4393768310546875, 0.48072052001953125, 0.522064208984375, 0.5634078979492188, 0.6047515869140625, 0.6460952758789062, 0.68743896484375, 0.7287826538085938, 0.7701263427734375, 0.8114700317382812, 0.852813720703125, 0.8941574096679688, 0.9355010986328125, 0.9768447875976562, 1.0181884765625, 1.0595321655273438, 1.1008758544921875, 1.1422195434570312, 1.183563232421875, 1.2249069213867188, 1.2662506103515625, 1.3075942993164062, 1.34893798828125, 1.3902816772460938, 1.4316253662109375, 1.4729690551757812, 1.514312744140625, 1.5556564331054688, 1.5970001220703125, 1.6383438110351562, 1.6796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 9.0, 19.0, 37.0, 72.0, 113.0, 179.0, 171.0, 135.0, 114.0, 61.0, 43.0, 17.0, 11.0, 9.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.526845455169678, -7.326095104217529, -7.125345230102539, -6.924594879150391, -6.723844528198242, -6.523094177246094, -6.3223443031311035, -6.121593952178955, -5.920843601226807, -5.720093250274658, -5.519343376159668, -5.3185930252075195, -5.117842674255371, -4.917092323303223, -4.716342449188232, -4.515592098236084, -4.314842224121094, -4.114091873168945, -3.913341760635376, -3.7125916481018066, -3.511841297149658, -3.311091184616089, -3.1103410720825195, -2.909590721130371, -2.7088403701782227, -2.5080902576446533, -2.307339906692505, -2.1065897941589355, -1.905839443206787, -1.7050893306732178, -1.5043390989303589, -1.3035888671875, -1.1028385162353516, -0.9020882844924927, -0.7013380527496338, -0.5005878806114197, -0.2998376488685608, -0.09908747673034668, 0.10166275501251221, 0.3024129867553711, 0.50316321849823, 0.7039134502410889, 0.9046636819839478, 1.1054139137268066, 1.306164026260376, 1.5069142580032349, 1.7076644897460938, 1.9084147214889526, 2.1091649532318115, 2.309915065765381, 2.5106654167175293, 2.7114155292510986, 2.912165880203247, 3.1129159927368164, 3.313666343688965, 3.514416456222534, 3.7151665687561035, 3.915916681289673, 4.116666793823242, 4.317417144775391, 4.518167495727539, 4.7189178466796875, 4.919667720794678, 5.120418071746826, 5.321168422698975]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 7.0, 9.0, 12.0, 20.0, 21.0, 18.0, 22.0, 32.0, 27.0, 25.0, 31.0, 40.0, 37.0, 35.0, 52.0, 33.0, 56.0, 44.0, 31.0, 50.0, 41.0, 41.0, 44.0, 31.0, 27.0, 31.0, 33.0, 17.0, 18.0, 21.0, 18.0, 12.0, 15.0, 5.0, 8.0, 11.0, 2.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9252784252166748, -1.85677170753479, -1.7882649898529053, -1.7197582721710205, -1.6512515544891357, -1.582744836807251, -1.5142381191253662, -1.4457314014434814, -1.3772246837615967, -1.308717966079712, -1.2402112483978271, -1.1717045307159424, -1.1031978130340576, -1.0346910953521729, -0.9661843776702881, -0.8976776599884033, -0.8291709423065186, -0.7606642246246338, -0.692157506942749, -0.6236507892608643, -0.5551440715789795, -0.4866373538970947, -0.41813063621520996, -0.3496239185333252, -0.28111720085144043, -0.21261048316955566, -0.1441037654876709, -0.07559704780578613, -0.007090330123901367, 0.0614163875579834, 0.12992310523986816, 0.19842982292175293, 0.2669367790222168, 0.33544349670410156, 0.40395021438598633, 0.4724569320678711, 0.5409636497497559, 0.6094703674316406, 0.6779770851135254, 0.7464838027954102, 0.8149905204772949, 0.8834972381591797, 0.9520039558410645, 1.0205106735229492, 1.089017391204834, 1.1575241088867188, 1.2260308265686035, 1.2945375442504883, 1.363044261932373, 1.4315509796142578, 1.5000576972961426, 1.5685644149780273, 1.637071132659912, 1.7055778503417969, 1.7740845680236816, 1.8425912857055664, 1.9110980033874512, 1.979604721069336, 2.0481114387512207, 2.1166181564331055, 2.1851248741149902, 2.253631591796875, 2.3221383094787598, 2.3906450271606445, 2.4591517448425293]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 17.0, 35.0, 42.0, 51.0, 102.0, 238.0, 473.0, 990.0, 2601.0, 7598.0, 27643.0, 124161.0, 559599.0, 253760.0, 51407.0, 13076.0, 3971.0, 1423.0, 656.0, 305.0, 164.0, 85.0, 63.0, 35.0, 19.0, 7.0, 9.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.898834228515625, -2.80743408203125, -2.716033935546875, -2.6246337890625, -2.533233642578125, -2.44183349609375, -2.350433349609375, -2.259033203125, -2.167633056640625, -2.07623291015625, -1.984832763671875, -1.8934326171875, -1.802032470703125, -1.71063232421875, -1.619232177734375, -1.52783203125, -1.436431884765625, -1.34503173828125, -1.253631591796875, -1.1622314453125, -1.070831298828125, -0.97943115234375, -0.888031005859375, -0.796630859375, -0.705230712890625, -0.61383056640625, -0.522430419921875, -0.4310302734375, -0.339630126953125, -0.24822998046875, -0.156829833984375, -0.0654296875, 0.025970458984375, 0.11737060546875, 0.208770751953125, 0.3001708984375, 0.391571044921875, 0.48297119140625, 0.574371337890625, 0.665771484375, 0.757171630859375, 0.84857177734375, 0.939971923828125, 1.0313720703125, 1.122772216796875, 1.21417236328125, 1.305572509765625, 1.39697265625, 1.488372802734375, 1.57977294921875, 1.671173095703125, 1.7625732421875, 1.853973388671875, 1.94537353515625, 2.036773681640625, 2.128173828125, 2.219573974609375, 2.31097412109375, 2.402374267578125, 2.4937744140625, 2.585174560546875, 2.67657470703125, 2.767974853515625, 2.859375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 9.0, 9.0, 11.0, 14.0, 24.0, 26.0, 29.0, 38.0, 40.0, 38.0, 51.0, 64.0, 45.0, 65.0, 73.0, 65.0, 62.0, 53.0, 48.0, 44.0, 39.0, 33.0, 29.0, 17.0, 17.0, 10.0, 7.0, 14.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.271240234375, -0.26348876953125, -0.2557373046875, -0.24798583984375, -0.240234375, -0.23248291015625, -0.2247314453125, -0.21697998046875, -0.209228515625, -0.20147705078125, -0.1937255859375, -0.18597412109375, -0.17822265625, -0.17047119140625, -0.1627197265625, -0.15496826171875, -0.147216796875, -0.13946533203125, -0.1317138671875, -0.12396240234375, -0.1162109375, -0.10845947265625, -0.1007080078125, -0.09295654296875, -0.085205078125, -0.07745361328125, -0.0697021484375, -0.06195068359375, -0.05419921875, -0.04644775390625, -0.0386962890625, -0.03094482421875, -0.023193359375, -0.01544189453125, -0.0076904296875, 6.103515625e-05, 0.0078125, 0.01556396484375, 0.0233154296875, 0.03106689453125, 0.038818359375, 0.04656982421875, 0.0543212890625, 0.06207275390625, 0.06982421875, 0.07757568359375, 0.0853271484375, 0.09307861328125, 0.100830078125, 0.10858154296875, 0.1163330078125, 0.12408447265625, 0.1318359375, 0.13958740234375, 0.1473388671875, 0.15509033203125, 0.162841796875, 0.17059326171875, 0.1783447265625, 0.18609619140625, 0.19384765625, 0.20159912109375, 0.2093505859375, 0.21710205078125, 0.224853515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 10.0, 12.0, 13.0, 24.0, 25.0, 28.0, 51.0, 61.0, 73.0, 107.0, 155.0, 200.0, 267.0, 399.0, 598.0, 964.0, 1672.0, 3184.0, 7277.0, 18855.0, 56290.0, 182664.0, 460647.0, 212541.0, 64496.0, 21442.0, 8154.0, 3448.0, 1810.0, 1009.0, 634.0, 391.0, 295.0, 206.0, 143.0, 102.0, 69.0, 59.0, 37.0, 29.0, 29.0, 30.0, 20.0, 10.0, 8.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5048828125, -1.4586639404296875, -1.412445068359375, -1.3662261962890625, -1.32000732421875, -1.2737884521484375, -1.227569580078125, -1.1813507080078125, -1.1351318359375, -1.0889129638671875, -1.042694091796875, -0.9964752197265625, -0.95025634765625, -0.9040374755859375, -0.857818603515625, -0.8115997314453125, -0.765380859375, -0.7191619873046875, -0.672943115234375, -0.6267242431640625, -0.58050537109375, -0.5342864990234375, -0.488067626953125, -0.4418487548828125, -0.3956298828125, -0.3494110107421875, -0.303192138671875, -0.2569732666015625, -0.21075439453125, -0.1645355224609375, -0.118316650390625, -0.0720977783203125, -0.02587890625, 0.0203399658203125, 0.066558837890625, 0.1127777099609375, 0.15899658203125, 0.2052154541015625, 0.251434326171875, 0.2976531982421875, 0.3438720703125, 0.3900909423828125, 0.436309814453125, 0.4825286865234375, 0.52874755859375, 0.5749664306640625, 0.621185302734375, 0.6674041748046875, 0.713623046875, 0.7598419189453125, 0.806060791015625, 0.8522796630859375, 0.89849853515625, 0.9447174072265625, 0.990936279296875, 1.0371551513671875, 1.0833740234375, 1.1295928955078125, 1.175811767578125, 1.2220306396484375, 1.26824951171875, 1.3144683837890625, 1.360687255859375, 1.4069061279296875, 1.453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 11.0, 11.0, 7.0, 14.0, 12.0, 12.0, 15.0, 13.0, 25.0, 30.0, 31.0, 27.0, 36.0, 39.0, 28.0, 36.0, 53.0, 38.0, 38.0, 43.0, 29.0, 40.0, 39.0, 27.0, 44.0, 41.0, 35.0, 29.0, 32.0, 14.0, 24.0, 21.0, 18.0, 16.0, 12.0, 8.0, 7.0, 6.0, 15.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.8447265625, -0.8186492919921875, -0.792572021484375, -0.7664947509765625, -0.74041748046875, -0.7143402099609375, -0.688262939453125, -0.6621856689453125, -0.6361083984375, -0.6100311279296875, -0.583953857421875, -0.5578765869140625, -0.53179931640625, -0.5057220458984375, -0.479644775390625, -0.4535675048828125, -0.427490234375, -0.4014129638671875, -0.375335693359375, -0.3492584228515625, -0.32318115234375, -0.2971038818359375, -0.271026611328125, -0.2449493408203125, -0.2188720703125, -0.1927947998046875, -0.166717529296875, -0.1406402587890625, -0.11456298828125, -0.0884857177734375, -0.062408447265625, -0.0363311767578125, -0.01025390625, 0.0158233642578125, 0.041900634765625, 0.0679779052734375, 0.09405517578125, 0.1201324462890625, 0.146209716796875, 0.1722869873046875, 0.1983642578125, 0.2244415283203125, 0.250518798828125, 0.2765960693359375, 0.30267333984375, 0.3287506103515625, 0.354827880859375, 0.3809051513671875, 0.406982421875, 0.4330596923828125, 0.459136962890625, 0.4852142333984375, 0.51129150390625, 0.5373687744140625, 0.563446044921875, 0.5895233154296875, 0.6156005859375, 0.6416778564453125, 0.667755126953125, 0.6938323974609375, 0.71990966796875, 0.7459869384765625, 0.772064208984375, 0.7981414794921875, 0.82421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 11.0, 19.0, 24.0, 37.0, 74.0, 100.0, 187.0, 362.0, 767.0, 2068.0, 6387.0, 27190.0, 243989.0, 677669.0, 71563.0, 12361.0, 3326.0, 1251.0, 522.0, 260.0, 138.0, 83.0, 51.0, 29.0, 18.0, 8.0, 12.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 0.0, 3.0], "bins": [-2.1640625, -2.1128387451171875, -2.061614990234375, -2.0103912353515625, -1.95916748046875, -1.9079437255859375, -1.856719970703125, -1.8054962158203125, -1.7542724609375, -1.7030487060546875, -1.651824951171875, -1.6006011962890625, -1.54937744140625, -1.4981536865234375, -1.446929931640625, -1.3957061767578125, -1.344482421875, -1.2932586669921875, -1.242034912109375, -1.1908111572265625, -1.13958740234375, -1.0883636474609375, -1.037139892578125, -0.9859161376953125, -0.9346923828125, -0.8834686279296875, -0.832244873046875, -0.7810211181640625, -0.72979736328125, -0.6785736083984375, -0.627349853515625, -0.5761260986328125, -0.52490234375, -0.4736785888671875, -0.422454833984375, -0.3712310791015625, -0.32000732421875, -0.2687835693359375, -0.217559814453125, -0.1663360595703125, -0.1151123046875, -0.0638885498046875, -0.012664794921875, 0.0385589599609375, 0.08978271484375, 0.1410064697265625, 0.192230224609375, 0.2434539794921875, 0.294677734375, 0.3459014892578125, 0.397125244140625, 0.4483489990234375, 0.49957275390625, 0.5507965087890625, 0.602020263671875, 0.6532440185546875, 0.7044677734375, 0.7556915283203125, 0.806915283203125, 0.8581390380859375, 0.90936279296875, 0.9605865478515625, 1.011810302734375, 1.0630340576171875, 1.1142578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 10.0, 10.0, 11.0, 17.0, 24.0, 46.0, 42.0, 59.0, 70.0, 79.0, 87.0, 87.0, 70.0, 71.0, 55.0, 44.0, 49.0, 35.0, 28.0, 15.0, 14.0, 9.0, 10.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00016927719116210938, -0.0001636296510696411, -0.00015798211097717285, -0.0001523345708847046, -0.00014668703079223633, -0.00014103949069976807, -0.0001353919506072998, -0.00012974441051483154, -0.00012409687042236328, -0.00011844933032989502, -0.00011280179023742676, -0.0001071542501449585, -0.00010150671005249023, -9.585916996002197e-05, -9.021162986755371e-05, -8.456408977508545e-05, -7.891654968261719e-05, -7.326900959014893e-05, -6.762146949768066e-05, -6.19739294052124e-05, -5.632638931274414e-05, -5.067884922027588e-05, -4.503130912780762e-05, -3.9383769035339355e-05, -3.3736228942871094e-05, -2.8088688850402832e-05, -2.244114875793457e-05, -1.679360866546631e-05, -1.1146068572998047e-05, -5.498528480529785e-06, 1.4901161193847656e-07, 5.796551704406738e-06, 1.1444091796875e-05, 1.7091631889343262e-05, 2.2739171981811523e-05, 2.8386712074279785e-05, 3.403425216674805e-05, 3.968179225921631e-05, 4.532933235168457e-05, 5.097687244415283e-05, 5.6624412536621094e-05, 6.227195262908936e-05, 6.791949272155762e-05, 7.356703281402588e-05, 7.921457290649414e-05, 8.48621129989624e-05, 9.050965309143066e-05, 9.615719318389893e-05, 0.00010180473327636719, 0.00010745227336883545, 0.00011309981346130371, 0.00011874735355377197, 0.00012439489364624023, 0.0001300424337387085, 0.00013568997383117676, 0.00014133751392364502, 0.00014698505401611328, 0.00015263259410858154, 0.0001582801342010498, 0.00016392767429351807, 0.00016957521438598633, 0.0001752227544784546, 0.00018087029457092285, 0.0001865178346633911, 0.00019216537475585938]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 6.0, 7.0, 6.0, 7.0, 10.0, 11.0, 22.0, 21.0, 34.0, 67.0, 103.0, 164.0, 301.0, 498.0, 1041.0, 2211.0, 5862.0, 20897.0, 145685.0, 756667.0, 90018.0, 16205.0, 4785.0, 1951.0, 845.0, 452.0, 245.0, 156.0, 86.0, 64.0, 38.0, 22.0, 20.0, 13.0, 11.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59375, -1.542999267578125, -1.49224853515625, -1.441497802734375, -1.3907470703125, -1.339996337890625, -1.28924560546875, -1.238494873046875, -1.187744140625, -1.136993408203125, -1.08624267578125, -1.035491943359375, -0.9847412109375, -0.933990478515625, -0.88323974609375, -0.832489013671875, -0.78173828125, -0.730987548828125, -0.68023681640625, -0.629486083984375, -0.5787353515625, -0.527984619140625, -0.47723388671875, -0.426483154296875, -0.375732421875, -0.324981689453125, -0.27423095703125, -0.223480224609375, -0.1727294921875, -0.121978759765625, -0.07122802734375, -0.020477294921875, 0.0302734375, 0.081024169921875, 0.13177490234375, 0.182525634765625, 0.2332763671875, 0.284027099609375, 0.33477783203125, 0.385528564453125, 0.436279296875, 0.487030029296875, 0.53778076171875, 0.588531494140625, 0.6392822265625, 0.690032958984375, 0.74078369140625, 0.791534423828125, 0.84228515625, 0.893035888671875, 0.94378662109375, 0.994537353515625, 1.0452880859375, 1.096038818359375, 1.14678955078125, 1.197540283203125, 1.248291015625, 1.299041748046875, 1.34979248046875, 1.400543212890625, 1.4512939453125, 1.502044677734375, 1.55279541015625, 1.603546142578125, 1.654296875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 12.0, 12.0, 12.0, 16.0, 23.0, 49.0, 63.0, 87.0, 100.0, 110.0, 123.0, 114.0, 63.0, 50.0, 44.0, 33.0, 11.0, 13.0, 6.0, 9.0, 6.0, 4.0, 8.0, 8.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.63458251953125, -0.6080322265625, -0.58148193359375, -0.554931640625, -0.52838134765625, -0.5018310546875, -0.47528076171875, -0.44873046875, -0.42218017578125, -0.3956298828125, -0.36907958984375, -0.342529296875, -0.31597900390625, -0.2894287109375, -0.26287841796875, -0.236328125, -0.20977783203125, -0.1832275390625, -0.15667724609375, -0.130126953125, -0.10357666015625, -0.0770263671875, -0.05047607421875, -0.02392578125, 0.00262451171875, 0.0291748046875, 0.05572509765625, 0.082275390625, 0.10882568359375, 0.1353759765625, 0.16192626953125, 0.1884765625, 0.21502685546875, 0.2415771484375, 0.26812744140625, 0.294677734375, 0.32122802734375, 0.3477783203125, 0.37432861328125, 0.40087890625, 0.42742919921875, 0.4539794921875, 0.48052978515625, 0.507080078125, 0.53363037109375, 0.5601806640625, 0.58673095703125, 0.61328125, 0.63983154296875, 0.6663818359375, 0.69293212890625, 0.719482421875, 0.74603271484375, 0.7725830078125, 0.79913330078125, 0.82568359375, 0.85223388671875, 0.8787841796875, 0.90533447265625, 0.931884765625, 0.95843505859375, 0.9849853515625, 1.01153564453125, 1.0380859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 14.0, 43.0, 123.0, 226.0, 315.0, 164.0, 76.0, 23.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.48180389404297, -38.68068313598633, -37.87955856323242, -37.07843780517578, -36.277313232421875, -35.476192474365234, -34.675071716308594, -33.87394714355469, -33.07282638549805, -32.271705627441406, -31.4705810546875, -30.66946029663086, -29.868337631225586, -29.067214965820312, -28.26609230041504, -27.464969635009766, -26.663846969604492, -25.86272430419922, -25.061601638793945, -24.260478973388672, -23.45935821533203, -22.658235549926758, -21.857112884521484, -21.05599021911621, -20.254867553710938, -19.453744888305664, -18.65262222290039, -17.85150146484375, -17.050378799438477, -16.249256134033203, -15.44813346862793, -14.647010803222656, -13.845891952514648, -13.044769287109375, -12.243647575378418, -11.442524909973145, -10.641403198242188, -9.840280532836914, -9.03915786743164, -8.238035202026367, -7.43691349029541, -6.635791301727295, -5.83466911315918, -5.033546447753906, -4.232424259185791, -3.431302070617676, -2.6301794052124023, -1.829057216644287, -1.0279350280761719, -0.2268127202987671, 0.5743095874786377, 1.375432014465332, 2.1765542030334473, 2.9776763916015625, 3.778799057006836, 4.579921245574951, 5.381043434143066, 6.182165622711182, 6.983287811279297, 7.78441047668457, 8.585533142089844, 9.3866548538208, 10.187777519226074, 10.988899230957031, 11.790021896362305]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 11.0, 13.0, 15.0, 13.0, 20.0, 20.0, 30.0, 29.0, 28.0, 35.0, 46.0, 36.0, 54.0, 50.0, 44.0, 54.0, 46.0, 55.0, 49.0, 45.0, 40.0, 37.0, 32.0, 36.0, 30.0, 21.0, 20.0, 15.0, 22.0, 12.0, 7.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.447265625, -6.256690979003906, -6.066116809844971, -5.875542640686035, -5.684967994689941, -5.494393348693848, -5.303819179534912, -5.113245010375977, -4.922670364379883, -4.732095718383789, -4.5415215492248535, -4.350947380065918, -4.160372734069824, -3.9697983264923096, -3.779223918914795, -3.5886495113372803, -3.3980751037597656, -3.207500696182251, -3.0169262886047363, -2.8263518810272217, -2.635777473449707, -2.4452030658721924, -2.2546286582946777, -2.064054250717163, -1.8734798431396484, -1.6829054355621338, -1.4923310279846191, -1.3017566204071045, -1.1111822128295898, -0.9206078052520752, -0.7300333976745605, -0.5394589900970459, -0.34888505935668945, -0.1583106517791748, 0.032263755798339844, 0.2228381633758545, 0.41341257095336914, 0.6039869785308838, 0.7945613861083984, 0.9851357936859131, 1.1757102012634277, 1.3662846088409424, 1.556859016418457, 1.7474334239959717, 1.9380078315734863, 2.128582239151001, 2.3191566467285156, 2.5097310543060303, 2.700305461883545, 2.8908798694610596, 3.081454277038574, 3.272028684616089, 3.4626030921936035, 3.653177499771118, 3.843751907348633, 4.034326553344727, 4.224900722503662, 4.415474891662598, 4.606049537658691, 4.796624183654785, 4.987198352813721, 5.177772521972656, 5.36834716796875, 5.558921813964844, 5.749495983123779]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 11.0, 6.0, 13.0, 22.0, 38.0, 40.0, 50.0, 93.0, 153.0, 188.0, 313.0, 491.0, 850.0, 1513.0, 2962.0, 5859.0, 12775.0, 33804.0, 139076.0, 3604437.0, 307607.0, 50422.0, 17453.0, 7641.0, 3657.0, 2019.0, 1067.0, 638.0, 380.0, 240.0, 141.0, 96.0, 64.0, 41.0, 30.0, 24.0, 7.0, 18.0, 6.0, 10.0, 6.0, 0.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9736328125, -1.9132232666015625, -1.852813720703125, -1.7924041748046875, -1.73199462890625, -1.6715850830078125, -1.611175537109375, -1.5507659912109375, -1.4903564453125, -1.4299468994140625, -1.369537353515625, -1.3091278076171875, -1.24871826171875, -1.1883087158203125, -1.127899169921875, -1.0674896240234375, -1.007080078125, -0.9466705322265625, -0.886260986328125, -0.8258514404296875, -0.76544189453125, -0.7050323486328125, -0.644622802734375, -0.5842132568359375, -0.5238037109375, -0.4633941650390625, -0.402984619140625, -0.3425750732421875, -0.28216552734375, -0.2217559814453125, -0.161346435546875, -0.1009368896484375, -0.04052734375, 0.0198822021484375, 0.080291748046875, 0.1407012939453125, 0.20111083984375, 0.2615203857421875, 0.321929931640625, 0.3823394775390625, 0.4427490234375, 0.5031585693359375, 0.563568115234375, 0.6239776611328125, 0.68438720703125, 0.7447967529296875, 0.805206298828125, 0.8656158447265625, 0.926025390625, 0.9864349365234375, 1.046844482421875, 1.1072540283203125, 1.16766357421875, 1.2280731201171875, 1.288482666015625, 1.3488922119140625, 1.4093017578125, 1.4697113037109375, 1.530120849609375, 1.5905303955078125, 1.65093994140625, 1.7113494873046875, 1.771759033203125, 1.8321685791015625, 1.892578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 11.0, 8.0, 7.0, 23.0, 16.0, 21.0, 21.0, 33.0, 33.0, 42.0, 54.0, 62.0, 68.0, 61.0, 62.0, 71.0, 64.0, 67.0, 46.0, 45.0, 41.0, 36.0, 19.0, 25.0, 20.0, 8.0, 8.0, 6.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2471923828125, -0.23877525329589844, -0.23035812377929688, -0.2219409942626953, -0.21352386474609375, -0.2051067352294922, -0.19668960571289062, -0.18827247619628906, -0.1798553466796875, -0.17143821716308594, -0.16302108764648438, -0.1546039581298828, -0.14618682861328125, -0.1377696990966797, -0.12935256958007812, -0.12093544006347656, -0.112518310546875, -0.10410118103027344, -0.09568405151367188, -0.08726692199707031, -0.07884979248046875, -0.07043266296386719, -0.062015533447265625, -0.05359840393066406, -0.0451812744140625, -0.03676414489746094, -0.028347015380859375, -0.019929885864257812, -0.01151275634765625, -0.0030956268310546875, 0.005321502685546875, 0.013738632202148438, 0.02215576171875, 0.030572891235351562, 0.038990020751953125, 0.04740715026855469, 0.05582427978515625, 0.06424140930175781, 0.07265853881835938, 0.08107566833496094, 0.0894927978515625, 0.09790992736816406, 0.10632705688476562, 0.11474418640136719, 0.12316131591796875, 0.1315784454345703, 0.13999557495117188, 0.14841270446777344, 0.156829833984375, 0.16524696350097656, 0.17366409301757812, 0.1820812225341797, 0.19049835205078125, 0.1989154815673828, 0.20733261108398438, 0.21574974060058594, 0.2241668701171875, 0.23258399963378906, 0.24100112915039062, 0.2494182586669922, 0.25783538818359375, 0.2662525177001953, 0.2746696472167969, 0.28308677673339844, 0.29150390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 6.0, 3.0, 10.0, 3.0, 9.0, 13.0, 15.0, 25.0, 26.0, 30.0, 47.0, 69.0, 85.0, 117.0, 173.0, 242.0, 406.0, 613.0, 1157.0, 2098.0, 4512.0, 11415.0, 34471.0, 203964.0, 3714227.0, 169614.0, 31422.0, 10464.0, 4151.0, 2026.0, 1042.0, 615.0, 393.0, 237.0, 148.0, 106.0, 84.0, 62.0, 56.0, 42.0, 20.0, 14.0, 17.0, 14.0, 8.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6328125, -2.54913330078125, -2.4654541015625, -2.38177490234375, -2.298095703125, -2.21441650390625, -2.1307373046875, -2.04705810546875, -1.96337890625, -1.87969970703125, -1.7960205078125, -1.71234130859375, -1.628662109375, -1.54498291015625, -1.4613037109375, -1.37762451171875, -1.2939453125, -1.21026611328125, -1.1265869140625, -1.04290771484375, -0.959228515625, -0.87554931640625, -0.7918701171875, -0.70819091796875, -0.62451171875, -0.54083251953125, -0.4571533203125, -0.37347412109375, -0.289794921875, -0.20611572265625, -0.1224365234375, -0.03875732421875, 0.044921875, 0.12860107421875, 0.2122802734375, 0.29595947265625, 0.379638671875, 0.46331787109375, 0.5469970703125, 0.63067626953125, 0.71435546875, 0.79803466796875, 0.8817138671875, 0.96539306640625, 1.049072265625, 1.13275146484375, 1.2164306640625, 1.30010986328125, 1.3837890625, 1.46746826171875, 1.5511474609375, 1.63482666015625, 1.718505859375, 1.80218505859375, 1.8858642578125, 1.96954345703125, 2.05322265625, 2.13690185546875, 2.2205810546875, 2.30426025390625, 2.387939453125, 2.47161865234375, 2.5552978515625, 2.63897705078125, 2.72265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 11.0, 19.0, 22.0, 41.0, 45.0, 88.0, 221.0, 1189.0, 1852.0, 305.0, 126.0, 49.0, 41.0, 31.0, 5.0, 11.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.273040771484375, -1.22772216796875, -1.182403564453125, -1.1370849609375, -1.091766357421875, -1.04644775390625, -1.001129150390625, -0.955810546875, -0.910491943359375, -0.86517333984375, -0.819854736328125, -0.7745361328125, -0.729217529296875, -0.68389892578125, -0.638580322265625, -0.59326171875, -0.547943115234375, -0.50262451171875, -0.457305908203125, -0.4119873046875, -0.366668701171875, -0.32135009765625, -0.276031494140625, -0.230712890625, -0.185394287109375, -0.14007568359375, -0.094757080078125, -0.0494384765625, -0.004119873046875, 0.04119873046875, 0.086517333984375, 0.1318359375, 0.177154541015625, 0.22247314453125, 0.267791748046875, 0.3131103515625, 0.358428955078125, 0.40374755859375, 0.449066162109375, 0.494384765625, 0.539703369140625, 0.58502197265625, 0.630340576171875, 0.6756591796875, 0.720977783203125, 0.76629638671875, 0.811614990234375, 0.85693359375, 0.902252197265625, 0.94757080078125, 0.992889404296875, 1.0382080078125, 1.083526611328125, 1.12884521484375, 1.174163818359375, 1.219482421875, 1.264801025390625, 1.31011962890625, 1.355438232421875, 1.4007568359375, 1.446075439453125, 1.49139404296875, 1.536712646484375, 1.58203125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 5.0, 7.0, 7.0, 13.0, 20.0, 27.0, 47.0, 53.0, 62.0, 88.0, 107.0, 101.0, 130.0, 74.0, 76.0, 57.0, 42.0, 21.0, 17.0, 19.0, 14.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.147331237792969, -6.9830403327941895, -6.818749904632568, -6.654458999633789, -6.49016809463501, -6.3258771896362305, -6.161586761474609, -5.99729585647583, -5.833004951477051, -5.6687140464782715, -5.50442361831665, -5.340132713317871, -5.175841808319092, -5.0115509033203125, -4.847260475158691, -4.682969570159912, -4.518679141998291, -4.354388236999512, -4.190097808837891, -4.025806903839111, -3.861515998840332, -3.697225332260132, -3.5329346656799316, -3.3686437606811523, -3.204353094100952, -3.040062427520752, -2.8757715225219727, -2.7114808559417725, -2.5471901893615723, -2.382899284362793, -2.2186086177825928, -2.0543179512023926, -1.8900272846221924, -1.7257364988327026, -1.561445713043213, -1.3971550464630127, -1.232864260673523, -1.0685734748840332, -0.9042827486991882, -0.7399920225143433, -0.5757012367248535, -0.41141048073768616, -0.2471197247505188, -0.08282896876335144, 0.08146178722381592, 0.24575257301330566, 0.41004329919815063, 0.5743340253829956, 0.7386248111724854, 0.9029155969619751, 1.0672063827514648, 1.231497049331665, 1.3957878351211548, 1.5600786209106445, 1.7243692874908447, 1.8886600732803345, 2.052950859069824, 2.2172415256500244, 2.3815324306488037, 2.545823097229004, 2.710114002227783, 2.8744046688079834, 3.0386953353881836, 3.202986240386963, 3.367276906967163]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 2.0, 8.0, 6.0, 7.0, 9.0, 14.0, 18.0, 16.0, 27.0, 28.0, 28.0, 37.0, 40.0, 39.0, 37.0, 44.0, 40.0, 45.0, 38.0, 51.0, 47.0, 32.0, 44.0, 34.0, 41.0, 32.0, 33.0, 30.0, 32.0, 27.0, 12.0, 22.0, 12.0, 14.0, 9.0, 10.0, 7.0, 7.0, 3.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.2771413326263428, -3.188575267791748, -3.1000092029571533, -3.0114431381225586, -2.922877311706543, -2.8343112468719482, -2.7457451820373535, -2.657179117202759, -2.568613052368164, -2.4800469875335693, -2.3914809226989746, -2.302915096282959, -2.2143490314483643, -2.1257829666137695, -2.037216901779175, -1.94865083694458, -1.8600850105285645, -1.7715189456939697, -1.6829530000686646, -1.5943869352340698, -1.5058209896087646, -1.41725492477417, -1.3286888599395752, -1.2401227951049805, -1.1515568494796753, -1.0629907846450806, -0.9744248390197754, -0.8858587741851807, -0.7972927689552307, -0.7087267637252808, -0.620160698890686, -0.5315946936607361, -0.44302845001220703, -0.3544624447822571, -0.26589640974998474, -0.1773303747177124, -0.08876436948776245, -0.0001983642578125, 0.08836770057678223, 0.17693370580673218, 0.26549971103668213, 0.3540657162666321, 0.4426317512989044, 0.5311977863311768, 0.6197637915611267, 0.7083297967910767, 0.7968958616256714, 0.8854618668556213, 0.9740278720855713, 1.062593936920166, 1.1511598825454712, 1.239725947380066, 1.328291893005371, 1.4168579578399658, 1.5054240226745605, 1.5939900875091553, 1.6825560331344604, 1.7711220979690552, 1.8596880435943604, 1.948254108428955, 2.03682017326355, 2.1253862380981445, 2.21395206451416, 2.302518129348755, 2.3910841941833496]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 13.0, 14.0, 23.0, 31.0, 51.0, 72.0, 112.0, 205.0, 353.0, 650.0, 1338.0, 2901.0, 6290.0, 15960.0, 48803.0, 231779.0, 628917.0, 72715.0, 22623.0, 8567.0, 3529.0, 1703.0, 815.0, 446.0, 237.0, 148.0, 69.0, 59.0, 51.0, 20.0, 17.0, 7.0, 9.0, 3.0, 2.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.5369873046875, -2.452880859375, -2.3687744140625, -2.28466796875, -2.2005615234375, -2.116455078125, -2.0323486328125, -1.9482421875, -1.8641357421875, -1.780029296875, -1.6959228515625, -1.61181640625, -1.5277099609375, -1.443603515625, -1.3594970703125, -1.275390625, -1.1912841796875, -1.107177734375, -1.0230712890625, -0.93896484375, -0.8548583984375, -0.770751953125, -0.6866455078125, -0.6025390625, -0.5184326171875, -0.434326171875, -0.3502197265625, -0.26611328125, -0.1820068359375, -0.097900390625, -0.0137939453125, 0.0703125, 0.1544189453125, 0.238525390625, 0.3226318359375, 0.40673828125, 0.4908447265625, 0.574951171875, 0.6590576171875, 0.7431640625, 0.8272705078125, 0.911376953125, 0.9954833984375, 1.07958984375, 1.1636962890625, 1.247802734375, 1.3319091796875, 1.416015625, 1.5001220703125, 1.584228515625, 1.6683349609375, 1.75244140625, 1.8365478515625, 1.920654296875, 2.0047607421875, 2.0888671875, 2.1729736328125, 2.257080078125, 2.3411865234375, 2.42529296875, 2.5093994140625, 2.593505859375, 2.6776123046875, 2.76171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 9.0, 9.0, 12.0, 12.0, 16.0, 19.0, 11.0, 26.0, 34.0, 36.0, 49.0, 32.0, 54.0, 46.0, 63.0, 41.0, 64.0, 63.0, 53.0, 42.0, 37.0, 36.0, 42.0, 32.0, 30.0, 23.0, 26.0, 13.0, 13.0, 9.0, 7.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.25146484375, -0.24406814575195312, -0.23667144775390625, -0.22927474975585938, -0.2218780517578125, -0.21448135375976562, -0.20708465576171875, -0.19968795776367188, -0.192291259765625, -0.18489456176757812, -0.17749786376953125, -0.17010116577148438, -0.1627044677734375, -0.15530776977539062, -0.14791107177734375, -0.14051437377929688, -0.13311767578125, -0.12572097778320312, -0.11832427978515625, -0.11092758178710938, -0.1035308837890625, -0.09613418579101562, -0.08873748779296875, -0.08134078979492188, -0.073944091796875, -0.06654739379882812, -0.05915069580078125, -0.051753997802734375, -0.0443572998046875, -0.036960601806640625, -0.02956390380859375, -0.022167205810546875, -0.0147705078125, -0.007373809814453125, 2.288818359375e-05, 0.007419586181640625, 0.0148162841796875, 0.022212982177734375, 0.02960968017578125, 0.037006378173828125, 0.044403076171875, 0.051799774169921875, 0.05919647216796875, 0.06659317016601562, 0.0739898681640625, 0.08138656616210938, 0.08878326416015625, 0.09617996215820312, 0.10357666015625, 0.11097335815429688, 0.11837005615234375, 0.12576675415039062, 0.1331634521484375, 0.14056015014648438, 0.14795684814453125, 0.15535354614257812, 0.162750244140625, 0.17014694213867188, 0.17754364013671875, 0.18494033813476562, 0.1923370361328125, 0.19973373413085938, 0.20713043212890625, 0.21452713012695312, 0.221923828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 12.0, 9.0, 19.0, 25.0, 46.0, 71.0, 110.0, 189.0, 407.0, 804.0, 1867.0, 5354.0, 22370.0, 191639.0, 764198.0, 47615.0, 8957.0, 2650.0, 1056.0, 498.0, 266.0, 155.0, 79.0, 59.0, 41.0, 20.0, 15.0, 8.0, 3.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.716796875, -3.6112060546875, -3.505615234375, -3.4000244140625, -3.29443359375, -3.1888427734375, -3.083251953125, -2.9776611328125, -2.8720703125, -2.7664794921875, -2.660888671875, -2.5552978515625, -2.44970703125, -2.3441162109375, -2.238525390625, -2.1329345703125, -2.02734375, -1.9217529296875, -1.816162109375, -1.7105712890625, -1.60498046875, -1.4993896484375, -1.393798828125, -1.2882080078125, -1.1826171875, -1.0770263671875, -0.971435546875, -0.8658447265625, -0.76025390625, -0.6546630859375, -0.549072265625, -0.4434814453125, -0.337890625, -0.2322998046875, -0.126708984375, -0.0211181640625, 0.08447265625, 0.1900634765625, 0.295654296875, 0.4012451171875, 0.5068359375, 0.6124267578125, 0.718017578125, 0.8236083984375, 0.92919921875, 1.0347900390625, 1.140380859375, 1.2459716796875, 1.3515625, 1.4571533203125, 1.562744140625, 1.6683349609375, 1.77392578125, 1.8795166015625, 1.985107421875, 2.0906982421875, 2.1962890625, 2.3018798828125, 2.407470703125, 2.5130615234375, 2.61865234375, 2.7242431640625, 2.829833984375, 2.9354248046875, 3.041015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 6.0, 7.0, 5.0, 4.0, 8.0, 7.0, 10.0, 17.0, 21.0, 16.0, 25.0, 27.0, 27.0, 35.0, 42.0, 40.0, 42.0, 37.0, 45.0, 35.0, 50.0, 52.0, 43.0, 35.0, 34.0, 34.0, 39.0, 23.0, 30.0, 21.0, 19.0, 29.0, 22.0, 11.0, 13.0, 13.0, 6.0, 10.0, 9.0, 13.0, 2.0, 5.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0], "bins": [-1.0263671875, -0.9971084594726562, -0.9678497314453125, -0.9385910034179688, -0.909332275390625, -0.8800735473632812, -0.8508148193359375, -0.8215560913085938, -0.79229736328125, -0.7630386352539062, -0.7337799072265625, -0.7045211791992188, -0.675262451171875, -0.6460037231445312, -0.6167449951171875, -0.5874862670898438, -0.5582275390625, -0.5289688110351562, -0.4997100830078125, -0.47045135498046875, -0.441192626953125, -0.41193389892578125, -0.3826751708984375, -0.35341644287109375, -0.32415771484375, -0.29489898681640625, -0.2656402587890625, -0.23638153076171875, -0.207122802734375, -0.17786407470703125, -0.1486053466796875, -0.11934661865234375, -0.090087890625, -0.06082916259765625, -0.0315704345703125, -0.00231170654296875, 0.026947021484375, 0.05620574951171875, 0.0854644775390625, 0.11472320556640625, 0.14398193359375, 0.17324066162109375, 0.2024993896484375, 0.23175811767578125, 0.261016845703125, 0.29027557373046875, 0.3195343017578125, 0.34879302978515625, 0.3780517578125, 0.40731048583984375, 0.4365692138671875, 0.46582794189453125, 0.495086669921875, 0.5243453979492188, 0.5536041259765625, 0.5828628540039062, 0.61212158203125, 0.6413803100585938, 0.6706390380859375, 0.6998977661132812, 0.729156494140625, 0.7584152221679688, 0.7876739501953125, 0.8169326782226562, 0.84619140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 7.0, 12.0, 10.0, 31.0, 54.0, 67.0, 107.0, 144.0, 263.0, 533.0, 900.0, 1971.0, 5674.0, 21678.0, 139358.0, 753335.0, 98717.0, 17317.0, 4674.0, 1829.0, 801.0, 411.0, 248.0, 154.0, 77.0, 67.0, 38.0, 19.0, 17.0, 11.0, 3.0, 5.0, 3.0, 8.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.238189697265625, -1.19610595703125, -1.154022216796875, -1.1119384765625, -1.069854736328125, -1.02777099609375, -0.985687255859375, -0.943603515625, -0.901519775390625, -0.85943603515625, -0.817352294921875, -0.7752685546875, -0.733184814453125, -0.69110107421875, -0.649017333984375, -0.60693359375, -0.564849853515625, -0.52276611328125, -0.480682373046875, -0.4385986328125, -0.396514892578125, -0.35443115234375, -0.312347412109375, -0.270263671875, -0.228179931640625, -0.18609619140625, -0.144012451171875, -0.1019287109375, -0.059844970703125, -0.01776123046875, 0.024322509765625, 0.06640625, 0.108489990234375, 0.15057373046875, 0.192657470703125, 0.2347412109375, 0.276824951171875, 0.31890869140625, 0.360992431640625, 0.403076171875, 0.445159912109375, 0.48724365234375, 0.529327392578125, 0.5714111328125, 0.613494873046875, 0.65557861328125, 0.697662353515625, 0.73974609375, 0.781829833984375, 0.82391357421875, 0.865997314453125, 0.9080810546875, 0.950164794921875, 0.99224853515625, 1.034332275390625, 1.076416015625, 1.118499755859375, 1.16058349609375, 1.202667236328125, 1.2447509765625, 1.286834716796875, 1.32891845703125, 1.371002197265625, 1.4130859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 9.0, 8.0, 10.0, 7.0, 20.0, 32.0, 56.0, 96.0, 171.0, 208.0, 159.0, 93.0, 43.0, 32.0, 18.0, 20.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024402141571044922, -0.00023440830409526825, -0.00022479519248008728, -0.0002151820808649063, -0.00020556896924972534, -0.00019595585763454437, -0.0001863427460193634, -0.00017672963440418243, -0.00016711652278900146, -0.0001575034111738205, -0.00014789029955863953, -0.00013827718794345856, -0.0001286640763282776, -0.00011905096471309662, -0.00010943785309791565, -9.982474148273468e-05, -9.021162986755371e-05, -8.059851825237274e-05, -7.098540663719177e-05, -6.13722950220108e-05, -5.1759183406829834e-05, -4.2146071791648865e-05, -3.2532960176467896e-05, -2.2919848561286926e-05, -1.3306736946105957e-05, -3.693625330924988e-06, 5.9194862842559814e-06, 1.553259789943695e-05, 2.514570951461792e-05, 3.475882112979889e-05, 4.437193274497986e-05, 5.398504436016083e-05, 6.35981559753418e-05, 7.321126759052277e-05, 8.282437920570374e-05, 9.24374908208847e-05, 0.00010205060243606567, 0.00011166371405124664, 0.00012127682566642761, 0.00013088993728160858, 0.00014050304889678955, 0.00015011616051197052, 0.0001597292721271515, 0.00016934238374233246, 0.00017895549535751343, 0.0001885686069726944, 0.00019818171858787537, 0.00020779483020305634, 0.0002174079418182373, 0.00022702105343341827, 0.00023663416504859924, 0.0002462472766637802, 0.0002558603882789612, 0.00026547349989414215, 0.0002750866115093231, 0.0002846997231245041, 0.00029431283473968506, 0.00030392594635486603, 0.000313539057970047, 0.00032315216958522797, 0.00033276528120040894, 0.0003423783928155899, 0.0003519915044307709, 0.00036160461604595184, 0.0003712177276611328]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 7.0, 10.0, 10.0, 12.0, 13.0, 18.0, 34.0, 37.0, 64.0, 91.0, 137.0, 231.0, 485.0, 997.0, 2201.0, 5844.0, 21506.0, 137674.0, 748783.0, 103823.0, 17597.0, 5118.0, 1928.0, 825.0, 430.0, 241.0, 140.0, 97.0, 62.0, 48.0, 28.0, 18.0, 15.0, 8.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0517578125, -1.0147705078125, -0.977783203125, -0.9407958984375, -0.90380859375, -0.8668212890625, -0.829833984375, -0.7928466796875, -0.755859375, -0.7188720703125, -0.681884765625, -0.6448974609375, -0.60791015625, -0.5709228515625, -0.533935546875, -0.4969482421875, -0.4599609375, -0.4229736328125, -0.385986328125, -0.3489990234375, -0.31201171875, -0.2750244140625, -0.238037109375, -0.2010498046875, -0.1640625, -0.1270751953125, -0.090087890625, -0.0531005859375, -0.01611328125, 0.0208740234375, 0.057861328125, 0.0948486328125, 0.1318359375, 0.1688232421875, 0.205810546875, 0.2427978515625, 0.27978515625, 0.3167724609375, 0.353759765625, 0.3907470703125, 0.427734375, 0.4647216796875, 0.501708984375, 0.5386962890625, 0.57568359375, 0.6126708984375, 0.649658203125, 0.6866455078125, 0.7236328125, 0.7606201171875, 0.797607421875, 0.8345947265625, 0.87158203125, 0.9085693359375, 0.945556640625, 0.9825439453125, 1.01953125, 1.0565185546875, 1.093505859375, 1.1304931640625, 1.16748046875, 1.2044677734375, 1.241455078125, 1.2784423828125, 1.3154296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 5.0, 6.0, 9.0, 13.0, 10.0, 19.0, 17.0, 17.0, 34.0, 53.0, 64.0, 129.0, 142.0, 140.0, 96.0, 58.0, 37.0, 31.0, 21.0, 12.0, 12.0, 9.0, 18.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.7000808715820312, -0.6779937744140625, -0.6559066772460938, -0.633819580078125, -0.6117324829101562, -0.5896453857421875, -0.5675582885742188, -0.54547119140625, -0.5233840942382812, -0.5012969970703125, -0.47920989990234375, -0.457122802734375, -0.43503570556640625, -0.4129486083984375, -0.39086151123046875, -0.3687744140625, -0.34668731689453125, -0.3246002197265625, -0.30251312255859375, -0.280426025390625, -0.25833892822265625, -0.2362518310546875, -0.21416473388671875, -0.19207763671875, -0.16999053955078125, -0.1479034423828125, -0.12581634521484375, -0.103729248046875, -0.08164215087890625, -0.0595550537109375, -0.03746795654296875, -0.015380859375, 0.00670623779296875, 0.0287933349609375, 0.05088043212890625, 0.072967529296875, 0.09505462646484375, 0.1171417236328125, 0.13922882080078125, 0.16131591796875, 0.18340301513671875, 0.2054901123046875, 0.22757720947265625, 0.249664306640625, 0.27175140380859375, 0.2938385009765625, 0.31592559814453125, 0.3380126953125, 0.36009979248046875, 0.3821868896484375, 0.40427398681640625, 0.426361083984375, 0.44844818115234375, 0.4705352783203125, 0.49262237548828125, 0.51470947265625, 0.5367965698242188, 0.5588836669921875, 0.5809707641601562, 0.603057861328125, 0.6251449584960938, 0.6472320556640625, 0.6693191528320312, 0.69140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 10.0, 14.0, 13.0, 24.0, 43.0, 62.0, 78.0, 103.0, 132.0, 128.0, 103.0, 93.0, 61.0, 62.0, 27.0, 20.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.203218460083008, -12.840780258178711, -12.478341102600098, -12.1159029006958, -11.753463745117188, -11.39102554321289, -11.028586387634277, -10.66614818572998, -10.303709030151367, -9.94127082824707, -9.578831672668457, -9.21639347076416, -8.853954315185547, -8.49151611328125, -8.129076957702637, -7.76663875579834, -7.404200077056885, -7.04176139831543, -6.679322719573975, -6.3168840408325195, -5.9544453620910645, -5.592006683349609, -5.2295684814453125, -4.867129325866699, -4.504691123962402, -4.142252445220947, -3.779813766479492, -3.417375087738037, -3.054936408996582, -2.692497730255127, -2.330059289932251, -1.967620611190796, -1.6051816940307617, -1.2427430152893066, -0.8803043961524963, -0.517865777015686, -0.15542709827423096, 0.20701158046722412, 0.5694501399993896, 0.9318888187408447, 1.2943274974822998, 1.6567661762237549, 2.01920485496521, 2.381643295288086, 2.744081974029541, 3.106520652770996, 3.468959331512451, 3.8313980102539062, 4.193836688995361, 4.556275367736816, 4.9187140464782715, 5.281152725219727, 5.643591403961182, 6.006030082702637, 6.368468284606934, 6.730907440185547, 7.093345642089844, 7.455784320831299, 7.818222999572754, 8.18066120147705, 8.543100357055664, 8.905538558959961, 9.267977714538574, 9.630415916442871, 9.992855072021484]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 8.0, 7.0, 7.0, 3.0, 8.0, 19.0, 15.0, 11.0, 21.0, 22.0, 29.0, 26.0, 30.0, 38.0, 41.0, 32.0, 32.0, 36.0, 42.0, 36.0, 41.0, 37.0, 43.0, 41.0, 35.0, 23.0, 33.0, 28.0, 19.0, 20.0, 22.0, 28.0, 14.0, 19.0, 21.0, 19.0, 9.0, 8.0, 10.0, 18.0, 5.0, 8.0, 4.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.347520351409912, -4.207920551300049, -4.068320274353027, -3.928720474243164, -3.7891204357147217, -3.6495203971862793, -3.509920597076416, -3.3703205585479736, -3.2307205200195312, -3.091120481491089, -2.9515204429626465, -2.811920642852783, -2.672320604324341, -2.5327205657958984, -2.393120765686035, -2.2535207271575928, -2.1139206886291504, -1.974320650100708, -1.8347207307815552, -1.6951208114624023, -1.55552077293396, -1.4159207344055176, -1.2763208150863647, -1.136720895767212, -0.9971208572387695, -0.8575208783149719, -0.7179208993911743, -0.5783209204673767, -0.4387209415435791, -0.2991209626197815, -0.1595209836959839, -0.01992100477218628, 0.11967897415161133, 0.25927895307540894, 0.39887893199920654, 0.5384789109230042, 0.6780788898468018, 0.8176788687705994, 0.957278847694397, 1.0968787670135498, 1.2364788055419922, 1.3760788440704346, 1.5156787633895874, 1.6552786827087402, 1.7948787212371826, 1.934478759765625, 2.0740785598754883, 2.2136785984039307, 2.353278636932373, 2.4928786754608154, 2.632478713989258, 2.772078514099121, 2.9116785526275635, 3.051278591156006, 3.190878391265869, 3.3304784297943115, 3.470078468322754, 3.6096785068511963, 3.7492785453796387, 3.888878345489502, 4.028478622436523, 4.168078422546387, 4.30767822265625, 4.4472784996032715, 4.586878299713135]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 9.0, 17.0, 11.0, 32.0, 52.0, 69.0, 129.0, 303.0, 655.0, 1513.0, 4136.0, 12567.0, 57021.0, 3677438.0, 393514.0, 32838.0, 8627.0, 3083.0, 1209.0, 530.0, 254.0, 115.0, 77.0, 23.0, 25.0, 15.0, 6.0, 9.0, 4.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.3795166015625, -3.276611328125, -3.1737060546875, -3.07080078125, -2.9678955078125, -2.864990234375, -2.7620849609375, -2.6591796875, -2.5562744140625, -2.453369140625, -2.3504638671875, -2.24755859375, -2.1446533203125, -2.041748046875, -1.9388427734375, -1.8359375, -1.7330322265625, -1.630126953125, -1.5272216796875, -1.42431640625, -1.3214111328125, -1.218505859375, -1.1156005859375, -1.0126953125, -0.9097900390625, -0.806884765625, -0.7039794921875, -0.60107421875, -0.4981689453125, -0.395263671875, -0.2923583984375, -0.189453125, -0.0865478515625, 0.016357421875, 0.1192626953125, 0.22216796875, 0.3250732421875, 0.427978515625, 0.5308837890625, 0.6337890625, 0.7366943359375, 0.839599609375, 0.9425048828125, 1.04541015625, 1.1483154296875, 1.251220703125, 1.3541259765625, 1.45703125, 1.5599365234375, 1.662841796875, 1.7657470703125, 1.86865234375, 1.9715576171875, 2.074462890625, 2.1773681640625, 2.2802734375, 2.3831787109375, 2.486083984375, 2.5889892578125, 2.69189453125, 2.7947998046875, 2.897705078125, 3.0006103515625, 3.103515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 9.0, 6.0, 15.0, 13.0, 12.0, 19.0, 23.0, 28.0, 22.0, 36.0, 39.0, 33.0, 47.0, 46.0, 50.0, 52.0, 66.0, 47.0, 40.0, 50.0, 44.0, 34.0, 36.0, 37.0, 29.0, 30.0, 19.0, 25.0, 16.0, 13.0, 14.0, 5.0, 6.0, 6.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2366943359375, -0.2294139862060547, -0.22213363647460938, -0.21485328674316406, -0.20757293701171875, -0.20029258728027344, -0.19301223754882812, -0.1857318878173828, -0.1784515380859375, -0.1711711883544922, -0.16389083862304688, -0.15661048889160156, -0.14933013916015625, -0.14204978942871094, -0.13476943969726562, -0.1274890899658203, -0.120208740234375, -0.11292839050292969, -0.10564804077148438, -0.09836769104003906, -0.09108734130859375, -0.08380699157714844, -0.07652664184570312, -0.06924629211425781, -0.0619659423828125, -0.05468559265136719, -0.047405242919921875, -0.04012489318847656, -0.03284454345703125, -0.025564193725585938, -0.018283843994140625, -0.011003494262695312, -0.00372314453125, 0.0035572052001953125, 0.010837554931640625, 0.018117904663085938, 0.02539825439453125, 0.03267860412597656, 0.039958953857421875, 0.04723930358886719, 0.0545196533203125, 0.06180000305175781, 0.06908035278320312, 0.07636070251464844, 0.08364105224609375, 0.09092140197753906, 0.09820175170898438, 0.10548210144042969, 0.112762451171875, 0.12004280090332031, 0.12732315063476562, 0.13460350036621094, 0.14188385009765625, 0.14916419982910156, 0.15644454956054688, 0.1637248992919922, 0.1710052490234375, 0.1782855987548828, 0.18556594848632812, 0.19284629821777344, 0.20012664794921875, 0.20740699768066406, 0.21468734741210938, 0.2219676971435547, 0.229248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 11.0, 9.0, 24.0, 30.0, 44.0, 43.0, 75.0, 97.0, 131.0, 170.0, 286.0, 399.0, 555.0, 908.0, 1503.0, 2577.0, 4764.0, 10419.0, 26170.0, 118661.0, 3708240.0, 254017.0, 38201.0, 13108.0, 5967.0, 3026.0, 1702.0, 1024.0, 661.0, 425.0, 305.0, 204.0, 161.0, 100.0, 76.0, 54.0, 33.0, 33.0, 23.0, 13.0, 14.0, 13.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.013671875, -2.92913818359375, -2.8446044921875, -2.76007080078125, -2.675537109375, -2.59100341796875, -2.5064697265625, -2.42193603515625, -2.33740234375, -2.25286865234375, -2.1683349609375, -2.08380126953125, -1.999267578125, -1.91473388671875, -1.8302001953125, -1.74566650390625, -1.6611328125, -1.57659912109375, -1.4920654296875, -1.40753173828125, -1.322998046875, -1.23846435546875, -1.1539306640625, -1.06939697265625, -0.98486328125, -0.90032958984375, -0.8157958984375, -0.73126220703125, -0.646728515625, -0.56219482421875, -0.4776611328125, -0.39312744140625, -0.30859375, -0.22406005859375, -0.1395263671875, -0.05499267578125, 0.029541015625, 0.11407470703125, 0.1986083984375, 0.28314208984375, 0.36767578125, 0.45220947265625, 0.5367431640625, 0.62127685546875, 0.705810546875, 0.79034423828125, 0.8748779296875, 0.95941162109375, 1.0439453125, 1.12847900390625, 1.2130126953125, 1.29754638671875, 1.382080078125, 1.46661376953125, 1.5511474609375, 1.63568115234375, 1.72021484375, 1.80474853515625, 1.8892822265625, 1.97381591796875, 2.058349609375, 2.14288330078125, 2.2274169921875, 2.31195068359375, 2.396484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 4.0, 12.0, 22.0, 15.0, 34.0, 50.0, 121.0, 344.0, 2286.0, 775.0, 172.0, 83.0, 42.0, 31.0, 23.0, 18.0, 4.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1064453125, -1.068023681640625, -1.02960205078125, -0.991180419921875, -0.9527587890625, -0.914337158203125, -0.87591552734375, -0.837493896484375, -0.799072265625, -0.760650634765625, -0.72222900390625, -0.683807373046875, -0.6453857421875, -0.606964111328125, -0.56854248046875, -0.530120849609375, -0.49169921875, -0.453277587890625, -0.41485595703125, -0.376434326171875, -0.3380126953125, -0.299591064453125, -0.26116943359375, -0.222747802734375, -0.184326171875, -0.145904541015625, -0.10748291015625, -0.069061279296875, -0.0306396484375, 0.007781982421875, 0.04620361328125, 0.084625244140625, 0.123046875, 0.161468505859375, 0.19989013671875, 0.238311767578125, 0.2767333984375, 0.315155029296875, 0.35357666015625, 0.391998291015625, 0.430419921875, 0.468841552734375, 0.50726318359375, 0.545684814453125, 0.5841064453125, 0.622528076171875, 0.66094970703125, 0.699371337890625, 0.73779296875, 0.776214599609375, 0.81463623046875, 0.853057861328125, 0.8914794921875, 0.929901123046875, 0.96832275390625, 1.006744384765625, 1.045166015625, 1.083587646484375, 1.12200927734375, 1.160430908203125, 1.1988525390625, 1.237274169921875, 1.27569580078125, 1.314117431640625, 1.3525390625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 13.0, 27.0, 39.0, 53.0, 61.0, 102.0, 136.0, 135.0, 117.0, 108.0, 66.0, 43.0, 31.0, 18.0, 16.0, 5.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.593568801879883, -8.387064933776855, -8.180561065673828, -7.974057197570801, -7.767553806304932, -7.561049938201904, -7.354546070098877, -7.14804220199585, -6.941538333892822, -6.735034465789795, -6.528530597686768, -6.322027206420898, -6.115523338317871, -5.909019470214844, -5.702515602111816, -5.496011734008789, -5.289507865905762, -5.083003997802734, -4.876500129699707, -4.66999626159668, -4.4634928703308105, -4.256989002227783, -4.050485134124756, -3.8439812660217285, -3.6374778747558594, -3.430974006652832, -3.224470376968384, -3.0179665088653564, -2.811462640762329, -2.604959011077881, -2.3984551429748535, -2.191951274871826, -1.9854474067687988, -1.778943657875061, -1.5724397897720337, -1.365936040878296, -1.1594321727752686, -0.9529284238815308, -0.746424674987793, -0.5399208068847656, -0.33341705799102783, -0.12691326439380646, 0.07959052920341492, 0.2860943078994751, 0.49259811639785767, 0.6991019248962402, 0.905605673789978, 1.1121095418930054, 1.3186132907867432, 1.525117039680481, 1.7316209077835083, 1.938124656677246, 2.1446285247802734, 2.351132392883301, 2.557636022567749, 2.7641398906707764, 2.9706435203552246, 3.177147388458252, 3.3836510181427, 3.5901548862457275, 3.796658754348755, 4.003162384033203, 4.2096662521362305, 4.416170120239258, 4.622673988342285]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 8.0, 17.0, 22.0, 19.0, 30.0, 34.0, 32.0, 47.0, 32.0, 42.0, 39.0, 38.0, 37.0, 40.0, 40.0, 56.0, 47.0, 36.0, 40.0, 38.0, 31.0, 30.0, 27.0, 35.0, 20.0, 26.0, 27.0, 19.0, 15.0, 14.0, 11.0, 10.0, 12.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.7790279388427734, -2.690699338912964, -2.6023707389831543, -2.5140419006347656, -2.425713300704956, -2.3373847007751465, -2.249056100845337, -2.1607275009155273, -2.0723986625671387, -1.984070062637329, -1.89574134349823, -1.8074127435684204, -1.7190840244293213, -1.6307554244995117, -1.5424268245697021, -1.4540982246398926, -1.365769624710083, -1.2774410247802734, -1.1891123056411743, -1.1007837057113647, -1.0124549865722656, -0.924126386642456, -0.8357977867126465, -0.7474691271781921, -0.6591404676437378, -0.5708118081092834, -0.4824831783771515, -0.39415454864501953, -0.3058258891105652, -0.21749722957611084, -0.12916862964630127, -0.040839970111846924, 0.04748892784118652, 0.13581757247447968, 0.22414621710777283, 0.3124748468399048, 0.40080350637435913, 0.4891321659088135, 0.577460765838623, 0.6657894253730774, 0.7541180849075317, 0.8424467444419861, 0.9307754039764404, 1.01910400390625, 1.1074326038360596, 1.1957613229751587, 1.2840899229049683, 1.3724186420440674, 1.460747241973877, 1.5490758419036865, 1.6374045610427856, 1.7257331609725952, 1.8140618801116943, 1.902390480041504, 1.9907190799713135, 2.079047679901123, 2.1673765182495117, 2.2557051181793213, 2.344033718109131, 2.4323625564575195, 2.520691156387329, 2.6090197563171387, 2.6973483562469482, 2.785676956176758, 2.8740055561065674]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 7.0, 4.0, 13.0, 10.0, 13.0, 28.0, 35.0, 57.0, 81.0, 80.0, 168.0, 240.0, 345.0, 588.0, 967.0, 1796.0, 3108.0, 5421.0, 10012.0, 18774.0, 38241.0, 106435.0, 569413.0, 190702.0, 50631.0, 23645.0, 12167.0, 6576.0, 3744.0, 2038.0, 1209.0, 725.0, 450.0, 261.0, 176.0, 113.0, 86.0, 51.0, 40.0, 26.0, 21.0, 16.0, 8.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4619140625, -1.4171600341796875, -1.372406005859375, -1.3276519775390625, -1.28289794921875, -1.2381439208984375, -1.193389892578125, -1.1486358642578125, -1.1038818359375, -1.0591278076171875, -1.014373779296875, -0.9696197509765625, -0.92486572265625, -0.8801116943359375, -0.835357666015625, -0.7906036376953125, -0.745849609375, -0.7010955810546875, -0.656341552734375, -0.6115875244140625, -0.56683349609375, -0.5220794677734375, -0.477325439453125, -0.4325714111328125, -0.3878173828125, -0.3430633544921875, -0.298309326171875, -0.2535552978515625, -0.20880126953125, -0.1640472412109375, -0.119293212890625, -0.0745391845703125, -0.02978515625, 0.0149688720703125, 0.059722900390625, 0.1044769287109375, 0.14923095703125, 0.1939849853515625, 0.238739013671875, 0.2834930419921875, 0.3282470703125, 0.3730010986328125, 0.417755126953125, 0.4625091552734375, 0.50726318359375, 0.5520172119140625, 0.596771240234375, 0.6415252685546875, 0.686279296875, 0.7310333251953125, 0.775787353515625, 0.8205413818359375, 0.86529541015625, 0.9100494384765625, 0.954803466796875, 0.9995574951171875, 1.0443115234375, 1.0890655517578125, 1.133819580078125, 1.1785736083984375, 1.22332763671875, 1.2680816650390625, 1.312835693359375, 1.3575897216796875, 1.40234375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 10.0, 7.0, 18.0, 18.0, 20.0, 22.0, 28.0, 28.0, 30.0, 43.0, 55.0, 51.0, 46.0, 53.0, 49.0, 54.0, 43.0, 52.0, 54.0, 42.0, 39.0, 34.0, 27.0, 22.0, 31.0, 25.0, 13.0, 16.0, 11.0, 13.0, 6.0, 6.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24929428100585938, -0.24102020263671875, -0.23274612426757812, -0.2244720458984375, -0.21619796752929688, -0.20792388916015625, -0.19964981079101562, -0.191375732421875, -0.18310165405273438, -0.17482757568359375, -0.16655349731445312, -0.1582794189453125, -0.15000534057617188, -0.14173126220703125, -0.13345718383789062, -0.12518310546875, -0.11690902709960938, -0.10863494873046875, -0.10036087036132812, -0.0920867919921875, -0.08381271362304688, -0.07553863525390625, -0.06726455688476562, -0.058990478515625, -0.050716400146484375, -0.04244232177734375, -0.034168243408203125, -0.0258941650390625, -0.017620086669921875, -0.00934600830078125, -0.001071929931640625, 0.0072021484375, 0.015476226806640625, 0.02375030517578125, 0.032024383544921875, 0.0402984619140625, 0.048572540283203125, 0.05684661865234375, 0.06512069702148438, 0.073394775390625, 0.08166885375976562, 0.08994293212890625, 0.09821701049804688, 0.1064910888671875, 0.11476516723632812, 0.12303924560546875, 0.13131332397460938, 0.13958740234375, 0.14786148071289062, 0.15613555908203125, 0.16440963745117188, 0.1726837158203125, 0.18095779418945312, 0.18923187255859375, 0.19750595092773438, 0.205780029296875, 0.21405410766601562, 0.22232818603515625, 0.23060226440429688, 0.2388763427734375, 0.24715042114257812, 0.25542449951171875, 0.2636985778808594, 0.27197265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 9.0, 9.0, 12.0, 24.0, 35.0, 48.0, 135.0, 179.0, 305.0, 618.0, 1201.0, 2345.0, 5549.0, 13063.0, 35372.0, 159297.0, 726938.0, 65792.0, 21803.0, 8542.0, 3720.0, 1689.0, 827.0, 417.0, 249.0, 129.0, 77.0, 51.0, 29.0, 28.0, 13.0, 17.0, 7.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.78125, -2.704559326171875, -2.62786865234375, -2.551177978515625, -2.4744873046875, -2.397796630859375, -2.32110595703125, -2.244415283203125, -2.167724609375, -2.091033935546875, -2.01434326171875, -1.937652587890625, -1.8609619140625, -1.784271240234375, -1.70758056640625, -1.630889892578125, -1.55419921875, -1.477508544921875, -1.40081787109375, -1.324127197265625, -1.2474365234375, -1.170745849609375, -1.09405517578125, -1.017364501953125, -0.940673828125, -0.863983154296875, -0.78729248046875, -0.710601806640625, -0.6339111328125, -0.557220458984375, -0.48052978515625, -0.403839111328125, -0.3271484375, -0.250457763671875, -0.17376708984375, -0.097076416015625, -0.0203857421875, 0.056304931640625, 0.13299560546875, 0.209686279296875, 0.286376953125, 0.363067626953125, 0.43975830078125, 0.516448974609375, 0.5931396484375, 0.669830322265625, 0.74652099609375, 0.823211669921875, 0.89990234375, 0.976593017578125, 1.05328369140625, 1.129974365234375, 1.2066650390625, 1.283355712890625, 1.36004638671875, 1.436737060546875, 1.513427734375, 1.590118408203125, 1.66680908203125, 1.743499755859375, 1.8201904296875, 1.896881103515625, 1.97357177734375, 2.050262451171875, 2.126953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 8.0, 6.0, 5.0, 6.0, 9.0, 14.0, 11.0, 21.0, 21.0, 31.0, 34.0, 37.0, 46.0, 41.0, 50.0, 65.0, 60.0, 65.0, 64.0, 56.0, 49.0, 49.0, 43.0, 37.0, 35.0, 30.0, 29.0, 21.0, 25.0, 8.0, 9.0, 7.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3349609375, -1.29290771484375, -1.2508544921875, -1.20880126953125, -1.166748046875, -1.12469482421875, -1.0826416015625, -1.04058837890625, -0.99853515625, -0.95648193359375, -0.9144287109375, -0.87237548828125, -0.830322265625, -0.78826904296875, -0.7462158203125, -0.70416259765625, -0.662109375, -0.62005615234375, -0.5780029296875, -0.53594970703125, -0.493896484375, -0.45184326171875, -0.4097900390625, -0.36773681640625, -0.32568359375, -0.28363037109375, -0.2415771484375, -0.19952392578125, -0.157470703125, -0.11541748046875, -0.0733642578125, -0.03131103515625, 0.0107421875, 0.05279541015625, 0.0948486328125, 0.13690185546875, 0.178955078125, 0.22100830078125, 0.2630615234375, 0.30511474609375, 0.34716796875, 0.38922119140625, 0.4312744140625, 0.47332763671875, 0.515380859375, 0.55743408203125, 0.5994873046875, 0.64154052734375, 0.68359375, 0.72564697265625, 0.7677001953125, 0.80975341796875, 0.851806640625, 0.89385986328125, 0.9359130859375, 0.97796630859375, 1.02001953125, 1.06207275390625, 1.1041259765625, 1.14617919921875, 1.188232421875, 1.23028564453125, 1.2723388671875, 1.31439208984375, 1.3564453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 4.0, 9.0, 13.0, 23.0, 45.0, 48.0, 69.0, 103.0, 169.0, 249.0, 511.0, 876.0, 1733.0, 3825.0, 8405.0, 21991.0, 75382.0, 636692.0, 231639.0, 41330.0, 13994.0, 5766.0, 2701.0, 1283.0, 674.0, 369.0, 240.0, 141.0, 71.0, 44.0, 46.0, 26.0, 26.0, 14.0, 9.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0480728149414062, -1.0170440673828125, -0.9860153198242188, -0.954986572265625, -0.9239578247070312, -0.8929290771484375, -0.8619003295898438, -0.83087158203125, -0.7998428344726562, -0.7688140869140625, -0.7377853393554688, -0.706756591796875, -0.6757278442382812, -0.6446990966796875, -0.6136703491210938, -0.5826416015625, -0.5516128540039062, -0.5205841064453125, -0.48955535888671875, -0.458526611328125, -0.42749786376953125, -0.3964691162109375, -0.36544036865234375, -0.33441162109375, -0.30338287353515625, -0.2723541259765625, -0.24132537841796875, -0.210296630859375, -0.17926788330078125, -0.1482391357421875, -0.11721038818359375, -0.086181640625, -0.05515289306640625, -0.0241241455078125, 0.00690460205078125, 0.037933349609375, 0.06896209716796875, 0.0999908447265625, 0.13101959228515625, 0.16204833984375, 0.19307708740234375, 0.2241058349609375, 0.25513458251953125, 0.286163330078125, 0.31719207763671875, 0.3482208251953125, 0.37924957275390625, 0.4102783203125, 0.44130706787109375, 0.4723358154296875, 0.5033645629882812, 0.534393310546875, 0.5654220581054688, 0.5964508056640625, 0.6274795532226562, 0.65850830078125, 0.6895370483398438, 0.7205657958984375, 0.7515945434570312, 0.782623291015625, 0.8136520385742188, 0.8446807861328125, 0.8757095336914062, 0.90673828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 4.0, 2.0, 3.0, 2.0, 7.0, 10.0, 11.0, 7.0, 10.0, 15.0, 20.0, 37.0, 76.0, 155.0, 267.0, 182.0, 79.0, 25.0, 24.0, 17.0, 9.0, 5.0, 7.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029754638671875, -0.00028748810291290283, -0.00027742981910705566, -0.0002673715353012085, -0.00025731325149536133, -0.00024725496768951416, -0.000237196683883667, -0.00022713840007781982, -0.00021708011627197266, -0.0002070218324661255, -0.00019696354866027832, -0.00018690526485443115, -0.00017684698104858398, -0.00016678869724273682, -0.00015673041343688965, -0.00014667212963104248, -0.0001366138458251953, -0.00012655556201934814, -0.00011649727821350098, -0.00010643899440765381, -9.638071060180664e-05, -8.632242679595947e-05, -7.62641429901123e-05, -6.620585918426514e-05, -5.614757537841797e-05, -4.60892915725708e-05, -3.603100776672363e-05, -2.5972723960876465e-05, -1.5914440155029297e-05, -5.856156349182129e-06, 4.202127456665039e-06, 1.4260411262512207e-05, 2.4318695068359375e-05, 3.437697887420654e-05, 4.443526268005371e-05, 5.449354648590088e-05, 6.455183029174805e-05, 7.461011409759521e-05, 8.466839790344238e-05, 9.472668170928955e-05, 0.00010478496551513672, 0.00011484324932098389, 0.00012490153312683105, 0.00013495981693267822, 0.0001450181007385254, 0.00015507638454437256, 0.00016513466835021973, 0.0001751929521560669, 0.00018525123596191406, 0.00019530951976776123, 0.0002053678035736084, 0.00021542608737945557, 0.00022548437118530273, 0.0002355426549911499, 0.00024560093879699707, 0.00025565922260284424, 0.0002657175064086914, 0.0002757757902145386, 0.00028583407402038574, 0.0002958923578262329, 0.0003059506416320801, 0.00031600892543792725, 0.0003260672092437744, 0.0003361254930496216, 0.00034618377685546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 6.0, 11.0, 19.0, 36.0, 47.0, 43.0, 94.0, 122.0, 168.0, 249.0, 406.0, 613.0, 1063.0, 1954.0, 3995.0, 8610.0, 23183.0, 93459.0, 688008.0, 171318.0, 33176.0, 11055.0, 5055.0, 2477.0, 1295.0, 741.0, 452.0, 293.0, 200.0, 117.0, 83.0, 48.0, 46.0, 34.0, 23.0, 11.0, 13.0, 5.0, 3.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.0439453125, -1.0138168334960938, -0.9836883544921875, -0.9535598754882812, -0.923431396484375, -0.8933029174804688, -0.8631744384765625, -0.8330459594726562, -0.80291748046875, -0.7727890014648438, -0.7426605224609375, -0.7125320434570312, -0.682403564453125, -0.6522750854492188, -0.6221466064453125, -0.5920181274414062, -0.5618896484375, -0.5317611694335938, -0.5016326904296875, -0.47150421142578125, -0.441375732421875, -0.41124725341796875, -0.3811187744140625, -0.35099029541015625, -0.32086181640625, -0.29073333740234375, -0.2606048583984375, -0.23047637939453125, -0.200347900390625, -0.17021942138671875, -0.1400909423828125, -0.10996246337890625, -0.079833984375, -0.04970550537109375, -0.0195770263671875, 0.01055145263671875, 0.040679931640625, 0.07080841064453125, 0.1009368896484375, 0.13106536865234375, 0.16119384765625, 0.19132232666015625, 0.2214508056640625, 0.25157928466796875, 0.281707763671875, 0.31183624267578125, 0.3419647216796875, 0.37209320068359375, 0.4022216796875, 0.43235015869140625, 0.4624786376953125, 0.49260711669921875, 0.522735595703125, 0.5528640747070312, 0.5829925537109375, 0.6131210327148438, 0.64324951171875, 0.6733779907226562, 0.7035064697265625, 0.7336349487304688, 0.763763427734375, 0.7938919067382812, 0.8240203857421875, 0.8541488647460938, 0.88427734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 6.0, 7.0, 13.0, 18.0, 19.0, 30.0, 41.0, 74.0, 124.0, 174.0, 177.0, 110.0, 60.0, 44.0, 21.0, 9.0, 16.0, 10.0, 4.0, 13.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68017578125, -0.6517257690429688, -0.6232757568359375, -0.5948257446289062, -0.566375732421875, -0.5379257202148438, -0.5094757080078125, -0.48102569580078125, -0.45257568359375, -0.42412567138671875, -0.3956756591796875, -0.36722564697265625, -0.338775634765625, -0.31032562255859375, -0.2818756103515625, -0.25342559814453125, -0.2249755859375, -0.19652557373046875, -0.1680755615234375, -0.13962554931640625, -0.111175537109375, -0.08272552490234375, -0.0542755126953125, -0.02582550048828125, 0.00262451171875, 0.03107452392578125, 0.0595245361328125, 0.08797454833984375, 0.116424560546875, 0.14487457275390625, 0.1733245849609375, 0.20177459716796875, 0.230224609375, 0.25867462158203125, 0.2871246337890625, 0.31557464599609375, 0.344024658203125, 0.37247467041015625, 0.4009246826171875, 0.42937469482421875, 0.45782470703125, 0.48627471923828125, 0.5147247314453125, 0.5431747436523438, 0.571624755859375, 0.6000747680664062, 0.6285247802734375, 0.6569747924804688, 0.6854248046875, 0.7138748168945312, 0.7423248291015625, 0.7707748413085938, 0.799224853515625, 0.8276748657226562, 0.8561248779296875, 0.8845748901367188, 0.91302490234375, 0.9414749145507812, 0.9699249267578125, 0.9983749389648438, 1.026824951171875, 1.0552749633789062, 1.0837249755859375, 1.1121749877929688, 1.140625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 11.0, 14.0, 30.0, 55.0, 110.0, 187.0, 221.0, 199.0, 111.0, 37.0, 23.0, 10.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.11473083496094, -36.395233154296875, -35.67573547363281, -34.95623779296875, -34.23674011230469, -33.517242431640625, -32.79774475097656, -32.0782470703125, -31.358749389648438, -30.639251708984375, -29.919754028320312, -29.20025634765625, -28.480758666992188, -27.761260986328125, -27.041763305664062, -26.322265625, -25.602766036987305, -24.883268356323242, -24.16377067565918, -23.444272994995117, -22.724775314331055, -22.005277633666992, -21.285778045654297, -20.566280364990234, -19.846782684326172, -19.12728500366211, -18.407787322998047, -17.688289642333984, -16.968791961669922, -16.24929428100586, -15.52979564666748, -14.810297966003418, -14.090799331665039, -13.371301651000977, -12.651803970336914, -11.932306289672852, -11.212808609008789, -10.493310928344727, -9.773812294006348, -9.054314613342285, -8.334816932678223, -7.61531925201416, -6.895821571350098, -6.176323413848877, -5.4568257331848145, -4.737328052520752, -4.017829895019531, -3.2983322143554688, -2.5788345336914062, -1.8593367338180542, -1.1398389339447021, -0.42034101486206055, 0.29915666580200195, 1.0186543464660645, 1.7381525039672852, 2.4576501846313477, 3.17714786529541, 3.8966455459594727, 4.616143226623535, 5.335641384124756, 6.055139064788818, 6.774636745452881, 7.494134902954102, 8.213632583618164, 8.933130264282227]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 13.0, 13.0, 15.0, 18.0, 8.0, 21.0, 23.0, 20.0, 34.0, 24.0, 36.0, 28.0, 35.0, 40.0, 30.0, 41.0, 39.0, 48.0, 36.0, 33.0, 37.0, 32.0, 39.0, 26.0, 40.0, 19.0, 26.0, 25.0, 27.0, 24.0, 20.0, 9.0, 17.0, 9.0, 13.0, 13.0, 9.0, 8.0, 14.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-4.48682975769043, -4.355088233947754, -4.223346710205078, -4.091605186462402, -3.9598639011383057, -3.82812237739563, -3.696380853652954, -3.5646393299102783, -3.4328980445861816, -3.301156520843506, -3.16941499710083, -3.0376734733581543, -2.9059321880340576, -2.774190664291382, -2.642449140548706, -2.5107076168060303, -2.3789660930633545, -2.2472245693206787, -2.115483045578003, -1.9837416410446167, -1.8520002365112305, -1.7202587127685547, -1.588517189025879, -1.4567756652832031, -1.325034260749817, -1.1932927370071411, -1.0615513324737549, -0.9298098087310791, -0.7980683445930481, -0.6663268804550171, -0.5345853567123413, -0.4028438925743103, -0.2711021900177002, -0.139360710978508, -0.007619231939315796, 0.1241222620010376, 0.2558637261390686, 0.3876051902770996, 0.5193467140197754, 0.6510881781578064, 0.7828296422958374, 0.9145711064338684, 1.0463125705718994, 1.1780540943145752, 1.309795618057251, 1.4415370225906372, 1.573278546333313, 1.7050199508666992, 1.836761474609375, 1.9685029983520508, 2.1002445220947266, 2.2319860458374023, 2.363727331161499, 2.495468854904175, 2.6272103786468506, 2.7589519023895264, 2.890693187713623, 3.022434711456299, 3.1541762351989746, 3.2859177589416504, 3.417659044265747, 3.549400568008423, 3.6811420917510986, 3.8128836154937744, 3.94462513923645]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 3.0, 7.0, 7.0, 4.0, 13.0, 16.0, 7.0, 17.0, 26.0, 38.0, 68.0, 90.0, 105.0, 188.0, 351.0, 584.0, 979.0, 1864.0, 3675.0, 8293.0, 22644.0, 83709.0, 3618210.0, 378867.0, 46407.0, 15226.0, 6239.0, 2909.0, 1495.0, 829.0, 525.0, 282.0, 184.0, 144.0, 72.0, 51.0, 42.0, 31.0, 23.0, 15.0, 12.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.07421875, -2.977569580078125, -2.88092041015625, -2.784271240234375, -2.6876220703125, -2.590972900390625, -2.49432373046875, -2.397674560546875, -2.301025390625, -2.204376220703125, -2.10772705078125, -2.011077880859375, -1.9144287109375, -1.817779541015625, -1.72113037109375, -1.624481201171875, -1.52783203125, -1.431182861328125, -1.33453369140625, -1.237884521484375, -1.1412353515625, -1.044586181640625, -0.94793701171875, -0.851287841796875, -0.754638671875, -0.657989501953125, -0.56134033203125, -0.464691162109375, -0.3680419921875, -0.271392822265625, -0.17474365234375, -0.078094482421875, 0.0185546875, 0.115203857421875, 0.21185302734375, 0.308502197265625, 0.4051513671875, 0.501800537109375, 0.59844970703125, 0.695098876953125, 0.791748046875, 0.888397216796875, 0.98504638671875, 1.081695556640625, 1.1783447265625, 1.274993896484375, 1.37164306640625, 1.468292236328125, 1.56494140625, 1.661590576171875, 1.75823974609375, 1.854888916015625, 1.9515380859375, 2.048187255859375, 2.14483642578125, 2.241485595703125, 2.338134765625, 2.434783935546875, 2.53143310546875, 2.628082275390625, 2.7247314453125, 2.821380615234375, 2.91802978515625, 3.014678955078125, 3.111328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 4.0, 5.0, 12.0, 12.0, 22.0, 27.0, 25.0, 30.0, 36.0, 37.0, 60.0, 51.0, 41.0, 65.0, 40.0, 76.0, 51.0, 55.0, 53.0, 45.0, 43.0, 43.0, 35.0, 24.0, 24.0, 18.0, 11.0, 16.0, 8.0, 9.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2529296875, -0.2436065673828125, -0.234283447265625, -0.2249603271484375, -0.21563720703125, -0.2063140869140625, -0.196990966796875, -0.1876678466796875, -0.1783447265625, -0.1690216064453125, -0.159698486328125, -0.1503753662109375, -0.14105224609375, -0.1317291259765625, -0.122406005859375, -0.1130828857421875, -0.103759765625, -0.0944366455078125, -0.085113525390625, -0.0757904052734375, -0.06646728515625, -0.0571441650390625, -0.047821044921875, -0.0384979248046875, -0.0291748046875, -0.0198516845703125, -0.010528564453125, -0.0012054443359375, 0.00811767578125, 0.0174407958984375, 0.026763916015625, 0.0360870361328125, 0.04541015625, 0.0547332763671875, 0.064056396484375, 0.0733795166015625, 0.08270263671875, 0.0920257568359375, 0.101348876953125, 0.1106719970703125, 0.1199951171875, 0.1293182373046875, 0.138641357421875, 0.1479644775390625, 0.15728759765625, 0.1666107177734375, 0.175933837890625, 0.1852569580078125, 0.194580078125, 0.2039031982421875, 0.213226318359375, 0.2225494384765625, 0.23187255859375, 0.2411956787109375, 0.250518798828125, 0.2598419189453125, 0.2691650390625, 0.2784881591796875, 0.287811279296875, 0.2971343994140625, 0.30645751953125, 0.3157806396484375, 0.325103759765625, 0.3344268798828125, 0.34375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 19.0, 13.0, 20.0, 21.0, 46.0, 50.0, 78.0, 112.0, 195.0, 267.0, 493.0, 909.0, 2100.0, 8959.0, 155794.0, 3994952.0, 23649.0, 3809.0, 1205.0, 546.0, 351.0, 216.0, 136.0, 110.0, 68.0, 46.0, 33.0, 27.0, 17.0, 13.0, 9.0, 3.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9893798828125, -9.697509765625, -9.4056396484375, -9.11376953125, -8.8218994140625, -8.530029296875, -8.2381591796875, -7.9462890625, -7.6544189453125, -7.362548828125, -7.0706787109375, -6.77880859375, -6.4869384765625, -6.195068359375, -5.9031982421875, -5.611328125, -5.3194580078125, -5.027587890625, -4.7357177734375, -4.44384765625, -4.1519775390625, -3.860107421875, -3.5682373046875, -3.2763671875, -2.9844970703125, -2.692626953125, -2.4007568359375, -2.10888671875, -1.8170166015625, -1.525146484375, -1.2332763671875, -0.94140625, -0.6495361328125, -0.357666015625, -0.0657958984375, 0.22607421875, 0.5179443359375, 0.809814453125, 1.1016845703125, 1.3935546875, 1.6854248046875, 1.977294921875, 2.2691650390625, 2.56103515625, 2.8529052734375, 3.144775390625, 3.4366455078125, 3.728515625, 4.0203857421875, 4.312255859375, 4.6041259765625, 4.89599609375, 5.1878662109375, 5.479736328125, 5.7716064453125, 6.0634765625, 6.3553466796875, 6.647216796875, 6.9390869140625, 7.23095703125, 7.5228271484375, 7.814697265625, 8.1065673828125, 8.3984375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 20.0, 41.0, 129.0, 2118.0, 1575.0, 118.0, 31.0, 21.0, 11.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0390625, -2.934234619140625, -2.82940673828125, -2.724578857421875, -2.6197509765625, -2.514923095703125, -2.41009521484375, -2.305267333984375, -2.200439453125, -2.095611572265625, -1.99078369140625, -1.885955810546875, -1.7811279296875, -1.676300048828125, -1.57147216796875, -1.466644287109375, -1.36181640625, -1.256988525390625, -1.15216064453125, -1.047332763671875, -0.9425048828125, -0.837677001953125, -0.73284912109375, -0.628021240234375, -0.523193359375, -0.418365478515625, -0.31353759765625, -0.208709716796875, -0.1038818359375, 0.000946044921875, 0.10577392578125, 0.210601806640625, 0.3154296875, 0.420257568359375, 0.52508544921875, 0.629913330078125, 0.7347412109375, 0.839569091796875, 0.94439697265625, 1.049224853515625, 1.154052734375, 1.258880615234375, 1.36370849609375, 1.468536376953125, 1.5733642578125, 1.678192138671875, 1.78302001953125, 1.887847900390625, 1.99267578125, 2.097503662109375, 2.20233154296875, 2.307159423828125, 2.4119873046875, 2.516815185546875, 2.62164306640625, 2.726470947265625, 2.831298828125, 2.936126708984375, 3.04095458984375, 3.145782470703125, 3.2506103515625, 3.355438232421875, 3.46026611328125, 3.565093994140625, 3.669921875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 10.0, 12.0, 19.0, 35.0, 25.0, 66.0, 81.0, 111.0, 129.0, 147.0, 110.0, 86.0, 61.0, 41.0, 21.0, 12.0, 13.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.782405853271484, -13.469378471374512, -13.156351089477539, -12.84332275390625, -12.530295372009277, -12.217267990112305, -11.904240608215332, -11.59121322631836, -11.27818489074707, -10.965157508850098, -10.652130126953125, -10.339101791381836, -10.026074409484863, -9.71304702758789, -9.400019645690918, -9.086992263793945, -8.773964881896973, -8.4609375, -8.147910118103027, -7.8348822593688965, -7.521854400634766, -7.208827018737793, -6.89579963684082, -6.582772254943848, -6.269744396209717, -5.956717014312744, -5.643689155578613, -5.330661773681641, -5.017634391784668, -4.704606533050537, -4.3915791511535645, -4.078551292419434, -3.765523910522461, -3.452496290206909, -3.1394686698913574, -2.8264412879943848, -2.513413667678833, -2.2003860473632812, -1.887358546257019, -1.5743310451507568, -1.261303424835205, -0.9482758641242981, -0.6352483034133911, -0.32222074270248413, -0.009193181991577148, 0.3038344383239746, 0.6168619394302368, 0.929889440536499, 1.2429170608520508, 1.5559446811676025, 1.8689721822738647, 2.181999683380127, 2.4950273036956787, 2.8080549240112305, 3.121082305908203, 3.434109926223755, 3.7471375465393066, 4.060164928436279, 4.37319278717041, 4.686220169067383, 4.9992475509643555, 5.312275409698486, 5.625302791595459, 5.93833065032959, 6.2513580322265625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 9.0, 7.0, 11.0, 9.0, 8.0, 10.0, 14.0, 14.0, 16.0, 17.0, 27.0, 24.0, 30.0, 31.0, 42.0, 37.0, 38.0, 43.0, 45.0, 50.0, 37.0, 44.0, 39.0, 48.0, 48.0, 41.0, 35.0, 32.0, 29.0, 18.0, 22.0, 24.0, 9.0, 17.0, 14.0, 14.0, 10.0, 7.0, 14.0, 4.0, 9.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.6984429359436035, -4.552917957305908, -4.407392978668213, -4.261868000030518, -4.1163434982299805, -3.970818281173706, -3.82529354095459, -3.6797685623168945, -3.534243583679199, -3.388718605041504, -3.2431936264038086, -3.0976688861846924, -2.952143907546997, -2.8066189289093018, -2.6610941886901855, -2.5155692100524902, -2.370044231414795, -2.2245192527770996, -2.0789942741394043, -1.933469533920288, -1.7879445552825928, -1.6424195766448975, -1.4968947172164917, -1.351369857788086, -1.2058448791503906, -1.0603199005126953, -0.9147950410842896, -0.769270122051239, -0.6237452030181885, -0.47822028398513794, -0.3326953649520874, -0.18717050552368164, -0.04164552688598633, 0.10387939214706421, 0.24940431118011475, 0.3949292302131653, 0.5404541492462158, 0.6859790682792664, 0.8315039873123169, 0.9770288467407227, 1.122553825378418, 1.2680788040161133, 1.413603663444519, 1.5591285228729248, 1.7046535015106201, 1.8501784801483154, 1.9957033395767212, 2.141228199005127, 2.2867531776428223, 2.4322781562805176, 2.577803134918213, 2.723327875137329, 2.8688528537750244, 3.0143778324127197, 3.159902572631836, 3.3054275512695312, 3.4509525299072266, 3.596477508544922, 3.742002487182617, 3.8875272274017334, 4.033052444458008, 4.178576946258545, 4.32410192489624, 4.4696269035339355, 4.615151882171631]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 8.0, 3.0, 14.0, 13.0, 29.0, 35.0, 49.0, 74.0, 109.0, 154.0, 226.0, 329.0, 536.0, 943.0, 1549.0, 2749.0, 4634.0, 8452.0, 15681.0, 30055.0, 59021.0, 122496.0, 322834.0, 264410.0, 105240.0, 51439.0, 26147.0, 13618.0, 7600.0, 4022.0, 2383.0, 1434.0, 753.0, 544.0, 338.0, 206.0, 165.0, 89.0, 57.0, 25.0, 34.0, 16.0, 11.0, 13.0, 4.0, 2.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5830078125, -1.528228759765625, -1.47344970703125, -1.418670654296875, -1.3638916015625, -1.309112548828125, -1.25433349609375, -1.199554443359375, -1.144775390625, -1.089996337890625, -1.03521728515625, -0.980438232421875, -0.9256591796875, -0.870880126953125, -0.81610107421875, -0.761322021484375, -0.70654296875, -0.651763916015625, -0.59698486328125, -0.542205810546875, -0.4874267578125, -0.432647705078125, -0.37786865234375, -0.323089599609375, -0.268310546875, -0.213531494140625, -0.15875244140625, -0.103973388671875, -0.0491943359375, 0.005584716796875, 0.06036376953125, 0.115142822265625, 0.169921875, 0.224700927734375, 0.27947998046875, 0.334259033203125, 0.3890380859375, 0.443817138671875, 0.49859619140625, 0.553375244140625, 0.608154296875, 0.662933349609375, 0.71771240234375, 0.772491455078125, 0.8272705078125, 0.882049560546875, 0.93682861328125, 0.991607666015625, 1.04638671875, 1.101165771484375, 1.15594482421875, 1.210723876953125, 1.2655029296875, 1.320281982421875, 1.37506103515625, 1.429840087890625, 1.484619140625, 1.539398193359375, 1.59417724609375, 1.648956298828125, 1.7037353515625, 1.758514404296875, 1.81329345703125, 1.868072509765625, 1.9228515625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 11.0, 10.0, 11.0, 15.0, 12.0, 17.0, 17.0, 16.0, 27.0, 23.0, 29.0, 40.0, 50.0, 43.0, 37.0, 34.0, 47.0, 48.0, 41.0, 45.0, 35.0, 31.0, 36.0, 27.0, 29.0, 31.0, 35.0, 31.0, 23.0, 21.0, 20.0, 19.0, 13.0, 9.0, 10.0, 14.0, 9.0, 2.0, 2.0, 6.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.348388671875, -0.33795166015625, -0.3275146484375, -0.31707763671875, -0.306640625, -0.29620361328125, -0.2857666015625, -0.27532958984375, -0.264892578125, -0.25445556640625, -0.2440185546875, -0.23358154296875, -0.22314453125, -0.21270751953125, -0.2022705078125, -0.19183349609375, -0.181396484375, -0.17095947265625, -0.1605224609375, -0.15008544921875, -0.1396484375, -0.12921142578125, -0.1187744140625, -0.10833740234375, -0.097900390625, -0.08746337890625, -0.0770263671875, -0.06658935546875, -0.05615234375, -0.04571533203125, -0.0352783203125, -0.02484130859375, -0.014404296875, -0.00396728515625, 0.0064697265625, 0.01690673828125, 0.02734375, 0.03778076171875, 0.0482177734375, 0.05865478515625, 0.069091796875, 0.07952880859375, 0.0899658203125, 0.10040283203125, 0.11083984375, 0.12127685546875, 0.1317138671875, 0.14215087890625, 0.152587890625, 0.16302490234375, 0.1734619140625, 0.18389892578125, 0.1943359375, 0.20477294921875, 0.2152099609375, 0.22564697265625, 0.236083984375, 0.24652099609375, 0.2569580078125, 0.26739501953125, 0.27783203125, 0.28826904296875, 0.2987060546875, 0.30914306640625, 0.319580078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 9.0, 13.0, 12.0, 16.0, 22.0, 32.0, 51.0, 106.0, 182.0, 313.0, 752.0, 2249.0, 11261.0, 178810.0, 809444.0, 38472.0, 4462.0, 1199.0, 506.0, 269.0, 152.0, 68.0, 51.0, 28.0, 17.0, 15.0, 12.0, 7.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.30859375, -6.11297607421875, -5.9173583984375, -5.72174072265625, -5.526123046875, -5.33050537109375, -5.1348876953125, -4.93927001953125, -4.74365234375, -4.54803466796875, -4.3524169921875, -4.15679931640625, -3.961181640625, -3.76556396484375, -3.5699462890625, -3.37432861328125, -3.1787109375, -2.98309326171875, -2.7874755859375, -2.59185791015625, -2.396240234375, -2.20062255859375, -2.0050048828125, -1.80938720703125, -1.61376953125, -1.41815185546875, -1.2225341796875, -1.02691650390625, -0.831298828125, -0.63568115234375, -0.4400634765625, -0.24444580078125, -0.048828125, 0.14678955078125, 0.3424072265625, 0.53802490234375, 0.733642578125, 0.92926025390625, 1.1248779296875, 1.32049560546875, 1.51611328125, 1.71173095703125, 1.9073486328125, 2.10296630859375, 2.298583984375, 2.49420166015625, 2.6898193359375, 2.88543701171875, 3.0810546875, 3.27667236328125, 3.4722900390625, 3.66790771484375, 3.863525390625, 4.05914306640625, 4.2547607421875, 4.45037841796875, 4.64599609375, 4.84161376953125, 5.0372314453125, 5.23284912109375, 5.428466796875, 5.62408447265625, 5.8197021484375, 6.01531982421875, 6.2109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 9.0, 23.0, 31.0, 41.0, 52.0, 76.0, 80.0, 92.0, 111.0, 101.0, 95.0, 71.0, 57.0, 36.0, 37.0, 23.0, 15.0, 15.0, 8.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6328125, -3.525421142578125, -3.41802978515625, -3.310638427734375, -3.2032470703125, -3.095855712890625, -2.98846435546875, -2.881072998046875, -2.773681640625, -2.666290283203125, -2.55889892578125, -2.451507568359375, -2.3441162109375, -2.236724853515625, -2.12933349609375, -2.021942138671875, -1.91455078125, -1.807159423828125, -1.69976806640625, -1.592376708984375, -1.4849853515625, -1.377593994140625, -1.27020263671875, -1.162811279296875, -1.055419921875, -0.948028564453125, -0.84063720703125, -0.733245849609375, -0.6258544921875, -0.518463134765625, -0.41107177734375, -0.303680419921875, -0.1962890625, -0.088897705078125, 0.01849365234375, 0.125885009765625, 0.2332763671875, 0.340667724609375, 0.44805908203125, 0.555450439453125, 0.662841796875, 0.770233154296875, 0.87762451171875, 0.985015869140625, 1.0924072265625, 1.199798583984375, 1.30718994140625, 1.414581298828125, 1.52197265625, 1.629364013671875, 1.73675537109375, 1.844146728515625, 1.9515380859375, 2.058929443359375, 2.16632080078125, 2.273712158203125, 2.381103515625, 2.488494873046875, 2.59588623046875, 2.703277587890625, 2.8106689453125, 2.918060302734375, 3.02545166015625, 3.132843017578125, 3.240234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 10.0, 6.0, 14.0, 18.0, 28.0, 29.0, 46.0, 72.0, 117.0, 203.0, 391.0, 763.0, 1558.0, 3154.0, 7325.0, 18431.0, 58191.0, 338281.0, 510286.0, 72421.0, 21400.0, 8653.0, 3644.0, 1615.0, 837.0, 432.0, 242.0, 122.0, 87.0, 53.0, 35.0, 27.0, 6.0, 16.0, 10.0, 5.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30078125, -1.2509002685546875, -1.201019287109375, -1.1511383056640625, -1.10125732421875, -1.0513763427734375, -1.001495361328125, -0.9516143798828125, -0.9017333984375, -0.8518524169921875, -0.801971435546875, -0.7520904541015625, -0.70220947265625, -0.6523284912109375, -0.602447509765625, -0.5525665283203125, -0.502685546875, -0.4528045654296875, -0.402923583984375, -0.3530426025390625, -0.30316162109375, -0.2532806396484375, -0.203399658203125, -0.1535186767578125, -0.1036376953125, -0.0537567138671875, -0.003875732421875, 0.0460052490234375, 0.09588623046875, 0.1457672119140625, 0.195648193359375, 0.2455291748046875, 0.29541015625, 0.3452911376953125, 0.395172119140625, 0.4450531005859375, 0.49493408203125, 0.5448150634765625, 0.594696044921875, 0.6445770263671875, 0.6944580078125, 0.7443389892578125, 0.794219970703125, 0.8441009521484375, 0.89398193359375, 0.9438629150390625, 0.993743896484375, 1.0436248779296875, 1.093505859375, 1.1433868408203125, 1.193267822265625, 1.2431488037109375, 1.29302978515625, 1.3429107666015625, 1.392791748046875, 1.4426727294921875, 1.4925537109375, 1.5424346923828125, 1.592315673828125, 1.6421966552734375, 1.69207763671875, 1.7419586181640625, 1.791839599609375, 1.8417205810546875, 1.8916015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 12.0, 18.0, 33.0, 46.0, 77.0, 113.0, 213.0, 196.0, 99.0, 61.0, 33.0, 29.0, 13.0, 14.0, 12.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004506111145019531, -0.0004376731812953949, -0.00042473524808883667, -0.00041179731488227844, -0.0003988593816757202, -0.000385921448469162, -0.00037298351526260376, -0.00036004558205604553, -0.0003471076488494873, -0.0003341697156429291, -0.00032123178243637085, -0.0003082938492298126, -0.0002953559160232544, -0.00028241798281669617, -0.00026948004961013794, -0.0002565421164035797, -0.00024360418319702148, -0.00023066624999046326, -0.00021772831678390503, -0.0002047903835773468, -0.00019185245037078857, -0.00017891451716423035, -0.00016597658395767212, -0.0001530386507511139, -0.00014010071754455566, -0.00012716278433799744, -0.00011422485113143921, -0.00010128691792488098, -8.834898471832275e-05, -7.541105151176453e-05, -6.24731183052063e-05, -4.953518509864807e-05, -3.6597251892089844e-05, -2.3659318685531616e-05, -1.0721385478973389e-05, 2.216547727584839e-06, 1.5154480934143066e-05, 2.8092414140701294e-05, 4.103034734725952e-05, 5.396828055381775e-05, 6.690621376037598e-05, 7.98441469669342e-05, 9.278208017349243e-05, 0.00010572001338005066, 0.00011865794658660889, 0.00013159587979316711, 0.00014453381299972534, 0.00015747174620628357, 0.0001704096794128418, 0.00018334761261940002, 0.00019628554582595825, 0.00020922347903251648, 0.0002221614122390747, 0.00023509934544563293, 0.00024803727865219116, 0.0002609752118587494, 0.0002739131450653076, 0.00028685107827186584, 0.00029978901147842407, 0.0003127269446849823, 0.00032566487789154053, 0.00033860281109809875, 0.000351540744304657, 0.0003644786775112152, 0.00037741661071777344]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 8.0, 12.0, 19.0, 15.0, 20.0, 29.0, 64.0, 91.0, 196.0, 350.0, 907.0, 2716.0, 10987.0, 68962.0, 811373.0, 130529.0, 16461.0, 3705.0, 1128.0, 450.0, 206.0, 118.0, 57.0, 35.0, 26.0, 26.0, 16.0, 11.0, 5.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.61328125, -2.5186767578125, -2.424072265625, -2.3294677734375, -2.23486328125, -2.1402587890625, -2.045654296875, -1.9510498046875, -1.8564453125, -1.7618408203125, -1.667236328125, -1.5726318359375, -1.47802734375, -1.3834228515625, -1.288818359375, -1.1942138671875, -1.099609375, -1.0050048828125, -0.910400390625, -0.8157958984375, -0.72119140625, -0.6265869140625, -0.531982421875, -0.4373779296875, -0.3427734375, -0.2481689453125, -0.153564453125, -0.0589599609375, 0.03564453125, 0.1302490234375, 0.224853515625, 0.3194580078125, 0.4140625, 0.5086669921875, 0.603271484375, 0.6978759765625, 0.79248046875, 0.8870849609375, 0.981689453125, 1.0762939453125, 1.1708984375, 1.2655029296875, 1.360107421875, 1.4547119140625, 1.54931640625, 1.6439208984375, 1.738525390625, 1.8331298828125, 1.927734375, 2.0223388671875, 2.116943359375, 2.2115478515625, 2.30615234375, 2.4007568359375, 2.495361328125, 2.5899658203125, 2.6845703125, 2.7791748046875, 2.873779296875, 2.9683837890625, 3.06298828125, 3.1575927734375, 3.252197265625, 3.3468017578125, 3.44140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 9.0, 7.0, 10.0, 21.0, 19.0, 25.0, 36.0, 47.0, 65.0, 77.0, 108.0, 134.0, 107.0, 87.0, 64.0, 55.0, 22.0, 19.0, 19.0, 16.0, 11.0, 9.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.720703125, -1.670684814453125, -1.62066650390625, -1.570648193359375, -1.5206298828125, -1.470611572265625, -1.42059326171875, -1.370574951171875, -1.320556640625, -1.270538330078125, -1.22052001953125, -1.170501708984375, -1.1204833984375, -1.070465087890625, -1.02044677734375, -0.970428466796875, -0.92041015625, -0.870391845703125, -0.82037353515625, -0.770355224609375, -0.7203369140625, -0.670318603515625, -0.62030029296875, -0.570281982421875, -0.520263671875, -0.470245361328125, -0.42022705078125, -0.370208740234375, -0.3201904296875, -0.270172119140625, -0.22015380859375, -0.170135498046875, -0.1201171875, -0.070098876953125, -0.02008056640625, 0.029937744140625, 0.0799560546875, 0.129974365234375, 0.17999267578125, 0.230010986328125, 0.280029296875, 0.330047607421875, 0.38006591796875, 0.430084228515625, 0.4801025390625, 0.530120849609375, 0.58013916015625, 0.630157470703125, 0.68017578125, 0.730194091796875, 0.78021240234375, 0.830230712890625, 0.8802490234375, 0.930267333984375, 0.98028564453125, 1.030303955078125, 1.080322265625, 1.130340576171875, 1.18035888671875, 1.230377197265625, 1.2803955078125, 1.330413818359375, 1.38043212890625, 1.430450439453125, 1.48046875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 3.0, 3.0, 9.0, 10.0, 27.0, 27.0, 54.0, 79.0, 111.0, 108.0, 122.0, 127.0, 91.0, 79.0, 51.0, 38.0, 18.0, 22.0, 6.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.558210372924805, -17.9486141204834, -17.33901596069336, -16.729419708251953, -16.119821548461914, -15.510225296020508, -14.900628089904785, -14.291030883789062, -13.681434631347656, -13.071837425231934, -12.462240219116211, -11.852643966674805, -11.243046760559082, -10.63344955444336, -10.023852348327637, -9.414255142211914, -8.804657936096191, -8.195060729980469, -7.585464000701904, -6.975866794586182, -6.366270065307617, -5.7566728591918945, -5.147075653076172, -4.537478923797607, -3.9278817176818848, -3.318284749984741, -2.7086877822875977, -2.099090576171875, -1.4894936084747314, -0.8798966407775879, -0.27029943466186523, 0.3392972946166992, 0.9488945007324219, 1.5584914684295654, 2.168088436126709, 2.7776856422424316, 3.387282609939575, 3.9968795776367188, 4.606476783752441, 5.216073513031006, 5.8256707191467285, 6.435267925262451, 7.044864654541016, 7.654461860656738, 8.264059066772461, 8.873655319213867, 9.483253479003906, 10.092849731445312, 10.702446937561035, 11.312044143676758, 11.92164134979248, 12.531238555908203, 13.14083480834961, 13.750432014465332, 14.360029220581055, 14.969625473022461, 15.5792236328125, 16.188819885253906, 16.798418045043945, 17.40801429748535, 18.01761245727539, 18.627208709716797, 19.236804962158203, 19.846403121948242, 20.45599937438965]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 12.0, 4.0, 14.0, 8.0, 15.0, 7.0, 25.0, 14.0, 31.0, 30.0, 30.0, 36.0, 33.0, 45.0, 51.0, 56.0, 47.0, 46.0, 40.0, 35.0, 37.0, 26.0, 43.0, 40.0, 26.0, 35.0, 32.0, 34.0, 31.0, 24.0, 21.0, 16.0, 11.0, 7.0, 3.0, 4.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.06781005859375, -9.732735633850098, -9.397662162780762, -9.06258773803711, -8.727514266967773, -8.392439842224121, -8.057366371154785, -7.722291946411133, -7.387218475341797, -7.052144527435303, -6.717070579528809, -6.3819966316223145, -6.04692268371582, -5.711848735809326, -5.376774787902832, -5.04170036315918, -4.7066264152526855, -4.371552467346191, -4.036478519439697, -3.701404571533203, -3.366330623626709, -3.031256675720215, -2.6961824893951416, -2.3611085414886475, -2.0260345935821533, -1.6909606456756592, -1.355886697769165, -1.0208126306533813, -0.6857386827468872, -0.35066473484039307, -0.015590667724609375, 0.31948328018188477, 0.6545572280883789, 0.989631175994873, 1.3247051239013672, 1.6597791910171509, 1.994853138923645, 2.3299269676208496, 2.665001153945923, 3.000075101852417, 3.335149049758911, 3.6702229976654053, 4.0052971839904785, 4.340371131896973, 4.675445079803467, 5.010519027709961, 5.345592975616455, 5.680666923522949, 6.015740871429443, 6.3508148193359375, 6.685888767242432, 7.020962715148926, 7.35603666305542, 7.691110610961914, 8.026185035705566, 8.361258506774902, 8.696332931518555, 9.031407356262207, 9.366480827331543, 9.701555252075195, 10.036628723144531, 10.371703147888184, 10.70677661895752, 11.041851043701172, 11.376924514770508]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 17.0, 20.0, 35.0, 39.0, 66.0, 90.0, 126.0, 222.0, 342.0, 587.0, 951.0, 1564.0, 2861.0, 5384.0, 11372.0, 27047.0, 86578.0, 3206058.0, 741505.0, 65247.0, 22545.0, 9850.0, 5004.0, 2668.0, 1537.0, 935.0, 566.0, 344.0, 237.0, 158.0, 89.0, 71.0, 53.0, 32.0, 15.0, 13.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.322265625, -3.2181396484375, -3.114013671875, -3.0098876953125, -2.90576171875, -2.8016357421875, -2.697509765625, -2.5933837890625, -2.4892578125, -2.3851318359375, -2.281005859375, -2.1768798828125, -2.07275390625, -1.9686279296875, -1.864501953125, -1.7603759765625, -1.65625, -1.5521240234375, -1.447998046875, -1.3438720703125, -1.23974609375, -1.1356201171875, -1.031494140625, -0.9273681640625, -0.8232421875, -0.7191162109375, -0.614990234375, -0.5108642578125, -0.40673828125, -0.3026123046875, -0.198486328125, -0.0943603515625, 0.009765625, 0.1138916015625, 0.218017578125, 0.3221435546875, 0.42626953125, 0.5303955078125, 0.634521484375, 0.7386474609375, 0.8427734375, 0.9468994140625, 1.051025390625, 1.1551513671875, 1.25927734375, 1.3634033203125, 1.467529296875, 1.5716552734375, 1.67578125, 1.7799072265625, 1.884033203125, 1.9881591796875, 2.09228515625, 2.1964111328125, 2.300537109375, 2.4046630859375, 2.5087890625, 2.6129150390625, 2.717041015625, 2.8211669921875, 2.92529296875, 3.0294189453125, 3.133544921875, 3.2376708984375, 3.341796875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 6.0, 2.0, 10.0, 7.0, 7.0, 8.0, 22.0, 16.0, 18.0, 19.0, 21.0, 24.0, 34.0, 42.0, 38.0, 39.0, 39.0, 37.0, 46.0, 50.0, 42.0, 35.0, 42.0, 31.0, 23.0, 43.0, 48.0, 34.0, 28.0, 23.0, 26.0, 20.0, 19.0, 17.0, 13.0, 16.0, 17.0, 7.0, 10.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.343505859375, -0.3329811096191406, -0.32245635986328125, -0.3119316101074219, -0.3014068603515625, -0.2908821105957031, -0.28035736083984375, -0.2698326110839844, -0.259307861328125, -0.24878311157226562, -0.23825836181640625, -0.22773361206054688, -0.2172088623046875, -0.20668411254882812, -0.19615936279296875, -0.18563461303710938, -0.17510986328125, -0.16458511352539062, -0.15406036376953125, -0.14353561401367188, -0.1330108642578125, -0.12248611450195312, -0.11196136474609375, -0.10143661499023438, -0.090911865234375, -0.08038711547851562, -0.06986236572265625, -0.059337615966796875, -0.0488128662109375, -0.038288116455078125, -0.02776336669921875, -0.017238616943359375, -0.0067138671875, 0.003810882568359375, 0.01433563232421875, 0.024860382080078125, 0.0353851318359375, 0.045909881591796875, 0.05643463134765625, 0.06695938110351562, 0.077484130859375, 0.08800888061523438, 0.09853363037109375, 0.10905838012695312, 0.1195831298828125, 0.13010787963867188, 0.14063262939453125, 0.15115737915039062, 0.16168212890625, 0.17220687866210938, 0.18273162841796875, 0.19325637817382812, 0.2037811279296875, 0.21430587768554688, 0.22483062744140625, 0.23535537719726562, 0.245880126953125, 0.2564048767089844, 0.26692962646484375, 0.2774543762207031, 0.2879791259765625, 0.2985038757324219, 0.30902862548828125, 0.3195533752441406, 0.330078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 2.0, 13.0, 9.0, 21.0, 17.0, 32.0, 31.0, 40.0, 52.0, 88.0, 108.0, 217.0, 544.0, 2182.0, 21029.0, 4044913.0, 117899.0, 5287.0, 945.0, 333.0, 141.0, 106.0, 81.0, 47.0, 39.0, 31.0, 22.0, 19.0, 13.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.8046875, -14.401611328125, -13.99853515625, -13.595458984375, -13.1923828125, -12.789306640625, -12.38623046875, -11.983154296875, -11.580078125, -11.177001953125, -10.77392578125, -10.370849609375, -9.9677734375, -9.564697265625, -9.16162109375, -8.758544921875, -8.35546875, -7.952392578125, -7.54931640625, -7.146240234375, -6.7431640625, -6.340087890625, -5.93701171875, -5.533935546875, -5.130859375, -4.727783203125, -4.32470703125, -3.921630859375, -3.5185546875, -3.115478515625, -2.71240234375, -2.309326171875, -1.90625, -1.503173828125, -1.10009765625, -0.697021484375, -0.2939453125, 0.109130859375, 0.51220703125, 0.915283203125, 1.318359375, 1.721435546875, 2.12451171875, 2.527587890625, 2.9306640625, 3.333740234375, 3.73681640625, 4.139892578125, 4.54296875, 4.946044921875, 5.34912109375, 5.752197265625, 6.1552734375, 6.558349609375, 6.96142578125, 7.364501953125, 7.767578125, 8.170654296875, 8.57373046875, 8.976806640625, 9.3798828125, 9.782958984375, 10.18603515625, 10.589111328125, 10.9921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 9.0, 27.0, 51.0, 160.0, 2655.0, 980.0, 129.0, 41.0, 16.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.85430908203125, -3.6929931640625, -3.53167724609375, -3.370361328125, -3.20904541015625, -3.0477294921875, -2.88641357421875, -2.72509765625, -2.56378173828125, -2.4024658203125, -2.24114990234375, -2.079833984375, -1.91851806640625, -1.7572021484375, -1.59588623046875, -1.4345703125, -1.27325439453125, -1.1119384765625, -0.95062255859375, -0.789306640625, -0.62799072265625, -0.4666748046875, -0.30535888671875, -0.14404296875, 0.01727294921875, 0.1785888671875, 0.33990478515625, 0.501220703125, 0.66253662109375, 0.8238525390625, 0.98516845703125, 1.146484375, 1.30780029296875, 1.4691162109375, 1.63043212890625, 1.791748046875, 1.95306396484375, 2.1143798828125, 2.27569580078125, 2.43701171875, 2.59832763671875, 2.7596435546875, 2.92095947265625, 3.082275390625, 3.24359130859375, 3.4049072265625, 3.56622314453125, 3.7275390625, 3.88885498046875, 4.0501708984375, 4.21148681640625, 4.372802734375, 4.53411865234375, 4.6954345703125, 4.85675048828125, 5.01806640625, 5.17938232421875, 5.3406982421875, 5.50201416015625, 5.663330078125, 5.82464599609375, 5.9859619140625, 6.14727783203125, 6.30859375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 18.0, 27.0, 75.0, 111.0, 177.0, 201.0, 162.0, 99.0, 46.0, 39.0, 15.0, 12.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.39603042602539, -22.84369468688965, -22.291358947753906, -21.739023208618164, -21.186687469482422, -20.634353637695312, -20.08201789855957, -19.529682159423828, -18.977346420288086, -18.425010681152344, -17.8726749420166, -17.32033920288086, -16.76800537109375, -16.215669631958008, -15.663333892822266, -15.110998153686523, -14.558662414550781, -14.006326675415039, -13.453990936279297, -12.901656150817871, -12.349320411682129, -11.796984672546387, -11.244649887084961, -10.692314147949219, -10.139978408813477, -9.587642669677734, -9.035306930541992, -8.482972145080566, -7.930636405944824, -7.378300666809082, -6.825965404510498, -6.273630142211914, -5.721294403076172, -5.16895866394043, -4.616623401641846, -4.064288139343262, -3.5119524002075195, -2.9596168994903564, -2.4072813987731934, -1.8549458980560303, -1.3026103973388672, -0.7502748966217041, -0.19793939590454102, 0.35439610481262207, 0.9067316055297852, 1.4590671062469482, 2.0114026069641113, 2.5637381076812744, 3.1160736083984375, 3.6684091091156006, 4.220744609832764, 4.773079872131348, 5.32541561126709, 5.877751350402832, 6.430086612701416, 6.982421875, 7.534757614135742, 8.087093353271484, 8.639429092407227, 9.191763877868652, 9.744099617004395, 10.296435356140137, 10.848770141601562, 11.401105880737305, 11.953441619873047]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 9.0, 8.0, 9.0, 8.0, 16.0, 16.0, 24.0, 21.0, 30.0, 27.0, 42.0, 39.0, 50.0, 43.0, 48.0, 53.0, 60.0, 46.0, 49.0, 48.0, 53.0, 39.0, 46.0, 38.0, 37.0, 26.0, 22.0, 20.0, 21.0, 15.0, 6.0, 7.0, 8.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.642404556274414, -8.420464515686035, -8.198525428771973, -7.976585388183594, -7.754645347595215, -7.532705783843994, -7.310766220092773, -7.0888261795043945, -6.866886138916016, -6.644946575164795, -6.423006534576416, -6.201066970825195, -5.979126930236816, -5.757187366485596, -5.535247802734375, -5.313307762145996, -5.091368198394775, -4.869428634643555, -4.647488594055176, -4.425549030303955, -4.203608989715576, -3.9816694259643555, -3.7597296237945557, -3.537789821624756, -3.315850019454956, -3.0939102172851562, -2.8719704151153564, -2.6500306129455566, -2.428091049194336, -2.206151008605957, -1.9842114448547363, -1.7622716426849365, -1.540332317352295, -1.3183925151824951, -1.0964527130126953, -0.8745130300521851, -0.6525732278823853, -0.43063342571258545, -0.2086937427520752, 0.01324605941772461, 0.23518586158752441, 0.45712563395500183, 0.6790654063224792, 0.9010051488876343, 1.122944951057434, 1.3448847532272339, 1.5668244361877441, 1.788764238357544, 2.0107040405273438, 2.2326438426971436, 2.4545836448669434, 2.676523208618164, 2.898463249206543, 3.1204028129577637, 3.3423426151275635, 3.5642824172973633, 3.786222219467163, 4.008162021636963, 4.230101585388184, 4.4520416259765625, 4.673981189727783, 4.895921230316162, 5.117860794067383, 5.339800834655762, 5.561740398406982]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 6.0, 3.0, 2.0, 6.0, 7.0, 12.0, 23.0, 35.0, 47.0, 95.0, 155.0, 279.0, 465.0, 831.0, 1488.0, 2940.0, 5894.0, 13169.0, 31192.0, 87061.0, 299453.0, 403829.0, 126810.0, 42375.0, 17102.0, 7613.0, 3563.0, 1794.0, 945.0, 570.0, 314.0, 189.0, 110.0, 73.0, 31.0, 25.0, 14.0, 15.0, 3.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.78125, -2.68902587890625, -2.5968017578125, -2.50457763671875, -2.412353515625, -2.32012939453125, -2.2279052734375, -2.13568115234375, -2.04345703125, -1.95123291015625, -1.8590087890625, -1.76678466796875, -1.674560546875, -1.58233642578125, -1.4901123046875, -1.39788818359375, -1.3056640625, -1.21343994140625, -1.1212158203125, -1.02899169921875, -0.936767578125, -0.84454345703125, -0.7523193359375, -0.66009521484375, -0.56787109375, -0.47564697265625, -0.3834228515625, -0.29119873046875, -0.198974609375, -0.10675048828125, -0.0145263671875, 0.07769775390625, 0.169921875, 0.26214599609375, 0.3543701171875, 0.44659423828125, 0.538818359375, 0.63104248046875, 0.7232666015625, 0.81549072265625, 0.90771484375, 0.99993896484375, 1.0921630859375, 1.18438720703125, 1.276611328125, 1.36883544921875, 1.4610595703125, 1.55328369140625, 1.6455078125, 1.73773193359375, 1.8299560546875, 1.92218017578125, 2.014404296875, 2.10662841796875, 2.1988525390625, 2.29107666015625, 2.38330078125, 2.47552490234375, 2.5677490234375, 2.65997314453125, 2.752197265625, 2.84442138671875, 2.9366455078125, 3.02886962890625, 3.12109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 7.0, 10.0, 9.0, 10.0, 11.0, 19.0, 18.0, 21.0, 31.0, 39.0, 37.0, 45.0, 38.0, 31.0, 42.0, 44.0, 62.0, 52.0, 51.0, 42.0, 43.0, 36.0, 46.0, 35.0, 40.0, 31.0, 28.0, 26.0, 24.0, 16.0, 13.0, 11.0, 5.0, 11.0, 8.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.4963264465332031, -0.48142242431640625, -0.4665184020996094, -0.4516143798828125, -0.4367103576660156, -0.42180633544921875, -0.4069023132324219, -0.391998291015625, -0.3770942687988281, -0.36219024658203125, -0.3472862243652344, -0.3323822021484375, -0.3174781799316406, -0.30257415771484375, -0.2876701354980469, -0.27276611328125, -0.2578620910644531, -0.24295806884765625, -0.22805404663085938, -0.2131500244140625, -0.19824600219726562, -0.18334197998046875, -0.16843795776367188, -0.153533935546875, -0.13862991333007812, -0.12372589111328125, -0.10882186889648438, -0.0939178466796875, -0.07901382446289062, -0.06410980224609375, -0.049205780029296875, -0.0343017578125, -0.019397735595703125, -0.00449371337890625, 0.010410308837890625, 0.0253143310546875, 0.040218353271484375, 0.05512237548828125, 0.07002639770507812, 0.084930419921875, 0.09983444213867188, 0.11473846435546875, 0.12964248657226562, 0.1445465087890625, 0.15945053100585938, 0.17435455322265625, 0.18925857543945312, 0.20416259765625, 0.21906661987304688, 0.23397064208984375, 0.24887466430664062, 0.2637786865234375, 0.2786827087402344, 0.29358673095703125, 0.3084907531738281, 0.323394775390625, 0.3382987976074219, 0.35320281982421875, 0.3681068420410156, 0.3830108642578125, 0.3979148864746094, 0.41281890869140625, 0.4277229309082031, 0.442626953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 8.0, 9.0, 28.0, 44.0, 61.0, 104.0, 182.0, 342.0, 738.0, 1677.0, 4919.0, 24293.0, 606939.0, 382901.0, 19214.0, 4184.0, 1442.0, 690.0, 302.0, 194.0, 110.0, 54.0, 31.0, 21.0, 14.0, 10.0, 9.0, 2.0, 2.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1796875, -7.923583984375, -7.66748046875, -7.411376953125, -7.1552734375, -6.899169921875, -6.64306640625, -6.386962890625, -6.130859375, -5.874755859375, -5.61865234375, -5.362548828125, -5.1064453125, -4.850341796875, -4.59423828125, -4.338134765625, -4.08203125, -3.825927734375, -3.56982421875, -3.313720703125, -3.0576171875, -2.801513671875, -2.54541015625, -2.289306640625, -2.033203125, -1.777099609375, -1.52099609375, -1.264892578125, -1.0087890625, -0.752685546875, -0.49658203125, -0.240478515625, 0.015625, 0.271728515625, 0.52783203125, 0.783935546875, 1.0400390625, 1.296142578125, 1.55224609375, 1.808349609375, 2.064453125, 2.320556640625, 2.57666015625, 2.832763671875, 3.0888671875, 3.344970703125, 3.60107421875, 3.857177734375, 4.11328125, 4.369384765625, 4.62548828125, 4.881591796875, 5.1376953125, 5.393798828125, 5.64990234375, 5.906005859375, 6.162109375, 6.418212890625, 6.67431640625, 6.930419921875, 7.1865234375, 7.442626953125, 7.69873046875, 7.954833984375, 8.2109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 10.0, 16.0, 11.0, 14.0, 12.0, 23.0, 29.0, 51.0, 49.0, 69.0, 67.0, 67.0, 82.0, 78.0, 72.0, 47.0, 63.0, 55.0, 36.0, 40.0, 27.0, 20.0, 25.0, 6.0, 8.0, 7.0, 3.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6640625, -3.546142578125, -3.42822265625, -3.310302734375, -3.1923828125, -3.074462890625, -2.95654296875, -2.838623046875, -2.720703125, -2.602783203125, -2.48486328125, -2.366943359375, -2.2490234375, -2.131103515625, -2.01318359375, -1.895263671875, -1.77734375, -1.659423828125, -1.54150390625, -1.423583984375, -1.3056640625, -1.187744140625, -1.06982421875, -0.951904296875, -0.833984375, -0.716064453125, -0.59814453125, -0.480224609375, -0.3623046875, -0.244384765625, -0.12646484375, -0.008544921875, 0.109375, 0.227294921875, 0.34521484375, 0.463134765625, 0.5810546875, 0.698974609375, 0.81689453125, 0.934814453125, 1.052734375, 1.170654296875, 1.28857421875, 1.406494140625, 1.5244140625, 1.642333984375, 1.76025390625, 1.878173828125, 1.99609375, 2.114013671875, 2.23193359375, 2.349853515625, 2.4677734375, 2.585693359375, 2.70361328125, 2.821533203125, 2.939453125, 3.057373046875, 3.17529296875, 3.293212890625, 3.4111328125, 3.529052734375, 3.64697265625, 3.764892578125, 3.8828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 13.0, 13.0, 16.0, 27.0, 34.0, 40.0, 65.0, 123.0, 188.0, 270.0, 481.0, 775.0, 1570.0, 3411.0, 9175.0, 43897.0, 591988.0, 353207.0, 29917.0, 7238.0, 2859.0, 1347.0, 753.0, 431.0, 251.0, 155.0, 99.0, 56.0, 41.0, 27.0, 18.0, 15.0, 6.0, 13.0, 10.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.697845458984375, -2.61053466796875, -2.523223876953125, -2.4359130859375, -2.348602294921875, -2.26129150390625, -2.173980712890625, -2.086669921875, -1.999359130859375, -1.91204833984375, -1.824737548828125, -1.7374267578125, -1.650115966796875, -1.56280517578125, -1.475494384765625, -1.38818359375, -1.300872802734375, -1.21356201171875, -1.126251220703125, -1.0389404296875, -0.951629638671875, -0.86431884765625, -0.777008056640625, -0.689697265625, -0.602386474609375, -0.51507568359375, -0.427764892578125, -0.3404541015625, -0.253143310546875, -0.16583251953125, -0.078521728515625, 0.0087890625, 0.096099853515625, 0.18341064453125, 0.270721435546875, 0.3580322265625, 0.445343017578125, 0.53265380859375, 0.619964599609375, 0.707275390625, 0.794586181640625, 0.88189697265625, 0.969207763671875, 1.0565185546875, 1.143829345703125, 1.23114013671875, 1.318450927734375, 1.40576171875, 1.493072509765625, 1.58038330078125, 1.667694091796875, 1.7550048828125, 1.842315673828125, 1.92962646484375, 2.016937255859375, 2.104248046875, 2.191558837890625, 2.27886962890625, 2.366180419921875, 2.4534912109375, 2.540802001953125, 2.62811279296875, 2.715423583984375, 2.802734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 11.0, 9.0, 26.0, 87.0, 202.0, 315.0, 201.0, 85.0, 31.0, 18.0, 2.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005521774291992188, -0.0005253404378890991, -0.0004985034465789795, -0.00047166645526885986, -0.00044482946395874023, -0.0004179924726486206, -0.000391155481338501, -0.00036431849002838135, -0.0003374814987182617, -0.0003106445074081421, -0.00028380751609802246, -0.00025697052478790283, -0.0002301335334777832, -0.00020329654216766357, -0.00017645955085754395, -0.00014962255954742432, -0.0001227855682373047, -9.594857692718506e-05, -6.911158561706543e-05, -4.22745943069458e-05, -1.5437602996826172e-05, 1.1399388313293457e-05, 3.8236379623413086e-05, 6.507337093353271e-05, 9.191036224365234e-05, 0.00011874735355377197, 0.0001455843448638916, 0.00017242133617401123, 0.00019925832748413086, 0.0002260953187942505, 0.0002529323101043701, 0.00027976930141448975, 0.0003066062927246094, 0.000333443284034729, 0.00036028027534484863, 0.00038711726665496826, 0.0004139542579650879, 0.0004407912492752075, 0.00046762824058532715, 0.0004944652318954468, 0.0005213022232055664, 0.000548139214515686, 0.0005749762058258057, 0.0006018131971359253, 0.0006286501884460449, 0.0006554871797561646, 0.0006823241710662842, 0.0007091611623764038, 0.0007359981536865234, 0.0007628351449966431, 0.0007896721363067627, 0.0008165091276168823, 0.000843346118927002, 0.0008701831102371216, 0.0008970201015472412, 0.0009238570928573608, 0.0009506940841674805, 0.0009775310754776, 0.0010043680667877197, 0.0010312050580978394, 0.001058042049407959, 0.0010848790407180786, 0.0011117160320281982, 0.0011385530233383179, 0.0011653900146484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 7.0, 7.0, 12.0, 22.0, 48.0, 72.0, 150.0, 395.0, 1196.0, 5964.0, 212730.0, 814588.0, 10648.0, 1770.0, 515.0, 191.0, 105.0, 51.0, 26.0, 11.0, 12.0, 10.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.51922607421875, -5.3157958984375, -5.11236572265625, -4.908935546875, -4.70550537109375, -4.5020751953125, -4.29864501953125, -4.09521484375, -3.89178466796875, -3.6883544921875, -3.48492431640625, -3.281494140625, -3.07806396484375, -2.8746337890625, -2.67120361328125, -2.4677734375, -2.26434326171875, -2.0609130859375, -1.85748291015625, -1.654052734375, -1.45062255859375, -1.2471923828125, -1.04376220703125, -0.84033203125, -0.63690185546875, -0.4334716796875, -0.23004150390625, -0.026611328125, 0.17681884765625, 0.3802490234375, 0.58367919921875, 0.787109375, 0.99053955078125, 1.1939697265625, 1.39739990234375, 1.600830078125, 1.80426025390625, 2.0076904296875, 2.21112060546875, 2.41455078125, 2.61798095703125, 2.8214111328125, 3.02484130859375, 3.228271484375, 3.43170166015625, 3.6351318359375, 3.83856201171875, 4.0419921875, 4.24542236328125, 4.4488525390625, 4.65228271484375, 4.855712890625, 5.05914306640625, 5.2625732421875, 5.46600341796875, 5.66943359375, 5.87286376953125, 6.0762939453125, 6.27972412109375, 6.483154296875, 6.68658447265625, 6.8900146484375, 7.09344482421875, 7.296875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 11.0, 10.0, 17.0, 21.0, 36.0, 63.0, 119.0, 195.0, 186.0, 136.0, 75.0, 55.0, 25.0, 15.0, 12.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.236328125, -3.141815185546875, -3.04730224609375, -2.952789306640625, -2.8582763671875, -2.763763427734375, -2.66925048828125, -2.574737548828125, -2.480224609375, -2.385711669921875, -2.29119873046875, -2.196685791015625, -2.1021728515625, -2.007659912109375, -1.91314697265625, -1.818634033203125, -1.72412109375, -1.629608154296875, -1.53509521484375, -1.440582275390625, -1.3460693359375, -1.251556396484375, -1.15704345703125, -1.062530517578125, -0.968017578125, -0.873504638671875, -0.77899169921875, -0.684478759765625, -0.5899658203125, -0.495452880859375, -0.40093994140625, -0.306427001953125, -0.2119140625, -0.117401123046875, -0.02288818359375, 0.071624755859375, 0.1661376953125, 0.260650634765625, 0.35516357421875, 0.449676513671875, 0.544189453125, 0.638702392578125, 0.73321533203125, 0.827728271484375, 0.9222412109375, 1.016754150390625, 1.11126708984375, 1.205780029296875, 1.30029296875, 1.394805908203125, 1.48931884765625, 1.583831787109375, 1.6783447265625, 1.772857666015625, 1.86737060546875, 1.961883544921875, 2.056396484375, 2.150909423828125, 2.24542236328125, 2.339935302734375, 2.4344482421875, 2.528961181640625, 2.62347412109375, 2.717987060546875, 2.8125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 13.0, 21.0, 49.0, 93.0, 168.0, 193.0, 169.0, 112.0, 90.0, 43.0, 20.0, 11.0, 4.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.037952423095703, -29.67232322692871, -28.30669403076172, -26.94106674194336, -25.575437545776367, -24.209808349609375, -22.844179153442383, -21.47854995727539, -20.11292266845703, -18.74729347229004, -17.381664276123047, -16.016036987304688, -14.650407791137695, -13.284778594970703, -11.919149398803711, -10.553521156311035, -9.187891006469727, -7.822262287139893, -6.456633567810059, -5.091004371643066, -3.7253756523132324, -2.3597469329833984, -0.9941177368164062, 0.37151050567626953, 1.7371397018432617, 3.1027684211730957, 4.46839714050293, 5.834026336669922, 7.199655055999756, 8.56528377532959, 9.930912971496582, 11.296541213989258, 12.66217041015625, 14.027799606323242, 15.393427848815918, 16.759056091308594, 18.124685287475586, 19.490314483642578, 20.85594367980957, 22.221572875976562, 23.587200164794922, 24.952829360961914, 26.318458557128906, 27.684085845947266, 29.049715042114258, 30.41534423828125, 31.780973434448242, 33.146602630615234, 34.512229919433594, 35.87785720825195, 37.24348831176758, 38.60911560058594, 39.97474670410156, 41.34037399291992, 42.70600128173828, 44.071632385253906, 45.43726348876953, 46.80289077758789, 48.168521881103516, 49.534149169921875, 50.8997802734375, 52.26540756225586, 53.63103485107422, 54.996665954589844, 56.3622932434082]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 2.0, 6.0, 7.0, 16.0, 18.0, 18.0, 18.0, 23.0, 25.0, 22.0, 26.0, 39.0, 34.0, 42.0, 48.0, 66.0, 47.0, 46.0, 57.0, 51.0, 50.0, 42.0, 42.0, 34.0, 36.0, 33.0, 25.0, 23.0, 16.0, 14.0, 18.0, 11.0, 12.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-19.131568908691406, -18.591711044311523, -18.05185317993164, -17.511993408203125, -16.972135543823242, -16.43227767944336, -15.892419815063477, -15.352561950683594, -14.812703132629395, -14.272845268249512, -13.732986450195312, -13.19312858581543, -12.653270721435547, -12.113411903381348, -11.573554039001465, -11.033695220947266, -10.493837356567383, -9.9539794921875, -9.4141206741333, -8.874262809753418, -8.334403991699219, -7.794546127319336, -7.254688262939453, -6.714829921722412, -6.174971580505371, -5.63511323928833, -5.095254898071289, -4.555397033691406, -4.015538692474365, -3.475680351257324, -2.9358222484588623, -2.3959641456604004, -1.8561058044433594, -1.316247582435608, -0.7763893604278564, -0.23653113842010498, 0.3033270835876465, 0.8431854248046875, 1.3830435276031494, 1.9229016304016113, 2.4627599716186523, 3.0026183128356934, 3.5424764156341553, 4.082334518432617, 4.622192859649658, 5.162051200866699, 5.701909065246582, 6.241767406463623, 6.781625747680664, 7.321484088897705, 7.861342430114746, 8.401200294494629, 8.941059112548828, 9.480916976928711, 10.020774841308594, 10.560632705688477, 11.100491523742676, 11.640349388122559, 12.180208206176758, 12.72006607055664, 13.259923934936523, 13.799782752990723, 14.339640617370605, 14.879499435424805, 15.419357299804688]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 7.0, 9.0, 23.0, 27.0, 33.0, 43.0, 58.0, 103.0, 153.0, 243.0, 373.0, 572.0, 937.0, 1717.0, 4706.0, 57792.0, 4111317.0, 10405.0, 2493.0, 1200.0, 729.0, 451.0, 294.0, 177.0, 140.0, 83.0, 62.0, 43.0, 33.0, 18.0, 9.0, 13.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8359375, -9.53076171875, -9.2255859375, -8.92041015625, -8.615234375, -8.31005859375, -8.0048828125, -7.69970703125, -7.39453125, -7.08935546875, -6.7841796875, -6.47900390625, -6.173828125, -5.86865234375, -5.5634765625, -5.25830078125, -4.953125, -4.64794921875, -4.3427734375, -4.03759765625, -3.732421875, -3.42724609375, -3.1220703125, -2.81689453125, -2.51171875, -2.20654296875, -1.9013671875, -1.59619140625, -1.291015625, -0.98583984375, -0.6806640625, -0.37548828125, -0.0703125, 0.23486328125, 0.5400390625, 0.84521484375, 1.150390625, 1.45556640625, 1.7607421875, 2.06591796875, 2.37109375, 2.67626953125, 2.9814453125, 3.28662109375, 3.591796875, 3.89697265625, 4.2021484375, 4.50732421875, 4.8125, 5.11767578125, 5.4228515625, 5.72802734375, 6.033203125, 6.33837890625, 6.6435546875, 6.94873046875, 7.25390625, 7.55908203125, 7.8642578125, 8.16943359375, 8.474609375, 8.77978515625, 9.0849609375, 9.39013671875, 9.6953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 7.0, 16.0, 17.0, 13.0, 31.0, 31.0, 34.0, 34.0, 32.0, 49.0, 47.0, 51.0, 43.0, 47.0, 58.0, 49.0, 46.0, 49.0, 46.0, 40.0, 46.0, 38.0, 32.0, 29.0, 19.0, 16.0, 20.0, 15.0, 9.0, 5.0, 7.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5485076904296875, -0.531585693359375, -0.5146636962890625, -0.49774169921875, -0.4808197021484375, -0.463897705078125, -0.4469757080078125, -0.4300537109375, -0.4131317138671875, -0.396209716796875, -0.3792877197265625, -0.36236572265625, -0.3454437255859375, -0.328521728515625, -0.3115997314453125, -0.294677734375, -0.2777557373046875, -0.260833740234375, -0.2439117431640625, -0.22698974609375, -0.2100677490234375, -0.193145751953125, -0.1762237548828125, -0.1593017578125, -0.1423797607421875, -0.125457763671875, -0.1085357666015625, -0.09161376953125, -0.0746917724609375, -0.057769775390625, -0.0408477783203125, -0.02392578125, -0.0070037841796875, 0.009918212890625, 0.0268402099609375, 0.04376220703125, 0.0606842041015625, 0.077606201171875, 0.0945281982421875, 0.1114501953125, 0.1283721923828125, 0.145294189453125, 0.1622161865234375, 0.17913818359375, 0.1960601806640625, 0.212982177734375, 0.2299041748046875, 0.246826171875, 0.2637481689453125, 0.280670166015625, 0.2975921630859375, 0.31451416015625, 0.3314361572265625, 0.348358154296875, 0.3652801513671875, 0.3822021484375, 0.3991241455078125, 0.416046142578125, 0.4329681396484375, 0.44989013671875, 0.4668121337890625, 0.483734130859375, 0.5006561279296875, 0.517578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 11.0, 14.0, 16.0, 41.0, 36.0, 43.0, 67.0, 72.0, 127.0, 146.0, 198.0, 307.0, 417.0, 573.0, 991.0, 1787.0, 3784.0, 13187.0, 512424.0, 3636581.0, 14537.0, 3988.0, 1745.0, 1017.0, 603.0, 429.0, 328.0, 216.0, 165.0, 115.0, 81.0, 69.0, 47.0, 31.0, 28.0, 12.0, 16.0, 10.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.797119140625, -5.62158203125, -5.446044921875, -5.2705078125, -5.094970703125, -4.91943359375, -4.743896484375, -4.568359375, -4.392822265625, -4.21728515625, -4.041748046875, -3.8662109375, -3.690673828125, -3.51513671875, -3.339599609375, -3.1640625, -2.988525390625, -2.81298828125, -2.637451171875, -2.4619140625, -2.286376953125, -2.11083984375, -1.935302734375, -1.759765625, -1.584228515625, -1.40869140625, -1.233154296875, -1.0576171875, -0.882080078125, -0.70654296875, -0.531005859375, -0.35546875, -0.179931640625, -0.00439453125, 0.171142578125, 0.3466796875, 0.522216796875, 0.69775390625, 0.873291015625, 1.048828125, 1.224365234375, 1.39990234375, 1.575439453125, 1.7509765625, 1.926513671875, 2.10205078125, 2.277587890625, 2.453125, 2.628662109375, 2.80419921875, 2.979736328125, 3.1552734375, 3.330810546875, 3.50634765625, 3.681884765625, 3.857421875, 4.032958984375, 4.20849609375, 4.384033203125, 4.5595703125, 4.735107421875, 4.91064453125, 5.086181640625, 5.26171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 14.0, 22.0, 44.0, 136.0, 3528.0, 213.0, 47.0, 22.0, 18.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9453125, -0.9122314453125, -0.879150390625, -0.8460693359375, -0.81298828125, -0.7799072265625, -0.746826171875, -0.7137451171875, -0.6806640625, -0.6475830078125, -0.614501953125, -0.5814208984375, -0.54833984375, -0.5152587890625, -0.482177734375, -0.4490966796875, -0.416015625, -0.3829345703125, -0.349853515625, -0.3167724609375, -0.28369140625, -0.2506103515625, -0.217529296875, -0.1844482421875, -0.1513671875, -0.1182861328125, -0.085205078125, -0.0521240234375, -0.01904296875, 0.0140380859375, 0.047119140625, 0.0802001953125, 0.11328125, 0.1463623046875, 0.179443359375, 0.2125244140625, 0.24560546875, 0.2786865234375, 0.311767578125, 0.3448486328125, 0.3779296875, 0.4110107421875, 0.444091796875, 0.4771728515625, 0.51025390625, 0.5433349609375, 0.576416015625, 0.6094970703125, 0.642578125, 0.6756591796875, 0.708740234375, 0.7418212890625, 0.77490234375, 0.8079833984375, 0.841064453125, 0.8741455078125, 0.9072265625, 0.9403076171875, 0.973388671875, 1.0064697265625, 1.03955078125, 1.0726318359375, 1.105712890625, 1.1387939453125, 1.171875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 5.0, 6.0, 8.0, 14.0, 14.0, 26.0, 27.0, 32.0, 42.0, 54.0, 57.0, 78.0, 60.0, 70.0, 64.0, 70.0, 64.0, 63.0, 38.0, 47.0, 33.0, 18.0, 19.0, 15.0, 19.0, 11.0, 8.0, 9.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.801316499710083, -1.7369202375411987, -1.6725239753723145, -1.6081278324127197, -1.5437315702438354, -1.4793353080749512, -1.4149391651153564, -1.3505429029464722, -1.286146640777588, -1.2217503786087036, -1.1573541164398193, -1.0929579734802246, -1.0285617113113403, -0.964165449142456, -0.8997692465782166, -0.835373044013977, -0.7709767818450928, -0.7065805196762085, -0.642184317111969, -0.5777881145477295, -0.5133918523788452, -0.4489956200122833, -0.38459938764572144, -0.32020315527915955, -0.25580692291259766, -0.19141069054603577, -0.12701445817947388, -0.06261822581291199, 0.0017780065536499023, 0.06617423892021179, 0.13057047128677368, 0.19496670365333557, 0.25936317443847656, 0.32375940680503845, 0.38815563917160034, 0.45255187153816223, 0.5169481039047241, 0.5813443660736084, 0.6457405686378479, 0.7101367712020874, 0.7745330333709717, 0.838929295539856, 0.9033254981040955, 0.967721700668335, 1.0321179628372192, 1.0965142250061035, 1.1609103679656982, 1.2253066301345825, 1.2897028923034668, 1.354099154472351, 1.4184954166412354, 1.48289155960083, 1.5472878217697144, 1.6116840839385986, 1.6760802268981934, 1.7404764890670776, 1.804872751235962, 1.8692690134048462, 1.9336652755737305, 1.9980614185333252, 2.06245756149292, 2.1268539428710938, 2.1912500858306885, 2.2556464672088623, 2.320042610168457]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 2.0, 7.0, 11.0, 9.0, 9.0, 16.0, 22.0, 20.0, 16.0, 22.0, 26.0, 24.0, 37.0, 32.0, 34.0, 41.0, 41.0, 34.0, 45.0, 44.0, 52.0, 38.0, 44.0, 42.0, 37.0, 32.0, 40.0, 24.0, 31.0, 34.0, 27.0, 18.0, 19.0, 14.0, 14.0, 10.0, 5.0, 5.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6023173332214355, -1.5578314065933228, -1.5133453607559204, -1.4688594341278076, -1.4243735074996948, -1.379887580871582, -1.3354015350341797, -1.290915608406067, -1.246429681777954, -1.2019437551498413, -1.157457709312439, -1.1129717826843262, -1.0684858560562134, -1.0239999294281006, -0.9795138835906982, -0.9350279569625854, -0.8905419111251831, -0.8460559248924255, -0.8015699982643127, -0.7570840120315552, -0.7125980854034424, -0.6681120991706848, -0.6236261129379272, -0.5791401863098145, -0.5346542000770569, -0.4901682436466217, -0.4456822872161865, -0.40119630098342896, -0.3567103445529938, -0.3122243881225586, -0.267738401889801, -0.22325244545936584, -0.17876648902893066, -0.13428053259849548, -0.08979456126689911, -0.045308589935302734, -0.0008226335048675537, 0.04366332292556763, 0.0881493091583252, 0.13263526558876038, 0.17712122201919556, 0.22160717844963074, 0.2660931348800659, 0.3105791211128235, 0.35506507754325867, 0.39955103397369385, 0.4440370202064514, 0.4885229766368866, 0.5330089330673218, 0.5774949193000793, 0.6219808459281921, 0.6664668321609497, 0.7109527587890625, 0.7554387450218201, 0.7999247312545776, 0.8444106578826904, 0.888896644115448, 0.9333826303482056, 0.9778685569763184, 1.0223546028137207, 1.0668405294418335, 1.1113264560699463, 1.1558125019073486, 1.2002984285354614, 1.2447843551635742]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 4.0, 11.0, 26.0, 35.0, 45.0, 84.0, 117.0, 285.0, 487.0, 868.0, 1766.0, 3653.0, 7551.0, 16935.0, 38808.0, 93766.0, 221209.0, 328091.0, 192878.0, 80384.0, 33731.0, 14607.0, 6716.0, 3162.0, 1538.0, 768.0, 443.0, 229.0, 127.0, 76.0, 44.0, 29.0, 25.0, 13.0, 10.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.078369140625, -2.01220703125, -1.946044921875, -1.8798828125, -1.813720703125, -1.74755859375, -1.681396484375, -1.615234375, -1.549072265625, -1.48291015625, -1.416748046875, -1.3505859375, -1.284423828125, -1.21826171875, -1.152099609375, -1.0859375, -1.019775390625, -0.95361328125, -0.887451171875, -0.8212890625, -0.755126953125, -0.68896484375, -0.622802734375, -0.556640625, -0.490478515625, -0.42431640625, -0.358154296875, -0.2919921875, -0.225830078125, -0.15966796875, -0.093505859375, -0.02734375, 0.038818359375, 0.10498046875, 0.171142578125, 0.2373046875, 0.303466796875, 0.36962890625, 0.435791015625, 0.501953125, 0.568115234375, 0.63427734375, 0.700439453125, 0.7666015625, 0.832763671875, 0.89892578125, 0.965087890625, 1.03125, 1.097412109375, 1.16357421875, 1.229736328125, 1.2958984375, 1.362060546875, 1.42822265625, 1.494384765625, 1.560546875, 1.626708984375, 1.69287109375, 1.759033203125, 1.8251953125, 1.891357421875, 1.95751953125, 2.023681640625, 2.08984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 8.0, 11.0, 3.0, 12.0, 13.0, 20.0, 26.0, 23.0, 30.0, 36.0, 35.0, 35.0, 46.0, 32.0, 51.0, 41.0, 58.0, 46.0, 48.0, 50.0, 45.0, 48.0, 39.0, 39.0, 33.0, 40.0, 30.0, 21.0, 20.0, 13.0, 8.0, 9.0, 9.0, 6.0, 9.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5336837768554688, -0.5170745849609375, -0.5004653930664062, -0.483856201171875, -0.46724700927734375, -0.4506378173828125, -0.43402862548828125, -0.41741943359375, -0.40081024169921875, -0.3842010498046875, -0.36759185791015625, -0.350982666015625, -0.33437347412109375, -0.3177642822265625, -0.30115509033203125, -0.2845458984375, -0.26793670654296875, -0.2513275146484375, -0.23471832275390625, -0.218109130859375, -0.20149993896484375, -0.1848907470703125, -0.16828155517578125, -0.15167236328125, -0.13506317138671875, -0.1184539794921875, -0.10184478759765625, -0.085235595703125, -0.06862640380859375, -0.0520172119140625, -0.03540802001953125, -0.018798828125, -0.00218963623046875, 0.0144195556640625, 0.03102874755859375, 0.047637939453125, 0.06424713134765625, 0.0808563232421875, 0.09746551513671875, 0.11407470703125, 0.13068389892578125, 0.1472930908203125, 0.16390228271484375, 0.180511474609375, 0.19712066650390625, 0.2137298583984375, 0.23033905029296875, 0.2469482421875, 0.26355743408203125, 0.2801666259765625, 0.29677581787109375, 0.313385009765625, 0.32999420166015625, 0.3466033935546875, 0.36321258544921875, 0.37982177734375, 0.39643096923828125, 0.4130401611328125, 0.42964935302734375, 0.446258544921875, 0.46286773681640625, 0.4794769287109375, 0.49608612060546875, 0.5126953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 7.0, 15.0, 28.0, 37.0, 48.0, 85.0, 134.0, 194.0, 339.0, 609.0, 1138.0, 3264.0, 15895.0, 174602.0, 758395.0, 79928.0, 9331.0, 2408.0, 953.0, 482.0, 242.0, 137.0, 93.0, 63.0, 41.0, 25.0, 16.0, 12.0, 9.0, 1.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.37890625, -5.2176513671875, -5.056396484375, -4.8951416015625, -4.73388671875, -4.5726318359375, -4.411376953125, -4.2501220703125, -4.0888671875, -3.9276123046875, -3.766357421875, -3.6051025390625, -3.44384765625, -3.2825927734375, -3.121337890625, -2.9600830078125, -2.798828125, -2.6375732421875, -2.476318359375, -2.3150634765625, -2.15380859375, -1.9925537109375, -1.831298828125, -1.6700439453125, -1.5087890625, -1.3475341796875, -1.186279296875, -1.0250244140625, -0.86376953125, -0.7025146484375, -0.541259765625, -0.3800048828125, -0.21875, -0.0574951171875, 0.103759765625, 0.2650146484375, 0.42626953125, 0.5875244140625, 0.748779296875, 0.9100341796875, 1.0712890625, 1.2325439453125, 1.393798828125, 1.5550537109375, 1.71630859375, 1.8775634765625, 2.038818359375, 2.2000732421875, 2.361328125, 2.5225830078125, 2.683837890625, 2.8450927734375, 3.00634765625, 3.1676025390625, 3.328857421875, 3.4901123046875, 3.6513671875, 3.8126220703125, 3.973876953125, 4.1351318359375, 4.29638671875, 4.4576416015625, 4.618896484375, 4.7801513671875, 4.94140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 4.0, 16.0, 14.0, 18.0, 21.0, 21.0, 31.0, 21.0, 30.0, 39.0, 42.0, 35.0, 38.0, 37.0, 45.0, 48.0, 56.0, 45.0, 46.0, 42.0, 44.0, 38.0, 29.0, 36.0, 32.0, 28.0, 29.0, 20.0, 16.0, 8.0, 10.0, 10.0, 8.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.76953125, -2.6904296875, -2.611328125, -2.5322265625, -2.453125, -2.3740234375, -2.294921875, -2.2158203125, -2.13671875, -2.0576171875, -1.978515625, -1.8994140625, -1.8203125, -1.7412109375, -1.662109375, -1.5830078125, -1.50390625, -1.4248046875, -1.345703125, -1.2666015625, -1.1875, -1.1083984375, -1.029296875, -0.9501953125, -0.87109375, -0.7919921875, -0.712890625, -0.6337890625, -0.5546875, -0.4755859375, -0.396484375, -0.3173828125, -0.23828125, -0.1591796875, -0.080078125, -0.0009765625, 0.078125, 0.1572265625, 0.236328125, 0.3154296875, 0.39453125, 0.4736328125, 0.552734375, 0.6318359375, 0.7109375, 0.7900390625, 0.869140625, 0.9482421875, 1.02734375, 1.1064453125, 1.185546875, 1.2646484375, 1.34375, 1.4228515625, 1.501953125, 1.5810546875, 1.66015625, 1.7392578125, 1.818359375, 1.8974609375, 1.9765625, 2.0556640625, 2.134765625, 2.2138671875, 2.29296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 16.0, 17.0, 25.0, 30.0, 52.0, 67.0, 95.0, 151.0, 226.0, 367.0, 664.0, 1364.0, 3536.0, 13889.0, 177650.0, 801436.0, 38072.0, 6501.0, 2106.0, 962.0, 461.0, 303.0, 173.0, 105.0, 82.0, 61.0, 39.0, 30.0, 17.0, 11.0, 12.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.728515625, -3.60919189453125, -3.4898681640625, -3.37054443359375, -3.251220703125, -3.13189697265625, -3.0125732421875, -2.89324951171875, -2.77392578125, -2.65460205078125, -2.5352783203125, -2.41595458984375, -2.296630859375, -2.17730712890625, -2.0579833984375, -1.93865966796875, -1.8193359375, -1.70001220703125, -1.5806884765625, -1.46136474609375, -1.342041015625, -1.22271728515625, -1.1033935546875, -0.98406982421875, -0.86474609375, -0.74542236328125, -0.6260986328125, -0.50677490234375, -0.387451171875, -0.26812744140625, -0.1488037109375, -0.02947998046875, 0.08984375, 0.20916748046875, 0.3284912109375, 0.44781494140625, 0.567138671875, 0.68646240234375, 0.8057861328125, 0.92510986328125, 1.04443359375, 1.16375732421875, 1.2830810546875, 1.40240478515625, 1.521728515625, 1.64105224609375, 1.7603759765625, 1.87969970703125, 1.9990234375, 2.11834716796875, 2.2376708984375, 2.35699462890625, 2.476318359375, 2.59564208984375, 2.7149658203125, 2.83428955078125, 2.95361328125, 3.07293701171875, 3.1922607421875, 3.31158447265625, 3.430908203125, 3.55023193359375, 3.6695556640625, 3.78887939453125, 3.908203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 11.0, 24.0, 60.0, 103.0, 161.0, 201.0, 185.0, 125.0, 68.0, 32.0, 12.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005893707275390625, -0.0005708262324333191, -0.0005522817373275757, -0.0005337372422218323, -0.0005151927471160889, -0.0004966482520103455, -0.00047810375690460205, -0.00045955926179885864, -0.00044101476669311523, -0.0004224702715873718, -0.0004039257764816284, -0.000385381281375885, -0.0003668367862701416, -0.0003482922911643982, -0.0003297477960586548, -0.0003112033009529114, -0.00029265880584716797, -0.00027411431074142456, -0.00025556981563568115, -0.00023702532052993774, -0.00021848082542419434, -0.00019993633031845093, -0.00018139183521270752, -0.0001628473401069641, -0.0001443028450012207, -0.0001257583498954773, -0.00010721385478973389, -8.866935968399048e-05, -7.012486457824707e-05, -5.158036947250366e-05, -3.3035874366760254e-05, -1.4491379261016846e-05, 4.0531158447265625e-06, 2.259761095046997e-05, 4.114210605621338e-05, 5.968660116195679e-05, 7.82310962677002e-05, 9.67755913734436e-05, 0.00011532008647918701, 0.00013386458158493042, 0.00015240907669067383, 0.00017095357179641724, 0.00018949806690216064, 0.00020804256200790405, 0.00022658705711364746, 0.00024513155221939087, 0.0002636760473251343, 0.0002822205424308777, 0.0003007650375366211, 0.0003193095326423645, 0.0003378540277481079, 0.0003563985228538513, 0.0003749430179595947, 0.00039348751306533813, 0.00041203200817108154, 0.00043057650327682495, 0.00044912099838256836, 0.00046766549348831177, 0.0004862099885940552, 0.0005047544836997986, 0.000523298978805542, 0.0005418434739112854, 0.0005603879690170288, 0.0005789324641227722, 0.0005974769592285156]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 0.0, 6.0, 5.0, 10.0, 11.0, 17.0, 42.0, 69.0, 176.0, 367.0, 918.0, 2474.0, 12398.0, 670318.0, 348233.0, 9767.0, 2322.0, 779.0, 322.0, 131.0, 61.0, 30.0, 22.0, 13.0, 6.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3359375, -5.15771484375, -4.9794921875, -4.80126953125, -4.623046875, -4.44482421875, -4.2666015625, -4.08837890625, -3.91015625, -3.73193359375, -3.5537109375, -3.37548828125, -3.197265625, -3.01904296875, -2.8408203125, -2.66259765625, -2.484375, -2.30615234375, -2.1279296875, -1.94970703125, -1.771484375, -1.59326171875, -1.4150390625, -1.23681640625, -1.05859375, -0.88037109375, -0.7021484375, -0.52392578125, -0.345703125, -0.16748046875, 0.0107421875, 0.18896484375, 0.3671875, 0.54541015625, 0.7236328125, 0.90185546875, 1.080078125, 1.25830078125, 1.4365234375, 1.61474609375, 1.79296875, 1.97119140625, 2.1494140625, 2.32763671875, 2.505859375, 2.68408203125, 2.8623046875, 3.04052734375, 3.21875, 3.39697265625, 3.5751953125, 3.75341796875, 3.931640625, 4.10986328125, 4.2880859375, 4.46630859375, 4.64453125, 4.82275390625, 5.0009765625, 5.17919921875, 5.357421875, 5.53564453125, 5.7138671875, 5.89208984375, 6.0703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 13.0, 19.0, 29.0, 47.0, 62.0, 128.0, 197.0, 191.0, 116.0, 59.0, 39.0, 31.0, 23.0, 5.0, 9.0, 8.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.359375, -3.2633056640625, -3.167236328125, -3.0711669921875, -2.97509765625, -2.8790283203125, -2.782958984375, -2.6868896484375, -2.5908203125, -2.4947509765625, -2.398681640625, -2.3026123046875, -2.20654296875, -2.1104736328125, -2.014404296875, -1.9183349609375, -1.822265625, -1.7261962890625, -1.630126953125, -1.5340576171875, -1.43798828125, -1.3419189453125, -1.245849609375, -1.1497802734375, -1.0537109375, -0.9576416015625, -0.861572265625, -0.7655029296875, -0.66943359375, -0.5733642578125, -0.477294921875, -0.3812255859375, -0.28515625, -0.1890869140625, -0.093017578125, 0.0030517578125, 0.09912109375, 0.1951904296875, 0.291259765625, 0.3873291015625, 0.4833984375, 0.5794677734375, 0.675537109375, 0.7716064453125, 0.86767578125, 0.9637451171875, 1.059814453125, 1.1558837890625, 1.251953125, 1.3480224609375, 1.444091796875, 1.5401611328125, 1.63623046875, 1.7322998046875, 1.828369140625, 1.9244384765625, 2.0205078125, 2.1165771484375, 2.212646484375, 2.3087158203125, 2.40478515625, 2.5008544921875, 2.596923828125, 2.6929931640625, 2.7890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 27.0, 101.0, 263.0, 344.0, 182.0, 61.0, 20.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.26325988769531, -36.99250411987305, -34.72174835205078, -32.450992584228516, -30.18023681640625, -27.909481048583984, -25.63872528076172, -23.367969512939453, -21.097213745117188, -18.826457977294922, -16.555702209472656, -14.28494644165039, -12.014190673828125, -9.74343490600586, -7.472679138183594, -5.201923370361328, -2.9311676025390625, -0.6604118347167969, 1.6103439331054688, 3.8810997009277344, 6.15185546875, 8.422611236572266, 10.693367004394531, 12.964122772216797, 15.234878540039062, 17.505634307861328, 19.776390075683594, 22.04714584350586, 24.317901611328125, 26.58865737915039, 28.859413146972656, 31.130168914794922, 33.40093231201172, 35.671688079833984, 37.94244384765625, 40.213199615478516, 42.48395538330078, 44.75471115112305, 47.02546691894531, 49.29622268676758, 51.566978454589844, 53.83773422241211, 56.108489990234375, 58.37924575805664, 60.650001525878906, 62.92075729370117, 65.19151306152344, 67.46226501464844, 69.73302459716797, 72.0037841796875, 74.2745361328125, 76.5452880859375, 78.81604766845703, 81.08680725097656, 83.35755920410156, 85.62831115722656, 87.8990707397461, 90.16983032226562, 92.44058227539062, 94.71133422851562, 96.98209381103516, 99.25285339355469, 101.52360534667969, 103.79435729980469, 106.06511688232422]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 9.0, 6.0, 6.0, 18.0, 20.0, 14.0, 27.0, 16.0, 23.0, 28.0, 26.0, 28.0, 32.0, 32.0, 45.0, 40.0, 45.0, 44.0, 39.0, 41.0, 32.0, 40.0, 48.0, 47.0, 46.0, 24.0, 24.0, 21.0, 21.0, 21.0, 26.0, 17.0, 15.0, 9.0, 13.0, 9.0, 12.0, 9.0, 4.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.883413314819336, -12.461821556091309, -12.040229797363281, -11.618638038635254, -11.197046279907227, -10.775455474853516, -10.353863716125488, -9.932271957397461, -9.510680198669434, -9.089088439941406, -8.667496681213379, -8.245904922485352, -7.824313640594482, -7.402721881866455, -6.981130599975586, -6.559538841247559, -6.137947082519531, -5.716355323791504, -5.294763565063477, -4.873172283172607, -4.45158052444458, -4.029988765716553, -3.6083972454071045, -3.1868057250976562, -2.765213966369629, -2.3436222076416016, -1.9220306873321533, -1.5004390478134155, -1.0788474082946777, -0.6572556495666504, -0.23566412925720215, 0.1859273910522461, 0.6075191497802734, 1.0291107892990112, 1.450702428817749, 1.8722940683364868, 2.2938857078552246, 2.715477466583252, 3.1370689868927, 3.5586605072021484, 3.980252265930176, 4.401844024658203, 4.8234357833862305, 5.2450270652771, 5.666618824005127, 6.088210582733154, 6.509801864624023, 6.931393623352051, 7.352985382080078, 7.7745771408081055, 8.196168899536133, 8.61776065826416, 9.039352416992188, 9.460943222045898, 9.882534980773926, 10.304126739501953, 10.72571849822998, 11.147310256958008, 11.568902015686035, 11.990493774414062, 12.412084579467773, 12.833677291870117, 13.255268096923828, 13.676859855651855, 14.098451614379883]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 5.0, 19.0, 15.0, 41.0, 58.0, 94.0, 92.0, 189.0, 335.0, 474.0, 916.0, 1867.0, 3779.0, 10652.0, 77823.0, 4064420.0, 21815.0, 6132.0, 2625.0, 1293.0, 640.0, 360.0, 229.0, 138.0, 93.0, 53.0, 31.0, 26.0, 15.0, 14.0, 6.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.2109375, -7.97796630859375, -7.7449951171875, -7.51202392578125, -7.279052734375, -7.04608154296875, -6.8131103515625, -6.58013916015625, -6.34716796875, -6.11419677734375, -5.8812255859375, -5.64825439453125, -5.415283203125, -5.18231201171875, -4.9493408203125, -4.71636962890625, -4.4833984375, -4.25042724609375, -4.0174560546875, -3.78448486328125, -3.551513671875, -3.31854248046875, -3.0855712890625, -2.85260009765625, -2.61962890625, -2.38665771484375, -2.1536865234375, -1.92071533203125, -1.687744140625, -1.45477294921875, -1.2218017578125, -0.98883056640625, -0.755859375, -0.52288818359375, -0.2899169921875, -0.05694580078125, 0.176025390625, 0.40899658203125, 0.6419677734375, 0.87493896484375, 1.10791015625, 1.34088134765625, 1.5738525390625, 1.80682373046875, 2.039794921875, 2.27276611328125, 2.5057373046875, 2.73870849609375, 2.9716796875, 3.20465087890625, 3.4376220703125, 3.67059326171875, 3.903564453125, 4.13653564453125, 4.3695068359375, 4.60247802734375, 4.83544921875, 5.06842041015625, 5.3013916015625, 5.53436279296875, 5.767333984375, 6.00030517578125, 6.2332763671875, 6.46624755859375, 6.69921875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 8.0, 14.0, 15.0, 11.0, 16.0, 23.0, 27.0, 35.0, 26.0, 34.0, 34.0, 45.0, 53.0, 49.0, 52.0, 53.0, 49.0, 59.0, 35.0, 47.0, 35.0, 35.0, 34.0, 24.0, 41.0, 24.0, 22.0, 21.0, 13.0, 6.0, 13.0, 15.0, 7.0, 3.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5212783813476562, -0.5049591064453125, -0.48863983154296875, -0.472320556640625, -0.45600128173828125, -0.4396820068359375, -0.42336273193359375, -0.40704345703125, -0.39072418212890625, -0.3744049072265625, -0.35808563232421875, -0.341766357421875, -0.32544708251953125, -0.3091278076171875, -0.29280853271484375, -0.2764892578125, -0.26016998291015625, -0.2438507080078125, -0.22753143310546875, -0.211212158203125, -0.19489288330078125, -0.1785736083984375, -0.16225433349609375, -0.14593505859375, -0.12961578369140625, -0.1132965087890625, -0.09697723388671875, -0.080657958984375, -0.06433868408203125, -0.0480194091796875, -0.03170013427734375, -0.015380859375, 0.00093841552734375, 0.0172576904296875, 0.03357696533203125, 0.049896240234375, 0.06621551513671875, 0.0825347900390625, 0.09885406494140625, 0.11517333984375, 0.13149261474609375, 0.1478118896484375, 0.16413116455078125, 0.180450439453125, 0.19676971435546875, 0.2130889892578125, 0.22940826416015625, 0.2457275390625, 0.26204681396484375, 0.2783660888671875, 0.29468536376953125, 0.311004638671875, 0.32732391357421875, 0.3436431884765625, 0.35996246337890625, 0.37628173828125, 0.39260101318359375, 0.4089202880859375, 0.42523956298828125, 0.441558837890625, 0.45787811279296875, 0.4741973876953125, 0.49051666259765625, 0.5068359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 10.0, 6.0, 9.0, 9.0, 11.0, 27.0, 28.0, 33.0, 52.0, 51.0, 93.0, 141.0, 180.0, 301.0, 449.0, 694.0, 1181.0, 1838.0, 3442.0, 6697.0, 16066.0, 80684.0, 4002873.0, 52427.0, 13500.0, 5840.0, 2931.0, 1762.0, 989.0, 620.0, 402.0, 288.0, 199.0, 126.0, 76.0, 69.0, 42.0, 34.0, 30.0, 15.0, 14.0, 8.0, 11.0, 10.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0703125, -3.93646240234375, -3.8026123046875, -3.66876220703125, -3.534912109375, -3.40106201171875, -3.2672119140625, -3.13336181640625, -2.99951171875, -2.86566162109375, -2.7318115234375, -2.59796142578125, -2.464111328125, -2.33026123046875, -2.1964111328125, -2.06256103515625, -1.9287109375, -1.79486083984375, -1.6610107421875, -1.52716064453125, -1.393310546875, -1.25946044921875, -1.1256103515625, -0.99176025390625, -0.85791015625, -0.72406005859375, -0.5902099609375, -0.45635986328125, -0.322509765625, -0.18865966796875, -0.0548095703125, 0.07904052734375, 0.212890625, 0.34674072265625, 0.4805908203125, 0.61444091796875, 0.748291015625, 0.88214111328125, 1.0159912109375, 1.14984130859375, 1.28369140625, 1.41754150390625, 1.5513916015625, 1.68524169921875, 1.819091796875, 1.95294189453125, 2.0867919921875, 2.22064208984375, 2.3544921875, 2.48834228515625, 2.6221923828125, 2.75604248046875, 2.889892578125, 3.02374267578125, 3.1575927734375, 3.29144287109375, 3.42529296875, 3.55914306640625, 3.6929931640625, 3.82684326171875, 3.960693359375, 4.09454345703125, 4.2283935546875, 4.36224365234375, 4.49609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 3.0, 7.0, 13.0, 12.0, 20.0, 28.0, 72.0, 370.0, 3346.0, 103.0, 40.0, 13.0, 10.0, 6.0, 4.0, 2.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1359100341796875, -1.097015380859375, -1.0581207275390625, -1.01922607421875, -0.9803314208984375, -0.941436767578125, -0.9025421142578125, -0.8636474609375, -0.8247528076171875, -0.785858154296875, -0.7469635009765625, -0.70806884765625, -0.6691741943359375, -0.630279541015625, -0.5913848876953125, -0.552490234375, -0.5135955810546875, -0.474700927734375, -0.4358062744140625, -0.39691162109375, -0.3580169677734375, -0.319122314453125, -0.2802276611328125, -0.2413330078125, -0.2024383544921875, -0.163543701171875, -0.1246490478515625, -0.08575439453125, -0.0468597412109375, -0.007965087890625, 0.0309295654296875, 0.06982421875, 0.1087188720703125, 0.147613525390625, 0.1865081787109375, 0.22540283203125, 0.2642974853515625, 0.303192138671875, 0.3420867919921875, 0.3809814453125, 0.4198760986328125, 0.458770751953125, 0.4976654052734375, 0.53656005859375, 0.5754547119140625, 0.614349365234375, 0.6532440185546875, 0.692138671875, 0.7310333251953125, 0.769927978515625, 0.8088226318359375, 0.84771728515625, 0.8866119384765625, 0.925506591796875, 0.9644012451171875, 1.0032958984375, 1.0421905517578125, 1.081085205078125, 1.1199798583984375, 1.15887451171875, 1.1977691650390625, 1.236663818359375, 1.2755584716796875, 1.314453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 8.0, 8.0, 9.0, 16.0, 19.0, 27.0, 25.0, 54.0, 76.0, 84.0, 80.0, 93.0, 74.0, 107.0, 88.0, 60.0, 36.0, 35.0, 19.0, 23.0, 15.0, 16.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.379238128662109, -4.276650905609131, -4.174063205718994, -4.071475982666016, -3.968888282775879, -3.8663008213043213, -3.7637133598327637, -3.661125898361206, -3.5585384368896484, -3.455950975418091, -3.353363513946533, -3.2507760524749756, -3.148188591003418, -3.0456011295318604, -2.9430136680603027, -2.840426206588745, -2.7378387451171875, -2.63525128364563, -2.5326638221740723, -2.4300763607025146, -2.327488899230957, -2.2249014377593994, -2.122313976287842, -2.019726514816284, -1.9171392917633057, -1.814551830291748, -1.7119643688201904, -1.6093769073486328, -1.5067894458770752, -1.4042019844055176, -1.30161452293396, -1.1990270614624023, -1.0964395999908447, -0.9938521385192871, -0.8912646770477295, -0.7886772155761719, -0.6860897541046143, -0.5835023522377014, -0.4809148907661438, -0.3783274292945862, -0.27573996782302856, -0.17315250635147095, -0.07056505978107452, 0.0320223867893219, 0.13460984826087952, 0.23719727993011475, 0.33978474140167236, 0.44237220287323, 0.5449596643447876, 0.6475471258163452, 0.7501345872879028, 0.8527220487594604, 0.9553095102310181, 1.0578968524932861, 1.1604843139648438, 1.2630717754364014, 1.365659236907959, 1.4682466983795166, 1.5708341598510742, 1.6734216213226318, 1.7760090827941895, 1.878596544265747, 1.9811840057373047, 2.0837714672088623, 2.18635892868042]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 11.0, 7.0, 11.0, 15.0, 15.0, 13.0, 22.0, 16.0, 32.0, 19.0, 31.0, 37.0, 35.0, 40.0, 32.0, 41.0, 44.0, 33.0, 39.0, 38.0, 42.0, 36.0, 46.0, 20.0, 27.0, 36.0, 24.0, 36.0, 22.0, 33.0, 21.0, 25.0, 19.0, 19.0, 12.0, 2.0, 10.0, 7.0, 5.0, 4.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.192915678024292, -2.130833625793457, -2.068751335144043, -2.006669282913208, -1.9445871114730835, -1.882504940032959, -1.820422887802124, -1.7583407163619995, -1.696258544921875, -1.6341763734817505, -1.572094202041626, -1.510012149810791, -1.4479299783706665, -1.385847806930542, -1.323765754699707, -1.2616835832595825, -1.199601411819458, -1.1375192403793335, -1.075437068939209, -1.013355016708374, -0.9512728452682495, -0.889190673828125, -0.8271085619926453, -0.7650264501571655, -0.702944278717041, -0.6408621072769165, -0.5787799954414368, -0.516697883605957, -0.4546157121658325, -0.3925335705280304, -0.33045142889022827, -0.26836928725242615, -0.20628726482391357, -0.14420512318611145, -0.08212298154830933, -0.020040839910507202, 0.04204130172729492, 0.10412344336509705, 0.16620558500289917, 0.2282877266407013, 0.2903698682785034, 0.35245200991630554, 0.41453415155410767, 0.4766162931919098, 0.5386984348297119, 0.6007806062698364, 0.6628627181053162, 0.7249448299407959, 0.7870270013809204, 0.8491091728210449, 0.9111912846565247, 0.9732733964920044, 1.035355567932129, 1.0974377393722534, 1.159519910812378, 1.221601963043213, 1.2836841344833374, 1.345766305923462, 1.4078483581542969, 1.4699305295944214, 1.532012701034546, 1.5940948724746704, 1.656177043914795, 1.7182590961456299, 1.7803412675857544]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 10.0, 13.0, 21.0, 22.0, 35.0, 43.0, 85.0, 120.0, 251.0, 340.0, 651.0, 1056.0, 1977.0, 3517.0, 6850.0, 13370.0, 27327.0, 58009.0, 126107.0, 252785.0, 276126.0, 147798.0, 67835.0, 31786.0, 15484.0, 7757.0, 4068.0, 2098.0, 1229.0, 686.0, 392.0, 246.0, 164.0, 93.0, 53.0, 39.0, 29.0, 16.0, 11.0, 16.0, 10.0, 5.0, 2.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.373321533203125, -1.32769775390625, -1.282073974609375, -1.2364501953125, -1.190826416015625, -1.14520263671875, -1.099578857421875, -1.053955078125, -1.008331298828125, -0.96270751953125, -0.917083740234375, -0.8714599609375, -0.825836181640625, -0.78021240234375, -0.734588623046875, -0.68896484375, -0.643341064453125, -0.59771728515625, -0.552093505859375, -0.5064697265625, -0.460845947265625, -0.41522216796875, -0.369598388671875, -0.323974609375, -0.278350830078125, -0.23272705078125, -0.187103271484375, -0.1414794921875, -0.095855712890625, -0.05023193359375, -0.004608154296875, 0.041015625, 0.086639404296875, 0.13226318359375, 0.177886962890625, 0.2235107421875, 0.269134521484375, 0.31475830078125, 0.360382080078125, 0.406005859375, 0.451629638671875, 0.49725341796875, 0.542877197265625, 0.5885009765625, 0.634124755859375, 0.67974853515625, 0.725372314453125, 0.77099609375, 0.816619873046875, 0.86224365234375, 0.907867431640625, 0.9534912109375, 0.999114990234375, 1.04473876953125, 1.090362548828125, 1.135986328125, 1.181610107421875, 1.22723388671875, 1.272857666015625, 1.3184814453125, 1.364105224609375, 1.40972900390625, 1.455352783203125, 1.5009765625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 4.0, 12.0, 10.0, 21.0, 16.0, 23.0, 20.0, 35.0, 32.0, 44.0, 35.0, 54.0, 37.0, 52.0, 41.0, 39.0, 49.0, 38.0, 52.0, 45.0, 36.0, 32.0, 41.0, 33.0, 28.0, 31.0, 22.0, 23.0, 9.0, 16.0, 11.0, 7.0, 7.0, 8.0, 6.0, 5.0, 8.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.568359375, -0.5512161254882812, -0.5340728759765625, -0.5169296264648438, -0.499786376953125, -0.48264312744140625, -0.4654998779296875, -0.44835662841796875, -0.43121337890625, -0.41407012939453125, -0.3969268798828125, -0.37978363037109375, -0.362640380859375, -0.34549713134765625, -0.3283538818359375, -0.31121063232421875, -0.2940673828125, -0.27692413330078125, -0.2597808837890625, -0.24263763427734375, -0.225494384765625, -0.20835113525390625, -0.1912078857421875, -0.17406463623046875, -0.15692138671875, -0.13977813720703125, -0.1226348876953125, -0.10549163818359375, -0.088348388671875, -0.07120513916015625, -0.0540618896484375, -0.03691864013671875, -0.019775390625, -0.00263214111328125, 0.0145111083984375, 0.03165435791015625, 0.048797607421875, 0.06594085693359375, 0.0830841064453125, 0.10022735595703125, 0.11737060546875, 0.13451385498046875, 0.1516571044921875, 0.16880035400390625, 0.185943603515625, 0.20308685302734375, 0.2202301025390625, 0.23737335205078125, 0.2545166015625, 0.27165985107421875, 0.2888031005859375, 0.30594635009765625, 0.323089599609375, 0.34023284912109375, 0.3573760986328125, 0.37451934814453125, 0.39166259765625, 0.40880584716796875, 0.4259490966796875, 0.44309234619140625, 0.460235595703125, 0.47737884521484375, 0.4945220947265625, 0.5116653442382812, 0.52880859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 12.0, 14.0, 16.0, 14.0, 22.0, 53.0, 53.0, 81.0, 128.0, 167.0, 272.0, 405.0, 805.0, 1534.0, 4212.0, 21270.0, 266135.0, 688348.0, 52822.0, 7442.0, 2203.0, 1015.0, 536.0, 313.0, 211.0, 151.0, 97.0, 64.0, 58.0, 32.0, 21.0, 17.0, 14.0, 6.0, 5.0, 8.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.99609375, -3.87200927734375, -3.7479248046875, -3.62384033203125, -3.499755859375, -3.37567138671875, -3.2515869140625, -3.12750244140625, -3.00341796875, -2.87933349609375, -2.7552490234375, -2.63116455078125, -2.507080078125, -2.38299560546875, -2.2589111328125, -2.13482666015625, -2.0107421875, -1.88665771484375, -1.7625732421875, -1.63848876953125, -1.514404296875, -1.39031982421875, -1.2662353515625, -1.14215087890625, -1.01806640625, -0.89398193359375, -0.7698974609375, -0.64581298828125, -0.521728515625, -0.39764404296875, -0.2735595703125, -0.14947509765625, -0.025390625, 0.09869384765625, 0.2227783203125, 0.34686279296875, 0.470947265625, 0.59503173828125, 0.7191162109375, 0.84320068359375, 0.96728515625, 1.09136962890625, 1.2154541015625, 1.33953857421875, 1.463623046875, 1.58770751953125, 1.7117919921875, 1.83587646484375, 1.9599609375, 2.08404541015625, 2.2081298828125, 2.33221435546875, 2.456298828125, 2.58038330078125, 2.7044677734375, 2.82855224609375, 2.95263671875, 3.07672119140625, 3.2008056640625, 3.32489013671875, 3.448974609375, 3.57305908203125, 3.6971435546875, 3.82122802734375, 3.9453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 8.0, 6.0, 4.0, 4.0, 10.0, 7.0, 4.0, 12.0, 16.0, 18.0, 28.0, 33.0, 33.0, 41.0, 32.0, 51.0, 44.0, 44.0, 47.0, 44.0, 52.0, 70.0, 35.0, 43.0, 44.0, 40.0, 37.0, 32.0, 25.0, 22.0, 24.0, 22.0, 20.0, 14.0, 7.0, 14.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.982421875, -2.897247314453125, -2.81207275390625, -2.726898193359375, -2.6417236328125, -2.556549072265625, -2.47137451171875, -2.386199951171875, -2.301025390625, -2.215850830078125, -2.13067626953125, -2.045501708984375, -1.9603271484375, -1.875152587890625, -1.78997802734375, -1.704803466796875, -1.61962890625, -1.534454345703125, -1.44927978515625, -1.364105224609375, -1.2789306640625, -1.193756103515625, -1.10858154296875, -1.023406982421875, -0.938232421875, -0.853057861328125, -0.76788330078125, -0.682708740234375, -0.5975341796875, -0.512359619140625, -0.42718505859375, -0.342010498046875, -0.2568359375, -0.171661376953125, -0.08648681640625, -0.001312255859375, 0.0838623046875, 0.169036865234375, 0.25421142578125, 0.339385986328125, 0.424560546875, 0.509735107421875, 0.59490966796875, 0.680084228515625, 0.7652587890625, 0.850433349609375, 0.93560791015625, 1.020782470703125, 1.10595703125, 1.191131591796875, 1.27630615234375, 1.361480712890625, 1.4466552734375, 1.531829833984375, 1.61700439453125, 1.702178955078125, 1.787353515625, 1.872528076171875, 1.95770263671875, 2.042877197265625, 2.1280517578125, 2.213226318359375, 2.29840087890625, 2.383575439453125, 2.46875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 16.0, 27.0, 31.0, 51.0, 75.0, 141.0, 306.0, 786.0, 3316.0, 29498.0, 887631.0, 117538.0, 6996.0, 1332.0, 388.0, 163.0, 94.0, 51.0, 30.0, 17.0, 12.0, 8.0, 13.0, 5.0, 4.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.919921875, -3.800048828125, -3.68017578125, -3.560302734375, -3.4404296875, -3.320556640625, -3.20068359375, -3.080810546875, -2.9609375, -2.841064453125, -2.72119140625, -2.601318359375, -2.4814453125, -2.361572265625, -2.24169921875, -2.121826171875, -2.001953125, -1.882080078125, -1.76220703125, -1.642333984375, -1.5224609375, -1.402587890625, -1.28271484375, -1.162841796875, -1.04296875, -0.923095703125, -0.80322265625, -0.683349609375, -0.5634765625, -0.443603515625, -0.32373046875, -0.203857421875, -0.083984375, 0.035888671875, 0.15576171875, 0.275634765625, 0.3955078125, 0.515380859375, 0.63525390625, 0.755126953125, 0.875, 0.994873046875, 1.11474609375, 1.234619140625, 1.3544921875, 1.474365234375, 1.59423828125, 1.714111328125, 1.833984375, 1.953857421875, 2.07373046875, 2.193603515625, 2.3134765625, 2.433349609375, 2.55322265625, 2.673095703125, 2.79296875, 2.912841796875, 3.03271484375, 3.152587890625, 3.2724609375, 3.392333984375, 3.51220703125, 3.632080078125, 3.751953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 8.0, 2.0, 7.0, 8.0, 7.0, 15.0, 24.0, 35.0, 29.0, 44.0, 40.0, 90.0, 94.0, 126.0, 118.0, 79.0, 83.0, 42.0, 49.0, 42.0, 20.0, 14.0, 7.0, 6.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0003390312194824219, -0.00033070705831050873, -0.0003223828971385956, -0.00031405873596668243, -0.0003057345747947693, -0.00029741041362285614, -0.000289086252450943, -0.00028076209127902985, -0.0002724379301071167, -0.00026411376893520355, -0.0002557896077632904, -0.00024746544659137726, -0.0002391412854194641, -0.00023081712424755096, -0.00022249296307563782, -0.00021416880190372467, -0.00020584464073181152, -0.00019752047955989838, -0.00018919631838798523, -0.00018087215721607208, -0.00017254799604415894, -0.0001642238348722458, -0.00015589967370033264, -0.0001475755125284195, -0.00013925135135650635, -0.0001309271901845932, -0.00012260302901268005, -0.0001142788678407669, -0.00010595470666885376, -9.763054549694061e-05, -8.930638432502747e-05, -8.098222315311432e-05, -7.265806198120117e-05, -6.433390080928802e-05, -5.600973963737488e-05, -4.768557846546173e-05, -3.9361417293548584e-05, -3.103725612163544e-05, -2.271309494972229e-05, -1.4388933777809143e-05, -6.064772605895996e-06, 2.259388566017151e-06, 1.0583549737930298e-05, 1.8907710909843445e-05, 2.7231872081756592e-05, 3.555603325366974e-05, 4.3880194425582886e-05, 5.220435559749603e-05, 6.052851676940918e-05, 6.885267794132233e-05, 7.717683911323547e-05, 8.550100028514862e-05, 9.382516145706177e-05, 0.00010214932262897491, 0.00011047348380088806, 0.00011879764497280121, 0.00012712180614471436, 0.0001354459673166275, 0.00014377012848854065, 0.0001520942896604538, 0.00016041845083236694, 0.0001687426120042801, 0.00017706677317619324, 0.00018539093434810638, 0.00019371509552001953]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 10.0, 8.0, 14.0, 23.0, 45.0, 96.0, 138.0, 326.0, 771.0, 2540.0, 15770.0, 667916.0, 346142.0, 11461.0, 2048.0, 654.0, 291.0, 131.0, 59.0, 36.0, 23.0, 11.0, 12.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.13592529296875, -3.0101318359375, -2.88433837890625, -2.758544921875, -2.63275146484375, -2.5069580078125, -2.38116455078125, -2.25537109375, -2.12957763671875, -2.0037841796875, -1.87799072265625, -1.752197265625, -1.62640380859375, -1.5006103515625, -1.37481689453125, -1.2490234375, -1.12322998046875, -0.9974365234375, -0.87164306640625, -0.745849609375, -0.62005615234375, -0.4942626953125, -0.36846923828125, -0.24267578125, -0.11688232421875, 0.0089111328125, 0.13470458984375, 0.260498046875, 0.38629150390625, 0.5120849609375, 0.63787841796875, 0.763671875, 0.88946533203125, 1.0152587890625, 1.14105224609375, 1.266845703125, 1.39263916015625, 1.5184326171875, 1.64422607421875, 1.77001953125, 1.89581298828125, 2.0216064453125, 2.14739990234375, 2.273193359375, 2.39898681640625, 2.5247802734375, 2.65057373046875, 2.7763671875, 2.90216064453125, 3.0279541015625, 3.15374755859375, 3.279541015625, 3.40533447265625, 3.5311279296875, 3.65692138671875, 3.78271484375, 3.90850830078125, 4.0343017578125, 4.16009521484375, 4.285888671875, 4.41168212890625, 4.5374755859375, 4.66326904296875, 4.7890625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 24.0, 26.0, 35.0, 63.0, 99.0, 138.0, 172.0, 132.0, 127.0, 61.0, 38.0, 31.0, 11.0, 7.0, 8.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.630859375, -2.556915283203125, -2.48297119140625, -2.409027099609375, -2.3350830078125, -2.261138916015625, -2.18719482421875, -2.113250732421875, -2.039306640625, -1.965362548828125, -1.89141845703125, -1.817474365234375, -1.7435302734375, -1.669586181640625, -1.59564208984375, -1.521697998046875, -1.44775390625, -1.373809814453125, -1.29986572265625, -1.225921630859375, -1.1519775390625, -1.078033447265625, -1.00408935546875, -0.930145263671875, -0.856201171875, -0.782257080078125, -0.70831298828125, -0.634368896484375, -0.5604248046875, -0.486480712890625, -0.41253662109375, -0.338592529296875, -0.2646484375, -0.190704345703125, -0.11676025390625, -0.042816162109375, 0.0311279296875, 0.105072021484375, 0.17901611328125, 0.252960205078125, 0.326904296875, 0.400848388671875, 0.47479248046875, 0.548736572265625, 0.6226806640625, 0.696624755859375, 0.77056884765625, 0.844512939453125, 0.91845703125, 0.992401123046875, 1.06634521484375, 1.140289306640625, 1.2142333984375, 1.288177490234375, 1.36212158203125, 1.436065673828125, 1.510009765625, 1.583953857421875, 1.65789794921875, 1.731842041015625, 1.8057861328125, 1.879730224609375, 1.95367431640625, 2.027618408203125, 2.1015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 10.0, 13.0, 18.0, 39.0, 60.0, 137.0, 194.0, 213.0, 149.0, 88.0, 39.0, 16.0, 9.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.158658981323242, -22.020191192626953, -20.88172149658203, -19.743253707885742, -18.60478401184082, -17.46631622314453, -16.32784652709961, -15.18937873840332, -14.050909996032715, -12.91244125366211, -11.773972511291504, -10.635503768920898, -9.49703598022461, -8.358566284179688, -7.220098495483398, -6.081629753112793, -4.9431610107421875, -3.804692268371582, -2.6662237644195557, -1.5277552604675293, -0.38928651809692383, 0.7491822242736816, 1.887650489807129, 3.0261192321777344, 4.16458797454834, 5.303056716918945, 6.441525459289551, 7.579993724822998, 8.718461990356445, 9.856931686401367, 10.995399475097656, 12.133868217468262, 13.272335052490234, 14.41080379486084, 15.549272537231445, 16.687740325927734, 17.826210021972656, 18.964677810668945, 20.103145599365234, 21.241615295410156, 22.380084991455078, 23.518552780151367, 24.65702247619629, 25.795490264892578, 26.9339599609375, 28.07242774963379, 29.210895538330078, 30.349365234375, 31.48783302307129, 32.62630081176758, 33.7647705078125, 34.90324020385742, 36.04170608520508, 37.18017578125, 38.31864547729492, 39.457115173339844, 40.5955810546875, 41.73405075073242, 42.87251663208008, 44.010986328125, 45.14945602416992, 46.287925720214844, 47.4263916015625, 48.56486129760742, 49.703330993652344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 7.0, 13.0, 18.0, 14.0, 26.0, 18.0, 27.0, 25.0, 27.0, 39.0, 34.0, 44.0, 48.0, 38.0, 53.0, 55.0, 50.0, 51.0, 61.0, 43.0, 37.0, 39.0, 34.0, 34.0, 22.0, 29.0, 23.0, 11.0, 11.0, 10.0, 10.0, 9.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.63257122039795, -12.218700408935547, -11.804828643798828, -11.39095687866211, -10.977086067199707, -10.563215255737305, -10.149343490600586, -9.735471725463867, -9.321600914001465, -8.907730102539062, -8.493858337402344, -8.079986572265625, -7.666115760803223, -7.252244472503662, -6.838373184204102, -6.424501895904541, -6.0106306076049805, -5.59675931930542, -5.182888031005859, -4.769016742706299, -4.355145454406738, -3.9412741661071777, -3.527402877807617, -3.1135315895080566, -2.699660301208496, -2.2857890129089355, -1.871917724609375, -1.4580464363098145, -1.044175148010254, -0.6303038597106934, -0.2164325714111328, 0.19743871688842773, 0.6113090515136719, 1.0251803398132324, 1.439051628112793, 1.8529229164123535, 2.266794204711914, 2.6806654930114746, 3.094536781311035, 3.5084080696105957, 3.9222793579101562, 4.336150646209717, 4.750021934509277, 5.163893222808838, 5.577764511108398, 5.991635799407959, 6.4055070877075195, 6.81937837600708, 7.233249664306641, 7.647120952606201, 8.060992240905762, 8.474863052368164, 8.888734817504883, 9.302606582641602, 9.716477394104004, 10.130348205566406, 10.544219970703125, 10.958091735839844, 11.371962547302246, 11.785833358764648, 12.199705123901367, 12.613576889038086, 13.027447700500488, 13.44131851196289, 13.85519027709961]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 10.0, 15.0, 28.0, 24.0, 33.0, 47.0, 69.0, 86.0, 112.0, 187.0, 495.0, 1142.0, 4130.0, 47233.0, 4129711.0, 7726.0, 1886.0, 580.0, 257.0, 140.0, 99.0, 70.0, 47.0, 40.0, 30.0, 23.0, 10.0, 11.0, 9.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6328125, -10.3123779296875, -9.991943359375, -9.6715087890625, -9.35107421875, -9.0306396484375, -8.710205078125, -8.3897705078125, -8.0693359375, -7.7489013671875, -7.428466796875, -7.1080322265625, -6.78759765625, -6.4671630859375, -6.146728515625, -5.8262939453125, -5.505859375, -5.1854248046875, -4.864990234375, -4.5445556640625, -4.22412109375, -3.9036865234375, -3.583251953125, -3.2628173828125, -2.9423828125, -2.6219482421875, -2.301513671875, -1.9810791015625, -1.66064453125, -1.3402099609375, -1.019775390625, -0.6993408203125, -0.37890625, -0.0584716796875, 0.261962890625, 0.5823974609375, 0.90283203125, 1.2232666015625, 1.543701171875, 1.8641357421875, 2.1845703125, 2.5050048828125, 2.825439453125, 3.1458740234375, 3.46630859375, 3.7867431640625, 4.107177734375, 4.4276123046875, 4.748046875, 5.0684814453125, 5.388916015625, 5.7093505859375, 6.02978515625, 6.3502197265625, 6.670654296875, 6.9910888671875, 7.3115234375, 7.6319580078125, 7.952392578125, 8.2728271484375, 8.59326171875, 8.9136962890625, 9.234130859375, 9.5545654296875, 9.875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 8.0, 6.0, 5.0, 10.0, 14.0, 24.0, 30.0, 28.0, 58.0, 56.0, 62.0, 63.0, 67.0, 66.0, 69.0, 87.0, 64.0, 58.0, 51.0, 46.0, 25.0, 28.0, 18.0, 16.0, 13.0, 13.0, 8.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5672988891601562, -0.5403594970703125, -0.5134201049804688, -0.486480712890625, -0.45954132080078125, -0.4326019287109375, -0.40566253662109375, -0.37872314453125, -0.35178375244140625, -0.3248443603515625, -0.29790496826171875, -0.270965576171875, -0.24402618408203125, -0.2170867919921875, -0.19014739990234375, -0.1632080078125, -0.13626861572265625, -0.1093292236328125, -0.08238983154296875, -0.055450439453125, -0.02851104736328125, -0.0015716552734375, 0.02536773681640625, 0.05230712890625, 0.07924652099609375, 0.1061859130859375, 0.13312530517578125, 0.160064697265625, 0.18700408935546875, 0.2139434814453125, 0.24088287353515625, 0.267822265625, 0.29476165771484375, 0.3217010498046875, 0.34864044189453125, 0.375579833984375, 0.40251922607421875, 0.4294586181640625, 0.45639801025390625, 0.48333740234375, 0.5102767944335938, 0.5372161865234375, 0.5641555786132812, 0.591094970703125, 0.6180343627929688, 0.6449737548828125, 0.6719131469726562, 0.6988525390625, 0.7257919311523438, 0.7527313232421875, 0.7796707153320312, 0.806610107421875, 0.8335494995117188, 0.8604888916015625, 0.8874282836914062, 0.91436767578125, 0.9413070678710938, 0.9682464599609375, 0.9951858520507812, 1.022125244140625, 1.0490646362304688, 1.0760040283203125, 1.1029434204101562, 1.1298828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 7.0, 17.0, 20.0, 21.0, 25.0, 39.0, 55.0, 62.0, 105.0, 128.0, 169.0, 314.0, 539.0, 888.0, 2122.0, 7279.0, 4065497.0, 107636.0, 5350.0, 1740.0, 820.0, 469.0, 295.0, 198.0, 131.0, 102.0, 43.0, 46.0, 29.0, 21.0, 16.0, 20.0, 12.0, 11.0, 7.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.97265625, -7.72271728515625, -7.4727783203125, -7.22283935546875, -6.972900390625, -6.72296142578125, -6.4730224609375, -6.22308349609375, -5.97314453125, -5.72320556640625, -5.4732666015625, -5.22332763671875, -4.973388671875, -4.72344970703125, -4.4735107421875, -4.22357177734375, -3.9736328125, -3.72369384765625, -3.4737548828125, -3.22381591796875, -2.973876953125, -2.72393798828125, -2.4739990234375, -2.22406005859375, -1.97412109375, -1.72418212890625, -1.4742431640625, -1.22430419921875, -0.974365234375, -0.72442626953125, -0.4744873046875, -0.22454833984375, 0.025390625, 0.27532958984375, 0.5252685546875, 0.77520751953125, 1.025146484375, 1.27508544921875, 1.5250244140625, 1.77496337890625, 2.02490234375, 2.27484130859375, 2.5247802734375, 2.77471923828125, 3.024658203125, 3.27459716796875, 3.5245361328125, 3.77447509765625, 4.0244140625, 4.27435302734375, 4.5242919921875, 4.77423095703125, 5.024169921875, 5.27410888671875, 5.5240478515625, 5.77398681640625, 6.02392578125, 6.27386474609375, 6.5238037109375, 6.77374267578125, 7.023681640625, 7.27362060546875, 7.5235595703125, 7.77349853515625, 8.0234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 23.0, 113.0, 3812.0, 73.0, 23.0, 12.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.337890625, -1.28302001953125, -1.2281494140625, -1.17327880859375, -1.118408203125, -1.06353759765625, -1.0086669921875, -0.95379638671875, -0.89892578125, -0.84405517578125, -0.7891845703125, -0.73431396484375, -0.679443359375, -0.62457275390625, -0.5697021484375, -0.51483154296875, -0.4599609375, -0.40509033203125, -0.3502197265625, -0.29534912109375, -0.240478515625, -0.18560791015625, -0.1307373046875, -0.07586669921875, -0.02099609375, 0.03387451171875, 0.0887451171875, 0.14361572265625, 0.198486328125, 0.25335693359375, 0.3082275390625, 0.36309814453125, 0.41796875, 0.47283935546875, 0.5277099609375, 0.58258056640625, 0.637451171875, 0.69232177734375, 0.7471923828125, 0.80206298828125, 0.85693359375, 0.91180419921875, 0.9666748046875, 1.02154541015625, 1.076416015625, 1.13128662109375, 1.1861572265625, 1.24102783203125, 1.2958984375, 1.35076904296875, 1.4056396484375, 1.46051025390625, 1.515380859375, 1.57025146484375, 1.6251220703125, 1.67999267578125, 1.73486328125, 1.78973388671875, 1.8446044921875, 1.89947509765625, 1.954345703125, 2.00921630859375, 2.0640869140625, 2.11895751953125, 2.173828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 9.0, 14.0, 18.0, 19.0, 42.0, 45.0, 71.0, 76.0, 96.0, 93.0, 110.0, 95.0, 65.0, 54.0, 31.0, 31.0, 28.0, 24.0, 16.0, 15.0, 6.0, 11.0, 4.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1812069416046143, -3.089060068130493, -2.996913194656372, -2.904766321182251, -2.81261944770813, -2.720472574234009, -2.6283257007598877, -2.5361788272857666, -2.4440319538116455, -2.3518850803375244, -2.2597382068634033, -2.1675913333892822, -2.075444459915161, -1.98329758644104, -1.891150712966919, -1.7990038394927979, -1.7068569660186768, -1.6147100925445557, -1.5225632190704346, -1.4304163455963135, -1.3382694721221924, -1.2461225986480713, -1.1539757251739502, -1.061828851699829, -0.969681978225708, -0.8775351047515869, -0.7853882312774658, -0.6932413578033447, -0.6010944843292236, -0.5089476108551025, -0.41680073738098145, -0.32465386390686035, -0.23250722885131836, -0.14036035537719727, -0.04821348190307617, 0.04393339157104492, 0.13608026504516602, 0.2282271385192871, 0.3203740119934082, 0.4125208854675293, 0.5046677589416504, 0.5968146324157715, 0.6889615058898926, 0.7811083793640137, 0.8732552528381348, 0.9654021263122559, 1.057548999786377, 1.149695873260498, 1.2418427467346191, 1.3339896202087402, 1.4261364936828613, 1.5182833671569824, 1.6104302406311035, 1.7025771141052246, 1.7947239875793457, 1.8868708610534668, 1.979017734527588, 2.071164608001709, 2.16331148147583, 2.255458354949951, 2.3476052284240723, 2.4397521018981934, 2.5318989753723145, 2.6240458488464355, 2.7161927223205566]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 9.0, 7.0, 11.0, 13.0, 17.0, 19.0, 24.0, 22.0, 28.0, 25.0, 32.0, 38.0, 45.0, 36.0, 42.0, 41.0, 42.0, 40.0, 28.0, 32.0, 29.0, 44.0, 35.0, 38.0, 40.0, 26.0, 21.0, 30.0, 23.0, 20.0, 22.0, 18.0, 20.0, 13.0, 18.0, 10.0, 3.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8112003803253174, -1.7545509338378906, -1.6979014873504639, -1.6412521600723267, -1.5846027135849, -1.5279532670974731, -1.471303939819336, -1.4146544933319092, -1.3580050468444824, -1.3013556003570557, -1.244706153869629, -1.1880568265914917, -1.131407380104065, -1.0747579336166382, -1.018108606338501, -0.9614591598510742, -0.9048097133636475, -0.8481602668762207, -0.7915108799934387, -0.7348614931106567, -0.67821204662323, -0.6215626001358032, -0.5649132132530212, -0.5082638263702393, -0.4516143798828125, -0.39496496319770813, -0.33831554651260376, -0.2816661298274994, -0.22501671314239502, -0.16836729645729065, -0.11171787977218628, -0.05506846308708191, 0.001580953598022461, 0.05823037028312683, 0.1148797869682312, 0.17152920365333557, 0.22817862033843994, 0.2848280370235443, 0.3414774537086487, 0.39812687039375305, 0.4547762870788574, 0.5114257335662842, 0.5680751204490662, 0.6247245073318481, 0.6813739538192749, 0.7380234003067017, 0.7946727871894836, 0.8513221740722656, 0.9079716205596924, 0.9646210670471191, 1.021270513534546, 1.077919840812683, 1.1345692873001099, 1.1912187337875366, 1.2478680610656738, 1.3045175075531006, 1.3611669540405273, 1.417816400527954, 1.4744658470153809, 1.531115174293518, 1.5877646207809448, 1.6444140672683716, 1.7010633945465088, 1.7577128410339355, 1.8143622875213623]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 8.0, 13.0, 22.0, 27.0, 72.0, 121.0, 214.0, 445.0, 913.0, 2011.0, 5254.0, 16577.0, 67536.0, 337299.0, 484041.0, 98872.0, 23450.0, 6800.0, 2569.0, 1128.0, 499.0, 294.0, 169.0, 72.0, 46.0, 33.0, 12.0, 20.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.4971923828125, -2.414306640625, -2.3314208984375, -2.24853515625, -2.1656494140625, -2.082763671875, -1.9998779296875, -1.9169921875, -1.8341064453125, -1.751220703125, -1.6683349609375, -1.58544921875, -1.5025634765625, -1.419677734375, -1.3367919921875, -1.25390625, -1.1710205078125, -1.088134765625, -1.0052490234375, -0.92236328125, -0.8394775390625, -0.756591796875, -0.6737060546875, -0.5908203125, -0.5079345703125, -0.425048828125, -0.3421630859375, -0.25927734375, -0.1763916015625, -0.093505859375, -0.0106201171875, 0.072265625, 0.1551513671875, 0.238037109375, 0.3209228515625, 0.40380859375, 0.4866943359375, 0.569580078125, 0.6524658203125, 0.7353515625, 0.8182373046875, 0.901123046875, 0.9840087890625, 1.06689453125, 1.1497802734375, 1.232666015625, 1.3155517578125, 1.3984375, 1.4813232421875, 1.564208984375, 1.6470947265625, 1.72998046875, 1.8128662109375, 1.895751953125, 1.9786376953125, 2.0615234375, 2.1444091796875, 2.227294921875, 2.3101806640625, 2.39306640625, 2.4759521484375, 2.558837890625, 2.6417236328125, 2.724609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 2.0, 6.0, 11.0, 14.0, 13.0, 17.0, 24.0, 41.0, 48.0, 39.0, 63.0, 67.0, 67.0, 62.0, 76.0, 81.0, 75.0, 52.0, 41.0, 47.0, 33.0, 32.0, 19.0, 23.0, 16.0, 6.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58203125, -0.553314208984375, -0.52459716796875, -0.495880126953125, -0.4671630859375, -0.438446044921875, -0.40972900390625, -0.381011962890625, -0.352294921875, -0.323577880859375, -0.29486083984375, -0.266143798828125, -0.2374267578125, -0.208709716796875, -0.17999267578125, -0.151275634765625, -0.12255859375, -0.093841552734375, -0.06512451171875, -0.036407470703125, -0.0076904296875, 0.021026611328125, 0.04974365234375, 0.078460693359375, 0.107177734375, 0.135894775390625, 0.16461181640625, 0.193328857421875, 0.2220458984375, 0.250762939453125, 0.27947998046875, 0.308197021484375, 0.3369140625, 0.365631103515625, 0.39434814453125, 0.423065185546875, 0.4517822265625, 0.480499267578125, 0.50921630859375, 0.537933349609375, 0.566650390625, 0.595367431640625, 0.62408447265625, 0.652801513671875, 0.6815185546875, 0.710235595703125, 0.73895263671875, 0.767669677734375, 0.79638671875, 0.825103759765625, 0.85382080078125, 0.882537841796875, 0.9112548828125, 0.939971923828125, 0.96868896484375, 0.997406005859375, 1.026123046875, 1.054840087890625, 1.08355712890625, 1.112274169921875, 1.1409912109375, 1.169708251953125, 1.19842529296875, 1.227142333984375, 1.255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 11.0, 22.0, 21.0, 18.0, 27.0, 49.0, 41.0, 93.0, 99.0, 144.0, 175.0, 229.0, 320.0, 554.0, 914.0, 1683.0, 4357.0, 16305.0, 106430.0, 734049.0, 152354.0, 20838.0, 4920.0, 1911.0, 953.0, 584.0, 410.0, 265.0, 183.0, 142.0, 122.0, 81.0, 61.0, 35.0, 30.0, 30.0, 24.0, 15.0, 9.0, 9.0, 4.0, 1.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.87109375, -2.788055419921875, -2.70501708984375, -2.621978759765625, -2.5389404296875, -2.455902099609375, -2.37286376953125, -2.289825439453125, -2.206787109375, -2.123748779296875, -2.04071044921875, -1.957672119140625, -1.8746337890625, -1.791595458984375, -1.70855712890625, -1.625518798828125, -1.54248046875, -1.459442138671875, -1.37640380859375, -1.293365478515625, -1.2103271484375, -1.127288818359375, -1.04425048828125, -0.961212158203125, -0.878173828125, -0.795135498046875, -0.71209716796875, -0.629058837890625, -0.5460205078125, -0.462982177734375, -0.37994384765625, -0.296905517578125, -0.2138671875, -0.130828857421875, -0.04779052734375, 0.035247802734375, 0.1182861328125, 0.201324462890625, 0.28436279296875, 0.367401123046875, 0.450439453125, 0.533477783203125, 0.61651611328125, 0.699554443359375, 0.7825927734375, 0.865631103515625, 0.94866943359375, 1.031707763671875, 1.11474609375, 1.197784423828125, 1.28082275390625, 1.363861083984375, 1.4468994140625, 1.529937744140625, 1.61297607421875, 1.696014404296875, 1.779052734375, 1.862091064453125, 1.94512939453125, 2.028167724609375, 2.1112060546875, 2.194244384765625, 2.27728271484375, 2.360321044921875, 2.443359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 1.0, 13.0, 7.0, 22.0, 16.0, 21.0, 23.0, 21.0, 24.0, 40.0, 38.0, 34.0, 27.0, 38.0, 54.0, 57.0, 44.0, 54.0, 39.0, 52.0, 47.0, 51.0, 46.0, 34.0, 40.0, 29.0, 21.0, 15.0, 18.0, 14.0, 10.0, 12.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.6953125, -3.59417724609375, -3.4930419921875, -3.39190673828125, -3.290771484375, -3.18963623046875, -3.0885009765625, -2.98736572265625, -2.88623046875, -2.78509521484375, -2.6839599609375, -2.58282470703125, -2.481689453125, -2.38055419921875, -2.2794189453125, -2.17828369140625, -2.0771484375, -1.97601318359375, -1.8748779296875, -1.77374267578125, -1.672607421875, -1.57147216796875, -1.4703369140625, -1.36920166015625, -1.26806640625, -1.16693115234375, -1.0657958984375, -0.96466064453125, -0.863525390625, -0.76239013671875, -0.6612548828125, -0.56011962890625, -0.458984375, -0.35784912109375, -0.2567138671875, -0.15557861328125, -0.054443359375, 0.04669189453125, 0.1478271484375, 0.24896240234375, 0.35009765625, 0.45123291015625, 0.5523681640625, 0.65350341796875, 0.754638671875, 0.85577392578125, 0.9569091796875, 1.05804443359375, 1.1591796875, 1.26031494140625, 1.3614501953125, 1.46258544921875, 1.563720703125, 1.66485595703125, 1.7659912109375, 1.86712646484375, 1.96826171875, 2.06939697265625, 2.1705322265625, 2.27166748046875, 2.372802734375, 2.47393798828125, 2.5750732421875, 2.67620849609375, 2.77734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 9.0, 8.0, 11.0, 13.0, 22.0, 36.0, 46.0, 48.0, 140.0, 213.0, 517.0, 1185.0, 3870.0, 26776.0, 735623.0, 261634.0, 14068.0, 2575.0, 843.0, 388.0, 203.0, 122.0, 60.0, 51.0, 21.0, 22.0, 11.0, 9.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.294921875, -3.2078857421875, -3.120849609375, -3.0338134765625, -2.94677734375, -2.8597412109375, -2.772705078125, -2.6856689453125, -2.5986328125, -2.5115966796875, -2.424560546875, -2.3375244140625, -2.25048828125, -2.1634521484375, -2.076416015625, -1.9893798828125, -1.90234375, -1.8153076171875, -1.728271484375, -1.6412353515625, -1.55419921875, -1.4671630859375, -1.380126953125, -1.2930908203125, -1.2060546875, -1.1190185546875, -1.031982421875, -0.9449462890625, -0.85791015625, -0.7708740234375, -0.683837890625, -0.5968017578125, -0.509765625, -0.4227294921875, -0.335693359375, -0.2486572265625, -0.16162109375, -0.0745849609375, 0.012451171875, 0.0994873046875, 0.1865234375, 0.2735595703125, 0.360595703125, 0.4476318359375, 0.53466796875, 0.6217041015625, 0.708740234375, 0.7957763671875, 0.8828125, 0.9698486328125, 1.056884765625, 1.1439208984375, 1.23095703125, 1.3179931640625, 1.405029296875, 1.4920654296875, 1.5791015625, 1.6661376953125, 1.753173828125, 1.8402099609375, 1.92724609375, 2.0142822265625, 2.101318359375, 2.1883544921875, 2.275390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 4.0, 8.0, 8.0, 14.0, 25.0, 28.0, 24.0, 28.0, 59.0, 45.0, 59.0, 92.0, 93.0, 98.0, 80.0, 51.0, 51.0, 33.0, 40.0, 22.0, 32.0, 19.0, 20.0, 10.0, 12.0, 13.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001468658447265625, -0.00014121830463409424, -0.00013557076454162598, -0.00012992322444915771, -0.00012427568435668945, -0.00011862814426422119, -0.00011298060417175293, -0.00010733306407928467, -0.0001016855239868164, -9.603798389434814e-05, -9.039044380187988e-05, -8.474290370941162e-05, -7.909536361694336e-05, -7.34478235244751e-05, -6.780028343200684e-05, -6.215274333953857e-05, -5.650520324707031e-05, -5.085766315460205e-05, -4.521012306213379e-05, -3.956258296966553e-05, -3.3915042877197266e-05, -2.8267502784729004e-05, -2.2619962692260742e-05, -1.697242259979248e-05, -1.1324882507324219e-05, -5.677342414855957e-06, -2.9802322387695312e-08, 5.617737770080566e-06, 1.1265277862548828e-05, 1.691281795501709e-05, 2.256035804748535e-05, 2.8207898139953613e-05, 3.3855438232421875e-05, 3.950297832489014e-05, 4.51505184173584e-05, 5.079805850982666e-05, 5.644559860229492e-05, 6.209313869476318e-05, 6.774067878723145e-05, 7.338821887969971e-05, 7.903575897216797e-05, 8.468329906463623e-05, 9.033083915710449e-05, 9.597837924957275e-05, 0.00010162591934204102, 0.00010727345943450928, 0.00011292099952697754, 0.0001185685396194458, 0.00012421607971191406, 0.00012986361980438232, 0.00013551115989685059, 0.00014115869998931885, 0.0001468062400817871, 0.00015245378017425537, 0.00015810132026672363, 0.0001637488603591919, 0.00016939640045166016, 0.00017504394054412842, 0.00018069148063659668, 0.00018633902072906494, 0.0001919865608215332, 0.00019763410091400146, 0.00020328164100646973, 0.000208929181098938, 0.00021457672119140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 25.0, 33.0, 52.0, 83.0, 161.0, 304.0, 713.0, 1876.0, 7490.0, 68639.0, 872459.0, 84695.0, 8417.0, 2099.0, 749.0, 319.0, 169.0, 82.0, 67.0, 38.0, 14.0, 9.0, 12.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.556640625, -3.461883544921875, -3.36712646484375, -3.272369384765625, -3.1776123046875, -3.082855224609375, -2.98809814453125, -2.893341064453125, -2.798583984375, -2.703826904296875, -2.60906982421875, -2.514312744140625, -2.4195556640625, -2.324798583984375, -2.23004150390625, -2.135284423828125, -2.04052734375, -1.945770263671875, -1.85101318359375, -1.756256103515625, -1.6614990234375, -1.566741943359375, -1.47198486328125, -1.377227783203125, -1.282470703125, -1.187713623046875, -1.09295654296875, -0.998199462890625, -0.9034423828125, -0.808685302734375, -0.71392822265625, -0.619171142578125, -0.5244140625, -0.429656982421875, -0.33489990234375, -0.240142822265625, -0.1453857421875, -0.050628662109375, 0.04412841796875, 0.138885498046875, 0.233642578125, 0.328399658203125, 0.42315673828125, 0.517913818359375, 0.6126708984375, 0.707427978515625, 0.80218505859375, 0.896942138671875, 0.99169921875, 1.086456298828125, 1.18121337890625, 1.275970458984375, 1.3707275390625, 1.465484619140625, 1.56024169921875, 1.654998779296875, 1.749755859375, 1.844512939453125, 1.93927001953125, 2.034027099609375, 2.1287841796875, 2.223541259765625, 2.31829833984375, 2.413055419921875, 2.5078125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 11.0, 26.0, 19.0, 31.0, 46.0, 76.0, 99.0, 117.0, 130.0, 129.0, 95.0, 51.0, 42.0, 33.0, 33.0, 16.0, 9.0, 9.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48828125, -1.42510986328125, -1.3619384765625, -1.29876708984375, -1.235595703125, -1.17242431640625, -1.1092529296875, -1.04608154296875, -0.98291015625, -0.91973876953125, -0.8565673828125, -0.79339599609375, -0.730224609375, -0.66705322265625, -0.6038818359375, -0.54071044921875, -0.4775390625, -0.41436767578125, -0.3511962890625, -0.28802490234375, -0.224853515625, -0.16168212890625, -0.0985107421875, -0.03533935546875, 0.02783203125, 0.09100341796875, 0.1541748046875, 0.21734619140625, 0.280517578125, 0.34368896484375, 0.4068603515625, 0.47003173828125, 0.533203125, 0.59637451171875, 0.6595458984375, 0.72271728515625, 0.785888671875, 0.84906005859375, 0.9122314453125, 0.97540283203125, 1.03857421875, 1.10174560546875, 1.1649169921875, 1.22808837890625, 1.291259765625, 1.35443115234375, 1.4176025390625, 1.48077392578125, 1.5439453125, 1.60711669921875, 1.6702880859375, 1.73345947265625, 1.796630859375, 1.85980224609375, 1.9229736328125, 1.98614501953125, 2.04931640625, 2.11248779296875, 2.1756591796875, 2.23883056640625, 2.302001953125, 2.36517333984375, 2.4283447265625, 2.49151611328125, 2.5546875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 12.0, 39.0, 177.0, 469.0, 256.0, 44.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.21088790893555, -45.74945068359375, -43.28800964355469, -40.82657241821289, -38.365135192871094, -35.90369415283203, -33.442256927490234, -30.980819702148438, -28.519380569458008, -26.057941436767578, -23.59650421142578, -21.13506507873535, -18.673625946044922, -16.212188720703125, -13.750749588012695, -11.289312362670898, -8.827873229980469, -6.3664350509643555, -3.904996395111084, -1.4435577392578125, 1.0178804397583008, 3.479318618774414, 5.940757751464844, 8.40219497680664, 10.86363410949707, 13.325072288513184, 15.786510467529297, 18.247949600219727, 20.709388732910156, 23.170825958251953, 25.632265090942383, 28.09370231628418, 30.555137634277344, 33.01657485961914, 35.4780158996582, 37.939453125, 40.4008903503418, 42.862327575683594, 45.323768615722656, 47.78520584106445, 50.24664306640625, 52.70808029174805, 55.16952133178711, 57.630958557128906, 60.0923957824707, 62.5538330078125, 65.01527404785156, 67.47671508789062, 69.93815612792969, 72.39959716796875, 74.86103057861328, 77.32247161865234, 79.7839126586914, 82.24534606933594, 84.706787109375, 87.16822814941406, 89.6296615600586, 92.09110260009766, 94.55253601074219, 97.01397705078125, 99.47541809082031, 101.93685150146484, 104.3982925415039, 106.85972595214844, 109.3211669921875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 6.0, 9.0, 3.0, 5.0, 17.0, 13.0, 18.0, 18.0, 24.0, 21.0, 32.0, 29.0, 44.0, 37.0, 41.0, 42.0, 48.0, 53.0, 56.0, 45.0, 54.0, 46.0, 56.0, 41.0, 38.0, 24.0, 31.0, 19.0, 22.0, 18.0, 20.0, 9.0, 11.0, 9.0, 6.0, 10.0, 5.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.600112915039062, -14.154204368591309, -13.708295822143555, -13.2623872756958, -12.816478729248047, -12.370570182800293, -11.924661636352539, -11.478754043579102, -11.032844543457031, -10.586935997009277, -10.141027450561523, -9.69511890411377, -9.249210357666016, -8.803301811218262, -8.357393264770508, -7.911485195159912, -7.465577125549316, -7.0196685791015625, -6.573760032653809, -6.127851486206055, -5.681942939758301, -5.236034393310547, -4.790126323699951, -4.344217777252197, -3.8983092308044434, -3.4524006843566895, -3.0064921379089355, -2.5605838298797607, -2.114675283432007, -1.668766736984253, -1.2228584289550781, -0.7769498825073242, -0.3310422897338867, 0.11486619710922241, 0.5607746839523315, 1.006683111190796, 1.4525916576385498, 1.8985002040863037, 2.3444085121154785, 2.7903170585632324, 3.2362256050109863, 3.6821341514587402, 4.128042697906494, 4.57395076751709, 5.019859313964844, 5.465767860412598, 5.911676406860352, 6.3575849533081055, 6.803493499755859, 7.249402046203613, 7.695310592651367, 8.141219139099121, 8.587127685546875, 9.033036231994629, 9.478944778442383, 9.92485237121582, 10.37076187133789, 10.816670417785645, 11.262578964233398, 11.708487510681152, 12.154396057128906, 12.60030460357666, 13.046213150024414, 13.492120742797852, 13.938029289245605]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 10.0, 16.0, 14.0, 31.0, 45.0, 67.0, 92.0, 131.0, 163.0, 258.0, 465.0, 806.0, 1519.0, 3606.0, 10724.0, 171657.0, 3981052.0, 15035.0, 4362.0, 1832.0, 901.0, 512.0, 290.0, 204.0, 117.0, 100.0, 62.0, 49.0, 41.0, 25.0, 18.0, 20.0, 9.0, 10.0, 11.0, 2.0, 6.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.5284423828125, -6.318603515625, -6.1087646484375, -5.89892578125, -5.6890869140625, -5.479248046875, -5.2694091796875, -5.0595703125, -4.8497314453125, -4.639892578125, -4.4300537109375, -4.22021484375, -4.0103759765625, -3.800537109375, -3.5906982421875, -3.380859375, -3.1710205078125, -2.961181640625, -2.7513427734375, -2.54150390625, -2.3316650390625, -2.121826171875, -1.9119873046875, -1.7021484375, -1.4923095703125, -1.282470703125, -1.0726318359375, -0.86279296875, -0.6529541015625, -0.443115234375, -0.2332763671875, -0.0234375, 0.1864013671875, 0.396240234375, 0.6060791015625, 0.81591796875, 1.0257568359375, 1.235595703125, 1.4454345703125, 1.6552734375, 1.8651123046875, 2.074951171875, 2.2847900390625, 2.49462890625, 2.7044677734375, 2.914306640625, 3.1241455078125, 3.333984375, 3.5438232421875, 3.753662109375, 3.9635009765625, 4.17333984375, 4.3831787109375, 4.593017578125, 4.8028564453125, 5.0126953125, 5.2225341796875, 5.432373046875, 5.6422119140625, 5.85205078125, 6.0618896484375, 6.271728515625, 6.4815673828125, 6.69140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 11.0, 13.0, 11.0, 27.0, 21.0, 34.0, 46.0, 47.0, 53.0, 72.0, 87.0, 80.0, 80.0, 70.0, 67.0, 55.0, 51.0, 36.0, 32.0, 30.0, 22.0, 15.0, 13.0, 4.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6543502807617188, -0.6246185302734375, -0.5948867797851562, -0.565155029296875, -0.5354232788085938, -0.5056915283203125, -0.47595977783203125, -0.44622802734375, -0.41649627685546875, -0.3867645263671875, -0.35703277587890625, -0.327301025390625, -0.29756927490234375, -0.2678375244140625, -0.23810577392578125, -0.2083740234375, -0.17864227294921875, -0.1489105224609375, -0.11917877197265625, -0.089447021484375, -0.05971527099609375, -0.0299835205078125, -0.00025177001953125, 0.02947998046875, 0.05921173095703125, 0.0889434814453125, 0.11867523193359375, 0.148406982421875, 0.17813873291015625, 0.2078704833984375, 0.23760223388671875, 0.267333984375, 0.29706573486328125, 0.3267974853515625, 0.35652923583984375, 0.386260986328125, 0.41599273681640625, 0.4457244873046875, 0.47545623779296875, 0.50518798828125, 0.5349197387695312, 0.5646514892578125, 0.5943832397460938, 0.624114990234375, 0.6538467407226562, 0.6835784912109375, 0.7133102416992188, 0.7430419921875, 0.7727737426757812, 0.8025054931640625, 0.8322372436523438, 0.861968994140625, 0.8917007446289062, 0.9214324951171875, 0.9511642456054688, 0.98089599609375, 1.0106277465820312, 1.0403594970703125, 1.0700912475585938, 1.099822998046875, 1.1295547485351562, 1.1592864990234375, 1.1890182495117188, 1.21875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 5.0, 4.0, 11.0, 9.0, 20.0, 17.0, 26.0, 32.0, 55.0, 69.0, 139.0, 168.0, 331.0, 493.0, 785.0, 1399.0, 3208.0, 16452.0, 4096924.0, 64025.0, 5467.0, 1973.0, 1027.0, 600.0, 360.0, 254.0, 128.0, 109.0, 50.0, 45.0, 27.0, 21.0, 23.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -5.99810791015625, -5.7735595703125, -5.54901123046875, -5.324462890625, -5.09991455078125, -4.8753662109375, -4.65081787109375, -4.42626953125, -4.20172119140625, -3.9771728515625, -3.75262451171875, -3.528076171875, -3.30352783203125, -3.0789794921875, -2.85443115234375, -2.6298828125, -2.40533447265625, -2.1807861328125, -1.95623779296875, -1.731689453125, -1.50714111328125, -1.2825927734375, -1.05804443359375, -0.83349609375, -0.60894775390625, -0.3843994140625, -0.15985107421875, 0.064697265625, 0.28924560546875, 0.5137939453125, 0.73834228515625, 0.962890625, 1.18743896484375, 1.4119873046875, 1.63653564453125, 1.861083984375, 2.08563232421875, 2.3101806640625, 2.53472900390625, 2.75927734375, 2.98382568359375, 3.2083740234375, 3.43292236328125, 3.657470703125, 3.88201904296875, 4.1065673828125, 4.33111572265625, 4.5556640625, 4.78021240234375, 5.0047607421875, 5.22930908203125, 5.453857421875, 5.67840576171875, 5.9029541015625, 6.12750244140625, 6.35205078125, 6.57659912109375, 6.8011474609375, 7.02569580078125, 7.250244140625, 7.47479248046875, 7.6993408203125, 7.92388916015625, 8.1484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 11.0, 11.0, 29.0, 49.0, 165.0, 3399.0, 290.0, 64.0, 28.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.873046875, -2.8023834228515625, -2.731719970703125, -2.6610565185546875, -2.59039306640625, -2.5197296142578125, -2.449066162109375, -2.3784027099609375, -2.3077392578125, -2.2370758056640625, -2.166412353515625, -2.0957489013671875, -2.02508544921875, -1.9544219970703125, -1.883758544921875, -1.8130950927734375, -1.742431640625, -1.6717681884765625, -1.601104736328125, -1.5304412841796875, -1.45977783203125, -1.3891143798828125, -1.318450927734375, -1.2477874755859375, -1.1771240234375, -1.1064605712890625, -1.035797119140625, -0.9651336669921875, -0.89447021484375, -0.8238067626953125, -0.753143310546875, -0.6824798583984375, -0.61181640625, -0.5411529541015625, -0.470489501953125, -0.3998260498046875, -0.32916259765625, -0.2584991455078125, -0.187835693359375, -0.1171722412109375, -0.0465087890625, 0.0241546630859375, 0.094818115234375, 0.1654815673828125, 0.23614501953125, 0.3068084716796875, 0.377471923828125, 0.4481353759765625, 0.518798828125, 0.5894622802734375, 0.660125732421875, 0.7307891845703125, 0.80145263671875, 0.8721160888671875, 0.942779541015625, 1.0134429931640625, 1.0841064453125, 1.1547698974609375, 1.225433349609375, 1.2960968017578125, 1.36676025390625, 1.4374237060546875, 1.508087158203125, 1.5787506103515625, 1.6494140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 3.0, 13.0, 11.0, 22.0, 25.0, 19.0, 42.0, 40.0, 69.0, 82.0, 110.0, 103.0, 118.0, 112.0, 58.0, 54.0, 29.0, 23.0, 18.0, 10.0, 11.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.641951560974121, -5.456475257873535, -5.270999431610107, -5.0855231285095215, -4.900047302246094, -4.714570999145508, -4.529094696044922, -4.343618392944336, -4.158142566680908, -3.9726665019989014, -3.7871904373168945, -3.6017141342163086, -3.4162380695343018, -3.230762004852295, -3.045285701751709, -2.859809637069702, -2.6743335723876953, -2.4888575077056885, -2.3033814430236816, -2.1179051399230957, -1.9324290752410889, -1.746953010559082, -1.5614768266677856, -1.3760006427764893, -1.1905245780944824, -1.0050485134124756, -0.8195723295211792, -0.6340962052345276, -0.448620080947876, -0.26314395666122437, -0.07766783237457275, 0.10780835151672363, 0.29328489303588867, 0.4787610173225403, 0.6642371416091919, 0.8497132658958435, 1.0351893901824951, 1.220665454864502, 1.4061416387557983, 1.5916178226470947, 1.7770938873291016, 1.9625699520111084, 2.1480460166931152, 2.333522319793701, 2.518998384475708, 2.704474449157715, 2.889950752258301, 3.0754268169403076, 3.2609028816223145, 3.4463789463043213, 3.631855010986328, 3.817331314086914, 4.0028076171875, 4.188283443450928, 4.373759746551514, 4.559235572814941, 4.744711875915527, 4.930188179016113, 5.115664005279541, 5.301140308380127, 5.486616134643555, 5.672092437744141, 5.857568740844727, 6.0430450439453125, 6.22852087020874]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 2.0, 3.0, 7.0, 5.0, 13.0, 8.0, 8.0, 11.0, 11.0, 17.0, 18.0, 21.0, 20.0, 29.0, 25.0, 43.0, 30.0, 30.0, 36.0, 40.0, 43.0, 39.0, 49.0, 47.0, 50.0, 49.0, 28.0, 32.0, 34.0, 26.0, 43.0, 29.0, 27.0, 23.0, 22.0, 17.0, 18.0, 4.0, 8.0, 9.0, 9.0, 1.0, 3.0, 4.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.8901729583740234, -3.772918701171875, -3.6556644439697266, -3.538410186767578, -3.4211559295654297, -3.3039016723632812, -3.186647415161133, -3.0693931579589844, -2.952138900756836, -2.8348846435546875, -2.717630386352539, -2.6003761291503906, -2.483121871948242, -2.3658676147460938, -2.2486133575439453, -2.131359100341797, -2.0141050815582275, -1.896850824356079, -1.7795965671539307, -1.6623423099517822, -1.5450880527496338, -1.4278337955474854, -1.3105796575546265, -1.193325400352478, -1.0760711431503296, -0.9588168859481812, -0.8415626287460327, -0.724308431148529, -0.6070541739463806, -0.4897999167442322, -0.3725457191467285, -0.2552914619445801, -0.13803720474243164, -0.020782962441444397, 0.09647127985954285, 0.2137255072593689, 0.33097976446151733, 0.44823402166366577, 0.5654882192611694, 0.6827424764633179, 0.7999967336654663, 0.9172509908676147, 1.0345052480697632, 1.151759386062622, 1.2690136432647705, 1.386267900466919, 1.5035221576690674, 1.6207764148712158, 1.7380306720733643, 1.8552849292755127, 1.9725391864776611, 2.0897934436798096, 2.207047700881958, 2.3243019580841064, 2.441555976867676, 2.558810234069824, 2.6760644912719727, 2.793318748474121, 2.9105730056762695, 3.027827262878418, 3.1450815200805664, 3.262335777282715, 3.3795900344848633, 3.4968442916870117, 3.61409854888916]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 7.0, 6.0, 10.0, 24.0, 17.0, 25.0, 37.0, 45.0, 58.0, 113.0, 166.0, 303.0, 539.0, 1028.0, 1974.0, 4319.0, 9540.0, 23108.0, 60479.0, 171032.0, 457071.0, 202365.0, 69476.0, 26476.0, 10823.0, 4745.0, 2162.0, 1091.0, 587.0, 333.0, 205.0, 104.0, 71.0, 61.0, 39.0, 30.0, 23.0, 15.0, 8.0, 10.0, 11.0, 7.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.525390625, -2.450164794921875, -2.37493896484375, -2.299713134765625, -2.2244873046875, -2.149261474609375, -2.07403564453125, -1.998809814453125, -1.923583984375, -1.848358154296875, -1.77313232421875, -1.697906494140625, -1.6226806640625, -1.547454833984375, -1.47222900390625, -1.397003173828125, -1.32177734375, -1.246551513671875, -1.17132568359375, -1.096099853515625, -1.0208740234375, -0.945648193359375, -0.87042236328125, -0.795196533203125, -0.719970703125, -0.644744873046875, -0.56951904296875, -0.494293212890625, -0.4190673828125, -0.343841552734375, -0.26861572265625, -0.193389892578125, -0.1181640625, -0.042938232421875, 0.03228759765625, 0.107513427734375, 0.1827392578125, 0.257965087890625, 0.33319091796875, 0.408416748046875, 0.483642578125, 0.558868408203125, 0.63409423828125, 0.709320068359375, 0.7845458984375, 0.859771728515625, 0.93499755859375, 1.010223388671875, 1.08544921875, 1.160675048828125, 1.23590087890625, 1.311126708984375, 1.3863525390625, 1.461578369140625, 1.53680419921875, 1.612030029296875, 1.687255859375, 1.762481689453125, 1.83770751953125, 1.912933349609375, 1.9881591796875, 2.063385009765625, 2.13861083984375, 2.213836669921875, 2.2890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 5.0, 10.0, 13.0, 9.0, 17.0, 25.0, 16.0, 49.0, 30.0, 44.0, 58.0, 58.0, 66.0, 66.0, 76.0, 75.0, 60.0, 58.0, 44.0, 46.0, 33.0, 29.0, 20.0, 22.0, 21.0, 14.0, 5.0, 6.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6380233764648438, -0.6095428466796875, -0.5810623168945312, -0.552581787109375, -0.5241012573242188, -0.4956207275390625, -0.46714019775390625, -0.43865966796875, -0.41017913818359375, -0.3816986083984375, -0.35321807861328125, -0.324737548828125, -0.29625701904296875, -0.2677764892578125, -0.23929595947265625, -0.2108154296875, -0.18233489990234375, -0.1538543701171875, -0.12537384033203125, -0.096893310546875, -0.06841278076171875, -0.0399322509765625, -0.01145172119140625, 0.01702880859375, 0.04550933837890625, 0.0739898681640625, 0.10247039794921875, 0.130950927734375, 0.15943145751953125, 0.1879119873046875, 0.21639251708984375, 0.244873046875, 0.27335357666015625, 0.3018341064453125, 0.33031463623046875, 0.358795166015625, 0.38727569580078125, 0.4157562255859375, 0.44423675537109375, 0.47271728515625, 0.5011978149414062, 0.5296783447265625, 0.5581588745117188, 0.586639404296875, 0.6151199340820312, 0.6436004638671875, 0.6720809936523438, 0.7005615234375, 0.7290420532226562, 0.7575225830078125, 0.7860031127929688, 0.814483642578125, 0.8429641723632812, 0.8714447021484375, 0.8999252319335938, 0.92840576171875, 0.9568862915039062, 0.9853668212890625, 1.0138473510742188, 1.042327880859375, 1.0708084106445312, 1.0992889404296875, 1.1277694702148438, 1.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 11.0, 20.0, 26.0, 33.0, 37.0, 53.0, 80.0, 123.0, 171.0, 249.0, 375.0, 642.0, 1144.0, 2419.0, 7134.0, 36370.0, 398093.0, 542540.0, 44743.0, 8231.0, 2751.0, 1268.0, 694.0, 425.0, 269.0, 204.0, 135.0, 87.0, 58.0, 45.0, 26.0, 29.0, 15.0, 13.0, 10.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.041473388671875, -3.92279052734375, -3.804107666015625, -3.6854248046875, -3.566741943359375, -3.44805908203125, -3.329376220703125, -3.210693359375, -3.092010498046875, -2.97332763671875, -2.854644775390625, -2.7359619140625, -2.617279052734375, -2.49859619140625, -2.379913330078125, -2.26123046875, -2.142547607421875, -2.02386474609375, -1.905181884765625, -1.7864990234375, -1.667816162109375, -1.54913330078125, -1.430450439453125, -1.311767578125, -1.193084716796875, -1.07440185546875, -0.955718994140625, -0.8370361328125, -0.718353271484375, -0.59967041015625, -0.480987548828125, -0.3623046875, -0.243621826171875, -0.12493896484375, -0.006256103515625, 0.1124267578125, 0.231109619140625, 0.34979248046875, 0.468475341796875, 0.587158203125, 0.705841064453125, 0.82452392578125, 0.943206787109375, 1.0618896484375, 1.180572509765625, 1.29925537109375, 1.417938232421875, 1.53662109375, 1.655303955078125, 1.77398681640625, 1.892669677734375, 2.0113525390625, 2.130035400390625, 2.24871826171875, 2.367401123046875, 2.486083984375, 2.604766845703125, 2.72344970703125, 2.842132568359375, 2.9608154296875, 3.079498291015625, 3.19818115234375, 3.316864013671875, 3.435546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 15.0, 9.0, 18.0, 18.0, 21.0, 24.0, 25.0, 29.0, 29.0, 39.0, 45.0, 42.0, 54.0, 42.0, 49.0, 46.0, 42.0, 48.0, 39.0, 49.0, 47.0, 36.0, 28.0, 32.0, 22.0, 18.0, 29.0, 15.0, 18.0, 9.0, 8.0, 7.0, 3.0, 6.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.94140625, -2.849945068359375, -2.75848388671875, -2.667022705078125, -2.5755615234375, -2.484100341796875, -2.39263916015625, -2.301177978515625, -2.209716796875, -2.118255615234375, -2.02679443359375, -1.935333251953125, -1.8438720703125, -1.752410888671875, -1.66094970703125, -1.569488525390625, -1.47802734375, -1.386566162109375, -1.29510498046875, -1.203643798828125, -1.1121826171875, -1.020721435546875, -0.92926025390625, -0.837799072265625, -0.746337890625, -0.654876708984375, -0.56341552734375, -0.471954345703125, -0.3804931640625, -0.289031982421875, -0.19757080078125, -0.106109619140625, -0.0146484375, 0.076812744140625, 0.16827392578125, 0.259735107421875, 0.3511962890625, 0.442657470703125, 0.53411865234375, 0.625579833984375, 0.717041015625, 0.808502197265625, 0.89996337890625, 0.991424560546875, 1.0828857421875, 1.174346923828125, 1.26580810546875, 1.357269287109375, 1.44873046875, 1.540191650390625, 1.63165283203125, 1.723114013671875, 1.8145751953125, 1.906036376953125, 1.99749755859375, 2.088958740234375, 2.180419921875, 2.271881103515625, 2.36334228515625, 2.454803466796875, 2.5462646484375, 2.637725830078125, 2.72918701171875, 2.820648193359375, 2.912109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 14.0, 20.0, 32.0, 49.0, 98.0, 146.0, 329.0, 778.0, 2321.0, 11222.0, 116032.0, 841845.0, 64757.0, 7915.0, 1764.0, 612.0, 247.0, 139.0, 84.0, 44.0, 28.0, 18.0, 10.0, 10.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7626953125, -1.7027435302734375, -1.642791748046875, -1.5828399658203125, -1.52288818359375, -1.4629364013671875, -1.402984619140625, -1.3430328369140625, -1.2830810546875, -1.2231292724609375, -1.163177490234375, -1.1032257080078125, -1.04327392578125, -0.9833221435546875, -0.923370361328125, -0.8634185791015625, -0.803466796875, -0.7435150146484375, -0.683563232421875, -0.6236114501953125, -0.56365966796875, -0.5037078857421875, -0.443756103515625, -0.3838043212890625, -0.3238525390625, -0.2639007568359375, -0.203948974609375, -0.1439971923828125, -0.08404541015625, -0.0240936279296875, 0.035858154296875, 0.0958099365234375, 0.15576171875, 0.2157135009765625, 0.275665283203125, 0.3356170654296875, 0.39556884765625, 0.4555206298828125, 0.515472412109375, 0.5754241943359375, 0.6353759765625, 0.6953277587890625, 0.755279541015625, 0.8152313232421875, 0.87518310546875, 0.9351348876953125, 0.995086669921875, 1.0550384521484375, 1.114990234375, 1.1749420166015625, 1.234893798828125, 1.2948455810546875, 1.35479736328125, 1.4147491455078125, 1.474700927734375, 1.5346527099609375, 1.5946044921875, 1.6545562744140625, 1.714508056640625, 1.7744598388671875, 1.83441162109375, 1.8943634033203125, 1.954315185546875, 2.0142669677734375, 2.07421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 7.0, 3.0, 10.0, 14.0, 11.0, 19.0, 18.0, 31.0, 47.0, 59.0, 54.0, 65.0, 102.0, 126.0, 92.0, 66.0, 48.0, 50.0, 30.0, 27.0, 19.0, 21.0, 8.0, 16.0, 11.0, 5.0, 0.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002391338348388672, -0.00023254379630088806, -0.00022595375776290894, -0.0002193637192249298, -0.00021277368068695068, -0.00020618364214897156, -0.00019959360361099243, -0.0001930035650730133, -0.00018641352653503418, -0.00017982348799705505, -0.00017323344945907593, -0.0001666434109210968, -0.00016005337238311768, -0.00015346333384513855, -0.00014687329530715942, -0.0001402832567691803, -0.00013369321823120117, -0.00012710317969322205, -0.00012051314115524292, -0.0001139231026172638, -0.00010733306407928467, -0.00010074302554130554, -9.415298700332642e-05, -8.756294846534729e-05, -8.097290992736816e-05, -7.438287138938904e-05, -6.779283285140991e-05, -6.120279431343079e-05, -5.461275577545166e-05, -4.8022717237472534e-05, -4.143267869949341e-05, -3.484264016151428e-05, -2.8252601623535156e-05, -2.166256308555603e-05, -1.5072524547576904e-05, -8.482486009597778e-06, -1.8924474716186523e-06, 4.697591066360474e-06, 1.12876296043396e-05, 1.7877668142318726e-05, 2.446770668029785e-05, 3.105774521827698e-05, 3.7647783756256104e-05, 4.423782229423523e-05, 5.0827860832214355e-05, 5.741789937019348e-05, 6.400793790817261e-05, 7.059797644615173e-05, 7.718801498413086e-05, 8.377805352210999e-05, 9.036809206008911e-05, 9.695813059806824e-05, 0.00010354816913604736, 0.00011013820767402649, 0.00011672824621200562, 0.00012331828474998474, 0.00012990832328796387, 0.000136498361825943, 0.00014308840036392212, 0.00014967843890190125, 0.00015626847743988037, 0.0001628585159778595, 0.00016944855451583862, 0.00017603859305381775, 0.00018262863159179688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 8.0, 14.0, 10.0, 15.0, 30.0, 27.0, 67.0, 64.0, 134.0, 218.0, 363.0, 753.0, 1762.0, 4918.0, 19247.0, 172441.0, 756537.0, 74190.0, 11693.0, 3360.0, 1281.0, 609.0, 327.0, 153.0, 111.0, 69.0, 44.0, 33.0, 18.0, 16.0, 8.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.4146728515625, -1.366455078125, -1.3182373046875, -1.27001953125, -1.2218017578125, -1.173583984375, -1.1253662109375, -1.0771484375, -1.0289306640625, -0.980712890625, -0.9324951171875, -0.88427734375, -0.8360595703125, -0.787841796875, -0.7396240234375, -0.69140625, -0.6431884765625, -0.594970703125, -0.5467529296875, -0.49853515625, -0.4503173828125, -0.402099609375, -0.3538818359375, -0.3056640625, -0.2574462890625, -0.209228515625, -0.1610107421875, -0.11279296875, -0.0645751953125, -0.016357421875, 0.0318603515625, 0.080078125, 0.1282958984375, 0.176513671875, 0.2247314453125, 0.27294921875, 0.3211669921875, 0.369384765625, 0.4176025390625, 0.4658203125, 0.5140380859375, 0.562255859375, 0.6104736328125, 0.65869140625, 0.7069091796875, 0.755126953125, 0.8033447265625, 0.8515625, 0.8997802734375, 0.947998046875, 0.9962158203125, 1.04443359375, 1.0926513671875, 1.140869140625, 1.1890869140625, 1.2373046875, 1.2855224609375, 1.333740234375, 1.3819580078125, 1.43017578125, 1.4783935546875, 1.526611328125, 1.5748291015625, 1.623046875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 17.0, 8.0, 19.0, 33.0, 25.0, 42.0, 60.0, 85.0, 113.0, 106.0, 121.0, 97.0, 83.0, 55.0, 39.0, 19.0, 18.0, 15.0, 10.0, 4.0, 5.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.818359375, -1.7757797241210938, -1.7332000732421875, -1.6906204223632812, -1.648040771484375, -1.6054611206054688, -1.5628814697265625, -1.5203018188476562, -1.47772216796875, -1.4351425170898438, -1.3925628662109375, -1.3499832153320312, -1.307403564453125, -1.2648239135742188, -1.2222442626953125, -1.1796646118164062, -1.1370849609375, -1.0945053100585938, -1.0519256591796875, -1.0093460083007812, -0.966766357421875, -0.9241867065429688, -0.8816070556640625, -0.8390274047851562, -0.79644775390625, -0.7538681030273438, -0.7112884521484375, -0.6687088012695312, -0.626129150390625, -0.5835494995117188, -0.5409698486328125, -0.49839019775390625, -0.455810546875, -0.41323089599609375, -0.3706512451171875, -0.32807159423828125, -0.285491943359375, -0.24291229248046875, -0.2003326416015625, -0.15775299072265625, -0.11517333984375, -0.07259368896484375, -0.0300140380859375, 0.01256561279296875, 0.055145263671875, 0.09772491455078125, 0.1403045654296875, 0.18288421630859375, 0.2254638671875, 0.26804351806640625, 0.3106231689453125, 0.35320281982421875, 0.395782470703125, 0.43836212158203125, 0.4809417724609375, 0.5235214233398438, 0.56610107421875, 0.6086807250976562, 0.6512603759765625, 0.6938400268554688, 0.736419677734375, 0.7789993286132812, 0.8215789794921875, 0.8641586303710938, 0.90673828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 21.0, 37.0, 101.0, 258.0, 308.0, 194.0, 62.0, 15.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.943870544433594, -49.31494903564453, -47.6860237121582, -46.05710220336914, -44.42818069458008, -42.79925537109375, -41.17033386230469, -39.541412353515625, -37.91249084472656, -36.2835693359375, -34.65464401245117, -33.02572250366211, -31.396800994873047, -29.76787757873535, -28.138954162597656, -26.510032653808594, -24.8811092376709, -23.252185821533203, -21.62326431274414, -19.994340896606445, -18.365419387817383, -16.736495971679688, -15.107573509216309, -13.47865104675293, -11.84972858428955, -10.220806121826172, -8.591883659362793, -6.962960720062256, -5.334038257598877, -3.70511531829834, -2.076192855834961, -0.44727039337158203, 1.1816520690917969, 2.810574531555176, 4.439496994018555, 6.068419933319092, 7.697342395782471, 9.326265335083008, 10.955187797546387, 12.584110260009766, 14.213032722473145, 15.841955184936523, 17.47087860107422, 19.09980010986328, 20.728723526000977, 22.357646942138672, 23.986568450927734, 25.615489959716797, 27.244413375854492, 28.873336791992188, 30.50225830078125, 32.13117980957031, 33.76010513305664, 35.3890266418457, 37.017948150634766, 38.646873474121094, 40.275794982910156, 41.90471649169922, 43.53364181518555, 45.16256332397461, 46.79148483276367, 48.42041015625, 50.04933166503906, 51.678253173828125, 53.30717468261719]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 5.0, 13.0, 16.0, 18.0, 28.0, 38.0, 29.0, 39.0, 31.0, 45.0, 60.0, 61.0, 61.0, 54.0, 60.0, 54.0, 59.0, 45.0, 37.0, 45.0, 39.0, 31.0, 18.0, 15.0, 22.0, 11.0, 13.0, 17.0, 8.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.00992202758789, -17.520435333251953, -17.030948638916016, -16.54146385192871, -16.051977157592773, -15.562490463256836, -15.073004722595215, -14.583518981933594, -14.094032287597656, -13.604545593261719, -13.115059852600098, -12.625574111938477, -12.136087417602539, -11.646600723266602, -11.15711498260498, -10.66762924194336, -10.178142547607422, -9.688655853271484, -9.199170112609863, -8.709684371948242, -8.220197677612305, -7.730711460113525, -7.241225242614746, -6.751739025115967, -6.2622528076171875, -5.772766590118408, -5.283280372619629, -4.79379415512085, -4.30430793762207, -3.814821720123291, -3.3253355026245117, -2.8358492851257324, -2.346363067626953, -1.8568768501281738, -1.3673906326293945, -0.8779044151306152, -0.38841819763183594, 0.10106801986694336, 0.5905542373657227, 1.080040454864502, 1.5695266723632812, 2.0590128898620605, 2.54849910736084, 3.037985324859619, 3.5274715423583984, 4.016957759857178, 4.506443977355957, 4.995930194854736, 5.485416412353516, 5.974902629852295, 6.464388847351074, 6.9538750648498535, 7.443361282348633, 7.932847499847412, 8.422333717346191, 8.911819458007812, 9.40130615234375, 9.890792846679688, 10.380278587341309, 10.86976432800293, 11.359251022338867, 11.848737716674805, 12.338223457336426, 12.827709197998047, 13.317195892333984]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 9.0, 12.0, 12.0, 25.0, 48.0, 65.0, 126.0, 207.0, 374.0, 664.0, 1290.0, 2704.0, 6184.0, 17008.0, 61494.0, 838293.0, 3132455.0, 94776.0, 23119.0, 7905.0, 3616.0, 1697.0, 904.0, 480.0, 328.0, 158.0, 110.0, 84.0, 51.0, 29.0, 14.0, 14.0, 5.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.8154296875, -2.73046875, -2.6455078125, -2.560546875, -2.4755859375, -2.390625, -2.3056640625, -2.220703125, -2.1357421875, -2.05078125, -1.9658203125, -1.880859375, -1.7958984375, -1.7109375, -1.6259765625, -1.541015625, -1.4560546875, -1.37109375, -1.2861328125, -1.201171875, -1.1162109375, -1.03125, -0.9462890625, -0.861328125, -0.7763671875, -0.69140625, -0.6064453125, -0.521484375, -0.4365234375, -0.3515625, -0.2666015625, -0.181640625, -0.0966796875, -0.01171875, 0.0732421875, 0.158203125, 0.2431640625, 0.328125, 0.4130859375, 0.498046875, 0.5830078125, 0.66796875, 0.7529296875, 0.837890625, 0.9228515625, 1.0078125, 1.0927734375, 1.177734375, 1.2626953125, 1.34765625, 1.4326171875, 1.517578125, 1.6025390625, 1.6875, 1.7724609375, 1.857421875, 1.9423828125, 2.02734375, 2.1123046875, 2.197265625, 2.2822265625, 2.3671875, 2.4521484375, 2.537109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 10.0, 12.0, 21.0, 28.0, 34.0, 53.0, 55.0, 90.0, 86.0, 93.0, 96.0, 91.0, 74.0, 76.0, 48.0, 38.0, 27.0, 19.0, 15.0, 17.0, 2.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5522994995117188, -0.5181732177734375, -0.48404693603515625, -0.449920654296875, -0.41579437255859375, -0.3816680908203125, -0.34754180908203125, -0.31341552734375, -0.27928924560546875, -0.2451629638671875, -0.21103668212890625, -0.176910400390625, -0.14278411865234375, -0.1086578369140625, -0.07453155517578125, -0.0404052734375, -0.00627899169921875, 0.0278472900390625, 0.06197357177734375, 0.096099853515625, 0.13022613525390625, 0.1643524169921875, 0.19847869873046875, 0.23260498046875, 0.26673126220703125, 0.3008575439453125, 0.33498382568359375, 0.369110107421875, 0.40323638916015625, 0.4373626708984375, 0.47148895263671875, 0.505615234375, 0.5397415161132812, 0.5738677978515625, 0.6079940795898438, 0.642120361328125, 0.6762466430664062, 0.7103729248046875, 0.7444992065429688, 0.77862548828125, 0.8127517700195312, 0.8468780517578125, 0.8810043334960938, 0.915130615234375, 0.9492568969726562, 0.9833831787109375, 1.0175094604492188, 1.0516357421875, 1.0857620239257812, 1.1198883056640625, 1.1540145874023438, 1.188140869140625, 1.2222671508789062, 1.2563934326171875, 1.2905197143554688, 1.32464599609375, 1.3587722778320312, 1.3928985595703125, 1.4270248413085938, 1.461151123046875, 1.4952774047851562, 1.5294036865234375, 1.5635299682617188, 1.59765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 14.0, 13.0, 7.0, 15.0, 33.0, 47.0, 96.0, 155.0, 293.0, 488.0, 904.0, 2142.0, 5465.0, 17036.0, 73014.0, 2275741.0, 1724285.0, 68377.0, 16451.0, 5305.0, 2094.0, 998.0, 532.0, 300.0, 172.0, 106.0, 72.0, 32.0, 21.0, 17.0, 14.0, 11.0, 4.0, 9.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.19921875, -3.105072021484375, -3.01092529296875, -2.916778564453125, -2.8226318359375, -2.728485107421875, -2.63433837890625, -2.540191650390625, -2.446044921875, -2.351898193359375, -2.25775146484375, -2.163604736328125, -2.0694580078125, -1.975311279296875, -1.88116455078125, -1.787017822265625, -1.69287109375, -1.598724365234375, -1.50457763671875, -1.410430908203125, -1.3162841796875, -1.222137451171875, -1.12799072265625, -1.033843994140625, -0.939697265625, -0.845550537109375, -0.75140380859375, -0.657257080078125, -0.5631103515625, -0.468963623046875, -0.37481689453125, -0.280670166015625, -0.1865234375, -0.092376708984375, 0.00177001953125, 0.095916748046875, 0.1900634765625, 0.284210205078125, 0.37835693359375, 0.472503662109375, 0.566650390625, 0.660797119140625, 0.75494384765625, 0.849090576171875, 0.9432373046875, 1.037384033203125, 1.13153076171875, 1.225677490234375, 1.31982421875, 1.413970947265625, 1.50811767578125, 1.602264404296875, 1.6964111328125, 1.790557861328125, 1.88470458984375, 1.978851318359375, 2.072998046875, 2.167144775390625, 2.26129150390625, 2.355438232421875, 2.4495849609375, 2.543731689453125, 2.63787841796875, 2.732025146484375, 2.826171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 1.0, 4.0, 7.0, 10.0, 10.0, 14.0, 23.0, 22.0, 36.0, 55.0, 82.0, 135.0, 319.0, 897.0, 1431.0, 497.0, 193.0, 92.0, 77.0, 36.0, 37.0, 22.0, 14.0, 11.0, 16.0, 10.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.572265625, -2.484405517578125, -2.39654541015625, -2.308685302734375, -2.2208251953125, -2.132965087890625, -2.04510498046875, -1.957244873046875, -1.869384765625, -1.781524658203125, -1.69366455078125, -1.605804443359375, -1.5179443359375, -1.430084228515625, -1.34222412109375, -1.254364013671875, -1.16650390625, -1.078643798828125, -0.99078369140625, -0.902923583984375, -0.8150634765625, -0.727203369140625, -0.63934326171875, -0.551483154296875, -0.463623046875, -0.375762939453125, -0.28790283203125, -0.200042724609375, -0.1121826171875, -0.024322509765625, 0.06353759765625, 0.151397705078125, 0.2392578125, 0.327117919921875, 0.41497802734375, 0.502838134765625, 0.5906982421875, 0.678558349609375, 0.76641845703125, 0.854278564453125, 0.942138671875, 1.029998779296875, 1.11785888671875, 1.205718994140625, 1.2935791015625, 1.381439208984375, 1.46929931640625, 1.557159423828125, 1.64501953125, 1.732879638671875, 1.82073974609375, 1.908599853515625, 1.9964599609375, 2.084320068359375, 2.17218017578125, 2.260040283203125, 2.347900390625, 2.435760498046875, 2.52362060546875, 2.611480712890625, 2.6993408203125, 2.787200927734375, 2.87506103515625, 2.962921142578125, 3.05078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 9.0, 24.0, 58.0, 132.0, 250.0, 259.0, 116.0, 65.0, 30.0, 21.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.876331329345703, -19.766733169555664, -18.657133102416992, -17.547534942626953, -16.43793487548828, -15.328336715698242, -14.218738555908203, -13.109139442443848, -11.999540328979492, -10.889941215515137, -9.780342102050781, -8.670743942260742, -7.561144828796387, -6.451545715332031, -5.341947078704834, -4.232348442077637, -3.1227493286132812, -2.013150453567505, -0.9035515785217285, 0.20604729652404785, 1.3156461715698242, 2.4252452850341797, 3.534843921661377, 4.644442558288574, 5.75404167175293, 6.863640785217285, 7.973239421844482, 9.08283805847168, 10.192437171936035, 11.30203628540039, 12.41163444519043, 13.521233558654785, 14.630836486816406, 15.740435600280762, 16.850034713745117, 17.959632873535156, 19.069232940673828, 20.178831100463867, 21.288429260253906, 22.398029327392578, 23.507627487182617, 24.617225646972656, 25.726825714111328, 26.836423873901367, 27.946022033691406, 29.055622100830078, 30.165220260620117, 31.274818420410156, 32.38441848754883, 33.4940185546875, 34.603614807128906, 35.71321487426758, 36.82281494140625, 37.932411193847656, 39.04201126098633, 40.151611328125, 41.261207580566406, 42.37080764770508, 43.480403900146484, 44.590003967285156, 45.69960403442383, 46.8092041015625, 47.918800354003906, 49.02840042114258, 50.13800048828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 2.0, 4.0, 11.0, 11.0, 9.0, 11.0, 21.0, 20.0, 24.0, 25.0, 47.0, 41.0, 55.0, 50.0, 53.0, 60.0, 47.0, 53.0, 59.0, 76.0, 60.0, 45.0, 34.0, 31.0, 33.0, 30.0, 18.0, 14.0, 12.0, 6.0, 9.0, 14.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.572761535644531, -12.147817611694336, -11.72287368774414, -11.297929763793945, -10.872986793518066, -10.448042869567871, -10.023098945617676, -9.59815502166748, -9.173212051391602, -8.748268127441406, -8.323324203491211, -7.898380756378174, -7.473437309265137, -7.048493385314941, -6.623549461364746, -6.198605537414551, -5.7736616134643555, -5.34871768951416, -4.923774242401123, -4.498830318450928, -4.073886871337891, -3.6489429473876953, -3.2239990234375, -2.799055337905884, -2.3741116523742676, -1.9491679668426514, -1.5242241621017456, -1.0992803573608398, -0.6743366718292236, -0.24939298629760742, 0.1755509376525879, 0.6004946231842041, 1.0254392623901367, 1.450382947921753, 1.8753267526626587, 2.3002705574035645, 2.7252142429351807, 3.150157928466797, 3.575101852416992, 4.0000457763671875, 4.424989223480225, 4.84993314743042, 5.274876594543457, 5.699820518493652, 6.124764442443848, 6.549707889556885, 6.97465181350708, 7.399595260620117, 7.8245391845703125, 8.249483108520508, 8.674427032470703, 9.099370956420898, 9.524313926696777, 9.949257850646973, 10.374201774597168, 10.799145698547363, 11.224088668823242, 11.649032592773438, 12.073976516723633, 12.498920440673828, 12.923863410949707, 13.348807334899902, 13.773751258850098, 14.198695182800293, 14.623639106750488]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 12.0, 20.0, 32.0, 52.0, 77.0, 164.0, 294.0, 529.0, 1101.0, 2428.0, 5841.0, 15947.0, 51033.0, 254217.0, 577816.0, 96152.0, 26891.0, 9123.0, 3570.0, 1543.0, 754.0, 417.0, 226.0, 107.0, 65.0, 46.0, 34.0, 12.0, 9.0, 8.0, 7.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.90234375, -2.809417724609375, -2.71649169921875, -2.623565673828125, -2.5306396484375, -2.437713623046875, -2.34478759765625, -2.251861572265625, -2.158935546875, -2.066009521484375, -1.97308349609375, -1.880157470703125, -1.7872314453125, -1.694305419921875, -1.60137939453125, -1.508453369140625, -1.41552734375, -1.322601318359375, -1.22967529296875, -1.136749267578125, -1.0438232421875, -0.950897216796875, -0.85797119140625, -0.765045166015625, -0.672119140625, -0.579193115234375, -0.48626708984375, -0.393341064453125, -0.3004150390625, -0.207489013671875, -0.11456298828125, -0.021636962890625, 0.0712890625, 0.164215087890625, 0.25714111328125, 0.350067138671875, 0.4429931640625, 0.535919189453125, 0.62884521484375, 0.721771240234375, 0.814697265625, 0.907623291015625, 1.00054931640625, 1.093475341796875, 1.1864013671875, 1.279327392578125, 1.37225341796875, 1.465179443359375, 1.55810546875, 1.651031494140625, 1.74395751953125, 1.836883544921875, 1.9298095703125, 2.022735595703125, 2.11566162109375, 2.208587646484375, 2.301513671875, 2.394439697265625, 2.48736572265625, 2.580291748046875, 2.6732177734375, 2.766143798828125, 2.85906982421875, 2.951995849609375, 3.044921875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 9.0, 13.0, 9.0, 14.0, 14.0, 19.0, 34.0, 39.0, 43.0, 51.0, 57.0, 54.0, 82.0, 74.0, 54.0, 74.0, 62.0, 57.0, 57.0, 37.0, 36.0, 25.0, 21.0, 28.0, 8.0, 16.0, 8.0, 5.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7270126342773438, -0.7001190185546875, -0.6732254028320312, -0.646331787109375, -0.6194381713867188, -0.5925445556640625, -0.5656509399414062, -0.53875732421875, -0.5118637084960938, -0.4849700927734375, -0.45807647705078125, -0.431182861328125, -0.40428924560546875, -0.3773956298828125, -0.35050201416015625, -0.3236083984375, -0.29671478271484375, -0.2698211669921875, -0.24292755126953125, -0.216033935546875, -0.18914031982421875, -0.1622467041015625, -0.13535308837890625, -0.10845947265625, -0.08156585693359375, -0.0546722412109375, -0.02777862548828125, -0.000885009765625, 0.02600860595703125, 0.0529022216796875, 0.07979583740234375, 0.106689453125, 0.13358306884765625, 0.1604766845703125, 0.18737030029296875, 0.214263916015625, 0.24115753173828125, 0.2680511474609375, 0.29494476318359375, 0.32183837890625, 0.34873199462890625, 0.3756256103515625, 0.40251922607421875, 0.429412841796875, 0.45630645751953125, 0.4832000732421875, 0.5100936889648438, 0.5369873046875, 0.5638809204101562, 0.5907745361328125, 0.6176681518554688, 0.644561767578125, 0.6714553833007812, 0.6983489990234375, 0.7252426147460938, 0.75213623046875, 0.7790298461914062, 0.8059234619140625, 0.8328170776367188, 0.859710693359375, 0.8866043090820312, 0.9134979248046875, 0.9403915405273438, 0.96728515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 10.0, 13.0, 29.0, 36.0, 62.0, 131.0, 180.0, 369.0, 678.0, 1472.0, 4475.0, 29841.0, 866897.0, 130402.0, 9378.0, 2431.0, 987.0, 483.0, 260.0, 157.0, 92.0, 54.0, 35.0, 26.0, 13.0, 12.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.80072021484375, -5.6287841796875, -5.45684814453125, -5.284912109375, -5.11297607421875, -4.9410400390625, -4.76910400390625, -4.59716796875, -4.42523193359375, -4.2532958984375, -4.08135986328125, -3.909423828125, -3.73748779296875, -3.5655517578125, -3.39361572265625, -3.2216796875, -3.04974365234375, -2.8778076171875, -2.70587158203125, -2.533935546875, -2.36199951171875, -2.1900634765625, -2.01812744140625, -1.84619140625, -1.67425537109375, -1.5023193359375, -1.33038330078125, -1.158447265625, -0.98651123046875, -0.8145751953125, -0.64263916015625, -0.470703125, -0.29876708984375, -0.1268310546875, 0.04510498046875, 0.217041015625, 0.38897705078125, 0.5609130859375, 0.73284912109375, 0.90478515625, 1.07672119140625, 1.2486572265625, 1.42059326171875, 1.592529296875, 1.76446533203125, 1.9364013671875, 2.10833740234375, 2.2802734375, 2.45220947265625, 2.6241455078125, 2.79608154296875, 2.968017578125, 3.13995361328125, 3.3118896484375, 3.48382568359375, 3.65576171875, 3.82769775390625, 3.9996337890625, 4.17156982421875, 4.343505859375, 4.51544189453125, 4.6873779296875, 4.85931396484375, 5.03125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 8.0, 6.0, 12.0, 9.0, 18.0, 25.0, 20.0, 28.0, 34.0, 46.0, 40.0, 31.0, 49.0, 56.0, 52.0, 60.0, 51.0, 50.0, 49.0, 60.0, 41.0, 44.0, 30.0, 31.0, 35.0, 21.0, 26.0, 10.0, 12.0, 6.0, 8.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.29296875, -3.19537353515625, -3.0977783203125, -3.00018310546875, -2.902587890625, -2.80499267578125, -2.7073974609375, -2.60980224609375, -2.51220703125, -2.41461181640625, -2.3170166015625, -2.21942138671875, -2.121826171875, -2.02423095703125, -1.9266357421875, -1.82904052734375, -1.7314453125, -1.63385009765625, -1.5362548828125, -1.43865966796875, -1.341064453125, -1.24346923828125, -1.1458740234375, -1.04827880859375, -0.95068359375, -0.85308837890625, -0.7554931640625, -0.65789794921875, -0.560302734375, -0.46270751953125, -0.3651123046875, -0.26751708984375, -0.169921875, -0.07232666015625, 0.0252685546875, 0.12286376953125, 0.220458984375, 0.31805419921875, 0.4156494140625, 0.51324462890625, 0.61083984375, 0.70843505859375, 0.8060302734375, 0.90362548828125, 1.001220703125, 1.09881591796875, 1.1964111328125, 1.29400634765625, 1.3916015625, 1.48919677734375, 1.5867919921875, 1.68438720703125, 1.781982421875, 1.87957763671875, 1.9771728515625, 2.07476806640625, 2.17236328125, 2.26995849609375, 2.3675537109375, 2.46514892578125, 2.562744140625, 2.66033935546875, 2.7579345703125, 2.85552978515625, 2.953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 1.0, 5.0, 11.0, 12.0, 6.0, 15.0, 27.0, 31.0, 55.0, 71.0, 116.0, 200.0, 385.0, 837.0, 2462.0, 10700.0, 95969.0, 842149.0, 81883.0, 9593.0, 2284.0, 810.0, 352.0, 190.0, 128.0, 67.0, 50.0, 29.0, 25.0, 32.0, 14.0, 9.0, 6.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7431640625, -1.6910858154296875, -1.639007568359375, -1.5869293212890625, -1.53485107421875, -1.4827728271484375, -1.430694580078125, -1.3786163330078125, -1.3265380859375, -1.2744598388671875, -1.222381591796875, -1.1703033447265625, -1.11822509765625, -1.0661468505859375, -1.014068603515625, -0.9619903564453125, -0.909912109375, -0.8578338623046875, -0.805755615234375, -0.7536773681640625, -0.70159912109375, -0.6495208740234375, -0.597442626953125, -0.5453643798828125, -0.4932861328125, -0.4412078857421875, -0.389129638671875, -0.3370513916015625, -0.28497314453125, -0.2328948974609375, -0.180816650390625, -0.1287384033203125, -0.07666015625, -0.0245819091796875, 0.027496337890625, 0.0795745849609375, 0.13165283203125, 0.1837310791015625, 0.235809326171875, 0.2878875732421875, 0.3399658203125, 0.3920440673828125, 0.444122314453125, 0.4962005615234375, 0.54827880859375, 0.6003570556640625, 0.652435302734375, 0.7045135498046875, 0.756591796875, 0.8086700439453125, 0.860748291015625, 0.9128265380859375, 0.96490478515625, 1.0169830322265625, 1.069061279296875, 1.1211395263671875, 1.1732177734375, 1.2252960205078125, 1.277374267578125, 1.3294525146484375, 1.38153076171875, 1.4336090087890625, 1.485687255859375, 1.5377655029296875, 1.58984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 10.0, 9.0, 12.0, 12.0, 20.0, 34.0, 41.0, 48.0, 75.0, 126.0, 215.0, 126.0, 66.0, 57.0, 36.0, 23.0, 16.0, 13.0, 11.0, 11.0, 5.0, 4.0, 8.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003428459167480469, -0.0003337189555168152, -0.0003245919942855835, -0.0003154650330543518, -0.0003063380718231201, -0.00029721111059188843, -0.00028808414936065674, -0.00027895718812942505, -0.00026983022689819336, -0.00026070326566696167, -0.00025157630443573, -0.0002424493432044983, -0.0002333223819732666, -0.0002241954207420349, -0.00021506845951080322, -0.00020594149827957153, -0.00019681453704833984, -0.00018768757581710815, -0.00017856061458587646, -0.00016943365335464478, -0.00016030669212341309, -0.0001511797308921814, -0.0001420527696609497, -0.00013292580842971802, -0.00012379884719848633, -0.00011467188596725464, -0.00010554492473602295, -9.641796350479126e-05, -8.729100227355957e-05, -7.816404104232788e-05, -6.903707981109619e-05, -5.99101185798645e-05, -5.078315734863281e-05, -4.165619611740112e-05, -3.2529234886169434e-05, -2.3402273654937744e-05, -1.4275312423706055e-05, -5.148351192474365e-06, 3.978610038757324e-06, 1.3105571269989014e-05, 2.2232532501220703e-05, 3.135949373245239e-05, 4.048645496368408e-05, 4.961341619491577e-05, 5.874037742614746e-05, 6.786733865737915e-05, 7.699429988861084e-05, 8.612126111984253e-05, 9.524822235107422e-05, 0.00010437518358230591, 0.0001135021448135376, 0.0001226291060447693, 0.00013175606727600098, 0.00014088302850723267, 0.00015000998973846436, 0.00015913695096969604, 0.00016826391220092773, 0.00017739087343215942, 0.0001865178346633911, 0.0001956447958946228, 0.0002047717571258545, 0.00021389871835708618, 0.00022302567958831787, 0.00023215264081954956, 0.00024127960205078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 11.0, 5.0, 10.0, 14.0, 19.0, 23.0, 35.0, 51.0, 92.0, 118.0, 235.0, 380.0, 739.0, 1694.0, 4341.0, 15125.0, 122526.0, 801989.0, 82297.0, 12045.0, 3623.0, 1487.0, 706.0, 362.0, 225.0, 117.0, 78.0, 49.0, 32.0, 22.0, 19.0, 18.0, 13.0, 14.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.525390625, -1.4783477783203125, -1.431304931640625, -1.3842620849609375, -1.33721923828125, -1.2901763916015625, -1.243133544921875, -1.1960906982421875, -1.1490478515625, -1.1020050048828125, -1.054962158203125, -1.0079193115234375, -0.96087646484375, -0.9138336181640625, -0.866790771484375, -0.8197479248046875, -0.772705078125, -0.7256622314453125, -0.678619384765625, -0.6315765380859375, -0.58453369140625, -0.5374908447265625, -0.490447998046875, -0.4434051513671875, -0.3963623046875, -0.3493194580078125, -0.302276611328125, -0.2552337646484375, -0.20819091796875, -0.1611480712890625, -0.114105224609375, -0.0670623779296875, -0.02001953125, 0.0270233154296875, 0.074066162109375, 0.1211090087890625, 0.16815185546875, 0.2151947021484375, 0.262237548828125, 0.3092803955078125, 0.3563232421875, 0.4033660888671875, 0.450408935546875, 0.4974517822265625, 0.54449462890625, 0.5915374755859375, 0.638580322265625, 0.6856231689453125, 0.732666015625, 0.7797088623046875, 0.826751708984375, 0.8737945556640625, 0.92083740234375, 0.9678802490234375, 1.014923095703125, 1.0619659423828125, 1.1090087890625, 1.1560516357421875, 1.203094482421875, 1.2501373291015625, 1.29718017578125, 1.3442230224609375, 1.391265869140625, 1.4383087158203125, 1.4853515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 9.0, 8.0, 13.0, 13.0, 17.0, 20.0, 29.0, 38.0, 34.0, 51.0, 32.0, 68.0, 67.0, 102.0, 74.0, 72.0, 68.0, 50.0, 38.0, 35.0, 29.0, 25.0, 18.0, 21.0, 15.0, 14.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91064453125, -0.8798599243164062, -0.8490753173828125, -0.8182907104492188, -0.787506103515625, -0.7567214965820312, -0.7259368896484375, -0.6951522827148438, -0.66436767578125, -0.6335830688476562, -0.6027984619140625, -0.5720138549804688, -0.541229248046875, -0.5104446411132812, -0.4796600341796875, -0.44887542724609375, -0.4180908203125, -0.38730621337890625, -0.3565216064453125, -0.32573699951171875, -0.294952392578125, -0.26416778564453125, -0.2333831787109375, -0.20259857177734375, -0.17181396484375, -0.14102935791015625, -0.1102447509765625, -0.07946014404296875, -0.048675537109375, -0.01789093017578125, 0.0128936767578125, 0.04367828369140625, 0.074462890625, 0.10524749755859375, 0.1360321044921875, 0.16681671142578125, 0.197601318359375, 0.22838592529296875, 0.2591705322265625, 0.28995513916015625, 0.32073974609375, 0.35152435302734375, 0.3823089599609375, 0.41309356689453125, 0.443878173828125, 0.47466278076171875, 0.5054473876953125, 0.5362319946289062, 0.5670166015625, 0.5978012084960938, 0.6285858154296875, 0.6593704223632812, 0.690155029296875, 0.7209396362304688, 0.7517242431640625, 0.7825088500976562, 0.81329345703125, 0.8440780639648438, 0.8748626708984375, 0.9056472778320312, 0.936431884765625, 0.9672164916992188, 0.9980010986328125, 1.0287857055664062, 1.0595703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 4.0, 2.0, 11.0, 21.0, 39.0, 86.0, 149.0, 219.0, 209.0, 117.0, 74.0, 34.0, 18.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-40.18266677856445, -39.324249267578125, -38.46583557128906, -37.607418060302734, -36.749000549316406, -35.890586853027344, -35.032169342041016, -34.17375183105469, -33.315338134765625, -32.4569206237793, -31.5985050201416, -30.740089416503906, -29.88167381286621, -29.023258209228516, -28.164840698242188, -27.306425094604492, -26.448007583618164, -25.58959197998047, -24.73117446899414, -23.872758865356445, -23.01434326171875, -22.155925750732422, -21.297510147094727, -20.43909454345703, -19.580677032470703, -18.722261428833008, -17.86384391784668, -17.005428314208984, -16.14701271057129, -15.288596153259277, -14.430179595947266, -13.57176399230957, -12.713348388671875, -11.854931831359863, -10.996516227722168, -10.138099670410156, -9.279684066772461, -8.42126750946045, -7.5628509521484375, -6.704434871673584, -5.8460187911987305, -4.987602710723877, -4.129186630249023, -3.2707700729370117, -2.412353992462158, -1.5539379119873047, -0.695521354675293, 0.16289472579956055, 1.021310806274414, 1.8797270059585571, 2.7381432056427, 3.596559524536133, 4.454975605010986, 5.31339168548584, 6.171808242797852, 7.030224323272705, 7.888640403747559, 8.74705696105957, 9.605472564697266, 10.463889122009277, 11.322305679321289, 12.180721282958984, 13.039137840270996, 13.897554397583008, 14.755970001220703]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 9.0, 19.0, 13.0, 13.0, 27.0, 22.0, 29.0, 29.0, 39.0, 47.0, 64.0, 47.0, 78.0, 50.0, 67.0, 80.0, 46.0, 51.0, 42.0, 33.0, 32.0, 32.0, 26.0, 20.0, 15.0, 24.0, 20.0, 7.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.31732940673828, -15.909163475036621, -15.500997543334961, -15.0928316116333, -14.68466567993164, -14.276498794555664, -13.868332862854004, -13.460166931152344, -13.052000999450684, -12.643835067749023, -12.235669136047363, -11.827503204345703, -11.419336318969727, -11.011171340942383, -10.603004455566406, -10.194838523864746, -9.786672592163086, -9.378506660461426, -8.970340728759766, -8.562174797058105, -8.154008865356445, -7.745842456817627, -7.337676048278809, -6.929510116577148, -6.521344184875488, -6.113178253173828, -5.705012321472168, -5.29684591293335, -4.8886799812316895, -4.480514049530029, -4.072347640991211, -3.664181709289551, -3.2560157775878906, -2.8478498458862305, -2.439683675765991, -2.031517505645752, -1.6233515739440918, -1.2151856422424316, -0.8070194721221924, -0.3988533020019531, 0.009312629699707031, 0.41747868061065674, 0.8256447315216064, 1.2338107824325562, 1.6419768333435059, 2.050142765045166, 2.4583089351654053, 2.8664751052856445, 3.2746410369873047, 3.682806968688965, 4.090972900390625, 4.499139308929443, 4.9073052406311035, 5.315471172332764, 5.723637580871582, 6.131803512573242, 6.539969444274902, 6.9481353759765625, 7.356301307678223, 7.764467716217041, 8.17263412475586, 8.580799102783203, 8.98896598815918, 9.39713191986084, 9.8052978515625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 11.0, 16.0, 18.0, 23.0, 34.0, 59.0, 63.0, 78.0, 163.0, 292.0, 955.0, 5298.0, 167839.0, 3999971.0, 16733.0, 1644.0, 464.0, 231.0, 111.0, 73.0, 51.0, 33.0, 29.0, 17.0, 16.0, 10.0, 12.0, 8.0, 2.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8671875, -6.66650390625, -6.4658203125, -6.26513671875, -6.064453125, -5.86376953125, -5.6630859375, -5.46240234375, -5.26171875, -5.06103515625, -4.8603515625, -4.65966796875, -4.458984375, -4.25830078125, -4.0576171875, -3.85693359375, -3.65625, -3.45556640625, -3.2548828125, -3.05419921875, -2.853515625, -2.65283203125, -2.4521484375, -2.25146484375, -2.05078125, -1.85009765625, -1.6494140625, -1.44873046875, -1.248046875, -1.04736328125, -0.8466796875, -0.64599609375, -0.4453125, -0.24462890625, -0.0439453125, 0.15673828125, 0.357421875, 0.55810546875, 0.7587890625, 0.95947265625, 1.16015625, 1.36083984375, 1.5615234375, 1.76220703125, 1.962890625, 2.16357421875, 2.3642578125, 2.56494140625, 2.765625, 2.96630859375, 3.1669921875, 3.36767578125, 3.568359375, 3.76904296875, 3.9697265625, 4.17041015625, 4.37109375, 4.57177734375, 4.7724609375, 4.97314453125, 5.173828125, 5.37451171875, 5.5751953125, 5.77587890625, 5.9765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 26.0, 18.0, 24.0, 31.0, 44.0, 39.0, 51.0, 69.0, 65.0, 77.0, 78.0, 74.0, 72.0, 64.0, 57.0, 44.0, 45.0, 24.0, 24.0, 17.0, 17.0, 10.0, 12.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.046875, -1.0189285278320312, -0.9909820556640625, -0.9630355834960938, -0.935089111328125, -0.9071426391601562, -0.8791961669921875, -0.8512496948242188, -0.82330322265625, -0.7953567504882812, -0.7674102783203125, -0.7394638061523438, -0.711517333984375, -0.6835708618164062, -0.6556243896484375, -0.6276779174804688, -0.5997314453125, -0.5717849731445312, -0.5438385009765625, -0.5158920288085938, -0.487945556640625, -0.45999908447265625, -0.4320526123046875, -0.40410614013671875, -0.37615966796875, -0.34821319580078125, -0.3202667236328125, -0.29232025146484375, -0.264373779296875, -0.23642730712890625, -0.2084808349609375, -0.18053436279296875, -0.152587890625, -0.12464141845703125, -0.0966949462890625, -0.06874847412109375, -0.040802001953125, -0.01285552978515625, 0.0150909423828125, 0.04303741455078125, 0.07098388671875, 0.09893035888671875, 0.1268768310546875, 0.15482330322265625, 0.182769775390625, 0.21071624755859375, 0.2386627197265625, 0.26660919189453125, 0.2945556640625, 0.32250213623046875, 0.3504486083984375, 0.37839508056640625, 0.406341552734375, 0.43428802490234375, 0.4622344970703125, 0.49018096923828125, 0.51812744140625, 0.5460739135742188, 0.5740203857421875, 0.6019668579101562, 0.629913330078125, 0.6578598022460938, 0.6858062744140625, 0.7137527465820312, 0.74169921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 4.0, 18.0, 20.0, 31.0, 52.0, 72.0, 93.0, 169.0, 297.0, 512.0, 940.0, 2005.0, 5138.0, 16951.0, 89323.0, 3387329.0, 633791.0, 41627.0, 9662.0, 3254.0, 1364.0, 663.0, 379.0, 214.0, 123.0, 72.0, 59.0, 44.0, 27.0, 13.0, 10.0, 7.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.302734375, -3.219757080078125, -3.13677978515625, -3.053802490234375, -2.9708251953125, -2.887847900390625, -2.80487060546875, -2.721893310546875, -2.638916015625, -2.555938720703125, -2.47296142578125, -2.389984130859375, -2.3070068359375, -2.224029541015625, -2.14105224609375, -2.058074951171875, -1.97509765625, -1.892120361328125, -1.80914306640625, -1.726165771484375, -1.6431884765625, -1.560211181640625, -1.47723388671875, -1.394256591796875, -1.311279296875, -1.228302001953125, -1.14532470703125, -1.062347412109375, -0.9793701171875, -0.896392822265625, -0.81341552734375, -0.730438232421875, -0.6474609375, -0.564483642578125, -0.48150634765625, -0.398529052734375, -0.3155517578125, -0.232574462890625, -0.14959716796875, -0.066619873046875, 0.016357421875, 0.099334716796875, 0.18231201171875, 0.265289306640625, 0.3482666015625, 0.431243896484375, 0.51422119140625, 0.597198486328125, 0.68017578125, 0.763153076171875, 0.84613037109375, 0.929107666015625, 1.0120849609375, 1.095062255859375, 1.17803955078125, 1.261016845703125, 1.343994140625, 1.426971435546875, 1.50994873046875, 1.592926025390625, 1.6759033203125, 1.758880615234375, 1.84185791015625, 1.924835205078125, 2.0078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 11.0, 13.0, 25.0, 43.0, 65.0, 122.0, 337.0, 1074.0, 1487.0, 481.0, 197.0, 79.0, 38.0, 19.0, 24.0, 14.0, 7.0, 5.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.826202392578125, -2.73248291015625, -2.638763427734375, -2.5450439453125, -2.451324462890625, -2.35760498046875, -2.263885498046875, -2.170166015625, -2.076446533203125, -1.98272705078125, -1.889007568359375, -1.7952880859375, -1.701568603515625, -1.60784912109375, -1.514129638671875, -1.42041015625, -1.326690673828125, -1.23297119140625, -1.139251708984375, -1.0455322265625, -0.951812744140625, -0.85809326171875, -0.764373779296875, -0.670654296875, -0.576934814453125, -0.48321533203125, -0.389495849609375, -0.2957763671875, -0.202056884765625, -0.10833740234375, -0.014617919921875, 0.0791015625, 0.172821044921875, 0.26654052734375, 0.360260009765625, 0.4539794921875, 0.547698974609375, 0.64141845703125, 0.735137939453125, 0.828857421875, 0.922576904296875, 1.01629638671875, 1.110015869140625, 1.2037353515625, 1.297454833984375, 1.39117431640625, 1.484893798828125, 1.57861328125, 1.672332763671875, 1.76605224609375, 1.859771728515625, 1.9534912109375, 2.047210693359375, 2.14093017578125, 2.234649658203125, 2.328369140625, 2.422088623046875, 2.51580810546875, 2.609527587890625, 2.7032470703125, 2.796966552734375, 2.89068603515625, 2.984405517578125, 3.078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 15.0, 36.0, 82.0, 211.0, 262.0, 191.0, 115.0, 41.0, 8.0, 9.0, 3.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.767578125, -36.95790481567383, -36.14822769165039, -35.33855438232422, -34.52887725830078, -33.71920394897461, -32.90953063964844, -32.099853515625, -31.290180206298828, -30.480504989624023, -29.67082977294922, -28.861156463623047, -28.051481246948242, -27.241806030273438, -26.432130813598633, -25.622455596923828, -24.812780380249023, -24.00310516357422, -23.193429946899414, -22.38375473022461, -21.574081420898438, -20.764406204223633, -19.954730987548828, -19.145055770874023, -18.33538055419922, -17.525705337524414, -16.71603012084961, -15.906355857849121, -15.096681594848633, -14.287006378173828, -13.477331161499023, -12.667655944824219, -11.857982635498047, -11.048307418823242, -10.238633155822754, -9.42895793914795, -8.619283676147461, -7.809608459472656, -6.999933242797852, -6.190258502960205, -5.380583763122559, -4.570909023284912, -3.7612340450286865, -2.951559066772461, -2.1418843269348145, -1.332209587097168, -0.5225343704223633, 0.2871403694152832, 1.0968151092529297, 1.9064899682998657, 2.7161648273468018, 3.5258398056030273, 4.335514545440674, 5.14518928527832, 5.954864501953125, 6.7645392417907715, 7.574213981628418, 8.383889198303223, 9.193563461303711, 10.003238677978516, 10.81291389465332, 11.622588157653809, 12.432263374328613, 13.241937637329102, 14.051612854003906]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 7.0, 3.0, 6.0, 15.0, 10.0, 19.0, 28.0, 25.0, 24.0, 40.0, 45.0, 47.0, 50.0, 57.0, 50.0, 51.0, 44.0, 49.0, 54.0, 52.0, 46.0, 56.0, 34.0, 39.0, 28.0, 18.0, 23.0, 18.0, 20.0, 10.0, 6.0, 5.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.66554069519043, -8.375518798828125, -8.08549690246582, -7.795474529266357, -7.505452632904053, -7.215430736541748, -6.925408363342285, -6.6353864669799805, -6.345364570617676, -6.055342674255371, -5.765320777893066, -5.4752984046936035, -5.185276508331299, -4.895254611968994, -4.605232238769531, -4.315210342407227, -4.025188446044922, -3.735166549682617, -3.4451444149017334, -3.1551222801208496, -2.865100383758545, -2.5750784873962402, -2.2850563526153564, -1.9950342178344727, -1.705012321472168, -1.4149903059005737, -1.1249682903289795, -0.8349462747573853, -0.544924259185791, -0.2549022436141968, 0.03511977195739746, 0.32514190673828125, 0.6151638031005859, 0.9051858186721802, 1.1952078342437744, 1.4852298498153687, 1.775251865386963, 2.0652737617492676, 2.3552958965301514, 2.645318031311035, 2.93533992767334, 3.2253618240356445, 3.5153839588165283, 3.805406093597412, 4.095427989959717, 4.3854498863220215, 4.675472259521484, 4.965494155883789, 5.255516052246094, 5.545537948608398, 5.835559844970703, 6.125582218170166, 6.415604114532471, 6.705626010894775, 6.995648384094238, 7.285670280456543, 7.575692176818848, 7.865714073181152, 8.155735969543457, 8.445757865905762, 8.735780715942383, 9.025802612304688, 9.315824508666992, 9.605846405029297, 9.895868301391602]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 25.0, 14.0, 30.0, 47.0, 45.0, 110.0, 182.0, 297.0, 468.0, 888.0, 1552.0, 2916.0, 6083.0, 13085.0, 33025.0, 108769.0, 476115.0, 294388.0, 67701.0, 23327.0, 9735.0, 4537.0, 2221.0, 1199.0, 675.0, 408.0, 249.0, 120.0, 92.0, 65.0, 40.0, 26.0, 20.0, 16.0, 11.0, 16.0, 6.0, 6.0, 1.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.884765625, -1.825531005859375, -1.76629638671875, -1.707061767578125, -1.6478271484375, -1.588592529296875, -1.52935791015625, -1.470123291015625, -1.410888671875, -1.351654052734375, -1.29241943359375, -1.233184814453125, -1.1739501953125, -1.114715576171875, -1.05548095703125, -0.996246337890625, -0.93701171875, -0.877777099609375, -0.81854248046875, -0.759307861328125, -0.7000732421875, -0.640838623046875, -0.58160400390625, -0.522369384765625, -0.463134765625, -0.403900146484375, -0.34466552734375, -0.285430908203125, -0.2261962890625, -0.166961669921875, -0.10772705078125, -0.048492431640625, 0.0107421875, 0.069976806640625, 0.12921142578125, 0.188446044921875, 0.2476806640625, 0.306915283203125, 0.36614990234375, 0.425384521484375, 0.484619140625, 0.543853759765625, 0.60308837890625, 0.662322998046875, 0.7215576171875, 0.780792236328125, 0.84002685546875, 0.899261474609375, 0.95849609375, 1.017730712890625, 1.07696533203125, 1.136199951171875, 1.1954345703125, 1.254669189453125, 1.31390380859375, 1.373138427734375, 1.432373046875, 1.491607666015625, 1.55084228515625, 1.610076904296875, 1.6693115234375, 1.728546142578125, 1.78778076171875, 1.847015380859375, 1.90625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 9.0, 13.0, 15.0, 26.0, 34.0, 46.0, 43.0, 46.0, 70.0, 84.0, 80.0, 75.0, 80.0, 70.0, 69.0, 55.0, 44.0, 43.0, 31.0, 19.0, 18.0, 16.0, 7.0, 9.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1875, -1.155059814453125, -1.12261962890625, -1.090179443359375, -1.0577392578125, -1.025299072265625, -0.99285888671875, -0.960418701171875, -0.927978515625, -0.895538330078125, -0.86309814453125, -0.830657958984375, -0.7982177734375, -0.765777587890625, -0.73333740234375, -0.700897216796875, -0.66845703125, -0.636016845703125, -0.60357666015625, -0.571136474609375, -0.5386962890625, -0.506256103515625, -0.47381591796875, -0.441375732421875, -0.408935546875, -0.376495361328125, -0.34405517578125, -0.311614990234375, -0.2791748046875, -0.246734619140625, -0.21429443359375, -0.181854248046875, -0.1494140625, -0.116973876953125, -0.08453369140625, -0.052093505859375, -0.0196533203125, 0.012786865234375, 0.04522705078125, 0.077667236328125, 0.110107421875, 0.142547607421875, 0.17498779296875, 0.207427978515625, 0.2398681640625, 0.272308349609375, 0.30474853515625, 0.337188720703125, 0.36962890625, 0.402069091796875, 0.43450927734375, 0.466949462890625, 0.4993896484375, 0.531829833984375, 0.56427001953125, 0.596710205078125, 0.629150390625, 0.661590576171875, 0.69403076171875, 0.726470947265625, 0.7589111328125, 0.791351318359375, 0.82379150390625, 0.856231689453125, 0.888671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 11.0, 9.0, 10.0, 10.0, 16.0, 16.0, 31.0, 44.0, 64.0, 64.0, 104.0, 209.0, 297.0, 509.0, 902.0, 1712.0, 4114.0, 12313.0, 51810.0, 598181.0, 323639.0, 37772.0, 9697.0, 3416.0, 1489.0, 797.0, 453.0, 333.0, 159.0, 121.0, 71.0, 48.0, 43.0, 31.0, 20.0, 9.0, 15.0, 4.0, 4.0, 5.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.069671630859375, -1.98309326171875, -1.896514892578125, -1.8099365234375, -1.723358154296875, -1.63677978515625, -1.550201416015625, -1.463623046875, -1.377044677734375, -1.29046630859375, -1.203887939453125, -1.1173095703125, -1.030731201171875, -0.94415283203125, -0.857574462890625, -0.77099609375, -0.684417724609375, -0.59783935546875, -0.511260986328125, -0.4246826171875, -0.338104248046875, -0.25152587890625, -0.164947509765625, -0.078369140625, 0.008209228515625, 0.09478759765625, 0.181365966796875, 0.2679443359375, 0.354522705078125, 0.44110107421875, 0.527679443359375, 0.6142578125, 0.700836181640625, 0.78741455078125, 0.873992919921875, 0.9605712890625, 1.047149658203125, 1.13372802734375, 1.220306396484375, 1.306884765625, 1.393463134765625, 1.48004150390625, 1.566619873046875, 1.6531982421875, 1.739776611328125, 1.82635498046875, 1.912933349609375, 1.99951171875, 2.086090087890625, 2.17266845703125, 2.259246826171875, 2.3458251953125, 2.432403564453125, 2.51898193359375, 2.605560302734375, 2.692138671875, 2.778717041015625, 2.86529541015625, 2.951873779296875, 3.0384521484375, 3.125030517578125, 3.21160888671875, 3.298187255859375, 3.384765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 12.0, 8.0, 11.0, 17.0, 19.0, 25.0, 28.0, 34.0, 34.0, 49.0, 64.0, 56.0, 56.0, 52.0, 52.0, 52.0, 61.0, 62.0, 46.0, 48.0, 49.0, 29.0, 30.0, 29.0, 20.0, 17.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.091796875, -2.993621826171875, -2.89544677734375, -2.797271728515625, -2.6990966796875, -2.600921630859375, -2.50274658203125, -2.404571533203125, -2.306396484375, -2.208221435546875, -2.11004638671875, -2.011871337890625, -1.9136962890625, -1.815521240234375, -1.71734619140625, -1.619171142578125, -1.52099609375, -1.422821044921875, -1.32464599609375, -1.226470947265625, -1.1282958984375, -1.030120849609375, -0.93194580078125, -0.833770751953125, -0.735595703125, -0.637420654296875, -0.53924560546875, -0.441070556640625, -0.3428955078125, -0.244720458984375, -0.14654541015625, -0.048370361328125, 0.0498046875, 0.147979736328125, 0.24615478515625, 0.344329833984375, 0.4425048828125, 0.540679931640625, 0.63885498046875, 0.737030029296875, 0.835205078125, 0.933380126953125, 1.03155517578125, 1.129730224609375, 1.2279052734375, 1.326080322265625, 1.42425537109375, 1.522430419921875, 1.62060546875, 1.718780517578125, 1.81695556640625, 1.915130615234375, 2.0133056640625, 2.111480712890625, 2.20965576171875, 2.307830810546875, 2.406005859375, 2.504180908203125, 2.60235595703125, 2.700531005859375, 2.7987060546875, 2.896881103515625, 2.99505615234375, 3.093231201171875, 3.19140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 28.0, 41.0, 48.0, 93.0, 218.0, 529.0, 1699.0, 8802.0, 129641.0, 853964.0, 46842.0, 4819.0, 1057.0, 365.0, 164.0, 84.0, 43.0, 23.0, 16.0, 11.0, 8.0, 5.0, 4.0, 2.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8466796875, -1.791290283203125, -1.73590087890625, -1.680511474609375, -1.6251220703125, -1.569732666015625, -1.51434326171875, -1.458953857421875, -1.403564453125, -1.348175048828125, -1.29278564453125, -1.237396240234375, -1.1820068359375, -1.126617431640625, -1.07122802734375, -1.015838623046875, -0.96044921875, -0.905059814453125, -0.84967041015625, -0.794281005859375, -0.7388916015625, -0.683502197265625, -0.62811279296875, -0.572723388671875, -0.517333984375, -0.461944580078125, -0.40655517578125, -0.351165771484375, -0.2957763671875, -0.240386962890625, -0.18499755859375, -0.129608154296875, -0.07421875, -0.018829345703125, 0.03656005859375, 0.091949462890625, 0.1473388671875, 0.202728271484375, 0.25811767578125, 0.313507080078125, 0.368896484375, 0.424285888671875, 0.47967529296875, 0.535064697265625, 0.5904541015625, 0.645843505859375, 0.70123291015625, 0.756622314453125, 0.81201171875, 0.867401123046875, 0.92279052734375, 0.978179931640625, 1.0335693359375, 1.088958740234375, 1.14434814453125, 1.199737548828125, 1.255126953125, 1.310516357421875, 1.36590576171875, 1.421295166015625, 1.4766845703125, 1.532073974609375, 1.58746337890625, 1.642852783203125, 1.6982421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 8.0, 8.0, 10.0, 17.0, 22.0, 26.0, 31.0, 44.0, 70.0, 84.0, 98.0, 119.0, 130.0, 74.0, 55.0, 43.0, 30.0, 31.0, 31.0, 13.0, 7.0, 7.0, 9.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00018143653869628906, -0.00017583556473255157, -0.0001702345907688141, -0.0001646336168050766, -0.0001590326428413391, -0.00015343166887760162, -0.00014783069491386414, -0.00014222972095012665, -0.00013662874698638916, -0.00013102777302265167, -0.00012542679905891418, -0.0001198258250951767, -0.00011422485113143921, -0.00010862387716770172, -0.00010302290320396423, -9.742192924022675e-05, -9.182095527648926e-05, -8.621998131275177e-05, -8.061900734901428e-05, -7.50180333852768e-05, -6.94170594215393e-05, -6.381608545780182e-05, -5.821511149406433e-05, -5.261413753032684e-05, -4.7013163566589355e-05, -4.141218960285187e-05, -3.581121563911438e-05, -3.0210241675376892e-05, -2.4609267711639404e-05, -1.9008293747901917e-05, -1.3407319784164429e-05, -7.806345820426941e-06, -2.205371856689453e-06, 3.3956021070480347e-06, 8.996576070785522e-06, 1.459755003452301e-05, 2.0198523998260498e-05, 2.5799497961997986e-05, 3.1400471925735474e-05, 3.700144588947296e-05, 4.260241985321045e-05, 4.820339381694794e-05, 5.3804367780685425e-05, 5.940534174442291e-05, 6.50063157081604e-05, 7.060728967189789e-05, 7.620826363563538e-05, 8.180923759937286e-05, 8.741021156311035e-05, 9.301118552684784e-05, 9.861215949058533e-05, 0.00010421313345432281, 0.0001098141074180603, 0.00011541508138179779, 0.00012101605534553528, 0.00012661702930927277, 0.00013221800327301025, 0.00013781897723674774, 0.00014341995120048523, 0.00014902092516422272, 0.0001546218991279602, 0.0001602228730916977, 0.00016582384705543518, 0.00017142482101917267, 0.00017702579498291016]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 7.0, 4.0, 11.0, 17.0, 18.0, 26.0, 58.0, 76.0, 174.0, 326.0, 718.0, 1741.0, 5540.0, 28626.0, 424940.0, 545520.0, 31742.0, 5702.0, 1888.0, 706.0, 319.0, 152.0, 103.0, 46.0, 24.0, 30.0, 14.0, 18.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9539413452148438, -0.9142303466796875, -0.8745193481445312, -0.834808349609375, -0.7950973510742188, -0.7553863525390625, -0.7156753540039062, -0.67596435546875, -0.6362533569335938, -0.5965423583984375, -0.5568313598632812, -0.517120361328125, -0.47740936279296875, -0.4376983642578125, -0.39798736572265625, -0.3582763671875, -0.31856536865234375, -0.2788543701171875, -0.23914337158203125, -0.199432373046875, -0.15972137451171875, -0.1200103759765625, -0.08029937744140625, -0.04058837890625, -0.00087738037109375, 0.0388336181640625, 0.07854461669921875, 0.118255615234375, 0.15796661376953125, 0.1976776123046875, 0.23738861083984375, 0.277099609375, 0.31681060791015625, 0.3565216064453125, 0.39623260498046875, 0.435943603515625, 0.47565460205078125, 0.5153656005859375, 0.5550765991210938, 0.59478759765625, 0.6344985961914062, 0.6742095947265625, 0.7139205932617188, 0.753631591796875, 0.7933425903320312, 0.8330535888671875, 0.8727645874023438, 0.9124755859375, 0.9521865844726562, 0.9918975830078125, 1.0316085815429688, 1.071319580078125, 1.1110305786132812, 1.1507415771484375, 1.1904525756835938, 1.23016357421875, 1.2698745727539062, 1.3095855712890625, 1.3492965698242188, 1.389007568359375, 1.4287185668945312, 1.4684295654296875, 1.5081405639648438, 1.5478515625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 19.0, 27.0, 27.0, 23.0, 59.0, 62.0, 100.0, 98.0, 129.0, 96.0, 111.0, 64.0, 57.0, 35.0, 23.0, 21.0, 15.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84228515625, -0.8068313598632812, -0.7713775634765625, -0.7359237670898438, -0.700469970703125, -0.6650161743164062, -0.6295623779296875, -0.5941085815429688, -0.55865478515625, -0.5232009887695312, -0.4877471923828125, -0.45229339599609375, -0.416839599609375, -0.38138580322265625, -0.3459320068359375, -0.31047821044921875, -0.2750244140625, -0.23957061767578125, -0.2041168212890625, -0.16866302490234375, -0.133209228515625, -0.09775543212890625, -0.0623016357421875, -0.02684783935546875, 0.00860595703125, 0.04405975341796875, 0.0795135498046875, 0.11496734619140625, 0.150421142578125, 0.18587493896484375, 0.2213287353515625, 0.25678253173828125, 0.292236328125, 0.32769012451171875, 0.3631439208984375, 0.39859771728515625, 0.434051513671875, 0.46950531005859375, 0.5049591064453125, 0.5404129028320312, 0.57586669921875, 0.6113204956054688, 0.6467742919921875, 0.6822280883789062, 0.717681884765625, 0.7531356811523438, 0.7885894775390625, 0.8240432739257812, 0.8594970703125, 0.8949508666992188, 0.9304046630859375, 0.9658584594726562, 1.001312255859375, 1.0367660522460938, 1.0722198486328125, 1.1076736450195312, 1.14312744140625, 1.1785812377929688, 1.2140350341796875, 1.2494888305664062, 1.284942626953125, 1.3203964233398438, 1.3558502197265625, 1.3913040161132812, 1.4267578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 14.0, 20.0, 68.0, 120.0, 180.0, 231.0, 177.0, 88.0, 49.0, 16.0, 12.0, 3.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.99929428100586, -22.270612716674805, -21.54193115234375, -20.813247680664062, -20.084566116333008, -19.355884552001953, -18.6272029876709, -17.898521423339844, -17.169837951660156, -16.4411563873291, -15.71247386932373, -14.983792304992676, -14.255109786987305, -13.52642822265625, -12.797746658325195, -12.069064140319824, -11.34038257598877, -10.611701011657715, -9.883018493652344, -9.154336929321289, -8.425654411315918, -7.696972846984863, -6.96829080581665, -6.2396087646484375, -5.510926723480225, -4.782244682312012, -4.053562641143799, -3.324880838394165, -2.596198797225952, -1.8675167560577393, -1.1388349533081055, -0.4101529121398926, 0.3185291290283203, 1.0472111701965332, 1.7758930921554565, 2.50457501411438, 3.2332570552825928, 3.9619390964508057, 4.6906208992004395, 5.419302940368652, 6.147984981536865, 6.876667022705078, 7.605349063873291, 8.334031105041504, 9.062712669372559, 9.79139518737793, 10.520076751708984, 11.248758316040039, 11.97744083404541, 12.706122398376465, 13.434804916381836, 14.16348648071289, 14.892168998718262, 15.620850563049316, 16.349533081054688, 17.078214645385742, 17.806896209716797, 18.53557777404785, 19.264259338378906, 19.992942810058594, 20.72162437438965, 21.450305938720703, 22.178987503051758, 22.907669067382812, 23.6363525390625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 15.0, 14.0, 31.0, 24.0, 26.0, 33.0, 47.0, 65.0, 51.0, 68.0, 81.0, 99.0, 84.0, 61.0, 53.0, 52.0, 33.0, 35.0, 35.0, 23.0, 23.0, 17.0, 5.0, 11.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.379646301269531, -10.89124584197998, -10.402846336364746, -9.914445877075195, -9.426045417785645, -8.937644958496094, -8.44924545288086, -7.960844993591309, -7.472444534301758, -6.984044551849365, -6.4956440925598145, -6.007244110107422, -5.518843650817871, -5.0304436683654785, -4.542043685913086, -4.053643226623535, -3.5652432441711426, -3.076843023300171, -2.588442802429199, -2.1000428199768066, -1.6116424798965454, -1.1232423782348633, -0.6348421573638916, -0.14644193649291992, 0.34195828437805176, 0.8303585052490234, 1.3187587261199951, 1.8071588277816772, 2.2955589294433594, 2.783959150314331, 3.2723593711853027, 3.7607595920562744, 4.249159812927246, 4.737559795379639, 5.2259602546691895, 5.714360237121582, 6.202760696411133, 6.691160678863525, 7.179560661315918, 7.667961120605469, 8.15636157989502, 8.64476203918457, 9.133161544799805, 9.621562004089355, 10.109962463378906, 10.59836196899414, 11.086762428283691, 11.575162887573242, 12.063562393188477, 12.551962852478027, 13.040362358093262, 13.528762817382812, 14.017163276672363, 14.505563735961914, 14.993963241577148, 15.4823637008667, 15.97076416015625, 16.459163665771484, 16.94756507873535, 17.435964584350586, 17.92436408996582, 18.412765502929688, 18.901165008544922, 19.389564514160156, 19.877965927124023]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 0.0, 4.0, 7.0, 10.0, 15.0, 25.0, 43.0, 54.0, 84.0, 152.0, 312.0, 601.0, 1515.0, 3873.0, 11833.0, 43641.0, 251594.0, 3113442.0, 665226.0, 73809.0, 18347.0, 5614.0, 2189.0, 949.0, 424.0, 199.0, 128.0, 53.0, 39.0, 33.0, 21.0, 15.0, 5.0, 6.0, 4.0, 8.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6370697021484375, -1.583709716796875, -1.5303497314453125, -1.47698974609375, -1.4236297607421875, -1.370269775390625, -1.3169097900390625, -1.2635498046875, -1.2101898193359375, -1.156829833984375, -1.1034698486328125, -1.05010986328125, -0.9967498779296875, -0.943389892578125, -0.8900299072265625, -0.836669921875, -0.7833099365234375, -0.729949951171875, -0.6765899658203125, -0.62322998046875, -0.5698699951171875, -0.516510009765625, -0.4631500244140625, -0.4097900390625, -0.3564300537109375, -0.303070068359375, -0.2497100830078125, -0.19635009765625, -0.1429901123046875, -0.089630126953125, -0.0362701416015625, 0.01708984375, 0.0704498291015625, 0.123809814453125, 0.1771697998046875, 0.23052978515625, 0.2838897705078125, 0.337249755859375, 0.3906097412109375, 0.4439697265625, 0.4973297119140625, 0.550689697265625, 0.6040496826171875, 0.65740966796875, 0.7107696533203125, 0.764129638671875, 0.8174896240234375, 0.870849609375, 0.9242095947265625, 0.977569580078125, 1.0309295654296875, 1.08428955078125, 1.1376495361328125, 1.191009521484375, 1.2443695068359375, 1.2977294921875, 1.3510894775390625, 1.404449462890625, 1.4578094482421875, 1.51116943359375, 1.5645294189453125, 1.617889404296875, 1.6712493896484375, 1.724609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 0.0, 10.0, 10.0, 9.0, 19.0, 23.0, 29.0, 39.0, 41.0, 48.0, 49.0, 54.0, 70.0, 66.0, 76.0, 55.0, 63.0, 55.0, 48.0, 59.0, 28.0, 36.0, 26.0, 29.0, 23.0, 15.0, 5.0, 7.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66552734375, -0.64141845703125, -0.6173095703125, -0.59320068359375, -0.569091796875, -0.54498291015625, -0.5208740234375, -0.49676513671875, -0.47265625, -0.44854736328125, -0.4244384765625, -0.40032958984375, -0.376220703125, -0.35211181640625, -0.3280029296875, -0.30389404296875, -0.27978515625, -0.25567626953125, -0.2315673828125, -0.20745849609375, -0.183349609375, -0.15924072265625, -0.1351318359375, -0.11102294921875, -0.0869140625, -0.06280517578125, -0.0386962890625, -0.01458740234375, 0.009521484375, 0.03363037109375, 0.0577392578125, 0.08184814453125, 0.10595703125, 0.13006591796875, 0.1541748046875, 0.17828369140625, 0.202392578125, 0.22650146484375, 0.2506103515625, 0.27471923828125, 0.298828125, 0.32293701171875, 0.3470458984375, 0.37115478515625, 0.395263671875, 0.41937255859375, 0.4434814453125, 0.46759033203125, 0.49169921875, 0.51580810546875, 0.5399169921875, 0.56402587890625, 0.588134765625, 0.61224365234375, 0.6363525390625, 0.66046142578125, 0.6845703125, 0.70867919921875, 0.7327880859375, 0.75689697265625, 0.781005859375, 0.80511474609375, 0.8292236328125, 0.85333251953125, 0.87744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 4.0, 6.0, 9.0, 19.0, 21.0, 31.0, 56.0, 99.0, 182.0, 348.0, 875.0, 2510.0, 10155.0, 73365.0, 3184223.0, 868373.0, 42226.0, 8045.0, 2299.0, 753.0, 334.0, 152.0, 82.0, 31.0, 22.0, 10.0, 12.0, 6.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.970703125, -2.8712158203125, -2.771728515625, -2.6722412109375, -2.57275390625, -2.4732666015625, -2.373779296875, -2.2742919921875, -2.1748046875, -2.0753173828125, -1.975830078125, -1.8763427734375, -1.77685546875, -1.6773681640625, -1.577880859375, -1.4783935546875, -1.37890625, -1.2794189453125, -1.179931640625, -1.0804443359375, -0.98095703125, -0.8814697265625, -0.781982421875, -0.6824951171875, -0.5830078125, -0.4835205078125, -0.384033203125, -0.2845458984375, -0.18505859375, -0.0855712890625, 0.013916015625, 0.1134033203125, 0.212890625, 0.3123779296875, 0.411865234375, 0.5113525390625, 0.61083984375, 0.7103271484375, 0.809814453125, 0.9093017578125, 1.0087890625, 1.1082763671875, 1.207763671875, 1.3072509765625, 1.40673828125, 1.5062255859375, 1.605712890625, 1.7052001953125, 1.8046875, 1.9041748046875, 2.003662109375, 2.1031494140625, 2.20263671875, 2.3021240234375, 2.401611328125, 2.5010986328125, 2.6005859375, 2.7000732421875, 2.799560546875, 2.8990478515625, 2.99853515625, 3.0980224609375, 3.197509765625, 3.2969970703125, 3.396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 7.0, 10.0, 14.0, 18.0, 27.0, 43.0, 49.0, 102.0, 173.0, 317.0, 598.0, 996.0, 749.0, 352.0, 198.0, 126.0, 78.0, 53.0, 41.0, 29.0, 13.0, 15.0, 10.0, 10.0, 9.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.759765625, -2.682464599609375, -2.60516357421875, -2.527862548828125, -2.4505615234375, -2.373260498046875, -2.29595947265625, -2.218658447265625, -2.141357421875, -2.064056396484375, -1.98675537109375, -1.909454345703125, -1.8321533203125, -1.754852294921875, -1.67755126953125, -1.600250244140625, -1.52294921875, -1.445648193359375, -1.36834716796875, -1.291046142578125, -1.2137451171875, -1.136444091796875, -1.05914306640625, -0.981842041015625, -0.904541015625, -0.827239990234375, -0.74993896484375, -0.672637939453125, -0.5953369140625, -0.518035888671875, -0.44073486328125, -0.363433837890625, -0.2861328125, -0.208831787109375, -0.13153076171875, -0.054229736328125, 0.0230712890625, 0.100372314453125, 0.17767333984375, 0.254974365234375, 0.332275390625, 0.409576416015625, 0.48687744140625, 0.564178466796875, 0.6414794921875, 0.718780517578125, 0.79608154296875, 0.873382568359375, 0.95068359375, 1.027984619140625, 1.10528564453125, 1.182586669921875, 1.2598876953125, 1.337188720703125, 1.41448974609375, 1.491790771484375, 1.569091796875, 1.646392822265625, 1.72369384765625, 1.800994873046875, 1.8782958984375, 1.955596923828125, 2.03289794921875, 2.110198974609375, 2.1875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 18.0, 46.0, 187.0, 268.0, 253.0, 136.0, 40.0, 17.0, 11.0, 5.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.34859848022461, -26.282636642456055, -25.216676712036133, -24.150714874267578, -23.084754943847656, -22.0187931060791, -20.952831268310547, -19.886871337890625, -18.82090950012207, -17.754947662353516, -16.688987731933594, -15.623025894165039, -14.5570650100708, -13.491104125976562, -12.425142288208008, -11.35918140411377, -10.293220520019531, -9.227259635925293, -8.161298751831055, -7.0953369140625, -6.029376029968262, -4.963415145874023, -3.897453784942627, -2.8314924240112305, -1.7655315399169922, -0.6995704174041748, 0.3663907051086426, 1.43235182762146, 2.4983129501342773, 3.5642738342285156, 4.630235195159912, 5.696196556091309, 6.762157440185547, 7.828118324279785, 8.894079208374023, 9.960041046142578, 11.026001930236816, 12.091962814331055, 13.15792465209961, 14.223885536193848, 15.289846420288086, 16.35580825805664, 17.421768188476562, 18.487730026245117, 19.553691864013672, 20.619651794433594, 21.68561363220215, 22.751575469970703, 23.817535400390625, 24.88349723815918, 25.9494571685791, 27.015419006347656, 28.081378936767578, 29.147340774536133, 30.213302612304688, 31.27926254272461, 32.34522247314453, 33.41118240356445, 34.47714614868164, 35.54310607910156, 36.609066009521484, 37.675025939941406, 38.740989685058594, 39.806949615478516, 40.8729133605957]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 9.0, 17.0, 16.0, 17.0, 26.0, 40.0, 29.0, 32.0, 42.0, 43.0, 39.0, 65.0, 57.0, 66.0, 53.0, 65.0, 53.0, 54.0, 41.0, 37.0, 42.0, 14.0, 27.0, 35.0, 20.0, 8.0, 15.0, 13.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.222214698791504, -9.837581634521484, -9.452949523925781, -9.068316459655762, -8.683683395385742, -8.299050331115723, -7.914417743682861, -7.52978515625, -7.1451520919799805, -6.760519027709961, -6.3758864402771, -5.991253852844238, -5.606620788574219, -5.221987724304199, -4.837355136871338, -4.452722549438477, -4.068089485168457, -3.6834566593170166, -3.298823833465576, -2.9141910076141357, -2.5295581817626953, -2.144925355911255, -1.7602925300598145, -1.375659704208374, -0.9910268783569336, -0.6063940525054932, -0.22176122665405273, 0.1628715991973877, 0.5475044250488281, 0.9321372509002686, 1.316770076751709, 1.7014029026031494, 2.0860366821289062, 2.4706695079803467, 2.855302333831787, 3.2399351596832275, 3.624567985534668, 4.0092010498046875, 4.393833637237549, 4.77846622467041, 5.16309928894043, 5.547732353210449, 5.9323649406433105, 6.316997528076172, 6.701630592346191, 7.086263656616211, 7.470896244049072, 7.855528831481934, 8.240161895751953, 8.624794960021973, 9.009428024291992, 9.394060134887695, 9.778693199157715, 10.163326263427734, 10.547958374023438, 10.932591438293457, 11.317224502563477, 11.701857566833496, 12.086490631103516, 12.471122741699219, 12.855755805969238, 13.240388870239258, 13.625020980834961, 14.00965404510498, 14.394287109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 12.0, 19.0, 18.0, 23.0, 47.0, 84.0, 131.0, 247.0, 722.0, 1859.0, 5369.0, 17811.0, 73208.0, 414061.0, 431744.0, 75796.0, 18673.0, 5364.0, 1921.0, 759.0, 308.0, 168.0, 63.0, 38.0, 25.0, 30.0, 10.0, 8.0, 9.0, 6.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.14453125, -3.054718017578125, -2.96490478515625, -2.875091552734375, -2.7852783203125, -2.695465087890625, -2.60565185546875, -2.515838623046875, -2.426025390625, -2.336212158203125, -2.24639892578125, -2.156585693359375, -2.0667724609375, -1.976959228515625, -1.88714599609375, -1.797332763671875, -1.70751953125, -1.617706298828125, -1.52789306640625, -1.438079833984375, -1.3482666015625, -1.258453369140625, -1.16864013671875, -1.078826904296875, -0.989013671875, -0.899200439453125, -0.80938720703125, -0.719573974609375, -0.6297607421875, -0.539947509765625, -0.45013427734375, -0.360321044921875, -0.2705078125, -0.180694580078125, -0.09088134765625, -0.001068115234375, 0.0887451171875, 0.178558349609375, 0.26837158203125, 0.358184814453125, 0.447998046875, 0.537811279296875, 0.62762451171875, 0.717437744140625, 0.8072509765625, 0.897064208984375, 0.98687744140625, 1.076690673828125, 1.16650390625, 1.256317138671875, 1.34613037109375, 1.435943603515625, 1.5257568359375, 1.615570068359375, 1.70538330078125, 1.795196533203125, 1.885009765625, 1.974822998046875, 2.06463623046875, 2.154449462890625, 2.2442626953125, 2.334075927734375, 2.42388916015625, 2.513702392578125, 2.603515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 10.0, 11.0, 21.0, 24.0, 22.0, 41.0, 46.0, 45.0, 40.0, 58.0, 62.0, 72.0, 82.0, 61.0, 78.0, 51.0, 43.0, 47.0, 30.0, 28.0, 31.0, 25.0, 23.0, 9.0, 4.0, 8.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6732864379882812, -0.6478424072265625, -0.6223983764648438, -0.596954345703125, -0.5715103149414062, -0.5460662841796875, -0.5206222534179688, -0.49517822265625, -0.46973419189453125, -0.4442901611328125, -0.41884613037109375, -0.393402099609375, -0.36795806884765625, -0.3425140380859375, -0.31707000732421875, -0.2916259765625, -0.26618194580078125, -0.2407379150390625, -0.21529388427734375, -0.189849853515625, -0.16440582275390625, -0.1389617919921875, -0.11351776123046875, -0.08807373046875, -0.06262969970703125, -0.0371856689453125, -0.01174163818359375, 0.013702392578125, 0.03914642333984375, 0.0645904541015625, 0.09003448486328125, 0.115478515625, 0.14092254638671875, 0.1663665771484375, 0.19181060791015625, 0.217254638671875, 0.24269866943359375, 0.2681427001953125, 0.29358673095703125, 0.31903076171875, 0.34447479248046875, 0.3699188232421875, 0.39536285400390625, 0.420806884765625, 0.44625091552734375, 0.4716949462890625, 0.49713897705078125, 0.5225830078125, 0.5480270385742188, 0.5734710693359375, 0.5989151000976562, 0.624359130859375, 0.6498031616210938, 0.6752471923828125, 0.7006912231445312, 0.72613525390625, 0.7515792846679688, 0.7770233154296875, 0.8024673461914062, 0.827911376953125, 0.8533554077148438, 0.8787994384765625, 0.9042434692382812, 0.9296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 6.0, 2.0, 16.0, 21.0, 32.0, 45.0, 55.0, 98.0, 122.0, 222.0, 340.0, 536.0, 939.0, 1862.0, 4496.0, 19923.0, 275604.0, 702171.0, 31149.0, 5975.0, 2226.0, 1072.0, 633.0, 341.0, 206.0, 141.0, 96.0, 75.0, 44.0, 29.0, 17.0, 17.0, 11.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.953125, -3.8125, -3.671875, -3.53125, -3.390625, -3.25, -3.109375, -2.96875, -2.828125, -2.6875, -2.546875, -2.40625, -2.265625, -2.125, -1.984375, -1.84375, -1.703125, -1.5625, -1.421875, -1.28125, -1.140625, -1.0, -0.859375, -0.71875, -0.578125, -0.4375, -0.296875, -0.15625, -0.015625, 0.125, 0.265625, 0.40625, 0.546875, 0.6875, 0.828125, 0.96875, 1.109375, 1.25, 1.390625, 1.53125, 1.671875, 1.8125, 1.953125, 2.09375, 2.234375, 2.375, 2.515625, 2.65625, 2.796875, 2.9375, 3.078125, 3.21875, 3.359375, 3.5, 3.640625, 3.78125, 3.921875, 4.0625, 4.203125, 4.34375, 4.484375, 4.625, 4.765625, 4.90625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 6.0, 15.0, 9.0, 8.0, 10.0, 13.0, 11.0, 18.0, 25.0, 30.0, 36.0, 32.0, 27.0, 42.0, 50.0, 52.0, 60.0, 60.0, 55.0, 40.0, 50.0, 39.0, 48.0, 31.0, 38.0, 27.0, 34.0, 21.0, 26.0, 17.0, 14.0, 10.0, 10.0, 9.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.826171875, -2.7342529296875, -2.642333984375, -2.5504150390625, -2.45849609375, -2.3665771484375, -2.274658203125, -2.1827392578125, -2.0908203125, -1.9989013671875, -1.906982421875, -1.8150634765625, -1.72314453125, -1.6312255859375, -1.539306640625, -1.4473876953125, -1.35546875, -1.2635498046875, -1.171630859375, -1.0797119140625, -0.98779296875, -0.8958740234375, -0.803955078125, -0.7120361328125, -0.6201171875, -0.5281982421875, -0.436279296875, -0.3443603515625, -0.25244140625, -0.1605224609375, -0.068603515625, 0.0233154296875, 0.115234375, 0.2071533203125, 0.299072265625, 0.3909912109375, 0.48291015625, 0.5748291015625, 0.666748046875, 0.7586669921875, 0.8505859375, 0.9425048828125, 1.034423828125, 1.1263427734375, 1.21826171875, 1.3101806640625, 1.402099609375, 1.4940185546875, 1.5859375, 1.6778564453125, 1.769775390625, 1.8616943359375, 1.95361328125, 2.0455322265625, 2.137451171875, 2.2293701171875, 2.3212890625, 2.4132080078125, 2.505126953125, 2.5970458984375, 2.68896484375, 2.7808837890625, 2.872802734375, 2.9647216796875, 3.056640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 8.0, 8.0, 7.0, 10.0, 12.0, 18.0, 37.0, 39.0, 46.0, 60.0, 72.0, 107.0, 141.0, 290.0, 526.0, 1053.0, 2335.0, 6793.0, 27471.0, 175363.0, 712295.0, 95532.0, 17692.0, 4802.0, 1825.0, 778.0, 421.0, 246.0, 149.0, 98.0, 92.0, 57.0, 44.0, 40.0, 23.0, 19.0, 13.0, 9.0, 5.0, 5.0, 2.0, 0.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0634765625, -1.0325164794921875, -1.001556396484375, -0.9705963134765625, -0.93963623046875, -0.9086761474609375, -0.877716064453125, -0.8467559814453125, -0.8157958984375, -0.7848358154296875, -0.753875732421875, -0.7229156494140625, -0.69195556640625, -0.6609954833984375, -0.630035400390625, -0.5990753173828125, -0.568115234375, -0.5371551513671875, -0.506195068359375, -0.4752349853515625, -0.44427490234375, -0.4133148193359375, -0.382354736328125, -0.3513946533203125, -0.3204345703125, -0.2894744873046875, -0.258514404296875, -0.2275543212890625, -0.19659423828125, -0.1656341552734375, -0.134674072265625, -0.1037139892578125, -0.07275390625, -0.0417938232421875, -0.010833740234375, 0.0201263427734375, 0.05108642578125, 0.0820465087890625, 0.113006591796875, 0.1439666748046875, 0.1749267578125, 0.2058868408203125, 0.236846923828125, 0.2678070068359375, 0.29876708984375, 0.3297271728515625, 0.360687255859375, 0.3916473388671875, 0.422607421875, 0.4535675048828125, 0.484527587890625, 0.5154876708984375, 0.54644775390625, 0.5774078369140625, 0.608367919921875, 0.6393280029296875, 0.6702880859375, 0.7012481689453125, 0.732208251953125, 0.7631683349609375, 0.79412841796875, 0.8250885009765625, 0.856048583984375, 0.8870086669921875, 0.91796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 0.0, 6.0, 10.0, 8.0, 9.0, 14.0, 15.0, 19.0, 21.0, 27.0, 37.0, 42.0, 65.0, 67.0, 115.0, 128.0, 89.0, 69.0, 51.0, 39.0, 31.0, 22.0, 27.0, 11.0, 9.0, 24.0, 2.0, 10.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00020432472229003906, -0.00019773654639720917, -0.00019114837050437927, -0.00018456019461154938, -0.00017797201871871948, -0.0001713838428258896, -0.0001647956669330597, -0.0001582074910402298, -0.0001516193151473999, -0.00014503113925457, -0.0001384429633617401, -0.00013185478746891022, -0.00012526661157608032, -0.00011867843568325043, -0.00011209025979042053, -0.00010550208389759064, -9.891390800476074e-05, -9.232573211193085e-05, -8.573755621910095e-05, -7.914938032627106e-05, -7.256120443344116e-05, -6.597302854061127e-05, -5.938485264778137e-05, -5.279667675495148e-05, -4.620850086212158e-05, -3.962032496929169e-05, -3.303214907646179e-05, -2.6443973183631897e-05, -1.9855797290802002e-05, -1.3267621397972107e-05, -6.679445505142212e-06, -9.12696123123169e-08, 6.496906280517578e-06, 1.3085082173347473e-05, 1.9673258066177368e-05, 2.6261433959007263e-05, 3.284960985183716e-05, 3.943778574466705e-05, 4.602596163749695e-05, 5.261413753032684e-05, 5.920231342315674e-05, 6.579048931598663e-05, 7.237866520881653e-05, 7.896684110164642e-05, 8.555501699447632e-05, 9.214319288730621e-05, 9.873136878013611e-05, 0.000105319544672966, 0.0001119077205657959, 0.0001184958964586258, 0.0001250840723514557, 0.00013167224824428558, 0.00013826042413711548, 0.00014484860002994537, 0.00015143677592277527, 0.00015802495181560516, 0.00016461312770843506, 0.00017120130360126495, 0.00017778947949409485, 0.00018437765538692474, 0.00019096583127975464, 0.00019755400717258453, 0.00020414218306541443, 0.00021073035895824432, 0.00021731853485107422]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 6.0, 10.0, 14.0, 14.0, 33.0, 44.0, 57.0, 89.0, 131.0, 245.0, 450.0, 843.0, 1866.0, 4513.0, 16779.0, 161697.0, 789208.0, 57151.0, 9332.0, 3079.0, 1342.0, 663.0, 387.0, 207.0, 128.0, 82.0, 50.0, 30.0, 27.0, 19.0, 12.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.151458740234375, -1.11346435546875, -1.075469970703125, -1.0374755859375, -0.999481201171875, -0.96148681640625, -0.923492431640625, -0.885498046875, -0.847503662109375, -0.80950927734375, -0.771514892578125, -0.7335205078125, -0.695526123046875, -0.65753173828125, -0.619537353515625, -0.58154296875, -0.543548583984375, -0.50555419921875, -0.467559814453125, -0.4295654296875, -0.391571044921875, -0.35357666015625, -0.315582275390625, -0.277587890625, -0.239593505859375, -0.20159912109375, -0.163604736328125, -0.1256103515625, -0.087615966796875, -0.04962158203125, -0.011627197265625, 0.0263671875, 0.064361572265625, 0.10235595703125, 0.140350341796875, 0.1783447265625, 0.216339111328125, 0.25433349609375, 0.292327880859375, 0.330322265625, 0.368316650390625, 0.40631103515625, 0.444305419921875, 0.4822998046875, 0.520294189453125, 0.55828857421875, 0.596282958984375, 0.63427734375, 0.672271728515625, 0.71026611328125, 0.748260498046875, 0.7862548828125, 0.824249267578125, 0.86224365234375, 0.900238037109375, 0.938232421875, 0.976226806640625, 1.01422119140625, 1.052215576171875, 1.0902099609375, 1.128204345703125, 1.16619873046875, 1.204193115234375, 1.2421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 10.0, 5.0, 5.0, 11.0, 12.0, 19.0, 16.0, 16.0, 18.0, 20.0, 31.0, 34.0, 53.0, 59.0, 67.0, 76.0, 68.0, 71.0, 62.0, 57.0, 45.0, 40.0, 32.0, 28.0, 27.0, 20.0, 18.0, 14.0, 16.0, 12.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.81396484375, -0.7904510498046875, -0.766937255859375, -0.7434234619140625, -0.71990966796875, -0.6963958740234375, -0.672882080078125, -0.6493682861328125, -0.6258544921875, -0.6023406982421875, -0.578826904296875, -0.5553131103515625, -0.53179931640625, -0.5082855224609375, -0.484771728515625, -0.4612579345703125, -0.437744140625, -0.4142303466796875, -0.390716552734375, -0.3672027587890625, -0.34368896484375, -0.3201751708984375, -0.296661376953125, -0.2731475830078125, -0.2496337890625, -0.2261199951171875, -0.202606201171875, -0.1790924072265625, -0.15557861328125, -0.1320648193359375, -0.108551025390625, -0.0850372314453125, -0.0615234375, -0.0380096435546875, -0.014495849609375, 0.0090179443359375, 0.03253173828125, 0.0560455322265625, 0.079559326171875, 0.1030731201171875, 0.1265869140625, 0.1501007080078125, 0.173614501953125, 0.1971282958984375, 0.22064208984375, 0.2441558837890625, 0.267669677734375, 0.2911834716796875, 0.314697265625, 0.3382110595703125, 0.361724853515625, 0.3852386474609375, 0.40875244140625, 0.4322662353515625, 0.455780029296875, 0.4792938232421875, 0.5028076171875, 0.5263214111328125, 0.549835205078125, 0.5733489990234375, 0.59686279296875, 0.6203765869140625, 0.643890380859375, 0.6674041748046875, 0.69091796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 11.0, 16.0, 26.0, 72.0, 106.0, 176.0, 300.0, 139.0, 74.0, 33.0, 19.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.396400451660156, -28.5870361328125, -27.77766990661621, -26.968305587768555, -26.158939361572266, -25.34957504272461, -24.540210723876953, -23.730846405029297, -22.921480178833008, -22.11211585998535, -21.302749633789062, -20.493385314941406, -19.68402099609375, -18.87465476989746, -18.065290451049805, -17.255924224853516, -16.44655990600586, -15.637194633483887, -14.827829360961914, -14.018465042114258, -13.209099769592285, -12.399734497070312, -11.590370178222656, -10.781004905700684, -9.971639633178711, -9.162274360656738, -8.352909088134766, -7.543544769287109, -6.734179496765137, -5.924814224243164, -5.11544942855835, -4.306084632873535, -3.4967174530029297, -2.687352418899536, -1.8779873847961426, -1.068622350692749, -0.25925731658935547, 0.5501079559326172, 1.3594727516174316, 2.168837547302246, 2.9782028198242188, 3.7875678539276123, 4.596932888031006, 5.40629768371582, 6.215662956237793, 7.025028228759766, 7.83439302444458, 8.643757820129395, 9.453123092651367, 10.26248836517334, 11.071853637695312, 11.881217956542969, 12.690583229064941, 13.499948501586914, 14.30931282043457, 15.118678092956543, 15.928043365478516, 16.737407684326172, 17.54677391052246, 18.356138229370117, 19.165504455566406, 19.974868774414062, 20.78423309326172, 21.593597412109375, 22.402963638305664]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 7.0, 11.0, 6.0, 8.0, 11.0, 7.0, 10.0, 19.0, 14.0, 22.0, 26.0, 24.0, 31.0, 25.0, 39.0, 35.0, 62.0, 57.0, 58.0, 83.0, 67.0, 44.0, 38.0, 36.0, 36.0, 32.0, 16.0, 21.0, 25.0, 19.0, 19.0, 20.0, 15.0, 20.0, 10.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.674976348876953, -12.316632270812988, -11.958288192749023, -11.599944114685059, -11.241600036621094, -10.883255958557129, -10.524911880493164, -10.166568756103516, -9.808223724365234, -9.44987964630127, -9.091535568237305, -8.73319149017334, -8.374847412109375, -8.01650333404541, -7.6581597328186035, -7.299815654754639, -6.941472053527832, -6.583127975463867, -6.224783897399902, -5.8664398193359375, -5.508095741271973, -5.149751663208008, -4.791408061981201, -4.433063983917236, -4.0747199058532715, -3.7163758277893066, -3.358031749725342, -2.999687910079956, -2.641343832015991, -2.2829997539520264, -1.9246559143066406, -1.5663118362426758, -1.207967758178711, -0.8496237397193909, -0.4912797212600708, -0.1329357624053955, 0.22540831565856934, 0.5837523937225342, 0.9420962333679199, 1.3004403114318848, 1.6587843894958496, 2.0171284675598145, 2.3754725456237793, 2.733816385269165, 3.09216046333313, 3.4505045413970947, 3.8088483810424805, 4.167192459106445, 4.52553653717041, 4.883880615234375, 5.24222469329834, 5.600568771362305, 5.9589128494262695, 6.317256927490234, 6.675600528717041, 7.033944606781006, 7.392288684844971, 7.7506327629089355, 8.108976364135742, 8.467320442199707, 8.825664520263672, 9.184008598327637, 9.542352676391602, 9.900696754455566, 10.259040832519531]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 3.0, 1.0, 4.0, 11.0, 8.0, 17.0, 21.0, 43.0, 72.0, 123.0, 211.0, 455.0, 1073.0, 3003.0, 10737.0, 49780.0, 672155.0, 3268646.0, 155146.0, 23507.0, 5889.0, 2013.0, 743.0, 290.0, 148.0, 67.0, 37.0, 19.0, 10.0, 7.0, 14.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9443359375, -1.8821563720703125, -1.819976806640625, -1.7577972412109375, -1.69561767578125, -1.6334381103515625, -1.571258544921875, -1.5090789794921875, -1.4468994140625, -1.3847198486328125, -1.322540283203125, -1.2603607177734375, -1.19818115234375, -1.1360015869140625, -1.073822021484375, -1.0116424560546875, -0.949462890625, -0.8872833251953125, -0.825103759765625, -0.7629241943359375, -0.70074462890625, -0.6385650634765625, -0.576385498046875, -0.5142059326171875, -0.4520263671875, -0.3898468017578125, -0.327667236328125, -0.2654876708984375, -0.20330810546875, -0.1411285400390625, -0.078948974609375, -0.0167694091796875, 0.04541015625, 0.1075897216796875, 0.169769287109375, 0.2319488525390625, 0.29412841796875, 0.3563079833984375, 0.418487548828125, 0.4806671142578125, 0.5428466796875, 0.6050262451171875, 0.667205810546875, 0.7293853759765625, 0.79156494140625, 0.8537445068359375, 0.915924072265625, 0.9781036376953125, 1.040283203125, 1.1024627685546875, 1.164642333984375, 1.2268218994140625, 1.28900146484375, 1.3511810302734375, 1.413360595703125, 1.4755401611328125, 1.5377197265625, 1.5998992919921875, 1.662078857421875, 1.7242584228515625, 1.78643798828125, 1.8486175537109375, 1.910797119140625, 1.9729766845703125, 2.03515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 11.0, 11.0, 10.0, 12.0, 24.0, 24.0, 37.0, 31.0, 44.0, 42.0, 55.0, 52.0, 73.0, 74.0, 70.0, 70.0, 41.0, 61.0, 39.0, 43.0, 38.0, 29.0, 24.0, 19.0, 9.0, 13.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6547927856445312, -0.6303863525390625, -0.6059799194335938, -0.581573486328125, -0.5571670532226562, -0.5327606201171875, -0.5083541870117188, -0.48394775390625, -0.45954132080078125, -0.4351348876953125, -0.41072845458984375, -0.386322021484375, -0.36191558837890625, -0.3375091552734375, -0.31310272216796875, -0.2886962890625, -0.26428985595703125, -0.2398834228515625, -0.21547698974609375, -0.191070556640625, -0.16666412353515625, -0.1422576904296875, -0.11785125732421875, -0.09344482421875, -0.06903839111328125, -0.0446319580078125, -0.02022552490234375, 0.004180908203125, 0.02858734130859375, 0.0529937744140625, 0.07740020751953125, 0.101806640625, 0.12621307373046875, 0.1506195068359375, 0.17502593994140625, 0.199432373046875, 0.22383880615234375, 0.2482452392578125, 0.27265167236328125, 0.29705810546875, 0.32146453857421875, 0.3458709716796875, 0.37027740478515625, 0.394683837890625, 0.41909027099609375, 0.4434967041015625, 0.46790313720703125, 0.4923095703125, 0.5167160034179688, 0.5411224365234375, 0.5655288696289062, 0.589935302734375, 0.6143417358398438, 0.6387481689453125, 0.6631546020507812, 0.68756103515625, 0.7119674682617188, 0.7363739013671875, 0.7607803344726562, 0.785186767578125, 0.8095932006835938, 0.8339996337890625, 0.8584060668945312, 0.8828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 12.0, 20.0, 32.0, 54.0, 115.0, 365.0, 1009.0, 4373.0, 38722.0, 3331925.0, 792442.0, 20633.0, 3075.0, 832.0, 317.0, 164.0, 82.0, 41.0, 22.0, 20.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84765625, -3.71441650390625, -3.5811767578125, -3.44793701171875, -3.314697265625, -3.18145751953125, -3.0482177734375, -2.91497802734375, -2.78173828125, -2.64849853515625, -2.5152587890625, -2.38201904296875, -2.248779296875, -2.11553955078125, -1.9822998046875, -1.84906005859375, -1.7158203125, -1.58258056640625, -1.4493408203125, -1.31610107421875, -1.182861328125, -1.04962158203125, -0.9163818359375, -0.78314208984375, -0.64990234375, -0.51666259765625, -0.3834228515625, -0.25018310546875, -0.116943359375, 0.01629638671875, 0.1495361328125, 0.28277587890625, 0.416015625, 0.54925537109375, 0.6824951171875, 0.81573486328125, 0.948974609375, 1.08221435546875, 1.2154541015625, 1.34869384765625, 1.48193359375, 1.61517333984375, 1.7484130859375, 1.88165283203125, 2.014892578125, 2.14813232421875, 2.2813720703125, 2.41461181640625, 2.5478515625, 2.68109130859375, 2.8143310546875, 2.94757080078125, 3.080810546875, 3.21405029296875, 3.3472900390625, 3.48052978515625, 3.61376953125, 3.74700927734375, 3.8802490234375, 4.01348876953125, 4.146728515625, 4.27996826171875, 4.4132080078125, 4.54644775390625, 4.6796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 17.0, 8.0, 14.0, 42.0, 46.0, 86.0, 169.0, 269.0, 617.0, 1188.0, 848.0, 362.0, 146.0, 93.0, 50.0, 43.0, 18.0, 18.0, 5.0, 11.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9677734375, -1.8673858642578125, -1.766998291015625, -1.6666107177734375, -1.56622314453125, -1.4658355712890625, -1.365447998046875, -1.2650604248046875, -1.1646728515625, -1.0642852783203125, -0.963897705078125, -0.8635101318359375, -0.76312255859375, -0.6627349853515625, -0.562347412109375, -0.4619598388671875, -0.361572265625, -0.2611846923828125, -0.160797119140625, -0.0604095458984375, 0.03997802734375, 0.1403656005859375, 0.240753173828125, 0.3411407470703125, 0.4415283203125, 0.5419158935546875, 0.642303466796875, 0.7426910400390625, 0.84307861328125, 0.9434661865234375, 1.043853759765625, 1.1442413330078125, 1.24462890625, 1.3450164794921875, 1.445404052734375, 1.5457916259765625, 1.64617919921875, 1.7465667724609375, 1.846954345703125, 1.9473419189453125, 2.0477294921875, 2.1481170654296875, 2.248504638671875, 2.3488922119140625, 2.44927978515625, 2.5496673583984375, 2.650054931640625, 2.7504425048828125, 2.850830078125, 2.9512176513671875, 3.051605224609375, 3.1519927978515625, 3.25238037109375, 3.3527679443359375, 3.453155517578125, 3.5535430908203125, 3.6539306640625, 3.7543182373046875, 3.854705810546875, 3.9550933837890625, 4.05548095703125, 4.1558685302734375, 4.256256103515625, 4.3566436767578125, 4.45703125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 30.0, 81.0, 423.0, 377.0, 65.0, 15.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.91976928710938, -72.07032775878906, -70.22089385986328, -68.37145233154297, -66.52201843261719, -64.67257690429688, -62.82313919067383, -60.97370147705078, -59.124263763427734, -57.27482604980469, -55.42538833618164, -53.575950622558594, -51.72650909423828, -49.8770751953125, -48.02763366699219, -46.17819595336914, -44.328758239746094, -42.47932052612305, -40.6298828125, -38.78044509887695, -36.931007385253906, -35.081565856933594, -33.23212814331055, -31.3826904296875, -29.533252716064453, -27.683815002441406, -25.83437728881836, -23.98493766784668, -22.135499954223633, -20.286062240600586, -18.436622619628906, -16.58718490600586, -14.737747192382812, -12.888309478759766, -11.038870811462402, -9.189432144165039, -7.339994430541992, -5.490556716918945, -3.641118049621582, -1.7916793823242188, 0.057758331298828125, 1.9071965217590332, 3.7566347122192383, 5.606072902679443, 7.455511093139648, 9.304948806762695, 11.154387474060059, 13.003826141357422, 14.853263854980469, 16.702701568603516, 18.552139282226562, 20.401578903198242, 22.25101661682129, 24.100454330444336, 25.949893951416016, 27.799331665039062, 29.64876937866211, 31.498207092285156, 33.3476448059082, 35.19708251953125, 37.04652404785156, 38.895957946777344, 40.745399475097656, 42.5948371887207, 44.44427490234375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 13.0, 21.0, 27.0, 22.0, 25.0, 43.0, 50.0, 64.0, 55.0, 72.0, 79.0, 70.0, 76.0, 65.0, 38.0, 47.0, 37.0, 40.0, 26.0, 24.0, 26.0, 19.0, 12.0, 10.0, 7.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.495662689208984, -15.0447416305542, -14.593820571899414, -14.142899513244629, -13.691978454589844, -13.241057395935059, -12.790136337280273, -12.339214324951172, -11.888294219970703, -11.437373161315918, -10.986452102661133, -10.535531044006348, -10.084609985351562, -9.633688926696777, -9.182767868041992, -8.73184585571289, -8.280924797058105, -7.83000373840332, -7.379082679748535, -6.92816162109375, -6.477240562438965, -6.02631950378418, -5.575397968292236, -5.124476909637451, -4.673555850982666, -4.222634792327881, -3.7717137336730957, -3.3207924365997314, -2.8698713779449463, -2.418950319290161, -1.9680290222167969, -1.5171079635620117, -1.0661869049072266, -0.6152657866477966, -0.1643446683883667, 0.286576509475708, 0.7374975681304932, 1.1884186267852783, 1.6393399238586426, 2.0902609825134277, 2.541182041168213, 2.992103099822998, 3.443024158477783, 3.8939454555511475, 4.344866752624512, 4.795787811279297, 5.246708869934082, 5.697629928588867, 6.148550987243652, 6.5994720458984375, 7.050393104553223, 7.501314163208008, 7.952235221862793, 8.403156280517578, 8.85407829284668, 9.304998397827148, 9.75592041015625, 10.206841468811035, 10.65776252746582, 11.108683586120605, 11.55960464477539, 12.010525703430176, 12.461446762084961, 12.912368774414062, 13.363288879394531]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 11.0, 18.0, 24.0, 42.0, 70.0, 101.0, 187.0, 397.0, 929.0, 2020.0, 4931.0, 13252.0, 46383.0, 274637.0, 579211.0, 91412.0, 22158.0, 7429.0, 2896.0, 1221.0, 580.0, 269.0, 132.0, 88.0, 47.0, 26.0, 16.0, 14.0, 9.0, 11.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.88671875, -2.80474853515625, -2.7227783203125, -2.64080810546875, -2.558837890625, -2.47686767578125, -2.3948974609375, -2.31292724609375, -2.23095703125, -2.14898681640625, -2.0670166015625, -1.98504638671875, -1.903076171875, -1.82110595703125, -1.7391357421875, -1.65716552734375, -1.5751953125, -1.49322509765625, -1.4112548828125, -1.32928466796875, -1.247314453125, -1.16534423828125, -1.0833740234375, -1.00140380859375, -0.91943359375, -0.83746337890625, -0.7554931640625, -0.67352294921875, -0.591552734375, -0.50958251953125, -0.4276123046875, -0.34564208984375, -0.263671875, -0.18170166015625, -0.0997314453125, -0.01776123046875, 0.064208984375, 0.14617919921875, 0.2281494140625, 0.31011962890625, 0.39208984375, 0.47406005859375, 0.5560302734375, 0.63800048828125, 0.719970703125, 0.80194091796875, 0.8839111328125, 0.96588134765625, 1.0478515625, 1.12982177734375, 1.2117919921875, 1.29376220703125, 1.375732421875, 1.45770263671875, 1.5396728515625, 1.62164306640625, 1.70361328125, 1.78558349609375, 1.8675537109375, 1.94952392578125, 2.031494140625, 2.11346435546875, 2.1954345703125, 2.27740478515625, 2.359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 6.0, 8.0, 8.0, 10.0, 10.0, 12.0, 15.0, 11.0, 24.0, 17.0, 31.0, 24.0, 31.0, 27.0, 44.0, 46.0, 38.0, 44.0, 61.0, 55.0, 56.0, 31.0, 47.0, 45.0, 39.0, 42.0, 37.0, 29.0, 24.0, 26.0, 25.0, 15.0, 11.0, 10.0, 12.0, 6.0, 8.0, 7.0, 3.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5906524658203125, -0.569976806640625, -0.5493011474609375, -0.52862548828125, -0.5079498291015625, -0.487274169921875, -0.4665985107421875, -0.4459228515625, -0.4252471923828125, -0.404571533203125, -0.3838958740234375, -0.36322021484375, -0.3425445556640625, -0.321868896484375, -0.3011932373046875, -0.280517578125, -0.2598419189453125, -0.239166259765625, -0.2184906005859375, -0.19781494140625, -0.1771392822265625, -0.156463623046875, -0.1357879638671875, -0.1151123046875, -0.0944366455078125, -0.073760986328125, -0.0530853271484375, -0.03240966796875, -0.0117340087890625, 0.008941650390625, 0.0296173095703125, 0.05029296875, 0.0709686279296875, 0.091644287109375, 0.1123199462890625, 0.13299560546875, 0.1536712646484375, 0.174346923828125, 0.1950225830078125, 0.2156982421875, 0.2363739013671875, 0.257049560546875, 0.2777252197265625, 0.29840087890625, 0.3190765380859375, 0.339752197265625, 0.3604278564453125, 0.381103515625, 0.4017791748046875, 0.422454833984375, 0.4431304931640625, 0.46380615234375, 0.4844818115234375, 0.505157470703125, 0.5258331298828125, 0.5465087890625, 0.5671844482421875, 0.587860107421875, 0.6085357666015625, 0.62921142578125, 0.6498870849609375, 0.670562744140625, 0.6912384033203125, 0.7119140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 8.0, 7.0, 8.0, 17.0, 13.0, 15.0, 30.0, 40.0, 65.0, 85.0, 123.0, 197.0, 290.0, 508.0, 867.0, 1809.0, 5475.0, 28928.0, 655341.0, 324311.0, 22057.0, 4565.0, 1679.0, 798.0, 445.0, 275.0, 181.0, 129.0, 71.0, 65.0, 49.0, 25.0, 24.0, 19.0, 16.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84375, -3.719482421875, -3.59521484375, -3.470947265625, -3.3466796875, -3.222412109375, -3.09814453125, -2.973876953125, -2.849609375, -2.725341796875, -2.60107421875, -2.476806640625, -2.3525390625, -2.228271484375, -2.10400390625, -1.979736328125, -1.85546875, -1.731201171875, -1.60693359375, -1.482666015625, -1.3583984375, -1.234130859375, -1.10986328125, -0.985595703125, -0.861328125, -0.737060546875, -0.61279296875, -0.488525390625, -0.3642578125, -0.239990234375, -0.11572265625, 0.008544921875, 0.1328125, 0.257080078125, 0.38134765625, 0.505615234375, 0.6298828125, 0.754150390625, 0.87841796875, 1.002685546875, 1.126953125, 1.251220703125, 1.37548828125, 1.499755859375, 1.6240234375, 1.748291015625, 1.87255859375, 1.996826171875, 2.12109375, 2.245361328125, 2.36962890625, 2.493896484375, 2.6181640625, 2.742431640625, 2.86669921875, 2.990966796875, 3.115234375, 3.239501953125, 3.36376953125, 3.488037109375, 3.6123046875, 3.736572265625, 3.86083984375, 3.985107421875, 4.109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 9.0, 9.0, 17.0, 25.0, 25.0, 18.0, 42.0, 39.0, 57.0, 73.0, 71.0, 85.0, 92.0, 72.0, 72.0, 58.0, 56.0, 44.0, 30.0, 22.0, 18.0, 18.0, 13.0, 6.0, 7.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.180877685546875, -5.04925537109375, -4.917633056640625, -4.7860107421875, -4.654388427734375, -4.52276611328125, -4.391143798828125, -4.259521484375, -4.127899169921875, -3.99627685546875, -3.864654541015625, -3.7330322265625, -3.601409912109375, -3.46978759765625, -3.338165283203125, -3.20654296875, -3.074920654296875, -2.94329833984375, -2.811676025390625, -2.6800537109375, -2.548431396484375, -2.41680908203125, -2.285186767578125, -2.153564453125, -2.021942138671875, -1.89031982421875, -1.758697509765625, -1.6270751953125, -1.495452880859375, -1.36383056640625, -1.232208251953125, -1.1005859375, -0.968963623046875, -0.83734130859375, -0.705718994140625, -0.5740966796875, -0.442474365234375, -0.31085205078125, -0.179229736328125, -0.047607421875, 0.084014892578125, 0.21563720703125, 0.347259521484375, 0.4788818359375, 0.610504150390625, 0.74212646484375, 0.873748779296875, 1.00537109375, 1.136993408203125, 1.26861572265625, 1.400238037109375, 1.5318603515625, 1.663482666015625, 1.79510498046875, 1.926727294921875, 2.058349609375, 2.189971923828125, 2.32159423828125, 2.453216552734375, 2.5848388671875, 2.716461181640625, 2.84808349609375, 2.979705810546875, 3.111328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 10.0, 17.0, 45.0, 62.0, 141.0, 383.0, 1562.0, 15273.0, 970727.0, 56496.0, 2836.0, 567.0, 203.0, 95.0, 54.0, 17.0, 9.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.974609375, -2.877593994140625, -2.78057861328125, -2.683563232421875, -2.5865478515625, -2.489532470703125, -2.39251708984375, -2.295501708984375, -2.198486328125, -2.101470947265625, -2.00445556640625, -1.907440185546875, -1.8104248046875, -1.713409423828125, -1.61639404296875, -1.519378662109375, -1.42236328125, -1.325347900390625, -1.22833251953125, -1.131317138671875, -1.0343017578125, -0.937286376953125, -0.84027099609375, -0.743255615234375, -0.646240234375, -0.549224853515625, -0.45220947265625, -0.355194091796875, -0.2581787109375, -0.161163330078125, -0.06414794921875, 0.032867431640625, 0.1298828125, 0.226898193359375, 0.32391357421875, 0.420928955078125, 0.5179443359375, 0.614959716796875, 0.71197509765625, 0.808990478515625, 0.906005859375, 1.003021240234375, 1.10003662109375, 1.197052001953125, 1.2940673828125, 1.391082763671875, 1.48809814453125, 1.585113525390625, 1.68212890625, 1.779144287109375, 1.87615966796875, 1.973175048828125, 2.0701904296875, 2.167205810546875, 2.26422119140625, 2.361236572265625, 2.458251953125, 2.555267333984375, 2.65228271484375, 2.749298095703125, 2.8463134765625, 2.943328857421875, 3.04034423828125, 3.137359619140625, 3.234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 14.0, 17.0, 24.0, 38.0, 51.0, 94.0, 153.0, 250.0, 142.0, 74.0, 43.0, 18.0, 26.0, 14.0, 7.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004303455352783203, -0.0004174672067165375, -0.00040458887815475464, -0.0003917105495929718, -0.00037883222103118896, -0.00036595389246940613, -0.0003530755639076233, -0.00034019723534584045, -0.0003273189067840576, -0.0003144405782222748, -0.00030156224966049194, -0.0002886839210987091, -0.00027580559253692627, -0.00026292726397514343, -0.0002500489354133606, -0.00023717060685157776, -0.00022429227828979492, -0.00021141394972801208, -0.00019853562116622925, -0.0001856572926044464, -0.00017277896404266357, -0.00015990063548088074, -0.0001470223069190979, -0.00013414397835731506, -0.00012126564979553223, -0.00010838732123374939, -9.550899267196655e-05, -8.263066411018372e-05, -6.975233554840088e-05, -5.687400698661804e-05, -4.3995678424835205e-05, -3.111734986305237e-05, -1.823902130126953e-05, -5.360692739486694e-06, 7.517635822296143e-06, 2.039596438407898e-05, 3.3274292945861816e-05, 4.615262150764465e-05, 5.903095006942749e-05, 7.190927863121033e-05, 8.478760719299316e-05, 9.7665935754776e-05, 0.00011054426431655884, 0.00012342259287834167, 0.0001363009214401245, 0.00014917925000190735, 0.00016205757856369019, 0.00017493590712547302, 0.00018781423568725586, 0.0002006925642490387, 0.00021357089281082153, 0.00022644922137260437, 0.0002393275499343872, 0.00025220587849617004, 0.0002650842070579529, 0.0002779625356197357, 0.00029084086418151855, 0.0003037191927433014, 0.00031659752130508423, 0.00032947584986686707, 0.0003423541784286499, 0.00035523250699043274, 0.0003681108355522156, 0.0003809891641139984, 0.00039386749267578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 2.0, 3.0, 10.0, 14.0, 22.0, 21.0, 34.0, 49.0, 73.0, 107.0, 192.0, 342.0, 629.0, 1455.0, 3837.0, 15630.0, 182241.0, 788551.0, 43851.0, 7118.0, 2297.0, 923.0, 472.0, 233.0, 131.0, 91.0, 63.0, 31.0, 30.0, 21.0, 17.0, 15.0, 13.0, 11.0, 3.0, 3.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19921875, -1.159576416015625, -1.11993408203125, -1.080291748046875, -1.0406494140625, -1.001007080078125, -0.96136474609375, -0.921722412109375, -0.882080078125, -0.842437744140625, -0.80279541015625, -0.763153076171875, -0.7235107421875, -0.683868408203125, -0.64422607421875, -0.604583740234375, -0.56494140625, -0.525299072265625, -0.48565673828125, -0.446014404296875, -0.4063720703125, -0.366729736328125, -0.32708740234375, -0.287445068359375, -0.247802734375, -0.208160400390625, -0.16851806640625, -0.128875732421875, -0.0892333984375, -0.049591064453125, -0.00994873046875, 0.029693603515625, 0.0693359375, 0.108978271484375, 0.14862060546875, 0.188262939453125, 0.2279052734375, 0.267547607421875, 0.30718994140625, 0.346832275390625, 0.386474609375, 0.426116943359375, 0.46575927734375, 0.505401611328125, 0.5450439453125, 0.584686279296875, 0.62432861328125, 0.663970947265625, 0.70361328125, 0.743255615234375, 0.78289794921875, 0.822540283203125, 0.8621826171875, 0.901824951171875, 0.94146728515625, 0.981109619140625, 1.020751953125, 1.060394287109375, 1.10003662109375, 1.139678955078125, 1.1793212890625, 1.218963623046875, 1.25860595703125, 1.298248291015625, 1.337890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 9.0, 8.0, 16.0, 20.0, 23.0, 38.0, 50.0, 56.0, 99.0, 103.0, 113.0, 118.0, 80.0, 63.0, 50.0, 27.0, 25.0, 20.0, 18.0, 15.0, 7.0, 10.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.89111328125, -0.8587417602539062, -0.8263702392578125, -0.7939987182617188, -0.761627197265625, -0.7292556762695312, -0.6968841552734375, -0.6645126342773438, -0.63214111328125, -0.5997695922851562, -0.5673980712890625, -0.5350265502929688, -0.502655029296875, -0.47028350830078125, -0.4379119873046875, -0.40554046630859375, -0.3731689453125, -0.34079742431640625, -0.3084259033203125, -0.27605438232421875, -0.243682861328125, -0.21131134033203125, -0.1789398193359375, -0.14656829833984375, -0.11419677734375, -0.08182525634765625, -0.0494537353515625, -0.01708221435546875, 0.015289306640625, 0.04766082763671875, 0.0800323486328125, 0.11240386962890625, 0.144775390625, 0.17714691162109375, 0.2095184326171875, 0.24188995361328125, 0.274261474609375, 0.30663299560546875, 0.3390045166015625, 0.37137603759765625, 0.40374755859375, 0.43611907958984375, 0.4684906005859375, 0.5008621215820312, 0.533233642578125, 0.5656051635742188, 0.5979766845703125, 0.6303482055664062, 0.6627197265625, 0.6950912475585938, 0.7274627685546875, 0.7598342895507812, 0.792205810546875, 0.8245773315429688, 0.8569488525390625, 0.8893203735351562, 0.92169189453125, 0.9540634155273438, 0.9864349365234375, 1.0188064575195312, 1.051177978515625, 1.0835494995117188, 1.1159210205078125, 1.1482925415039062, 1.1806640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 20.0, 67.0, 163.0, 368.0, 237.0, 77.0, 24.0, 10.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.52988624572754, -30.434688568115234, -29.33949089050293, -28.244293212890625, -27.14909553527832, -26.053897857666016, -24.958702087402344, -23.863502502441406, -22.768306732177734, -21.67310905456543, -20.577911376953125, -19.48271369934082, -18.387516021728516, -17.29231834411621, -16.197120666503906, -15.101923942565918, -14.006725311279297, -12.911527633666992, -11.816329956054688, -10.721132278442383, -9.625934600830078, -8.530736923217773, -7.435540199279785, -6.3403425216674805, -5.245144844055176, -4.149947166442871, -3.0547497272491455, -1.95955228805542, -0.8643546104431152, 0.23084306716918945, 1.326040267944336, 2.4212379455566406, 3.516437530517578, 4.611635208129883, 5.7068328857421875, 6.802030086517334, 7.897227764129639, 8.992425918579102, 10.08762264251709, 11.182820320129395, 12.2780179977417, 13.373215675354004, 14.468413352966309, 15.563610076904297, 16.6588077545166, 17.754005432128906, 18.84920310974121, 19.944400787353516, 21.03959846496582, 22.134796142578125, 23.22999382019043, 24.325191497802734, 25.42038917541504, 26.515586853027344, 27.610782623291016, 28.705982208251953, 29.801177978515625, 30.89637565612793, 31.991573333740234, 33.086769104003906, 34.181968688964844, 35.277164459228516, 36.37236404418945, 37.467559814453125, 38.56275939941406]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 7.0, 11.0, 11.0, 16.0, 12.0, 21.0, 22.0, 21.0, 33.0, 44.0, 43.0, 33.0, 49.0, 73.0, 89.0, 82.0, 63.0, 50.0, 47.0, 32.0, 42.0, 29.0, 26.0, 30.0, 19.0, 11.0, 13.0, 14.0, 11.0, 3.0, 8.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.790928840637207, -14.369871139526367, -13.948813438415527, -13.527755737304688, -13.106697082519531, -12.685639381408691, -12.264581680297852, -11.843523979187012, -11.422466278076172, -11.001408576965332, -10.580350875854492, -10.159292221069336, -9.738234519958496, -9.317176818847656, -8.896119117736816, -8.475061416625977, -8.05400276184082, -7.6329450607299805, -7.211886882781982, -6.790829181671143, -6.3697710037231445, -5.948713302612305, -5.527655601501465, -5.106597900390625, -4.685539722442627, -4.264482021331787, -3.843423843383789, -3.422366142272949, -3.0013082027435303, -2.5802502632141113, -2.1591925621032715, -1.7381346225738525, -1.31707763671875, -0.8960197567939758, -0.47496187686920166, -0.053904056549072266, 0.3671538829803467, 0.7882118225097656, 1.2092695236206055, 1.6303274631500244, 2.0513854026794434, 2.4724433422088623, 2.8935012817382812, 3.314558982849121, 3.73561692237854, 4.156674861907959, 4.577732563018799, 4.998790740966797, 5.419848442077637, 5.840906143188477, 6.261964321136475, 6.6830220222473145, 7.1040802001953125, 7.525137901306152, 7.946195602416992, 8.367253303527832, 8.788311004638672, 9.209368705749512, 9.630426406860352, 10.051485061645508, 10.472542762756348, 10.893600463867188, 11.314658164978027, 11.735715866088867, 12.156774520874023]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 11.0, 9.0, 7.0, 13.0, 17.0, 33.0, 70.0, 111.0, 245.0, 556.0, 1806.0, 7198.0, 43225.0, 1911442.0, 2171802.0, 46487.0, 7854.0, 2155.0, 705.0, 244.0, 117.0, 60.0, 36.0, 22.0, 18.0, 4.0, 9.0, 7.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.698577880859375, -2.62567138671875, -2.552764892578125, -2.4798583984375, -2.406951904296875, -2.33404541015625, -2.261138916015625, -2.188232421875, -2.115325927734375, -2.04241943359375, -1.969512939453125, -1.8966064453125, -1.823699951171875, -1.75079345703125, -1.677886962890625, -1.60498046875, -1.532073974609375, -1.45916748046875, -1.386260986328125, -1.3133544921875, -1.240447998046875, -1.16754150390625, -1.094635009765625, -1.021728515625, -0.948822021484375, -0.87591552734375, -0.803009033203125, -0.7301025390625, -0.657196044921875, -0.58428955078125, -0.511383056640625, -0.4384765625, -0.365570068359375, -0.29266357421875, -0.219757080078125, -0.1468505859375, -0.073944091796875, -0.00103759765625, 0.071868896484375, 0.144775390625, 0.217681884765625, 0.29058837890625, 0.363494873046875, 0.4364013671875, 0.509307861328125, 0.58221435546875, 0.655120849609375, 0.72802734375, 0.800933837890625, 0.87384033203125, 0.946746826171875, 1.0196533203125, 1.092559814453125, 1.16546630859375, 1.238372802734375, 1.311279296875, 1.384185791015625, 1.45709228515625, 1.529998779296875, 1.6029052734375, 1.675811767578125, 1.74871826171875, 1.821624755859375, 1.89453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 22.0, 35.0, 41.0, 32.0, 57.0, 65.0, 80.0, 88.0, 96.0, 60.0, 68.0, 70.0, 69.0, 47.0, 38.0, 31.0, 27.0, 17.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5009765625, -1.4665298461914062, -1.4320831298828125, -1.3976364135742188, -1.363189697265625, -1.3287429809570312, -1.2942962646484375, -1.2598495483398438, -1.22540283203125, -1.1909561157226562, -1.1565093994140625, -1.1220626831054688, -1.087615966796875, -1.0531692504882812, -1.0187225341796875, -0.9842758178710938, -0.9498291015625, -0.9153823852539062, -0.8809356689453125, -0.8464889526367188, -0.812042236328125, -0.7775955200195312, -0.7431488037109375, -0.7087020874023438, -0.67425537109375, -0.6398086547851562, -0.6053619384765625, -0.5709152221679688, -0.536468505859375, -0.5020217895507812, -0.4675750732421875, -0.43312835693359375, -0.398681640625, -0.36423492431640625, -0.3297882080078125, -0.29534149169921875, -0.260894775390625, -0.22644805908203125, -0.1920013427734375, -0.15755462646484375, -0.12310791015625, -0.08866119384765625, -0.0542144775390625, -0.01976776123046875, 0.014678955078125, 0.04912567138671875, 0.0835723876953125, 0.11801910400390625, 0.1524658203125, 0.18691253662109375, 0.2213592529296875, 0.25580596923828125, 0.290252685546875, 0.32469940185546875, 0.3591461181640625, 0.39359283447265625, 0.42803955078125, 0.46248626708984375, 0.4969329833984375, 0.5313796997070312, 0.565826416015625, 0.6002731323242188, 0.6347198486328125, 0.6691665649414062, 0.70361328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 11.0, 13.0, 13.0, 15.0, 12.0, 26.0, 45.0, 78.0, 117.0, 186.0, 380.0, 899.0, 2356.0, 8537.0, 48768.0, 2318152.0, 1754052.0, 46883.0, 8913.0, 2715.0, 1061.0, 471.0, 246.0, 101.0, 64.0, 53.0, 31.0, 15.0, 14.0, 20.0, 9.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6875, -2.600738525390625, -2.51397705078125, -2.427215576171875, -2.3404541015625, -2.253692626953125, -2.16693115234375, -2.080169677734375, -1.993408203125, -1.906646728515625, -1.81988525390625, -1.733123779296875, -1.6463623046875, -1.559600830078125, -1.47283935546875, -1.386077880859375, -1.29931640625, -1.212554931640625, -1.12579345703125, -1.039031982421875, -0.9522705078125, -0.865509033203125, -0.77874755859375, -0.691986083984375, -0.605224609375, -0.518463134765625, -0.43170166015625, -0.344940185546875, -0.2581787109375, -0.171417236328125, -0.08465576171875, 0.002105712890625, 0.0888671875, 0.175628662109375, 0.26239013671875, 0.349151611328125, 0.4359130859375, 0.522674560546875, 0.60943603515625, 0.696197509765625, 0.782958984375, 0.869720458984375, 0.95648193359375, 1.043243408203125, 1.1300048828125, 1.216766357421875, 1.30352783203125, 1.390289306640625, 1.47705078125, 1.563812255859375, 1.65057373046875, 1.737335205078125, 1.8240966796875, 1.910858154296875, 1.99761962890625, 2.084381103515625, 2.171142578125, 2.257904052734375, 2.34466552734375, 2.431427001953125, 2.5181884765625, 2.604949951171875, 2.69171142578125, 2.778472900390625, 2.865234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 17.0, 19.0, 24.0, 27.0, 74.0, 108.0, 265.0, 531.0, 1080.0, 1007.0, 405.0, 187.0, 120.0, 59.0, 30.0, 25.0, 16.0, 17.0, 12.0, 1.0, 7.0, 6.0, 4.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.154266357421875, -2.07415771484375, -1.994049072265625, -1.9139404296875, -1.833831787109375, -1.75372314453125, -1.673614501953125, -1.593505859375, -1.513397216796875, -1.43328857421875, -1.353179931640625, -1.2730712890625, -1.192962646484375, -1.11285400390625, -1.032745361328125, -0.95263671875, -0.872528076171875, -0.79241943359375, -0.712310791015625, -0.6322021484375, -0.552093505859375, -0.47198486328125, -0.391876220703125, -0.311767578125, -0.231658935546875, -0.15155029296875, -0.071441650390625, 0.0086669921875, 0.088775634765625, 0.16888427734375, 0.248992919921875, 0.3291015625, 0.409210205078125, 0.48931884765625, 0.569427490234375, 0.6495361328125, 0.729644775390625, 0.80975341796875, 0.889862060546875, 0.969970703125, 1.050079345703125, 1.13018798828125, 1.210296630859375, 1.2904052734375, 1.370513916015625, 1.45062255859375, 1.530731201171875, 1.61083984375, 1.690948486328125, 1.77105712890625, 1.851165771484375, 1.9312744140625, 2.011383056640625, 2.09149169921875, 2.171600341796875, 2.251708984375, 2.331817626953125, 2.41192626953125, 2.492034912109375, 2.5721435546875, 2.652252197265625, 2.73236083984375, 2.812469482421875, 2.892578125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 13.0, 8.0, 28.0, 121.0, 311.0, 322.0, 129.0, 38.0, 13.0, 6.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.79423713684082, -30.83261489868164, -29.870990753173828, -28.90936851501465, -27.94774627685547, -26.98612403869629, -26.02450180053711, -25.062877655029297, -24.101255416870117, -23.139633178710938, -22.178009033203125, -21.216386795043945, -20.254764556884766, -19.293142318725586, -18.331520080566406, -17.369895935058594, -16.408273696899414, -15.446651458740234, -14.485028266906738, -13.523405075073242, -12.561782836914062, -11.600160598754883, -10.638537406921387, -9.67691421508789, -8.715291976928711, -7.753669261932373, -6.792046546936035, -5.830423831939697, -4.868801116943359, -3.9071784019470215, -2.9455556869506836, -1.9839329719543457, -1.0223121643066406, -0.060689449310302734, 0.9009332656860352, 1.862555980682373, 2.824178695678711, 3.785801410675049, 4.747424125671387, 5.709046840667725, 6.6706695556640625, 7.6322922706604, 8.593914985656738, 9.555538177490234, 10.517160415649414, 11.478782653808594, 12.44040584564209, 13.402029037475586, 14.363651275634766, 15.325273513793945, 16.286895751953125, 17.248519897460938, 18.210142135620117, 19.171764373779297, 20.13338851928711, 21.09501075744629, 22.05663299560547, 23.01825523376465, 23.979877471923828, 24.94150161743164, 25.90312385559082, 26.86474609375, 27.826370239257812, 28.787992477416992, 29.749614715576172]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 14.0, 9.0, 17.0, 14.0, 21.0, 22.0, 48.0, 40.0, 49.0, 56.0, 55.0, 60.0, 70.0, 73.0, 73.0, 63.0, 53.0, 52.0, 44.0, 46.0, 32.0, 22.0, 22.0, 9.0, 9.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.723822593688965, -10.338404655456543, -9.952986717224121, -9.567567825317383, -9.182149887084961, -8.796731948852539, -8.411314010620117, -8.025896072387695, -7.640477180480957, -7.255059242248535, -6.869640827178955, -6.484222888946533, -6.098804473876953, -5.713386535644531, -5.327968597412109, -4.942550182342529, -4.557132244110107, -4.1717143058776855, -3.7862958908081055, -3.4008779525756836, -3.0154595375061035, -2.6300415992736816, -2.2446234226226807, -1.8592052459716797, -1.4737870693206787, -1.0883688926696777, -0.7029507756233215, -0.31753265857696533, 0.06788551807403564, 0.4533036947250366, 0.838721752166748, 1.224139928817749, 1.60955810546875, 1.994976282119751, 2.380394458770752, 2.765812397003174, 3.151230812072754, 3.536648750305176, 3.9220669269561768, 4.307485103607178, 4.692903518676758, 5.07832145690918, 5.46373987197876, 5.849157810211182, 6.234576225280762, 6.619994163513184, 7.0054121017456055, 7.3908305168151855, 7.776248455047607, 8.161666870117188, 8.54708480834961, 8.932502746582031, 9.317920684814453, 9.703339576721191, 10.088757514953613, 10.474175453186035, 10.859593391418457, 11.245011329650879, 11.6304292678833, 12.015848159790039, 12.401266098022461, 12.786684036254883, 13.172101974487305, 13.557519912719727, 13.942938804626465]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 11.0, 10.0, 19.0, 25.0, 42.0, 74.0, 146.0, 249.0, 481.0, 1095.0, 2686.0, 7348.0, 27181.0, 165786.0, 618004.0, 183295.0, 29149.0, 7981.0, 2742.0, 1084.0, 512.0, 267.0, 138.0, 73.0, 32.0, 29.0, 30.0, 9.0, 8.0, 10.0, 10.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.63128662109375, -1.5740966796875, -1.51690673828125, -1.459716796875, -1.40252685546875, -1.3453369140625, -1.28814697265625, -1.23095703125, -1.17376708984375, -1.1165771484375, -1.05938720703125, -1.002197265625, -0.94500732421875, -0.8878173828125, -0.83062744140625, -0.7734375, -0.71624755859375, -0.6590576171875, -0.60186767578125, -0.544677734375, -0.48748779296875, -0.4302978515625, -0.37310791015625, -0.31591796875, -0.25872802734375, -0.2015380859375, -0.14434814453125, -0.087158203125, -0.02996826171875, 0.0272216796875, 0.08441162109375, 0.1416015625, 0.19879150390625, 0.2559814453125, 0.31317138671875, 0.370361328125, 0.42755126953125, 0.4847412109375, 0.54193115234375, 0.59912109375, 0.65631103515625, 0.7135009765625, 0.77069091796875, 0.827880859375, 0.88507080078125, 0.9422607421875, 0.99945068359375, 1.056640625, 1.11383056640625, 1.1710205078125, 1.22821044921875, 1.285400390625, 1.34259033203125, 1.3997802734375, 1.45697021484375, 1.51416015625, 1.57135009765625, 1.6285400390625, 1.68572998046875, 1.742919921875, 1.80010986328125, 1.8572998046875, 1.91448974609375, 1.9716796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 4.0, 12.0, 19.0, 34.0, 34.0, 42.0, 46.0, 60.0, 91.0, 78.0, 73.0, 80.0, 82.0, 92.0, 70.0, 33.0, 41.0, 27.0, 26.0, 16.0, 11.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.6396484375, -1.6029586791992188, -1.5662689208984375, -1.5295791625976562, -1.492889404296875, -1.4561996459960938, -1.4195098876953125, -1.3828201293945312, -1.34613037109375, -1.3094406127929688, -1.2727508544921875, -1.2360610961914062, -1.199371337890625, -1.1626815795898438, -1.1259918212890625, -1.0893020629882812, -1.0526123046875, -1.0159225463867188, -0.9792327880859375, -0.9425430297851562, -0.905853271484375, -0.8691635131835938, -0.8324737548828125, -0.7957839965820312, -0.75909423828125, -0.7224044799804688, -0.6857147216796875, -0.6490249633789062, -0.612335205078125, -0.5756454467773438, -0.5389556884765625, -0.5022659301757812, -0.465576171875, -0.42888641357421875, -0.3921966552734375, -0.35550689697265625, -0.318817138671875, -0.28212738037109375, -0.2454376220703125, -0.20874786376953125, -0.17205810546875, -0.13536834716796875, -0.0986785888671875, -0.06198883056640625, -0.025299072265625, 0.01139068603515625, 0.0480804443359375, 0.08477020263671875, 0.1214599609375, 0.15814971923828125, 0.1948394775390625, 0.23152923583984375, 0.268218994140625, 0.30490875244140625, 0.3415985107421875, 0.37828826904296875, 0.41497802734375, 0.45166778564453125, 0.4883575439453125, 0.5250473022460938, 0.561737060546875, 0.5984268188476562, 0.6351165771484375, 0.6718063354492188, 0.70849609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 6.0, 13.0, 11.0, 16.0, 22.0, 38.0, 76.0, 112.0, 205.0, 363.0, 984.0, 3084.0, 14899.0, 194113.0, 779740.0, 45854.0, 6143.0, 1614.0, 588.0, 261.0, 142.0, 83.0, 67.0, 43.0, 26.0, 18.0, 6.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.936248779296875, -1.85296630859375, -1.769683837890625, -1.6864013671875, -1.603118896484375, -1.51983642578125, -1.436553955078125, -1.353271484375, -1.269989013671875, -1.18670654296875, -1.103424072265625, -1.0201416015625, -0.936859130859375, -0.85357666015625, -0.770294189453125, -0.68701171875, -0.603729248046875, -0.52044677734375, -0.437164306640625, -0.3538818359375, -0.270599365234375, -0.18731689453125, -0.104034423828125, -0.020751953125, 0.062530517578125, 0.14581298828125, 0.229095458984375, 0.3123779296875, 0.395660400390625, 0.47894287109375, 0.562225341796875, 0.6455078125, 0.728790283203125, 0.81207275390625, 0.895355224609375, 0.9786376953125, 1.061920166015625, 1.14520263671875, 1.228485107421875, 1.311767578125, 1.395050048828125, 1.47833251953125, 1.561614990234375, 1.6448974609375, 1.728179931640625, 1.81146240234375, 1.894744873046875, 1.97802734375, 2.061309814453125, 2.14459228515625, 2.227874755859375, 2.3111572265625, 2.394439697265625, 2.47772216796875, 2.561004638671875, 2.644287109375, 2.727569580078125, 2.81085205078125, 2.894134521484375, 2.9774169921875, 3.060699462890625, 3.14398193359375, 3.227264404296875, 3.310546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 9.0, 10.0, 14.0, 19.0, 27.0, 23.0, 24.0, 25.0, 45.0, 43.0, 51.0, 50.0, 73.0, 53.0, 70.0, 53.0, 69.0, 48.0, 43.0, 51.0, 39.0, 32.0, 19.0, 33.0, 22.0, 7.0, 15.0, 6.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.386810302734375, -2.28924560546875, -2.191680908203125, -2.0941162109375, -1.996551513671875, -1.89898681640625, -1.801422119140625, -1.703857421875, -1.606292724609375, -1.50872802734375, -1.411163330078125, -1.3135986328125, -1.216033935546875, -1.11846923828125, -1.020904541015625, -0.92333984375, -0.825775146484375, -0.72821044921875, -0.630645751953125, -0.5330810546875, -0.435516357421875, -0.33795166015625, -0.240386962890625, -0.142822265625, -0.045257568359375, 0.05230712890625, 0.149871826171875, 0.2474365234375, 0.345001220703125, 0.44256591796875, 0.540130615234375, 0.6376953125, 0.735260009765625, 0.83282470703125, 0.930389404296875, 1.0279541015625, 1.125518798828125, 1.22308349609375, 1.320648193359375, 1.418212890625, 1.515777587890625, 1.61334228515625, 1.710906982421875, 1.8084716796875, 1.906036376953125, 2.00360107421875, 2.101165771484375, 2.19873046875, 2.296295166015625, 2.39385986328125, 2.491424560546875, 2.5889892578125, 2.686553955078125, 2.78411865234375, 2.881683349609375, 2.979248046875, 3.076812744140625, 3.17437744140625, 3.271942138671875, 3.3695068359375, 3.467071533203125, 3.56463623046875, 3.662200927734375, 3.759765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 0.0, 8.0, 17.0, 14.0, 22.0, 22.0, 37.0, 61.0, 88.0, 114.0, 184.0, 396.0, 823.0, 1786.0, 4546.0, 14047.0, 56570.0, 331096.0, 548050.0, 66149.0, 15711.0, 4999.0, 1892.0, 861.0, 441.0, 231.0, 136.0, 73.0, 57.0, 32.0, 29.0, 13.0, 17.0, 7.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5478515625, -0.5296173095703125, -0.511383056640625, -0.4931488037109375, -0.47491455078125, -0.4566802978515625, -0.438446044921875, -0.4202117919921875, -0.4019775390625, -0.3837432861328125, -0.365509033203125, -0.3472747802734375, -0.32904052734375, -0.3108062744140625, -0.292572021484375, -0.2743377685546875, -0.256103515625, -0.2378692626953125, -0.219635009765625, -0.2014007568359375, -0.18316650390625, -0.1649322509765625, -0.146697998046875, -0.1284637451171875, -0.1102294921875, -0.0919952392578125, -0.073760986328125, -0.0555267333984375, -0.03729248046875, -0.0190582275390625, -0.000823974609375, 0.0174102783203125, 0.03564453125, 0.0538787841796875, 0.072113037109375, 0.0903472900390625, 0.10858154296875, 0.1268157958984375, 0.145050048828125, 0.1632843017578125, 0.1815185546875, 0.1997528076171875, 0.217987060546875, 0.2362213134765625, 0.25445556640625, 0.2726898193359375, 0.290924072265625, 0.3091583251953125, 0.327392578125, 0.3456268310546875, 0.363861083984375, 0.3820953369140625, 0.40032958984375, 0.4185638427734375, 0.436798095703125, 0.4550323486328125, 0.4732666015625, 0.4915008544921875, 0.509735107421875, 0.5279693603515625, 0.54620361328125, 0.5644378662109375, 0.582672119140625, 0.6009063720703125, 0.619140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 0.0, 8.0, 9.0, 5.0, 4.0, 8.0, 10.0, 18.0, 28.0, 50.0, 57.0, 74.0, 96.0, 98.0, 140.0, 106.0, 87.0, 53.0, 40.0, 27.0, 16.0, 12.0, 12.0, 13.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015652179718017578, -0.00015220511704683304, -0.0001478884369134903, -0.00014357175678014755, -0.0001392550766468048, -0.00013493839651346207, -0.00013062171638011932, -0.00012630503624677658, -0.00012198835611343384, -0.0001176716759800911, -0.00011335499584674835, -0.00010903831571340561, -0.00010472163558006287, -0.00010040495544672012, -9.608827531337738e-05, -9.177159518003464e-05, -8.74549150466919e-05, -8.313823491334915e-05, -7.882155478000641e-05, -7.450487464666367e-05, -7.018819451332092e-05, -6.587151437997818e-05, -6.155483424663544e-05, -5.7238154113292694e-05, -5.292147397994995e-05, -4.860479384660721e-05, -4.4288113713264465e-05, -3.997143357992172e-05, -3.565475344657898e-05, -3.1338073313236237e-05, -2.7021393179893494e-05, -2.270471304655075e-05, -1.8388032913208008e-05, -1.4071352779865265e-05, -9.754672646522522e-06, -5.437992513179779e-06, -1.1213123798370361e-06, 3.1953677535057068e-06, 7.51204788684845e-06, 1.1828728020191193e-05, 1.6145408153533936e-05, 2.046208828687668e-05, 2.477876842021942e-05, 2.9095448553562164e-05, 3.341212868690491e-05, 3.772880882024765e-05, 4.204548895359039e-05, 4.6362169086933136e-05, 5.067884922027588e-05, 5.499552935361862e-05, 5.9312209486961365e-05, 6.362888962030411e-05, 6.794556975364685e-05, 7.22622498869896e-05, 7.657893002033234e-05, 8.089561015367508e-05, 8.521229028701782e-05, 8.952897042036057e-05, 9.384565055370331e-05, 9.816233068704605e-05, 0.0001024790108203888, 0.00010679569095373154, 0.00011111237108707428, 0.00011542905122041702, 0.00011974573135375977]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 10.0, 20.0, 18.0, 43.0, 76.0, 105.0, 137.0, 282.0, 593.0, 1283.0, 3217.0, 11070.0, 64445.0, 680651.0, 246271.0, 29847.0, 6535.0, 2081.0, 860.0, 398.0, 240.0, 131.0, 82.0, 50.0, 28.0, 21.0, 11.0, 3.0, 12.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.876953125, -0.8517532348632812, -0.8265533447265625, -0.8013534545898438, -0.776153564453125, -0.7509536743164062, -0.7257537841796875, -0.7005538940429688, -0.67535400390625, -0.6501541137695312, -0.6249542236328125, -0.5997543334960938, -0.574554443359375, -0.5493545532226562, -0.5241546630859375, -0.49895477294921875, -0.4737548828125, -0.44855499267578125, -0.4233551025390625, -0.39815521240234375, -0.372955322265625, -0.34775543212890625, -0.3225555419921875, -0.29735565185546875, -0.27215576171875, -0.24695587158203125, -0.2217559814453125, -0.19655609130859375, -0.171356201171875, -0.14615631103515625, -0.1209564208984375, -0.09575653076171875, -0.070556640625, -0.04535675048828125, -0.0201568603515625, 0.00504302978515625, 0.030242919921875, 0.05544281005859375, 0.0806427001953125, 0.10584259033203125, 0.13104248046875, 0.15624237060546875, 0.1814422607421875, 0.20664215087890625, 0.231842041015625, 0.25704193115234375, 0.2822418212890625, 0.30744171142578125, 0.3326416015625, 0.35784149169921875, 0.3830413818359375, 0.40824127197265625, 0.433441162109375, 0.45864105224609375, 0.4838409423828125, 0.5090408325195312, 0.53424072265625, 0.5594406127929688, 0.5846405029296875, 0.6098403930664062, 0.635040283203125, 0.6602401733398438, 0.6854400634765625, 0.7106399536132812, 0.73583984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 4.0, 5.0, 18.0, 10.0, 24.0, 25.0, 41.0, 54.0, 61.0, 88.0, 105.0, 93.0, 91.0, 72.0, 81.0, 69.0, 44.0, 34.0, 22.0, 18.0, 12.0, 9.0, 3.0, 0.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.4770050048828125, -0.455963134765625, -0.4349212646484375, -0.41387939453125, -0.3928375244140625, -0.371795654296875, -0.3507537841796875, -0.3297119140625, -0.3086700439453125, -0.287628173828125, -0.2665863037109375, -0.24554443359375, -0.2245025634765625, -0.203460693359375, -0.1824188232421875, -0.161376953125, -0.1403350830078125, -0.119293212890625, -0.0982513427734375, -0.07720947265625, -0.0561676025390625, -0.035125732421875, -0.0140838623046875, 0.0069580078125, 0.0279998779296875, 0.049041748046875, 0.0700836181640625, 0.09112548828125, 0.1121673583984375, 0.133209228515625, 0.1542510986328125, 0.17529296875, 0.1963348388671875, 0.217376708984375, 0.2384185791015625, 0.25946044921875, 0.2805023193359375, 0.301544189453125, 0.3225860595703125, 0.3436279296875, 0.3646697998046875, 0.385711669921875, 0.4067535400390625, 0.42779541015625, 0.4488372802734375, 0.469879150390625, 0.4909210205078125, 0.511962890625, 0.5330047607421875, 0.554046630859375, 0.5750885009765625, 0.59613037109375, 0.6171722412109375, 0.638214111328125, 0.6592559814453125, 0.6802978515625, 0.7013397216796875, 0.722381591796875, 0.7434234619140625, 0.76446533203125, 0.7855072021484375, 0.806549072265625, 0.8275909423828125, 0.8486328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 11.0, 30.0, 68.0, 104.0, 223.0, 292.0, 130.0, 57.0, 35.0, 14.0, 9.0, 3.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.372516632080078, -24.834980010986328, -24.297443389892578, -23.759906768798828, -23.222370147705078, -22.684833526611328, -22.147296905517578, -21.609758377075195, -21.072221755981445, -20.534685134887695, -19.997148513793945, -19.459611892700195, -18.922075271606445, -18.384536743164062, -17.847000122070312, -17.309463500976562, -16.771926879882812, -16.234390258789062, -15.696853637695312, -15.159317016601562, -14.621779441833496, -14.084242820739746, -13.546706199645996, -13.009169578552246, -12.471633911132812, -11.934097290039062, -11.396560668945312, -10.859024047851562, -10.321486473083496, -9.783949851989746, -9.246413230895996, -8.708876609802246, -8.17133903503418, -7.63380241394043, -7.0962653160095215, -6.5587286949157715, -6.021191596984863, -5.483654975891113, -4.946118354797363, -4.408581733703613, -3.871044635772705, -3.333507776260376, -2.795970916748047, -2.258434295654297, -1.7208974361419678, -1.1833605766296387, -0.6458239555358887, -0.10828709602355957, 0.42924976348876953, 0.9667865633964539, 1.5043233633041382, 2.0418601036071777, 2.579396963119507, 3.116933822631836, 3.654470443725586, 4.192007064819336, 4.729544162750244, 5.267080783843994, 5.804617881774902, 6.342154502868652, 6.879691123962402, 7.4172282218933105, 7.9547648429870605, 8.492301940917969, 9.029838562011719]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 9.0, 7.0, 5.0, 18.0, 29.0, 20.0, 18.0, 21.0, 26.0, 40.0, 36.0, 36.0, 50.0, 68.0, 99.0, 92.0, 65.0, 56.0, 45.0, 45.0, 33.0, 34.0, 30.0, 22.0, 24.0, 18.0, 11.0, 8.0, 8.0, 8.0, 11.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.636160850524902, -13.27888298034668, -12.921606063842773, -12.56432819366455, -12.207050323486328, -11.849772453308105, -11.492494583129883, -11.135217666625977, -10.777939796447754, -10.420661926269531, -10.063385009765625, -9.706107139587402, -9.34882926940918, -8.991551399230957, -8.634273529052734, -8.276996612548828, -7.9197187423706055, -7.562440872192383, -7.205163478851318, -6.847886085510254, -6.490608215332031, -6.133330345153809, -5.776052951812744, -5.41877555847168, -5.061497688293457, -4.704219818115234, -4.34694242477417, -3.9896647930145264, -3.632387161254883, -3.2751095294952393, -2.9178318977355957, -2.560554265975952, -2.203275680541992, -1.8459980487823486, -1.488720417022705, -1.1314427852630615, -0.774165153503418, -0.4168875217437744, -0.05960988998413086, 0.2976677417755127, 0.6549453735351562, 1.0122230052947998, 1.3695006370544434, 1.726778268814087, 2.0840559005737305, 2.441333532333374, 2.7986111640930176, 3.155888795852661, 3.5131664276123047, 3.8704440593719482, 4.227721691131592, 4.584999084472656, 4.942276954650879, 5.299554824829102, 5.656832218170166, 6.0141096115112305, 6.371387481689453, 6.728665351867676, 7.08594274520874, 7.443220138549805, 7.800498008728027, 8.15777587890625, 8.515052795410156, 8.872330665588379, 9.229608535766602]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 16.0, 22.0, 33.0, 59.0, 148.0, 402.0, 1448.0, 6303.0, 49917.0, 3065244.0, 1037916.0, 27034.0, 4147.0, 1060.0, 328.0, 95.0, 40.0, 29.0, 14.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -1.999114990234375, -1.92987060546875, -1.860626220703125, -1.7913818359375, -1.722137451171875, -1.65289306640625, -1.583648681640625, -1.514404296875, -1.445159912109375, -1.37591552734375, -1.306671142578125, -1.2374267578125, -1.168182373046875, -1.09893798828125, -1.029693603515625, -0.96044921875, -0.891204833984375, -0.82196044921875, -0.752716064453125, -0.6834716796875, -0.614227294921875, -0.54498291015625, -0.475738525390625, -0.406494140625, -0.337249755859375, -0.26800537109375, -0.198760986328125, -0.1295166015625, -0.060272216796875, 0.00897216796875, 0.078216552734375, 0.1474609375, 0.216705322265625, 0.28594970703125, 0.355194091796875, 0.4244384765625, 0.493682861328125, 0.56292724609375, 0.632171630859375, 0.701416015625, 0.770660400390625, 0.83990478515625, 0.909149169921875, 0.9783935546875, 1.047637939453125, 1.11688232421875, 1.186126708984375, 1.25537109375, 1.324615478515625, 1.39385986328125, 1.463104248046875, 1.5323486328125, 1.601593017578125, 1.67083740234375, 1.740081787109375, 1.809326171875, 1.878570556640625, 1.94781494140625, 2.017059326171875, 2.0863037109375, 2.155548095703125, 2.22479248046875, 2.294036865234375, 2.36328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 14.0, 14.0, 28.0, 35.0, 40.0, 51.0, 61.0, 84.0, 86.0, 94.0, 94.0, 84.0, 84.0, 62.0, 45.0, 36.0, 24.0, 25.0, 20.0, 2.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6240234375, -1.58770751953125, -1.5513916015625, -1.51507568359375, -1.478759765625, -1.44244384765625, -1.4061279296875, -1.36981201171875, -1.33349609375, -1.29718017578125, -1.2608642578125, -1.22454833984375, -1.188232421875, -1.15191650390625, -1.1156005859375, -1.07928466796875, -1.04296875, -1.00665283203125, -0.9703369140625, -0.93402099609375, -0.897705078125, -0.86138916015625, -0.8250732421875, -0.78875732421875, -0.75244140625, -0.71612548828125, -0.6798095703125, -0.64349365234375, -0.607177734375, -0.57086181640625, -0.5345458984375, -0.49822998046875, -0.4619140625, -0.42559814453125, -0.3892822265625, -0.35296630859375, -0.316650390625, -0.28033447265625, -0.2440185546875, -0.20770263671875, -0.17138671875, -0.13507080078125, -0.0987548828125, -0.06243896484375, -0.026123046875, 0.01019287109375, 0.0465087890625, 0.08282470703125, 0.119140625, 0.15545654296875, 0.1917724609375, 0.22808837890625, 0.264404296875, 0.30072021484375, 0.3370361328125, 0.37335205078125, 0.40966796875, 0.44598388671875, 0.4822998046875, 0.51861572265625, 0.554931640625, 0.59124755859375, 0.6275634765625, 0.66387939453125, 0.7001953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 8.0, 9.0, 12.0, 18.0, 35.0, 84.0, 147.0, 377.0, 1508.0, 10977.0, 606253.0, 3547909.0, 23665.0, 2308.0, 576.0, 208.0, 87.0, 49.0, 23.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.758056640625, -3.64111328125, -3.524169921875, -3.4072265625, -3.290283203125, -3.17333984375, -3.056396484375, -2.939453125, -2.822509765625, -2.70556640625, -2.588623046875, -2.4716796875, -2.354736328125, -2.23779296875, -2.120849609375, -2.00390625, -1.886962890625, -1.77001953125, -1.653076171875, -1.5361328125, -1.419189453125, -1.30224609375, -1.185302734375, -1.068359375, -0.951416015625, -0.83447265625, -0.717529296875, -0.6005859375, -0.483642578125, -0.36669921875, -0.249755859375, -0.1328125, -0.015869140625, 0.10107421875, 0.218017578125, 0.3349609375, 0.451904296875, 0.56884765625, 0.685791015625, 0.802734375, 0.919677734375, 1.03662109375, 1.153564453125, 1.2705078125, 1.387451171875, 1.50439453125, 1.621337890625, 1.73828125, 1.855224609375, 1.97216796875, 2.089111328125, 2.2060546875, 2.322998046875, 2.43994140625, 2.556884765625, 2.673828125, 2.790771484375, 2.90771484375, 3.024658203125, 3.1416015625, 3.258544921875, 3.37548828125, 3.492431640625, 3.609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 17.0, 12.0, 25.0, 39.0, 75.0, 150.0, 217.0, 549.0, 1106.0, 973.0, 412.0, 194.0, 108.0, 62.0, 39.0, 22.0, 21.0, 9.0, 11.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.712890625, -2.6411895751953125, -2.569488525390625, -2.4977874755859375, -2.42608642578125, -2.3543853759765625, -2.282684326171875, -2.2109832763671875, -2.1392822265625, -2.0675811767578125, -1.995880126953125, -1.9241790771484375, -1.85247802734375, -1.7807769775390625, -1.709075927734375, -1.6373748779296875, -1.565673828125, -1.4939727783203125, -1.422271728515625, -1.3505706787109375, -1.27886962890625, -1.2071685791015625, -1.135467529296875, -1.0637664794921875, -0.9920654296875, -0.9203643798828125, -0.848663330078125, -0.7769622802734375, -0.70526123046875, -0.6335601806640625, -0.561859130859375, -0.4901580810546875, -0.41845703125, -0.3467559814453125, -0.275054931640625, -0.2033538818359375, -0.13165283203125, -0.0599517822265625, 0.011749267578125, 0.0834503173828125, 0.1551513671875, 0.2268524169921875, 0.298553466796875, 0.3702545166015625, 0.44195556640625, 0.5136566162109375, 0.585357666015625, 0.6570587158203125, 0.728759765625, 0.8004608154296875, 0.872161865234375, 0.9438629150390625, 1.01556396484375, 1.0872650146484375, 1.158966064453125, 1.2306671142578125, 1.3023681640625, 1.3740692138671875, 1.445770263671875, 1.5174713134765625, 1.58917236328125, 1.6608734130859375, 1.732574462890625, 1.8042755126953125, 1.8759765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 28.0, 97.0, 207.0, 310.0, 207.0, 79.0, 30.0, 17.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.83171844482422, -24.132568359375, -23.43341636657715, -22.73426628112793, -22.035114288330078, -21.33596420288086, -20.63681411743164, -19.937664031982422, -19.23851203918457, -18.53936195373535, -17.8402099609375, -17.14105987548828, -16.441909790039062, -15.742757797241211, -15.043607711791992, -14.344456672668457, -13.645305633544922, -12.946154594421387, -12.247003555297852, -11.547853469848633, -10.848702430725098, -10.149551391601562, -9.450401306152344, -8.751250267028809, -8.052099227905273, -7.352948188781738, -6.653797626495361, -5.954647064208984, -5.255496025085449, -4.556344985961914, -3.857194423675537, -3.15804386138916, -2.458892822265625, -1.759742021560669, -1.060591220855713, -0.36144042015075684, 0.3377103805541992, 1.0368611812591553, 1.7360119819641113, 2.4351625442504883, 3.1343135833740234, 3.8334643840789795, 4.5326151847839355, 5.2317657470703125, 5.930916786193848, 6.630067825317383, 7.32921838760376, 8.028368949890137, 8.727519989013672, 9.426671028137207, 10.125822067260742, 10.824972152709961, 11.524123191833496, 12.223274230957031, 12.92242431640625, 13.621575355529785, 14.32072639465332, 15.019877433776855, 15.71902847290039, 16.41817855834961, 17.117328643798828, 17.81648063659668, 18.5156307220459, 19.21478271484375, 19.91393280029297]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 11.0, 3.0, 7.0, 9.0, 16.0, 13.0, 13.0, 30.0, 20.0, 28.0, 25.0, 31.0, 36.0, 45.0, 41.0, 46.0, 45.0, 54.0, 63.0, 58.0, 50.0, 52.0, 39.0, 36.0, 38.0, 26.0, 21.0, 15.0, 15.0, 24.0, 17.0, 12.0, 14.0, 6.0, 9.0, 9.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.208372592926025, -5.996061325073242, -5.783749580383301, -5.571438312530518, -5.359126567840576, -5.146815299987793, -4.934503555297852, -4.722192287445068, -4.509881019592285, -4.297569751739502, -4.0852580070495605, -3.8729467391967773, -3.660634994506836, -3.4483237266540527, -3.2360122203826904, -3.023700714111328, -2.8113889694213867, -2.5990774631500244, -2.386765956878662, -2.174454689025879, -1.962143063545227, -1.7498315572738647, -1.537520170211792, -1.3252086639404297, -1.1128971576690674, -0.9005856513977051, -0.6882742047309875, -0.47596275806427, -0.2636512517929077, -0.05133974552154541, 0.16097164154052734, 0.37328314781188965, 0.5855951309204102, 0.7979066371917725, 1.0102181434631348, 1.2225295305252075, 1.4348410367965698, 1.6471525430679321, 1.8594639301300049, 2.071775436401367, 2.2840869426727295, 2.496398448944092, 2.708709955215454, 2.9210214614868164, 3.1333327293395996, 3.345644474029541, 3.557955741882324, 3.7702672481536865, 3.982578754425049, 4.194890022277832, 4.407201766967773, 4.619513034820557, 4.831824779510498, 5.044136047363281, 5.256447792053223, 5.468759059906006, 5.681070327758789, 5.893381595611572, 6.105693340301514, 6.318004608154297, 6.530316352844238, 6.7426276206970215, 6.954938888549805, 7.167250633239746, 7.3795623779296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 10.0, 20.0, 28.0, 34.0, 59.0, 116.0, 180.0, 333.0, 671.0, 1544.0, 4083.0, 13745.0, 70110.0, 502157.0, 386160.0, 52175.0, 11043.0, 3409.0, 1351.0, 597.0, 287.0, 192.0, 95.0, 49.0, 30.0, 18.0, 16.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.4010772705078125, -1.349029541015625, -1.2969818115234375, -1.24493408203125, -1.1928863525390625, -1.140838623046875, -1.0887908935546875, -1.0367431640625, -0.9846954345703125, -0.932647705078125, -0.8805999755859375, -0.82855224609375, -0.7765045166015625, -0.724456787109375, -0.6724090576171875, -0.620361328125, -0.5683135986328125, -0.516265869140625, -0.4642181396484375, -0.41217041015625, -0.3601226806640625, -0.308074951171875, -0.2560272216796875, -0.2039794921875, -0.1519317626953125, -0.099884033203125, -0.0478363037109375, 0.00421142578125, 0.0562591552734375, 0.108306884765625, 0.1603546142578125, 0.21240234375, 0.2644500732421875, 0.316497802734375, 0.3685455322265625, 0.42059326171875, 0.4726409912109375, 0.524688720703125, 0.5767364501953125, 0.6287841796875, 0.6808319091796875, 0.732879638671875, 0.7849273681640625, 0.83697509765625, 0.8890228271484375, 0.941070556640625, 0.9931182861328125, 1.045166015625, 1.0972137451171875, 1.149261474609375, 1.2013092041015625, 1.25335693359375, 1.3054046630859375, 1.357452392578125, 1.4095001220703125, 1.4615478515625, 1.5135955810546875, 1.565643310546875, 1.6176910400390625, 1.66973876953125, 1.7217864990234375, 1.773834228515625, 1.8258819580078125, 1.8779296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 10.0, 15.0, 22.0, 23.0, 32.0, 49.0, 46.0, 65.0, 84.0, 77.0, 92.0, 87.0, 100.0, 71.0, 47.0, 47.0, 31.0, 29.0, 28.0, 19.0, 11.0, 5.0, 8.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.626953125, -1.5906143188476562, -1.5542755126953125, -1.5179367065429688, -1.481597900390625, -1.4452590942382812, -1.4089202880859375, -1.3725814819335938, -1.33624267578125, -1.2999038696289062, -1.2635650634765625, -1.2272262573242188, -1.190887451171875, -1.1545486450195312, -1.1182098388671875, -1.0818710327148438, -1.0455322265625, -1.0091934204101562, -0.9728546142578125, -0.9365158081054688, -0.900177001953125, -0.8638381958007812, -0.8274993896484375, -0.7911605834960938, -0.75482177734375, -0.7184829711914062, -0.6821441650390625, -0.6458053588867188, -0.609466552734375, -0.5731277465820312, -0.5367889404296875, -0.5004501342773438, -0.464111328125, -0.42777252197265625, -0.3914337158203125, -0.35509490966796875, -0.318756103515625, -0.28241729736328125, -0.2460784912109375, -0.20973968505859375, -0.17340087890625, -0.13706207275390625, -0.1007232666015625, -0.06438446044921875, -0.028045654296875, 0.00829315185546875, 0.0446319580078125, 0.08097076416015625, 0.1173095703125, 0.15364837646484375, 0.1899871826171875, 0.22632598876953125, 0.262664794921875, 0.29900360107421875, 0.3353424072265625, 0.37168121337890625, 0.40802001953125, 0.44435882568359375, 0.4806976318359375, 0.5170364379882812, 0.553375244140625, 0.5897140502929688, 0.6260528564453125, 0.6623916625976562, 0.69873046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 6.0, 15.0, 19.0, 12.0, 18.0, 40.0, 54.0, 90.0, 144.0, 219.0, 395.0, 892.0, 2438.0, 11048.0, 138580.0, 845923.0, 39948.0, 5647.0, 1604.0, 607.0, 317.0, 176.0, 106.0, 70.0, 48.0, 34.0, 23.0, 20.0, 21.0, 11.0, 6.0, 2.0, 7.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.90625, -2.82391357421875, -2.7415771484375, -2.65924072265625, -2.576904296875, -2.49456787109375, -2.4122314453125, -2.32989501953125, -2.24755859375, -2.16522216796875, -2.0828857421875, -2.00054931640625, -1.918212890625, -1.83587646484375, -1.7535400390625, -1.67120361328125, -1.5888671875, -1.50653076171875, -1.4241943359375, -1.34185791015625, -1.259521484375, -1.17718505859375, -1.0948486328125, -1.01251220703125, -0.93017578125, -0.84783935546875, -0.7655029296875, -0.68316650390625, -0.600830078125, -0.51849365234375, -0.4361572265625, -0.35382080078125, -0.271484375, -0.18914794921875, -0.1068115234375, -0.02447509765625, 0.057861328125, 0.14019775390625, 0.2225341796875, 0.30487060546875, 0.38720703125, 0.46954345703125, 0.5518798828125, 0.63421630859375, 0.716552734375, 0.79888916015625, 0.8812255859375, 0.96356201171875, 1.0458984375, 1.12823486328125, 1.2105712890625, 1.29290771484375, 1.375244140625, 1.45758056640625, 1.5399169921875, 1.62225341796875, 1.70458984375, 1.78692626953125, 1.8692626953125, 1.95159912109375, 2.033935546875, 2.11627197265625, 2.1986083984375, 2.28094482421875, 2.36328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 7.0, 4.0, 11.0, 11.0, 19.0, 25.0, 34.0, 52.0, 46.0, 62.0, 76.0, 96.0, 76.0, 84.0, 81.0, 75.0, 55.0, 46.0, 32.0, 29.0, 17.0, 20.0, 8.0, 7.0, 4.0, 3.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.62890625, -4.506317138671875, -4.38372802734375, -4.261138916015625, -4.1385498046875, -4.015960693359375, -3.89337158203125, -3.770782470703125, -3.648193359375, -3.525604248046875, -3.40301513671875, -3.280426025390625, -3.1578369140625, -3.035247802734375, -2.91265869140625, -2.790069580078125, -2.66748046875, -2.544891357421875, -2.42230224609375, -2.299713134765625, -2.1771240234375, -2.054534912109375, -1.93194580078125, -1.809356689453125, -1.686767578125, -1.564178466796875, -1.44158935546875, -1.319000244140625, -1.1964111328125, -1.073822021484375, -0.95123291015625, -0.828643798828125, -0.7060546875, -0.583465576171875, -0.46087646484375, -0.338287353515625, -0.2156982421875, -0.093109130859375, 0.02947998046875, 0.152069091796875, 0.274658203125, 0.397247314453125, 0.51983642578125, 0.642425537109375, 0.7650146484375, 0.887603759765625, 1.01019287109375, 1.132781982421875, 1.25537109375, 1.377960205078125, 1.50054931640625, 1.623138427734375, 1.7457275390625, 1.868316650390625, 1.99090576171875, 2.113494873046875, 2.236083984375, 2.358673095703125, 2.48126220703125, 2.603851318359375, 2.7264404296875, 2.849029541015625, 2.97161865234375, 3.094207763671875, 3.216796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 5.0, 8.0, 16.0, 33.0, 48.0, 74.0, 175.0, 371.0, 826.0, 2669.0, 10972.0, 90396.0, 877903.0, 53699.0, 7928.0, 2077.0, 727.0, 301.0, 138.0, 71.0, 49.0, 16.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.91796875, -0.8896408081054688, -0.8613128662109375, -0.8329849243164062, -0.804656982421875, -0.7763290405273438, -0.7480010986328125, -0.7196731567382812, -0.69134521484375, -0.6630172729492188, -0.6346893310546875, -0.6063613891601562, -0.578033447265625, -0.5497055053710938, -0.5213775634765625, -0.49304962158203125, -0.4647216796875, -0.43639373779296875, -0.4080657958984375, -0.37973785400390625, -0.351409912109375, -0.32308197021484375, -0.2947540283203125, -0.26642608642578125, -0.23809814453125, -0.20977020263671875, -0.1814422607421875, -0.15311431884765625, -0.124786376953125, -0.09645843505859375, -0.0681304931640625, -0.03980255126953125, -0.011474609375, 0.01685333251953125, 0.0451812744140625, 0.07350921630859375, 0.101837158203125, 0.13016510009765625, 0.1584930419921875, 0.18682098388671875, 0.21514892578125, 0.24347686767578125, 0.2718048095703125, 0.30013275146484375, 0.328460693359375, 0.35678863525390625, 0.3851165771484375, 0.41344451904296875, 0.4417724609375, 0.47010040283203125, 0.4984283447265625, 0.5267562866210938, 0.555084228515625, 0.5834121704101562, 0.6117401123046875, 0.6400680541992188, 0.66839599609375, 0.6967239379882812, 0.7250518798828125, 0.7533798217773438, 0.781707763671875, 0.8100357055664062, 0.8383636474609375, 0.8666915893554688, 0.89501953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 9.0, 14.0, 10.0, 9.0, 28.0, 35.0, 60.0, 81.0, 128.0, 147.0, 132.0, 114.0, 78.0, 35.0, 33.0, 16.0, 13.0, 9.0, 5.0, 12.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0001671314239501953, -0.00016231834888458252, -0.00015750527381896973, -0.00015269219875335693, -0.00014787912368774414, -0.00014306604862213135, -0.00013825297355651855, -0.00013343989849090576, -0.00012862682342529297, -0.00012381374835968018, -0.00011900067329406738, -0.00011418759822845459, -0.0001093745231628418, -0.000104561448097229, -9.974837303161621e-05, -9.493529796600342e-05, -9.012222290039062e-05, -8.530914783477783e-05, -8.049607276916504e-05, -7.568299770355225e-05, -7.086992263793945e-05, -6.605684757232666e-05, -6.124377250671387e-05, -5.6430697441101074e-05, -5.161762237548828e-05, -4.680454730987549e-05, -4.1991472244262695e-05, -3.71783971786499e-05, -3.236532211303711e-05, -2.7552247047424316e-05, -2.2739171981811523e-05, -1.792609691619873e-05, -1.3113021850585938e-05, -8.299946784973145e-06, -3.4868717193603516e-06, 1.3262033462524414e-06, 6.139278411865234e-06, 1.0952353477478027e-05, 1.576542854309082e-05, 2.0578503608703613e-05, 2.5391578674316406e-05, 3.02046537399292e-05, 3.501772880554199e-05, 3.9830803871154785e-05, 4.464387893676758e-05, 4.945695400238037e-05, 5.4270029067993164e-05, 5.908310413360596e-05, 6.389617919921875e-05, 6.870925426483154e-05, 7.352232933044434e-05, 7.833540439605713e-05, 8.314847946166992e-05, 8.796155452728271e-05, 9.277462959289551e-05, 9.75877046585083e-05, 0.0001024007797241211, 0.00010721385478973389, 0.00011202692985534668, 0.00011684000492095947, 0.00012165307998657227, 0.00012646615505218506, 0.00013127923011779785, 0.00013609230518341064, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 6.0, 8.0, 8.0, 3.0, 17.0, 8.0, 20.0, 27.0, 24.0, 57.0, 61.0, 131.0, 197.0, 282.0, 441.0, 855.0, 1625.0, 3658.0, 9184.0, 28298.0, 127960.0, 699160.0, 130671.0, 29112.0, 9088.0, 3710.0, 1669.0, 871.0, 519.0, 267.0, 196.0, 122.0, 86.0, 66.0, 33.0, 33.0, 24.0, 17.0, 5.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.5419921875, -0.5275421142578125, -0.513092041015625, -0.4986419677734375, -0.48419189453125, -0.4697418212890625, -0.455291748046875, -0.4408416748046875, -0.4263916015625, -0.4119415283203125, -0.397491455078125, -0.3830413818359375, -0.36859130859375, -0.3541412353515625, -0.339691162109375, -0.3252410888671875, -0.310791015625, -0.2963409423828125, -0.281890869140625, -0.2674407958984375, -0.25299072265625, -0.2385406494140625, -0.224090576171875, -0.2096405029296875, -0.1951904296875, -0.1807403564453125, -0.166290283203125, -0.1518402099609375, -0.13739013671875, -0.1229400634765625, -0.108489990234375, -0.0940399169921875, -0.07958984375, -0.0651397705078125, -0.050689697265625, -0.0362396240234375, -0.02178955078125, -0.0073394775390625, 0.007110595703125, 0.0215606689453125, 0.0360107421875, 0.0504608154296875, 0.064910888671875, 0.0793609619140625, 0.09381103515625, 0.1082611083984375, 0.122711181640625, 0.1371612548828125, 0.151611328125, 0.1660614013671875, 0.180511474609375, 0.1949615478515625, 0.20941162109375, 0.2238616943359375, 0.238311767578125, 0.2527618408203125, 0.2672119140625, 0.2816619873046875, 0.296112060546875, 0.3105621337890625, 0.32501220703125, 0.3394622802734375, 0.353912353515625, 0.3683624267578125, 0.3828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 5.0, 5.0, 2.0, 7.0, 6.0, 8.0, 14.0, 18.0, 12.0, 33.0, 38.0, 46.0, 81.0, 82.0, 97.0, 116.0, 80.0, 92.0, 71.0, 46.0, 31.0, 29.0, 15.0, 16.0, 8.0, 11.0, 4.0, 8.0, 5.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.527618408203125, -0.51129150390625, -0.494964599609375, -0.4786376953125, -0.462310791015625, -0.44598388671875, -0.429656982421875, -0.413330078125, -0.397003173828125, -0.38067626953125, -0.364349365234375, -0.3480224609375, -0.331695556640625, -0.31536865234375, -0.299041748046875, -0.28271484375, -0.266387939453125, -0.25006103515625, -0.233734130859375, -0.2174072265625, -0.201080322265625, -0.18475341796875, -0.168426513671875, -0.152099609375, -0.135772705078125, -0.11944580078125, -0.103118896484375, -0.0867919921875, -0.070465087890625, -0.05413818359375, -0.037811279296875, -0.021484375, -0.005157470703125, 0.01116943359375, 0.027496337890625, 0.0438232421875, 0.060150146484375, 0.07647705078125, 0.092803955078125, 0.109130859375, 0.125457763671875, 0.14178466796875, 0.158111572265625, 0.1744384765625, 0.190765380859375, 0.20709228515625, 0.223419189453125, 0.23974609375, 0.256072998046875, 0.27239990234375, 0.288726806640625, 0.3050537109375, 0.321380615234375, 0.33770751953125, 0.354034423828125, 0.370361328125, 0.386688232421875, 0.40301513671875, 0.419342041015625, 0.4356689453125, 0.451995849609375, 0.46832275390625, 0.484649658203125, 0.5009765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 10.0, 13.0, 26.0, 48.0, 103.0, 159.0, 319.0, 141.0, 84.0, 43.0, 21.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.255863189697266, -8.824491500854492, -8.393118858337402, -7.961747169494629, -7.5303754806518555, -7.099003314971924, -6.667631149291992, -6.236259460449219, -5.804887294769287, -5.3735151290893555, -4.942143440246582, -4.51077127456665, -4.079399108886719, -3.6480274200439453, -3.2166552543640137, -2.785283327102661, -2.3539113998413086, -1.922539472579956, -1.491167426109314, -1.0597953796386719, -0.6284234523773193, -0.1970515251159668, 0.23432064056396484, 0.6656925678253174, 1.09706449508667, 1.5284364223480225, 1.9598084688186646, 2.3911805152893066, 2.822552442550659, 3.2539243698120117, 3.6852965354919434, 4.116668701171875, 4.548040390014648, 4.97941255569458, 5.4107842445373535, 5.842156410217285, 6.273528099060059, 6.70490026473999, 7.136272430419922, 7.567644119262695, 7.999016284942627, 8.430388450622559, 8.861760139465332, 9.293132781982422, 9.724504470825195, 10.155876159667969, 10.587247848510742, 11.018620491027832, 11.449992179870605, 11.881363868713379, 12.312736511230469, 12.744108200073242, 13.175479888916016, 13.606851577758789, 14.038224220275879, 14.469595909118652, 14.900968551635742, 15.332340240478516, 15.763712882995605, 16.195083618164062, 16.62645721435547, 17.057828903198242, 17.489200592041016, 17.92057228088379, 18.351943969726562]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 12.0, 9.0, 22.0, 11.0, 21.0, 23.0, 23.0, 22.0, 25.0, 38.0, 35.0, 44.0, 66.0, 77.0, 101.0, 85.0, 62.0, 39.0, 37.0, 36.0, 27.0, 23.0, 26.0, 15.0, 20.0, 15.0, 11.0, 13.0, 13.0, 3.0, 8.0, 3.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.976898193359375, -8.682901382446289, -8.388904571533203, -8.094907760620117, -7.8009114265441895, -7.5069146156311035, -7.212918281555176, -6.91892147064209, -6.624924659729004, -6.330927848815918, -6.036931037902832, -5.742934703826904, -5.448937892913818, -5.154941082000732, -4.860944747924805, -4.566947937011719, -4.272951126098633, -3.978954315185547, -3.68495774269104, -3.390961170196533, -3.0969643592834473, -2.8029675483703613, -2.5089709758758545, -2.2149744033813477, -1.9209775924682617, -1.6269809007644653, -1.332984209060669, -1.0389875173568726, -0.7449908256530762, -0.4509941339492798, -0.1569974422454834, 0.13699913024902344, 0.4309959411621094, 0.7249926328659058, 1.0189893245697021, 1.3129860162734985, 1.606982707977295, 1.9009793996810913, 2.1949760913848877, 2.4889726638793945, 2.7829694747924805, 3.0769662857055664, 3.3709628582000732, 3.66495943069458, 3.958956241607666, 4.252953052520752, 4.54694938659668, 4.840946197509766, 5.134943008422852, 5.4289398193359375, 5.722936630249023, 6.016932964324951, 6.310929775238037, 6.604926586151123, 6.898922920227051, 7.192919731140137, 7.486916542053223, 7.780913352966309, 8.074910163879395, 8.36890697479248, 8.66290283203125, 8.956899642944336, 9.250896453857422, 9.544893264770508, 9.838890075683594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 14.0, 30.0, 43.0, 70.0, 162.0, 422.0, 1502.0, 6300.0, 52671.0, 2888212.0, 1207862.0, 30589.0, 4663.0, 1128.0, 355.0, 122.0, 56.0, 29.0, 17.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.2803497314453125, -2.214996337890625, -2.1496429443359375, -2.08428955078125, -2.0189361572265625, -1.953582763671875, -1.8882293701171875, -1.8228759765625, -1.7575225830078125, -1.692169189453125, -1.6268157958984375, -1.56146240234375, -1.4961090087890625, -1.430755615234375, -1.3654022216796875, -1.300048828125, -1.2346954345703125, -1.169342041015625, -1.1039886474609375, -1.03863525390625, -0.9732818603515625, -0.907928466796875, -0.8425750732421875, -0.7772216796875, -0.7118682861328125, -0.646514892578125, -0.5811614990234375, -0.51580810546875, -0.4504547119140625, -0.385101318359375, -0.3197479248046875, -0.25439453125, -0.1890411376953125, -0.123687744140625, -0.0583343505859375, 0.00701904296875, 0.0723724365234375, 0.137725830078125, 0.2030792236328125, 0.2684326171875, 0.3337860107421875, 0.399139404296875, 0.4644927978515625, 0.52984619140625, 0.5951995849609375, 0.660552978515625, 0.7259063720703125, 0.791259765625, 0.8566131591796875, 0.921966552734375, 0.9873199462890625, 1.05267333984375, 1.1180267333984375, 1.183380126953125, 1.2487335205078125, 1.3140869140625, 1.3794403076171875, 1.444793701171875, 1.5101470947265625, 1.57550048828125, 1.6408538818359375, 1.706207275390625, 1.7715606689453125, 1.8369140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 6.0, 11.0, 9.0, 16.0, 12.0, 19.0, 21.0, 34.0, 32.0, 36.0, 57.0, 58.0, 56.0, 64.0, 70.0, 51.0, 52.0, 55.0, 62.0, 43.0, 40.0, 44.0, 24.0, 34.0, 23.0, 17.0, 17.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.98974609375, -0.9650192260742188, -0.9402923583984375, -0.9155654907226562, -0.890838623046875, -0.8661117553710938, -0.8413848876953125, -0.8166580200195312, -0.79193115234375, -0.7672042846679688, -0.7424774169921875, -0.7177505493164062, -0.693023681640625, -0.6682968139648438, -0.6435699462890625, -0.6188430786132812, -0.5941162109375, -0.5693893432617188, -0.5446624755859375, -0.5199356079101562, -0.495208740234375, -0.47048187255859375, -0.4457550048828125, -0.42102813720703125, -0.39630126953125, -0.37157440185546875, -0.3468475341796875, -0.32212066650390625, -0.297393798828125, -0.27266693115234375, -0.2479400634765625, -0.22321319580078125, -0.198486328125, -0.17375946044921875, -0.1490325927734375, -0.12430572509765625, -0.099578857421875, -0.07485198974609375, -0.0501251220703125, -0.02539825439453125, -0.00067138671875, 0.02405548095703125, 0.0487823486328125, 0.07350921630859375, 0.098236083984375, 0.12296295166015625, 0.1476898193359375, 0.17241668701171875, 0.1971435546875, 0.22187042236328125, 0.2465972900390625, 0.27132415771484375, 0.296051025390625, 0.32077789306640625, 0.3455047607421875, 0.37023162841796875, 0.39495849609375, 0.41968536376953125, 0.4444122314453125, 0.46913909912109375, 0.493865966796875, 0.5185928344726562, 0.5433197021484375, 0.5680465698242188, 0.5927734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 2.0, 14.0, 20.0, 16.0, 16.0, 22.0, 30.0, 59.0, 90.0, 175.0, 364.0, 1084.0, 4082.0, 21062.0, 248814.0, 3736659.0, 159731.0, 16942.0, 3429.0, 905.0, 312.0, 150.0, 81.0, 64.0, 29.0, 30.0, 14.0, 19.0, 16.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.970703125, -1.9117584228515625, -1.852813720703125, -1.7938690185546875, -1.73492431640625, -1.6759796142578125, -1.617034912109375, -1.5580902099609375, -1.4991455078125, -1.4402008056640625, -1.381256103515625, -1.3223114013671875, -1.26336669921875, -1.2044219970703125, -1.145477294921875, -1.0865325927734375, -1.027587890625, -0.9686431884765625, -0.909698486328125, -0.8507537841796875, -0.79180908203125, -0.7328643798828125, -0.673919677734375, -0.6149749755859375, -0.5560302734375, -0.4970855712890625, -0.438140869140625, -0.3791961669921875, -0.32025146484375, -0.2613067626953125, -0.202362060546875, -0.1434173583984375, -0.08447265625, -0.0255279541015625, 0.033416748046875, 0.0923614501953125, 0.15130615234375, 0.2102508544921875, 0.269195556640625, 0.3281402587890625, 0.3870849609375, 0.4460296630859375, 0.504974365234375, 0.5639190673828125, 0.62286376953125, 0.6818084716796875, 0.740753173828125, 0.7996978759765625, 0.858642578125, 0.9175872802734375, 0.976531982421875, 1.0354766845703125, 1.09442138671875, 1.1533660888671875, 1.212310791015625, 1.2712554931640625, 1.3302001953125, 1.3891448974609375, 1.448089599609375, 1.5070343017578125, 1.56597900390625, 1.6249237060546875, 1.683868408203125, 1.7428131103515625, 1.8017578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 8.0, 5.0, 6.0, 8.0, 10.0, 7.0, 20.0, 26.0, 25.0, 42.0, 55.0, 78.0, 137.0, 217.0, 342.0, 551.0, 743.0, 587.0, 408.0, 251.0, 170.0, 95.0, 58.0, 56.0, 37.0, 24.0, 18.0, 12.0, 12.0, 11.0, 7.0, 6.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.0869598388671875, -1.048919677734375, -1.0108795166015625, -0.97283935546875, -0.9347991943359375, -0.896759033203125, -0.8587188720703125, -0.8206787109375, -0.7826385498046875, -0.744598388671875, -0.7065582275390625, -0.66851806640625, -0.6304779052734375, -0.592437744140625, -0.5543975830078125, -0.516357421875, -0.4783172607421875, -0.440277099609375, -0.4022369384765625, -0.36419677734375, -0.3261566162109375, -0.288116455078125, -0.2500762939453125, -0.2120361328125, -0.1739959716796875, -0.135955810546875, -0.0979156494140625, -0.05987548828125, -0.0218353271484375, 0.016204833984375, 0.0542449951171875, 0.09228515625, 0.1303253173828125, 0.168365478515625, 0.2064056396484375, 0.24444580078125, 0.2824859619140625, 0.320526123046875, 0.3585662841796875, 0.3966064453125, 0.4346466064453125, 0.472686767578125, 0.5107269287109375, 0.54876708984375, 0.5868072509765625, 0.624847412109375, 0.6628875732421875, 0.700927734375, 0.7389678955078125, 0.777008056640625, 0.8150482177734375, 0.85308837890625, 0.8911285400390625, 0.929168701171875, 0.9672088623046875, 1.0052490234375, 1.0432891845703125, 1.081329345703125, 1.1193695068359375, 1.15740966796875, 1.1954498291015625, 1.233489990234375, 1.2715301513671875, 1.3095703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 12.0, 12.0, 30.0, 52.0, 87.0, 108.0, 138.0, 165.0, 111.0, 89.0, 68.0, 34.0, 20.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.272780895233154, -7.011215686798096, -6.749650478363037, -6.488085746765137, -6.226520538330078, -5.9649553298950195, -5.703390121459961, -5.441824913024902, -5.180259704589844, -4.918694496154785, -4.657129287719727, -4.395564079284668, -4.133999347686768, -3.872434139251709, -3.6108689308166504, -3.349303722381592, -3.0877389907836914, -2.826173782348633, -2.5646088123321533, -2.3030436038970947, -2.0414786338806152, -1.7799134254455566, -1.518348217010498, -1.256783127784729, -0.99521803855896, -0.7336529493331909, -0.4720878005027771, -0.21052265167236328, 0.05104243755340576, 0.3126075267791748, 0.5741727352142334, 0.8357378244400024, 1.0973024368286133, 1.3588675260543823, 1.6204326152801514, 1.88199782371521, 2.1435627937316895, 2.405128002166748, 2.6666932106018066, 2.9282584190368652, 3.1898233890533447, 3.4513885974884033, 3.712953567504883, 3.9745187759399414, 4.236083984375, 4.497649192810059, 4.759214401245117, 5.020779132843018, 5.282344341278076, 5.543909549713135, 5.805474758148193, 6.067039489746094, 6.328604698181152, 6.590169906616211, 6.8517351150512695, 7.113300323486328, 7.374865531921387, 7.636430740356445, 7.897995948791504, 8.159561157226562, 8.421126365661621, 8.68269157409668, 8.944255828857422, 9.20582103729248, 9.467386245727539]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 13.0, 8.0, 17.0, 20.0, 30.0, 17.0, 28.0, 30.0, 32.0, 42.0, 44.0, 73.0, 54.0, 58.0, 58.0, 54.0, 55.0, 41.0, 50.0, 55.0, 31.0, 33.0, 26.0, 22.0, 21.0, 23.0, 20.0, 11.0, 5.0, 8.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.614980697631836, -5.408015251159668, -5.201049327850342, -4.994083881378174, -4.787118434906006, -4.58015251159668, -4.373187065124512, -4.166221618652344, -3.9592559337615967, -3.7522902488708496, -3.5453248023986816, -3.3383591175079346, -3.1313934326171875, -2.9244279861450195, -2.7174623012542725, -2.5104966163635254, -2.3035311698913574, -2.0965654850006104, -1.8896000385284424, -1.6826343536376953, -1.4756687879562378, -1.2687032222747803, -1.0617375373840332, -0.8547719717025757, -0.6478064060211182, -0.44084081053733826, -0.23387521505355835, -0.026909589767456055, 0.18005597591400146, 0.387021541595459, 0.593987226486206, 0.8009527921676636, 1.007918357849121, 1.2148839235305786, 1.4218494892120361, 1.6288151741027832, 1.8357807397842407, 2.0427463054656982, 2.2497119903564453, 2.4566774368286133, 2.6636431217193604, 2.8706088066101074, 3.0775742530822754, 3.2845399379730225, 3.4915056228637695, 3.6984710693359375, 3.9054367542266846, 4.112402439117432, 4.3193678855896, 4.526333332061768, 4.733299255371094, 4.940264701843262, 5.14723014831543, 5.354195594787598, 5.561161518096924, 5.768126964569092, 5.975092887878418, 6.182058334350586, 6.389024257659912, 6.59598970413208, 6.802955150604248, 7.009921073913574, 7.216886520385742, 7.42385196685791, 7.630817413330078]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 7.0, 12.0, 9.0, 27.0, 37.0, 55.0, 66.0, 124.0, 213.0, 352.0, 723.0, 1495.0, 3263.0, 8229.0, 25478.0, 107178.0, 536820.0, 286022.0, 53448.0, 15040.0, 5331.0, 2282.0, 1054.0, 515.0, 301.0, 152.0, 94.0, 65.0, 45.0, 34.0, 11.0, 11.0, 14.0, 4.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.390625, -1.34686279296875, -1.3031005859375, -1.25933837890625, -1.215576171875, -1.17181396484375, -1.1280517578125, -1.08428955078125, -1.04052734375, -0.99676513671875, -0.9530029296875, -0.90924072265625, -0.865478515625, -0.82171630859375, -0.7779541015625, -0.73419189453125, -0.6904296875, -0.64666748046875, -0.6029052734375, -0.55914306640625, -0.515380859375, -0.47161865234375, -0.4278564453125, -0.38409423828125, -0.34033203125, -0.29656982421875, -0.2528076171875, -0.20904541015625, -0.165283203125, -0.12152099609375, -0.0777587890625, -0.03399658203125, 0.009765625, 0.05352783203125, 0.0972900390625, 0.14105224609375, 0.184814453125, 0.22857666015625, 0.2723388671875, 0.31610107421875, 0.35986328125, 0.40362548828125, 0.4473876953125, 0.49114990234375, 0.534912109375, 0.57867431640625, 0.6224365234375, 0.66619873046875, 0.7099609375, 0.75372314453125, 0.7974853515625, 0.84124755859375, 0.885009765625, 0.92877197265625, 0.9725341796875, 1.01629638671875, 1.06005859375, 1.10382080078125, 1.1475830078125, 1.19134521484375, 1.235107421875, 1.27886962890625, 1.3226318359375, 1.36639404296875, 1.41015625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 9.0, 9.0, 15.0, 14.0, 15.0, 28.0, 25.0, 36.0, 39.0, 41.0, 47.0, 60.0, 67.0, 46.0, 57.0, 52.0, 51.0, 63.0, 43.0, 46.0, 36.0, 29.0, 35.0, 34.0, 19.0, 18.0, 10.0, 9.0, 11.0, 12.0, 4.0, 6.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.9951171875, -0.9706878662109375, -0.946258544921875, -0.9218292236328125, -0.89739990234375, -0.8729705810546875, -0.848541259765625, -0.8241119384765625, -0.7996826171875, -0.7752532958984375, -0.750823974609375, -0.7263946533203125, -0.70196533203125, -0.6775360107421875, -0.653106689453125, -0.6286773681640625, -0.604248046875, -0.5798187255859375, -0.555389404296875, -0.5309600830078125, -0.50653076171875, -0.4821014404296875, -0.457672119140625, -0.4332427978515625, -0.4088134765625, -0.3843841552734375, -0.359954833984375, -0.3355255126953125, -0.31109619140625, -0.2866668701171875, -0.262237548828125, -0.2378082275390625, -0.21337890625, -0.1889495849609375, -0.164520263671875, -0.1400909423828125, -0.11566162109375, -0.0912322998046875, -0.066802978515625, -0.0423736572265625, -0.0179443359375, 0.0064849853515625, 0.030914306640625, 0.0553436279296875, 0.07977294921875, 0.1042022705078125, 0.128631591796875, 0.1530609130859375, 0.177490234375, 0.2019195556640625, 0.226348876953125, 0.2507781982421875, 0.27520751953125, 0.2996368408203125, 0.324066162109375, 0.3484954833984375, 0.3729248046875, 0.3973541259765625, 0.421783447265625, 0.4462127685546875, 0.47064208984375, 0.4950714111328125, 0.519500732421875, 0.5439300537109375, 0.568359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 5.0, 12.0, 9.0, 19.0, 20.0, 33.0, 49.0, 84.0, 122.0, 222.0, 422.0, 907.0, 2367.0, 9635.0, 130428.0, 871896.0, 25318.0, 4241.0, 1368.0, 575.0, 322.0, 168.0, 98.0, 66.0, 44.0, 30.0, 24.0, 9.0, 9.0, 13.0, 4.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.033172607421875, -1.93743896484375, -1.841705322265625, -1.7459716796875, -1.650238037109375, -1.55450439453125, -1.458770751953125, -1.363037109375, -1.267303466796875, -1.17156982421875, -1.075836181640625, -0.9801025390625, -0.884368896484375, -0.78863525390625, -0.692901611328125, -0.59716796875, -0.501434326171875, -0.40570068359375, -0.309967041015625, -0.2142333984375, -0.118499755859375, -0.02276611328125, 0.072967529296875, 0.168701171875, 0.264434814453125, 0.36016845703125, 0.455902099609375, 0.5516357421875, 0.647369384765625, 0.74310302734375, 0.838836669921875, 0.9345703125, 1.030303955078125, 1.12603759765625, 1.221771240234375, 1.3175048828125, 1.413238525390625, 1.50897216796875, 1.604705810546875, 1.700439453125, 1.796173095703125, 1.89190673828125, 1.987640380859375, 2.0833740234375, 2.179107666015625, 2.27484130859375, 2.370574951171875, 2.46630859375, 2.562042236328125, 2.65777587890625, 2.753509521484375, 2.8492431640625, 2.944976806640625, 3.04071044921875, 3.136444091796875, 3.232177734375, 3.327911376953125, 3.42364501953125, 3.519378662109375, 3.6151123046875, 3.710845947265625, 3.80657958984375, 3.902313232421875, 3.998046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 12.0, 7.0, 10.0, 21.0, 25.0, 40.0, 37.0, 62.0, 64.0, 81.0, 90.0, 86.0, 98.0, 78.0, 73.0, 38.0, 36.0, 31.0, 26.0, 23.0, 15.0, 10.0, 11.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.658966064453125, -3.53472900390625, -3.410491943359375, -3.2862548828125, -3.162017822265625, -3.03778076171875, -2.913543701171875, -2.789306640625, -2.665069580078125, -2.54083251953125, -2.416595458984375, -2.2923583984375, -2.168121337890625, -2.04388427734375, -1.919647216796875, -1.79541015625, -1.671173095703125, -1.54693603515625, -1.422698974609375, -1.2984619140625, -1.174224853515625, -1.04998779296875, -0.925750732421875, -0.801513671875, -0.677276611328125, -0.55303955078125, -0.428802490234375, -0.3045654296875, -0.180328369140625, -0.05609130859375, 0.068145751953125, 0.1923828125, 0.316619873046875, 0.44085693359375, 0.565093994140625, 0.6893310546875, 0.813568115234375, 0.93780517578125, 1.062042236328125, 1.186279296875, 1.310516357421875, 1.43475341796875, 1.558990478515625, 1.6832275390625, 1.807464599609375, 1.93170166015625, 2.055938720703125, 2.18017578125, 2.304412841796875, 2.42864990234375, 2.552886962890625, 2.6771240234375, 2.801361083984375, 2.92559814453125, 3.049835205078125, 3.174072265625, 3.298309326171875, 3.42254638671875, 3.546783447265625, 3.6710205078125, 3.795257568359375, 3.91949462890625, 4.043731689453125, 4.16796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 10.0, 9.0, 15.0, 11.0, 19.0, 22.0, 26.0, 40.0, 63.0, 111.0, 230.0, 509.0, 1277.0, 4029.0, 19115.0, 673309.0, 326652.0, 17102.0, 3764.0, 1188.0, 450.0, 226.0, 117.0, 56.0, 37.0, 27.0, 26.0, 17.0, 13.0, 12.0, 7.0, 8.0, 2.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70703125, -0.683441162109375, -0.65985107421875, -0.636260986328125, -0.6126708984375, -0.589080810546875, -0.56549072265625, -0.541900634765625, -0.518310546875, -0.494720458984375, -0.47113037109375, -0.447540283203125, -0.4239501953125, -0.400360107421875, -0.37677001953125, -0.353179931640625, -0.32958984375, -0.305999755859375, -0.28240966796875, -0.258819580078125, -0.2352294921875, -0.211639404296875, -0.18804931640625, -0.164459228515625, -0.140869140625, -0.117279052734375, -0.09368896484375, -0.070098876953125, -0.0465087890625, -0.022918701171875, 0.00067138671875, 0.024261474609375, 0.0478515625, 0.071441650390625, 0.09503173828125, 0.118621826171875, 0.1422119140625, 0.165802001953125, 0.18939208984375, 0.212982177734375, 0.236572265625, 0.260162353515625, 0.28375244140625, 0.307342529296875, 0.3309326171875, 0.354522705078125, 0.37811279296875, 0.401702880859375, 0.42529296875, 0.448883056640625, 0.47247314453125, 0.496063232421875, 0.5196533203125, 0.543243408203125, 0.56683349609375, 0.590423583984375, 0.614013671875, 0.637603759765625, 0.66119384765625, 0.684783935546875, 0.7083740234375, 0.731964111328125, 0.75555419921875, 0.779144287109375, 0.802734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 6.0, 10.0, 20.0, 25.0, 58.0, 162.0, 360.0, 172.0, 74.0, 27.0, 21.0, 9.0, 11.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00028586387634277344, -0.0002778284251689911, -0.00026979297399520874, -0.0002617575228214264, -0.00025372207164764404, -0.0002456866204738617, -0.00023765116930007935, -0.000229615718126297, -0.00022158026695251465, -0.0002135448157787323, -0.00020550936460494995, -0.0001974739134311676, -0.00018943846225738525, -0.0001814030110836029, -0.00017336755990982056, -0.0001653321087360382, -0.00015729665756225586, -0.0001492612063884735, -0.00014122575521469116, -0.0001331903040409088, -0.00012515485286712646, -0.00011711940169334412, -0.00010908395051956177, -0.00010104849934577942, -9.301304817199707e-05, -8.497759699821472e-05, -7.694214582443237e-05, -6.890669465065002e-05, -6.0871243476867676e-05, -5.283579230308533e-05, -4.480034112930298e-05, -3.676488995552063e-05, -2.872943878173828e-05, -2.0693987607955933e-05, -1.2658536434173584e-05, -4.623085260391235e-06, 3.4123659133911133e-06, 1.1447817087173462e-05, 1.948326826095581e-05, 2.751871943473816e-05, 3.555417060852051e-05, 4.3589621782302856e-05, 5.1625072956085205e-05, 5.9660524129867554e-05, 6.76959753036499e-05, 7.573142647743225e-05, 8.37668776512146e-05, 9.180232882499695e-05, 9.98377799987793e-05, 0.00010787323117256165, 0.000115908682346344, 0.00012394413352012634, 0.0001319795846939087, 0.00014001503586769104, 0.0001480504870414734, 0.00015608593821525574, 0.00016412138938903809, 0.00017215684056282043, 0.00018019229173660278, 0.00018822774291038513, 0.00019626319408416748, 0.00020429864525794983, 0.00021233409643173218, 0.00022036954760551453, 0.00022840499877929688]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 10.0, 4.0, 12.0, 17.0, 21.0, 38.0, 38.0, 84.0, 127.0, 230.0, 394.0, 768.0, 1701.0, 4439.0, 16496.0, 124386.0, 817724.0, 64968.0, 10908.0, 3389.0, 1321.0, 616.0, 337.0, 190.0, 121.0, 63.0, 44.0, 34.0, 19.0, 11.0, 6.0, 13.0, 4.0, 2.0, 9.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5636520385742188, -0.5477142333984375, -0.5317764282226562, -0.515838623046875, -0.49990081787109375, -0.4839630126953125, -0.46802520751953125, -0.45208740234375, -0.43614959716796875, -0.4202117919921875, -0.40427398681640625, -0.388336181640625, -0.37239837646484375, -0.3564605712890625, -0.34052276611328125, -0.3245849609375, -0.30864715576171875, -0.2927093505859375, -0.27677154541015625, -0.260833740234375, -0.24489593505859375, -0.2289581298828125, -0.21302032470703125, -0.19708251953125, -0.18114471435546875, -0.1652069091796875, -0.14926910400390625, -0.133331298828125, -0.11739349365234375, -0.1014556884765625, -0.08551788330078125, -0.069580078125, -0.05364227294921875, -0.0377044677734375, -0.02176666259765625, -0.005828857421875, 0.01010894775390625, 0.0260467529296875, 0.04198455810546875, 0.05792236328125, 0.07386016845703125, 0.0897979736328125, 0.10573577880859375, 0.121673583984375, 0.13761138916015625, 0.1535491943359375, 0.16948699951171875, 0.1854248046875, 0.20136260986328125, 0.2173004150390625, 0.23323822021484375, 0.249176025390625, 0.26511383056640625, 0.2810516357421875, 0.29698944091796875, 0.31292724609375, 0.32886505126953125, 0.3448028564453125, 0.36074066162109375, 0.376678466796875, 0.39261627197265625, 0.4085540771484375, 0.42449188232421875, 0.4404296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 1.0, 3.0, 5.0, 5.0, 9.0, 9.0, 16.0, 15.0, 17.0, 28.0, 21.0, 39.0, 44.0, 53.0, 88.0, 111.0, 81.0, 90.0, 71.0, 65.0, 58.0, 38.0, 32.0, 20.0, 19.0, 14.0, 13.0, 11.0, 5.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.31591796875, -0.304046630859375, -0.29217529296875, -0.280303955078125, -0.2684326171875, -0.256561279296875, -0.24468994140625, -0.232818603515625, -0.220947265625, -0.209075927734375, -0.19720458984375, -0.185333251953125, -0.1734619140625, -0.161590576171875, -0.14971923828125, -0.137847900390625, -0.1259765625, -0.114105224609375, -0.10223388671875, -0.090362548828125, -0.0784912109375, -0.066619873046875, -0.05474853515625, -0.042877197265625, -0.031005859375, -0.019134521484375, -0.00726318359375, 0.004608154296875, 0.0164794921875, 0.028350830078125, 0.04022216796875, 0.052093505859375, 0.06396484375, 0.075836181640625, 0.08770751953125, 0.099578857421875, 0.1114501953125, 0.123321533203125, 0.13519287109375, 0.147064208984375, 0.158935546875, 0.170806884765625, 0.18267822265625, 0.194549560546875, 0.2064208984375, 0.218292236328125, 0.23016357421875, 0.242034912109375, 0.25390625, 0.265777587890625, 0.27764892578125, 0.289520263671875, 0.3013916015625, 0.313262939453125, 0.32513427734375, 0.337005615234375, 0.348876953125, 0.360748291015625, 0.37261962890625, 0.384490966796875, 0.3963623046875, 0.408233642578125, 0.42010498046875, 0.431976318359375, 0.44384765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 13.0, 21.0, 48.0, 140.0, 479.0, 170.0, 68.0, 13.0, 17.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.29620361328125, -22.6197566986084, -21.943309783935547, -21.266862869262695, -20.590415954589844, -19.91396713256836, -19.23752212524414, -18.561073303222656, -17.884626388549805, -17.208179473876953, -16.5317325592041, -15.85528564453125, -15.178837776184082, -14.50239086151123, -13.825943946838379, -13.149496078491211, -12.473050117492676, -11.796603202819824, -11.120156288146973, -10.443708419799805, -9.767261505126953, -9.090814590454102, -8.41436767578125, -7.73792028427124, -7.061473369598389, -6.385026454925537, -5.708579063415527, -5.032132148742676, -4.355685234069824, -3.6792378425598145, -3.002790927886963, -2.326343536376953, -1.6498966217041016, -0.9734495282173157, -0.2970024347305298, 0.37944459915161133, 1.055891752243042, 1.7323389053344727, 2.408785820007324, 3.085233211517334, 3.7616801261901855, 4.438127040863037, 5.114574432373047, 5.791021347045898, 6.46746826171875, 7.14391565322876, 7.820362567901611, 8.496809959411621, 9.173256874084473, 9.849703788757324, 10.526150703430176, 11.202598571777344, 11.879045486450195, 12.555492401123047, 13.231939315795898, 13.90838623046875, 14.584833145141602, 15.261280059814453, 15.937726974487305, 16.614173889160156, 17.290620803833008, 17.96706771850586, 18.643516540527344, 19.319963455200195, 19.996410369873047]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 9.0, 8.0, 10.0, 15.0, 18.0, 19.0, 27.0, 32.0, 35.0, 39.0, 62.0, 69.0, 125.0, 116.0, 79.0, 65.0, 47.0, 37.0, 26.0, 24.0, 28.0, 33.0, 12.0, 11.0, 12.0, 10.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.97336196899414, -10.620179176330566, -10.266995429992676, -9.913812637329102, -9.560629844665527, -9.207447052001953, -8.854263305664062, -8.501080513000488, -8.147897720336914, -7.794714450836182, -7.441531658172607, -7.088348388671875, -6.735165596008301, -6.381982326507568, -6.028799057006836, -5.675616264343262, -5.322432518005371, -4.969249248504639, -4.6160664558410645, -4.262883186340332, -3.9097001552581787, -3.5565171241760254, -3.203333854675293, -2.8501508235931396, -2.4969677925109863, -2.143784761428833, -1.7906016111373901, -1.4374184608459473, -1.084235429763794, -0.7310523986816406, -0.3778691291809082, -0.024686098098754883, 0.32849788665771484, 0.6816809773445129, 1.034864068031311, 1.388047218322754, 1.7412302494049072, 2.0944132804870605, 2.447596549987793, 2.8007795810699463, 3.1539626121520996, 3.507145643234253, 3.8603286743164062, 4.213511943817139, 4.566695213317871, 4.919878005981445, 5.273061275482178, 5.62624454498291, 5.979427337646484, 6.332610607147217, 6.685793399810791, 7.038976669311523, 7.392159461975098, 7.74534273147583, 8.098526000976562, 8.451708793640137, 8.804891586303711, 9.158074378967285, 9.511258125305176, 9.86444091796875, 10.217623710632324, 10.570806503295898, 10.923990249633789, 11.277173042297363, 11.630356788635254]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 21.0, 24.0, 28.0, 56.0, 58.0, 121.0, 221.0, 426.0, 791.0, 1953.0, 5681.0, 24462.0, 342477.0, 3341802.0, 437772.0, 28131.0, 6294.0, 2071.0, 890.0, 424.0, 234.0, 131.0, 74.0, 41.0, 28.0, 21.0, 14.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.607421875, -2.5360565185546875, -2.464691162109375, -2.3933258056640625, -2.32196044921875, -2.2505950927734375, -2.179229736328125, -2.1078643798828125, -2.0364990234375, -1.9651336669921875, -1.893768310546875, -1.8224029541015625, -1.75103759765625, -1.6796722412109375, -1.608306884765625, -1.5369415283203125, -1.465576171875, -1.3942108154296875, -1.322845458984375, -1.2514801025390625, -1.18011474609375, -1.1087493896484375, -1.037384033203125, -0.9660186767578125, -0.8946533203125, -0.8232879638671875, -0.751922607421875, -0.6805572509765625, -0.60919189453125, -0.5378265380859375, -0.466461181640625, -0.3950958251953125, -0.32373046875, -0.2523651123046875, -0.180999755859375, -0.1096343994140625, -0.03826904296875, 0.0330963134765625, 0.104461669921875, 0.1758270263671875, 0.2471923828125, 0.3185577392578125, 0.389923095703125, 0.4612884521484375, 0.53265380859375, 0.6040191650390625, 0.675384521484375, 0.7467498779296875, 0.818115234375, 0.8894805908203125, 0.960845947265625, 1.0322113037109375, 1.10357666015625, 1.1749420166015625, 1.246307373046875, 1.3176727294921875, 1.3890380859375, 1.4604034423828125, 1.531768798828125, 1.6031341552734375, 1.67449951171875, 1.7458648681640625, 1.817230224609375, 1.8885955810546875, 1.9599609375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 7.0, 7.0, 19.0, 4.0, 17.0, 9.0, 19.0, 27.0, 15.0, 23.0, 23.0, 34.0, 32.0, 45.0, 52.0, 36.0, 39.0, 40.0, 43.0, 39.0, 35.0, 34.0, 39.0, 47.0, 37.0, 36.0, 25.0, 23.0, 29.0, 20.0, 11.0, 22.0, 19.0, 8.0, 9.0, 7.0, 12.0, 11.0, 6.0, 11.0, 6.0, 2.0, 0.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.54833984375, -0.5317153930664062, -0.5150909423828125, -0.49846649169921875, -0.481842041015625, -0.46521759033203125, -0.4485931396484375, -0.43196868896484375, -0.41534423828125, -0.39871978759765625, -0.3820953369140625, -0.36547088623046875, -0.348846435546875, -0.33222198486328125, -0.3155975341796875, -0.29897308349609375, -0.2823486328125, -0.26572418212890625, -0.2490997314453125, -0.23247528076171875, -0.215850830078125, -0.19922637939453125, -0.1826019287109375, -0.16597747802734375, -0.14935302734375, -0.13272857666015625, -0.1161041259765625, -0.09947967529296875, -0.082855224609375, -0.06623077392578125, -0.0496063232421875, -0.03298187255859375, -0.016357421875, 0.00026702880859375, 0.0168914794921875, 0.03351593017578125, 0.050140380859375, 0.06676483154296875, 0.0833892822265625, 0.10001373291015625, 0.11663818359375, 0.13326263427734375, 0.1498870849609375, 0.16651153564453125, 0.183135986328125, 0.19976043701171875, 0.2163848876953125, 0.23300933837890625, 0.2496337890625, 0.26625823974609375, 0.2828826904296875, 0.29950714111328125, 0.316131591796875, 0.33275604248046875, 0.3493804931640625, 0.36600494384765625, 0.38262939453125, 0.39925384521484375, 0.4158782958984375, 0.43250274658203125, 0.449127197265625, 0.46575164794921875, 0.4823760986328125, 0.49900054931640625, 0.515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 9.0, 4.0, 12.0, 18.0, 27.0, 41.0, 53.0, 80.0, 169.0, 249.0, 478.0, 1027.0, 2628.0, 10369.0, 186457.0, 3921676.0, 61015.0, 6362.0, 1847.0, 740.0, 361.0, 238.0, 134.0, 98.0, 51.0, 47.0, 22.0, 15.0, 10.0, 17.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.05047607421875, -3.9290771484375, -3.80767822265625, -3.686279296875, -3.56488037109375, -3.4434814453125, -3.32208251953125, -3.20068359375, -3.07928466796875, -2.9578857421875, -2.83648681640625, -2.715087890625, -2.59368896484375, -2.4722900390625, -2.35089111328125, -2.2294921875, -2.10809326171875, -1.9866943359375, -1.86529541015625, -1.743896484375, -1.62249755859375, -1.5010986328125, -1.37969970703125, -1.25830078125, -1.13690185546875, -1.0155029296875, -0.89410400390625, -0.772705078125, -0.65130615234375, -0.5299072265625, -0.40850830078125, -0.287109375, -0.16571044921875, -0.0443115234375, 0.07708740234375, 0.198486328125, 0.31988525390625, 0.4412841796875, 0.56268310546875, 0.68408203125, 0.80548095703125, 0.9268798828125, 1.04827880859375, 1.169677734375, 1.29107666015625, 1.4124755859375, 1.53387451171875, 1.6552734375, 1.77667236328125, 1.8980712890625, 2.01947021484375, 2.140869140625, 2.26226806640625, 2.3836669921875, 2.50506591796875, 2.62646484375, 2.74786376953125, 2.8692626953125, 2.99066162109375, 3.112060546875, 3.23345947265625, 3.3548583984375, 3.47625732421875, 3.59765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 9.0, 5.0, 9.0, 15.0, 36.0, 42.0, 53.0, 73.0, 83.0, 144.0, 197.0, 313.0, 429.0, 619.0, 633.0, 442.0, 300.0, 220.0, 155.0, 86.0, 54.0, 38.0, 34.0, 28.0, 14.0, 11.0, 7.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6239776611328125, -1.553619384765625, -1.4832611083984375, -1.41290283203125, -1.3425445556640625, -1.272186279296875, -1.2018280029296875, -1.1314697265625, -1.0611114501953125, -0.990753173828125, -0.9203948974609375, -0.85003662109375, -0.7796783447265625, -0.709320068359375, -0.6389617919921875, -0.568603515625, -0.4982452392578125, -0.427886962890625, -0.3575286865234375, -0.28717041015625, -0.2168121337890625, -0.146453857421875, -0.0760955810546875, -0.0057373046875, 0.0646209716796875, 0.134979248046875, 0.2053375244140625, 0.27569580078125, 0.3460540771484375, 0.416412353515625, 0.4867706298828125, 0.55712890625, 0.6274871826171875, 0.697845458984375, 0.7682037353515625, 0.83856201171875, 0.9089202880859375, 0.979278564453125, 1.0496368408203125, 1.1199951171875, 1.1903533935546875, 1.260711669921875, 1.3310699462890625, 1.40142822265625, 1.4717864990234375, 1.542144775390625, 1.6125030517578125, 1.682861328125, 1.7532196044921875, 1.823577880859375, 1.8939361572265625, 1.96429443359375, 2.0346527099609375, 2.105010986328125, 2.1753692626953125, 2.2457275390625, 2.3160858154296875, 2.386444091796875, 2.4568023681640625, 2.52716064453125, 2.5975189208984375, 2.667877197265625, 2.7382354736328125, 2.80859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 17.0, 30.0, 57.0, 125.0, 238.0, 235.0, 137.0, 59.0, 29.0, 18.0, 8.0, 8.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.02146911621094, -42.04667663574219, -41.07188034057617, -40.097084045410156, -39.122291564941406, -38.147499084472656, -37.17270278930664, -36.197906494140625, -35.223114013671875, -34.248321533203125, -33.27352523803711, -32.298728942871094, -31.323936462402344, -30.34914207458496, -29.374347686767578, -28.399553298950195, -27.424758911132812, -26.44996452331543, -25.475170135498047, -24.500375747680664, -23.52558135986328, -22.5507869720459, -21.575992584228516, -20.601198196411133, -19.62640380859375, -18.651609420776367, -17.676815032958984, -16.7020206451416, -15.727226257324219, -14.752431869506836, -13.777637481689453, -12.80284309387207, -11.828048706054688, -10.853254318237305, -9.878459930419922, -8.903665542602539, -7.928871154785156, -6.954076766967773, -5.979282379150391, -5.004487991333008, -4.029693603515625, -3.054899215698242, -2.0801048278808594, -1.1053104400634766, -0.13051605224609375, 0.8442783355712891, 1.8190727233886719, 2.7938671112060547, 3.7686614990234375, 4.74345588684082, 5.718250274658203, 6.693044662475586, 7.667839050292969, 8.642633438110352, 9.617427825927734, 10.592222213745117, 11.5670166015625, 12.541810989379883, 13.516605377197266, 14.491399765014648, 15.466194152832031, 16.440988540649414, 17.415782928466797, 18.39057731628418, 19.365371704101562]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 13.0, 13.0, 14.0, 13.0, 26.0, 21.0, 29.0, 33.0, 47.0, 42.0, 38.0, 53.0, 43.0, 60.0, 66.0, 51.0, 57.0, 47.0, 45.0, 38.0, 30.0, 30.0, 31.0, 30.0, 20.0, 19.0, 15.0, 12.0, 8.0, 11.0, 8.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-12.217418670654297, -11.84764575958252, -11.477871894836426, -11.108098983764648, -10.738325119018555, -10.368552207946777, -9.998779296875, -9.629005432128906, -9.259232521057129, -8.889459609985352, -8.519685745239258, -8.14991283416748, -7.780139446258545, -7.410366058349609, -7.040592670440674, -6.670819282531738, -6.301045894622803, -5.931272506713867, -5.561499118804932, -5.191725730895996, -4.821952819824219, -4.452179431915283, -4.082406044006348, -3.712632894515991, -3.3428595066070557, -2.97308611869812, -2.6033129692077637, -2.233539581298828, -1.8637663125991821, -1.4939930438995361, -1.1242196559906006, -0.7544465065002441, -0.3846731185913086, -0.01489982008934021, 0.3548734784126282, 0.724646806716919, 1.094420075416565, 1.464193344116211, 1.8339667320251465, 2.203739881515503, 2.5735132694244385, 2.943286657333374, 3.3130598068237305, 3.682833194732666, 4.052606582641602, 4.422379493713379, 4.792153358459473, 5.16192626953125, 5.5316996574401855, 5.901473045349121, 6.271246433258057, 6.641019821166992, 7.0107927322387695, 7.380566120147705, 7.750339508056641, 8.120112419128418, 8.489886283874512, 8.859659194946289, 9.229433059692383, 9.59920597076416, 9.968979835510254, 10.338752746582031, 10.708526611328125, 11.078299522399902, 11.44807243347168]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 10.0, 9.0, 14.0, 22.0, 29.0, 39.0, 68.0, 121.0, 179.0, 312.0, 489.0, 902.0, 1716.0, 3411.0, 7348.0, 18793.0, 56365.0, 253942.0, 557122.0, 98248.0, 29165.0, 10628.0, 4553.0, 2273.0, 1139.0, 661.0, 357.0, 229.0, 127.0, 87.0, 48.0, 45.0, 31.0, 17.0, 13.0, 6.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.93505859375, -0.9041061401367188, -0.8731536865234375, -0.8422012329101562, -0.811248779296875, -0.7802963256835938, -0.7493438720703125, -0.7183914184570312, -0.68743896484375, -0.6564865112304688, -0.6255340576171875, -0.5945816040039062, -0.563629150390625, -0.5326766967773438, -0.5017242431640625, -0.47077178955078125, -0.4398193359375, -0.40886688232421875, -0.3779144287109375, -0.34696197509765625, -0.316009521484375, -0.28505706787109375, -0.2541046142578125, -0.22315216064453125, -0.19219970703125, -0.16124725341796875, -0.1302947998046875, -0.09934234619140625, -0.068389892578125, -0.03743743896484375, -0.0064849853515625, 0.02446746826171875, 0.055419921875, 0.08637237548828125, 0.1173248291015625, 0.14827728271484375, 0.179229736328125, 0.21018218994140625, 0.2411346435546875, 0.27208709716796875, 0.30303955078125, 0.33399200439453125, 0.3649444580078125, 0.39589691162109375, 0.426849365234375, 0.45780181884765625, 0.4887542724609375, 0.5197067260742188, 0.5506591796875, 0.5816116333007812, 0.6125640869140625, 0.6435165405273438, 0.674468994140625, 0.7054214477539062, 0.7363739013671875, 0.7673263549804688, 0.79827880859375, 0.8292312622070312, 0.8601837158203125, 0.8911361694335938, 0.922088623046875, 0.9530410766601562, 0.9839935302734375, 1.0149459838867188, 1.0458984375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 10.0, 13.0, 11.0, 25.0, 16.0, 28.0, 33.0, 31.0, 31.0, 46.0, 61.0, 50.0, 60.0, 63.0, 56.0, 37.0, 47.0, 42.0, 60.0, 33.0, 26.0, 36.0, 33.0, 24.0, 26.0, 13.0, 11.0, 13.0, 11.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.6875839233398438, -0.6622772216796875, -0.6369705200195312, -0.611663818359375, -0.5863571166992188, -0.5610504150390625, -0.5357437133789062, -0.51043701171875, -0.48513031005859375, -0.4598236083984375, -0.43451690673828125, -0.409210205078125, -0.38390350341796875, -0.3585968017578125, -0.33329010009765625, -0.3079833984375, -0.28267669677734375, -0.2573699951171875, -0.23206329345703125, -0.206756591796875, -0.18144989013671875, -0.1561431884765625, -0.13083648681640625, -0.10552978515625, -0.08022308349609375, -0.0549163818359375, -0.02960968017578125, -0.004302978515625, 0.02100372314453125, 0.0463104248046875, 0.07161712646484375, 0.096923828125, 0.12223052978515625, 0.1475372314453125, 0.17284393310546875, 0.198150634765625, 0.22345733642578125, 0.2487640380859375, 0.27407073974609375, 0.29937744140625, 0.32468414306640625, 0.3499908447265625, 0.37529754638671875, 0.400604248046875, 0.42591094970703125, 0.4512176513671875, 0.47652435302734375, 0.5018310546875, 0.5271377563476562, 0.5524444580078125, 0.5777511596679688, 0.603057861328125, 0.6283645629882812, 0.6536712646484375, 0.6789779663085938, 0.70428466796875, 0.7295913696289062, 0.7548980712890625, 0.7802047729492188, 0.805511474609375, 0.8308181762695312, 0.8561248779296875, 0.8814315795898438, 0.90673828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 2.0, 6.0, 9.0, 15.0, 12.0, 21.0, 34.0, 49.0, 93.0, 135.0, 256.0, 421.0, 985.0, 3511.0, 26762.0, 948079.0, 60203.0, 5288.0, 1352.0, 523.0, 282.0, 181.0, 116.0, 62.0, 43.0, 29.0, 25.0, 19.0, 7.0, 6.0, 11.0, 6.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.97161865234375, -1.9002685546875, -1.82891845703125, -1.757568359375, -1.68621826171875, -1.6148681640625, -1.54351806640625, -1.47216796875, -1.40081787109375, -1.3294677734375, -1.25811767578125, -1.186767578125, -1.11541748046875, -1.0440673828125, -0.97271728515625, -0.9013671875, -0.83001708984375, -0.7586669921875, -0.68731689453125, -0.615966796875, -0.54461669921875, -0.4732666015625, -0.40191650390625, -0.33056640625, -0.25921630859375, -0.1878662109375, -0.11651611328125, -0.045166015625, 0.02618408203125, 0.0975341796875, 0.16888427734375, 0.240234375, 0.31158447265625, 0.3829345703125, 0.45428466796875, 0.525634765625, 0.59698486328125, 0.6683349609375, 0.73968505859375, 0.81103515625, 0.88238525390625, 0.9537353515625, 1.02508544921875, 1.096435546875, 1.16778564453125, 1.2391357421875, 1.31048583984375, 1.3818359375, 1.45318603515625, 1.5245361328125, 1.59588623046875, 1.667236328125, 1.73858642578125, 1.8099365234375, 1.88128662109375, 1.95263671875, 2.02398681640625, 2.0953369140625, 2.16668701171875, 2.238037109375, 2.30938720703125, 2.3807373046875, 2.45208740234375, 2.5234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 8.0, 7.0, 12.0, 18.0, 11.0, 17.0, 20.0, 18.0, 35.0, 53.0, 55.0, 59.0, 83.0, 90.0, 90.0, 74.0, 68.0, 62.0, 41.0, 38.0, 17.0, 25.0, 11.0, 10.0, 16.0, 11.0, 5.0, 5.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.369140625, -3.251556396484375, -3.13397216796875, -3.016387939453125, -2.8988037109375, -2.781219482421875, -2.66363525390625, -2.546051025390625, -2.428466796875, -2.310882568359375, -2.19329833984375, -2.075714111328125, -1.9581298828125, -1.840545654296875, -1.72296142578125, -1.605377197265625, -1.48779296875, -1.370208740234375, -1.25262451171875, -1.135040283203125, -1.0174560546875, -0.899871826171875, -0.78228759765625, -0.664703369140625, -0.547119140625, -0.429534912109375, -0.31195068359375, -0.194366455078125, -0.0767822265625, 0.040802001953125, 0.15838623046875, 0.275970458984375, 0.3935546875, 0.511138916015625, 0.62872314453125, 0.746307373046875, 0.8638916015625, 0.981475830078125, 1.09906005859375, 1.216644287109375, 1.334228515625, 1.451812744140625, 1.56939697265625, 1.686981201171875, 1.8045654296875, 1.922149658203125, 2.03973388671875, 2.157318115234375, 2.27490234375, 2.392486572265625, 2.51007080078125, 2.627655029296875, 2.7452392578125, 2.862823486328125, 2.98040771484375, 3.097991943359375, 3.215576171875, 3.333160400390625, 3.45074462890625, 3.568328857421875, 3.6859130859375, 3.803497314453125, 3.92108154296875, 4.038665771484375, 4.15625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 21.0, 34.0, 45.0, 77.0, 165.0, 366.0, 922.0, 2475.0, 9795.0, 70095.0, 903377.0, 49757.0, 7861.0, 2128.0, 773.0, 313.0, 152.0, 70.0, 43.0, 19.0, 13.0, 9.0, 7.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30029296875, -0.2897300720214844, -0.27916717529296875, -0.2686042785644531, -0.2580413818359375, -0.24747848510742188, -0.23691558837890625, -0.22635269165039062, -0.215789794921875, -0.20522689819335938, -0.19466400146484375, -0.18410110473632812, -0.1735382080078125, -0.16297531127929688, -0.15241241455078125, -0.14184951782226562, -0.13128662109375, -0.12072372436523438, -0.11016082763671875, -0.09959793090820312, -0.0890350341796875, -0.07847213745117188, -0.06790924072265625, -0.057346343994140625, -0.046783447265625, -0.036220550537109375, -0.02565765380859375, -0.015094757080078125, -0.0045318603515625, 0.006031036376953125, 0.01659393310546875, 0.027156829833984375, 0.0377197265625, 0.048282623291015625, 0.05884552001953125, 0.06940841674804688, 0.0799713134765625, 0.09053421020507812, 0.10109710693359375, 0.11166000366210938, 0.122222900390625, 0.13278579711914062, 0.14334869384765625, 0.15391159057617188, 0.1644744873046875, 0.17503738403320312, 0.18560028076171875, 0.19616317749023438, 0.20672607421875, 0.21728897094726562, 0.22785186767578125, 0.23841476440429688, 0.2489776611328125, 0.2595405578613281, 0.27010345458984375, 0.2806663513183594, 0.291229248046875, 0.3017921447753906, 0.31235504150390625, 0.3229179382324219, 0.3334808349609375, 0.3440437316894531, 0.35460662841796875, 0.3651695251464844, 0.375732421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 12.0, 10.0, 18.0, 22.0, 39.0, 50.0, 57.0, 77.0, 132.0, 138.0, 97.0, 87.0, 62.0, 46.0, 30.0, 28.0, 14.0, 14.0, 9.0, 11.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.059906005859375e-05, -8.781347423791885e-05, -8.502788841724396e-05, -8.224230259656906e-05, -7.945671677589417e-05, -7.667113095521927e-05, -7.388554513454437e-05, -7.109995931386948e-05, -6.831437349319458e-05, -6.552878767251968e-05, -6.274320185184479e-05, -5.995761603116989e-05, -5.7172030210494995e-05, -5.43864443898201e-05, -5.16008585691452e-05, -4.8815272748470306e-05, -4.602968692779541e-05, -4.3244101107120514e-05, -4.045851528644562e-05, -3.767292946577072e-05, -3.4887343645095825e-05, -3.210175782442093e-05, -2.9316172003746033e-05, -2.6530586183071136e-05, -2.374500036239624e-05, -2.0959414541721344e-05, -1.8173828721046448e-05, -1.538824290037155e-05, -1.2602657079696655e-05, -9.817071259021759e-06, -7.031485438346863e-06, -4.2458996176719666e-06, -1.4603137969970703e-06, 1.325272023677826e-06, 4.110857844352722e-06, 6.896443665027618e-06, 9.682029485702515e-06, 1.2467615306377411e-05, 1.5253201127052307e-05, 1.8038786947727203e-05, 2.08243727684021e-05, 2.3609958589076996e-05, 2.6395544409751892e-05, 2.918113023042679e-05, 3.1966716051101685e-05, 3.475230187177658e-05, 3.753788769245148e-05, 4.032347351312637e-05, 4.310905933380127e-05, 4.5894645154476166e-05, 4.868023097515106e-05, 5.146581679582596e-05, 5.4251402616500854e-05, 5.703698843717575e-05, 5.982257425785065e-05, 6.260816007852554e-05, 6.539374589920044e-05, 6.817933171987534e-05, 7.096491754055023e-05, 7.375050336122513e-05, 7.653608918190002e-05, 7.932167500257492e-05, 8.210726082324982e-05, 8.489284664392471e-05, 8.767843246459961e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 4.0, 12.0, 19.0, 36.0, 57.0, 85.0, 224.0, 397.0, 950.0, 2341.0, 7115.0, 29059.0, 219939.0, 737801.0, 37170.0, 8580.0, 2730.0, 1076.0, 482.0, 235.0, 91.0, 58.0, 36.0, 26.0, 10.0, 11.0, 2.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.3142852783203125, -0.305572509765625, -0.2968597412109375, -0.28814697265625, -0.2794342041015625, -0.270721435546875, -0.2620086669921875, -0.2532958984375, -0.2445831298828125, -0.235870361328125, -0.2271575927734375, -0.21844482421875, -0.2097320556640625, -0.201019287109375, -0.1923065185546875, -0.18359375, -0.1748809814453125, -0.166168212890625, -0.1574554443359375, -0.14874267578125, -0.1400299072265625, -0.131317138671875, -0.1226043701171875, -0.1138916015625, -0.1051788330078125, -0.096466064453125, -0.0877532958984375, -0.07904052734375, -0.0703277587890625, -0.061614990234375, -0.0529022216796875, -0.044189453125, -0.0354766845703125, -0.026763916015625, -0.0180511474609375, -0.00933837890625, -0.0006256103515625, 0.008087158203125, 0.0167999267578125, 0.0255126953125, 0.0342254638671875, 0.042938232421875, 0.0516510009765625, 0.06036376953125, 0.0690765380859375, 0.077789306640625, 0.0865020751953125, 0.09521484375, 0.1039276123046875, 0.112640380859375, 0.1213531494140625, 0.13006591796875, 0.1387786865234375, 0.147491455078125, 0.1562042236328125, 0.1649169921875, 0.1736297607421875, 0.182342529296875, 0.1910552978515625, 0.19976806640625, 0.2084808349609375, 0.217193603515625, 0.2259063720703125, 0.234619140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 8.0, 7.0, 14.0, 12.0, 10.0, 14.0, 17.0, 20.0, 30.0, 38.0, 63.0, 66.0, 89.0, 114.0, 94.0, 86.0, 65.0, 56.0, 32.0, 26.0, 15.0, 20.0, 17.0, 12.0, 17.0, 7.0, 6.0, 11.0, 9.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.317626953125, -0.3096809387207031, -0.30173492431640625, -0.2937889099121094, -0.2858428955078125, -0.2778968811035156, -0.26995086669921875, -0.2620048522949219, -0.254058837890625, -0.24611282348632812, -0.23816680908203125, -0.23022079467773438, -0.2222747802734375, -0.21432876586914062, -0.20638275146484375, -0.19843673706054688, -0.19049072265625, -0.18254470825195312, -0.17459869384765625, -0.16665267944335938, -0.1587066650390625, -0.15076065063476562, -0.14281463623046875, -0.13486862182617188, -0.126922607421875, -0.11897659301757812, -0.11103057861328125, -0.10308456420898438, -0.0951385498046875, -0.08719253540039062, -0.07924652099609375, -0.07130050659179688, -0.0633544921875, -0.055408477783203125, -0.04746246337890625, -0.039516448974609375, -0.0315704345703125, -0.023624420166015625, -0.01567840576171875, -0.007732391357421875, 0.000213623046875, 0.008159637451171875, 0.01610565185546875, 0.024051666259765625, 0.0319976806640625, 0.039943695068359375, 0.04788970947265625, 0.055835723876953125, 0.06378173828125, 0.07172775268554688, 0.07967376708984375, 0.08761978149414062, 0.0955657958984375, 0.10351181030273438, 0.11145782470703125, 0.11940383911132812, 0.127349853515625, 0.13529586791992188, 0.14324188232421875, 0.15118789672851562, 0.1591339111328125, 0.16707992553710938, 0.17502593994140625, 0.18297195434570312, 0.19091796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 7.0, 12.0, 14.0, 29.0, 36.0, 59.0, 190.0, 397.0, 109.0, 56.0, 33.0, 13.0, 14.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.249752044677734, -4.905951976776123, -4.562151908874512, -4.218351364135742, -3.87455153465271, -3.5307514667510986, -3.186951160430908, -2.843151092529297, -2.4993510246276855, -2.155550956726074, -1.8117507696151733, -1.4679505825042725, -1.1241505146026611, -0.7803504467010498, -0.4365501403808594, -0.09275007247924805, 0.2510499954223633, 0.5948501229286194, 0.9386502504348755, 1.2824504375457764, 1.6262505054473877, 1.970050573348999, 2.3138508796691895, 2.657650947570801, 3.001451015472412, 3.3452510833740234, 3.6890511512756348, 4.032851219177246, 4.376651763916016, 4.720451354980469, 5.064251899719238, 5.40805196762085, 5.751852035522461, 6.095652103424072, 6.439452171325684, 6.783252716064453, 7.127052307128906, 7.470852851867676, 7.814652919769287, 8.158452987670898, 8.502252578735352, 8.846053123474121, 9.189852714538574, 9.533653259277344, 9.877452850341797, 10.221253395080566, 10.565053939819336, 10.908853530883789, 11.252654075622559, 11.596454620361328, 11.940254211425781, 12.28405475616455, 12.627854347229004, 12.971654891967773, 13.315454483032227, 13.659255027770996, 14.003055572509766, 14.346856117248535, 14.690655708312988, 15.034456253051758, 15.378255844116211, 15.72205638885498, 16.06585693359375, 16.409656524658203, 16.753456115722656]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 8.0, 12.0, 13.0, 14.0, 14.0, 22.0, 20.0, 22.0, 26.0, 29.0, 63.0, 162.0, 218.0, 125.0, 44.0, 34.0, 31.0, 23.0, 28.0, 21.0, 9.0, 14.0, 11.0, 11.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.462679862976074, -8.098509788513184, -7.734339237213135, -7.370168685913086, -7.005998611450195, -6.641828536987305, -6.277657985687256, -5.913487434387207, -5.549317359924316, -5.185147285461426, -4.820976734161377, -4.456806182861328, -4.0926361083984375, -3.7284657955169678, -3.364295482635498, -3.0001251697540283, -2.6359548568725586, -2.271784543991089, -1.9076142311096191, -1.5434439182281494, -1.1792736053466797, -0.81510329246521, -0.45093297958374023, -0.08676266670227051, 0.2774076461791992, 0.641577959060669, 1.0057482719421387, 1.3699185848236084, 1.7340888977050781, 2.098259210586548, 2.4624295234680176, 2.8265998363494873, 3.1907691955566406, 3.5549395084381104, 3.91910982131958, 4.283280372619629, 4.6474504470825195, 5.01162052154541, 5.375791072845459, 5.739961624145508, 6.104131698608398, 6.468301773071289, 6.832472324371338, 7.196642875671387, 7.560812950134277, 7.924983024597168, 8.289154052734375, 8.653324127197266, 9.017494201660156, 9.381664276123047, 9.745834350585938, 10.110005378723145, 10.474175453186035, 10.838345527648926, 11.202516555786133, 11.566686630249023, 11.930856704711914, 12.295026779174805, 12.659196853637695, 13.023367881774902, 13.387537956237793, 13.751708030700684, 14.11587905883789, 14.480049133300781, 14.844219207763672]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 8.0, 6.0, 11.0, 14.0, 9.0, 16.0, 27.0, 22.0, 27.0, 34.0, 36.0, 52.0, 66.0, 230.0, 142.0, 62.0, 39.0, 27.0, 22.0, 22.0, 20.0, 19.0, 17.0, 11.0, 11.0, 10.0, 8.0, 10.0, 4.0, 7.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7275390625, -0.7023162841796875, -0.677093505859375, -0.6518707275390625, -0.62664794921875, -0.6014251708984375, -0.576202392578125, -0.5509796142578125, -0.5257568359375, -0.5005340576171875, -0.475311279296875, -0.4500885009765625, -0.42486572265625, -0.3996429443359375, -0.374420166015625, -0.3491973876953125, -0.323974609375, -0.2987518310546875, -0.273529052734375, -0.2483062744140625, -0.22308349609375, -0.1978607177734375, -0.172637939453125, -0.1474151611328125, -0.1221923828125, -0.0969696044921875, -0.071746826171875, -0.0465240478515625, -0.02130126953125, 0.0039215087890625, 0.029144287109375, 0.0543670654296875, 0.07958984375, 0.1048126220703125, 0.130035400390625, 0.1552581787109375, 0.18048095703125, 0.2057037353515625, 0.230926513671875, 0.2561492919921875, 0.2813720703125, 0.3065948486328125, 0.331817626953125, 0.3570404052734375, 0.38226318359375, 0.4074859619140625, 0.432708740234375, 0.4579315185546875, 0.483154296875, 0.5083770751953125, 0.533599853515625, 0.5588226318359375, 0.58404541015625, 0.6092681884765625, 0.634490966796875, 0.6597137451171875, 0.6849365234375, 0.7101593017578125, 0.735382080078125, 0.7606048583984375, 0.78582763671875, 0.8110504150390625, 0.836273193359375, 0.8614959716796875, 0.88671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 7.0, 9.0, 8.0, 8.0, 24.0, 95.0, 201.0, 679.0, 6284.0, 8370505.0, 9552.0, 835.0, 209.0, 79.0, 33.0, 20.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.76881217956543, -11.247289657592773, -10.725768089294434, -10.204246520996094, -9.682723999023438, -9.161201477050781, -8.639679908752441, -8.118158340454102, -7.596635818481445, -7.075113773345947, -6.553591728210449, -6.032069683074951, -5.510547637939453, -4.989025592803955, -4.467503547668457, -3.945981502532959, -3.424459457397461, -2.902937412261963, -2.381415367126465, -1.8598933219909668, -1.3383712768554688, -0.8168492317199707, -0.29532718658447266, 0.2261948585510254, 0.7477169036865234, 1.2692389488220215, 1.7907609939575195, 2.3122830390930176, 2.8338050842285156, 3.3553271293640137, 3.8768491744995117, 4.39837121963501, 4.919893264770508, 5.441415309906006, 5.962937355041504, 6.484459400177002, 7.0059814453125, 7.527503490447998, 8.049025535583496, 8.570547103881836, 9.092069625854492, 9.613592147827148, 10.135113716125488, 10.656635284423828, 11.178157806396484, 11.69968032836914, 12.22120189666748, 12.74272346496582, 13.264245986938477, 13.785768508911133, 14.307290077209473, 14.828811645507812, 15.350334167480469, 15.871856689453125, 16.39337921142578, 16.914899826049805, 17.43642234802246, 17.957944869995117, 18.47946548461914, 19.000988006591797, 19.522510528564453, 20.04403305053711, 20.565555572509766, 21.08707618713379, 21.608598709106445]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 4.0, 8.0, 6.0, 16.0, 14.0, 7.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.55813217163086, -25.723434448242188, -24.88873863220215, -24.054040908813477, -23.219343185424805, -22.384647369384766, -21.549949645996094, -20.715251922607422, -19.880556106567383, -19.04585838317871, -18.211162567138672, -17.37646484375, -16.541767120361328, -15.707071304321289, -14.872373580932617, -14.037676811218262, -13.20297908782959, -12.368282318115234, -11.533584594726562, -10.698887825012207, -9.864191055297852, -9.02949333190918, -8.194796562194824, -7.360099792480469, -6.525402545928955, -5.690705299377441, -4.856008529663086, -4.021311283111572, -3.1866142749786377, -2.351917266845703, -1.5172200202941895, -0.682523250579834, 0.1521739959716797, 0.986871063709259, 1.8215681314468384, 2.6562652587890625, 3.490962266921997, 4.325659275054932, 5.160356521606445, 5.995053291320801, 6.8297505378723145, 7.664447784423828, 8.499144554138184, 9.333841323852539, 10.168539047241211, 11.003235816955566, 11.837932586669922, 12.672630310058594, 13.50732707977295, 14.342023849487305, 15.176721572875977, 16.011417388916016, 16.846115112304688, 17.68081283569336, 18.51551055908203, 19.35020637512207, 20.184904098510742, 21.019601821899414, 21.854297637939453, 22.688995361328125, 23.523693084716797, 24.358388900756836, 25.193086624145508, 26.027782440185547, 26.86248016357422]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 15.0, 16.0, 20.0, 29.0, 52.0, 111.0, 141.0, 356.0, 823.0, 2987.0, 14777.0, 101737.0, 318769.0, 69132.0, 11343.0, 2456.0, 806.0, 327.0, 167.0, 74.0, 42.0, 22.0, 11.0, 11.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.09375, -14.7200927734375, -14.346435546875, -13.9727783203125, -13.59912109375, -13.2254638671875, -12.851806640625, -12.4781494140625, -12.1044921875, -11.7308349609375, -11.357177734375, -10.9835205078125, -10.60986328125, -10.2362060546875, -9.862548828125, -9.4888916015625, -9.115234375, -8.7415771484375, -8.367919921875, -7.9942626953125, -7.62060546875, -7.2469482421875, -6.873291015625, -6.4996337890625, -6.1259765625, -5.7523193359375, -5.378662109375, -5.0050048828125, -4.63134765625, -4.2576904296875, -3.884033203125, -3.5103759765625, -3.13671875, -2.7630615234375, -2.389404296875, -2.0157470703125, -1.64208984375, -1.2684326171875, -0.894775390625, -0.5211181640625, -0.1474609375, 0.2261962890625, 0.599853515625, 0.9735107421875, 1.34716796875, 1.7208251953125, 2.094482421875, 2.4681396484375, 2.841796875, 3.2154541015625, 3.589111328125, 3.9627685546875, 4.33642578125, 4.7100830078125, 5.083740234375, 5.4573974609375, 5.8310546875, 6.2047119140625, 6.578369140625, 6.9520263671875, 7.32568359375, 7.6993408203125, 8.072998046875, 8.4466552734375, 8.8203125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 5.0, 10.0, 6.0, 7.0, 13.0, 19.0, 18.0, 24.0, 26.0, 44.0, 41.0, 57.0, 70.0, 69.0, 63.0, 66.0, 72.0, 71.0, 67.0, 50.0, 45.0, 32.0, 26.0, 16.0, 20.0, 14.0, 12.0, 7.0, 9.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7119140625, -0.6813812255859375, -0.650848388671875, -0.6203155517578125, -0.58978271484375, -0.5592498779296875, -0.528717041015625, -0.4981842041015625, -0.4676513671875, -0.4371185302734375, -0.406585693359375, -0.3760528564453125, -0.34552001953125, -0.3149871826171875, -0.284454345703125, -0.2539215087890625, -0.223388671875, -0.1928558349609375, -0.162322998046875, -0.1317901611328125, -0.10125732421875, -0.0707244873046875, -0.040191650390625, -0.0096588134765625, 0.0208740234375, 0.0514068603515625, 0.081939697265625, 0.1124725341796875, 0.14300537109375, 0.1735382080078125, 0.204071044921875, 0.2346038818359375, 0.26513671875, 0.2956695556640625, 0.326202392578125, 0.3567352294921875, 0.38726806640625, 0.4178009033203125, 0.448333740234375, 0.4788665771484375, 0.5093994140625, 0.5399322509765625, 0.570465087890625, 0.6009979248046875, 0.63153076171875, 0.6620635986328125, 0.692596435546875, 0.7231292724609375, 0.753662109375, 0.7841949462890625, 0.814727783203125, 0.8452606201171875, 0.87579345703125, 0.9063262939453125, 0.936859130859375, 0.9673919677734375, 0.9979248046875, 1.0284576416015625, 1.058990478515625, 1.0895233154296875, 1.12005615234375, 1.1505889892578125, 1.181121826171875, 1.2116546630859375, 1.2421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 7.0, 16.0, 24.0, 42.0, 56.0, 73.0, 71.0, 62.0, 35.0, 25.0, 15.0, 11.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.150140762329102, -6.939509391784668, -6.728878021240234, -6.518246650695801, -6.307615756988525, -6.096984386444092, -5.886353015899658, -5.675721645355225, -5.465090751647949, -5.254459381103516, -5.043828010559082, -4.833196640014648, -4.622565746307373, -4.4119343757629395, -4.201303005218506, -3.9906716346740723, -3.7800402641296387, -3.569408893585205, -3.3587777614593506, -3.148146390914917, -2.9375152587890625, -2.726883888244629, -2.5162525177001953, -2.3056211471557617, -2.0949900150299072, -1.8843587636947632, -1.6737275123596191, -1.4630961418151855, -1.2524648904800415, -1.0418336391448975, -0.8312022686004639, -0.6205710172653198, -0.4099392890930176, -0.19930800795555115, 0.011323273181915283, 0.2219545841217041, 0.43258583545684814, 0.6432170867919922, 0.8538484573364258, 1.0644797086715698, 1.2751109600067139, 1.485742211341858, 1.696373462677002, 1.9070048332214355, 2.117636203765869, 2.3282673358917236, 2.5388987064361572, 2.7495298385620117, 2.9601612091064453, 3.170792579650879, 3.3814237117767334, 3.592055082321167, 3.8026862144470215, 4.013317584991455, 4.223948955535889, 4.434580326080322, 4.645211219787598, 4.855842590332031, 5.066473960876465, 5.277105331420898, 5.487736225128174, 5.698367595672607, 5.908998966217041, 6.119630336761475, 6.330261707305908]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 5.0, 6.0, 8.0, 11.0, 10.0, 26.0, 27.0, 50.0, 60.0, 75.0, 61.0, 48.0, 23.0, 14.0, 15.0, 11.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.011608600616455, -4.856748580932617, -4.7018890380859375, -4.5470290184021, -4.392168998718262, -4.237309455871582, -4.082449436187744, -3.9275896549224854, -3.7727298736572266, -3.6178700923919678, -3.463010311126709, -3.308150291442871, -3.1532905101776123, -2.9984307289123535, -2.8435707092285156, -2.688710927963257, -2.533851146697998, -2.3789913654327393, -2.2241315841674805, -2.0692715644836426, -1.9144117832183838, -1.759552001953125, -1.6046921014785767, -1.4498322010040283, -1.2949724197387695, -1.1401126384735107, -0.9852527379989624, -0.8303928971290588, -0.6755330562591553, -0.5206732153892517, -0.36581337451934814, -0.2109534740447998, -0.05609416961669922, 0.09876567125320435, 0.2536255121231079, 0.4084853529930115, 0.563345193862915, 0.7182050347328186, 0.8730648756027222, 1.0279247760772705, 1.1827845573425293, 1.337644338607788, 1.4925042390823364, 1.6473641395568848, 1.8022239208221436, 1.9570837020874023, 2.1119437217712402, 2.266803503036499, 2.421663284301758, 2.5765230655670166, 2.7313828468322754, 2.8862428665161133, 3.041102647781372, 3.195962429046631, 3.3508224487304688, 3.5056822299957275, 3.6605420112609863, 3.815401792526245, 3.970261573791504, 4.125121593475342, 4.27998161315918, 4.434841156005859, 4.589701175689697, 4.744561195373535, 4.899420738220215]}, "eval/loss": 1.8155099153518677, "eval/wer": 1.0577746925823086, "eval/runtime": 923.6212, "eval/samples_per_second": 2.86, "eval/steps_per_second": 0.358} \ No newline at end of file +{"train/loss": 0.0081, "train/learning_rate": 4.658551068883611e-05, "train/epoch": 11.21, "train/global_step": 10000, "_runtime": 61682, "_timestamp": 1646643229, "_step": 10003, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 37.0, 117.0, 352.0, 363.0, 110.0, 30.0, 7.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.77510070800781, -60.67342758178711, -59.571754455566406, -58.47008514404297, -57.368412017822266, -56.26673889160156, -55.16506576538086, -54.063392639160156, -52.96172332763672, -51.860050201416016, -50.75837707519531, -49.656707763671875, -48.55503463745117, -47.45336151123047, -46.351688385009766, -45.25001525878906, -44.14834213256836, -43.046669006347656, -41.94499588012695, -40.843326568603516, -39.74165344238281, -38.63998031616211, -37.538307189941406, -36.4366340637207, -35.3349609375, -34.2332878112793, -33.131614685058594, -32.029945373535156, -30.928272247314453, -29.82659912109375, -28.724925994873047, -27.623252868652344, -26.521587371826172, -25.41991424560547, -24.3182430267334, -23.216569900512695, -22.114898681640625, -21.013225555419922, -19.91155242919922, -18.809879302978516, -17.708206176757812, -16.60653305053711, -15.504861831665039, -14.403188705444336, -13.30151653289795, -12.199844360351562, -11.09817123413086, -9.996499061584473, -8.894827842712402, -7.793155670166016, -6.691483020782471, -5.589810371398926, -4.488138198852539, -3.3864660263061523, -2.2847933769226074, -1.1831207275390625, -0.08144855499267578, 1.02022385597229, 2.121896266937256, 3.2235686779022217, 4.3252410888671875, 5.426913261413574, 6.528585910797119, 7.630258560180664, 8.73193073272705]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 13.0, 10.0, 17.0, 34.0, 29.0, 30.0, 49.0, 54.0, 52.0, 76.0, 74.0, 69.0, 72.0, 51.0, 74.0, 66.0, 54.0, 42.0, 30.0, 25.0, 20.0, 18.0, 16.0, 11.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0779619216918945, -3.8481321334838867, -3.6183021068573, -3.388472080230713, -3.158642292022705, -2.9288125038146973, -2.6989824771881104, -2.4691524505615234, -2.2393226623535156, -2.009492874145508, -1.779662847518921, -1.5498329401016235, -1.3200030326843262, -1.0901731252670288, -0.8603432178497314, -0.6305133104324341, -0.4006834030151367, -0.17085349559783936, 0.05897641181945801, 0.28880631923675537, 0.5186362266540527, 0.7484661340713501, 0.9782960414886475, 1.2081259489059448, 1.4379558563232422, 1.6677857637405396, 1.897615671157837, 2.127445697784424, 2.3572754859924316, 2.5871052742004395, 2.8169353008270264, 3.0467653274536133, 3.276595115661621, 3.506424903869629, 3.736254930496216, 3.9660849571228027, 4.1959147453308105, 4.425744533538818, 4.655574798583984, 4.885404586791992, 5.115234375, 5.345064163208008, 5.574893951416016, 5.804724216461182, 6.0345540046691895, 6.264383792877197, 6.494214057922363, 6.724043846130371, 6.953873634338379, 7.183703422546387, 7.4135332107543945, 7.6433634757995605, 7.873193264007568, 8.103023529052734, 8.332853317260742, 8.56268310546875, 8.792512893676758, 9.022342681884766, 9.252172470092773, 9.482002258300781, 9.711832046508789, 9.941662788391113, 10.171492576599121, 10.401322364807129, 10.631152153015137]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 10.0, 4.0, 5.0, 13.0, 10.0, 13.0, 14.0, 21.0, 19.0, 27.0, 26.0, 40.0, 45.0, 37.0, 34.0, 59.0, 49.0, 51.0, 43.0, 46.0, 49.0, 40.0, 51.0, 51.0, 30.0, 38.0, 32.0, 28.0, 25.0, 17.0, 16.0, 14.0, 19.0, 10.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3836631774902344, -0.36864471435546875, -0.3536262512207031, -0.3386077880859375, -0.3235893249511719, -0.30857086181640625, -0.2935523986816406, -0.278533935546875, -0.2635154724121094, -0.24849700927734375, -0.23347854614257812, -0.2184600830078125, -0.20344161987304688, -0.18842315673828125, -0.17340469360351562, -0.15838623046875, -0.14336776733398438, -0.12834930419921875, -0.11333084106445312, -0.0983123779296875, -0.08329391479492188, -0.06827545166015625, -0.053256988525390625, -0.038238525390625, -0.023220062255859375, -0.00820159912109375, 0.006816864013671875, 0.0218353271484375, 0.036853790283203125, 0.05187225341796875, 0.06689071655273438, 0.0819091796875, 0.09692764282226562, 0.11194610595703125, 0.12696456909179688, 0.1419830322265625, 0.15700149536132812, 0.17201995849609375, 0.18703842163085938, 0.202056884765625, 0.21707534790039062, 0.23209381103515625, 0.24711227416992188, 0.2621307373046875, 0.2771492004394531, 0.29216766357421875, 0.3071861267089844, 0.32220458984375, 0.3372230529785156, 0.35224151611328125, 0.3672599792480469, 0.3822784423828125, 0.3972969055175781, 0.41231536865234375, 0.4273338317871094, 0.442352294921875, 0.4573707580566406, 0.47238922119140625, 0.4874076843261719, 0.5024261474609375, 0.5174446105957031, 0.5324630737304688, 0.5474815368652344, 0.5625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 6.0, 13.0, 19.0, 21.0, 15.0, 24.0, 27.0, 44.0, 59.0, 53.0, 71.0, 85.0, 125.0, 182.0, 263.0, 437.0, 767.0, 1844.0, 5313.0, 20728.0, 113288.0, 2925715.0, 1023462.0, 78213.0, 15533.0, 4258.0, 1518.0, 701.0, 386.0, 291.0, 193.0, 132.0, 102.0, 82.0, 65.0, 54.0, 54.0, 28.0, 29.0, 23.0, 14.0, 9.0, 12.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.31640625, -4.18109130859375, -4.0457763671875, -3.91046142578125, -3.775146484375, -3.63983154296875, -3.5045166015625, -3.36920166015625, -3.23388671875, -3.09857177734375, -2.9632568359375, -2.82794189453125, -2.692626953125, -2.55731201171875, -2.4219970703125, -2.28668212890625, -2.1513671875, -2.01605224609375, -1.8807373046875, -1.74542236328125, -1.610107421875, -1.47479248046875, -1.3394775390625, -1.20416259765625, -1.06884765625, -0.93353271484375, -0.7982177734375, -0.66290283203125, -0.527587890625, -0.39227294921875, -0.2569580078125, -0.12164306640625, 0.013671875, 0.14898681640625, 0.2843017578125, 0.41961669921875, 0.554931640625, 0.69024658203125, 0.8255615234375, 0.96087646484375, 1.09619140625, 1.23150634765625, 1.3668212890625, 1.50213623046875, 1.637451171875, 1.77276611328125, 1.9080810546875, 2.04339599609375, 2.1787109375, 2.31402587890625, 2.4493408203125, 2.58465576171875, 2.719970703125, 2.85528564453125, 2.9906005859375, 3.12591552734375, 3.26123046875, 3.39654541015625, 3.5318603515625, 3.66717529296875, 3.802490234375, 3.93780517578125, 4.0731201171875, 4.20843505859375, 4.34375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 11.0, 19.0, 41.0, 43.0, 81.0, 132.0, 195.0, 328.0, 666.0, 1174.0, 545.0, 313.0, 187.0, 129.0, 88.0, 36.0, 26.0, 22.0, 11.0, 7.0, 5.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.135284423828125, -2.04400634765625, -1.952728271484375, -1.8614501953125, -1.770172119140625, -1.67889404296875, -1.587615966796875, -1.496337890625, -1.405059814453125, -1.31378173828125, -1.222503662109375, -1.1312255859375, -1.039947509765625, -0.94866943359375, -0.857391357421875, -0.76611328125, -0.674835205078125, -0.58355712890625, -0.492279052734375, -0.4010009765625, -0.309722900390625, -0.21844482421875, -0.127166748046875, -0.035888671875, 0.055389404296875, 0.14666748046875, 0.237945556640625, 0.3292236328125, 0.420501708984375, 0.51177978515625, 0.603057861328125, 0.6943359375, 0.785614013671875, 0.87689208984375, 0.968170166015625, 1.0594482421875, 1.150726318359375, 1.24200439453125, 1.333282470703125, 1.424560546875, 1.515838623046875, 1.60711669921875, 1.698394775390625, 1.7896728515625, 1.880950927734375, 1.97222900390625, 2.063507080078125, 2.15478515625, 2.246063232421875, 2.33734130859375, 2.428619384765625, 2.5198974609375, 2.611175537109375, 2.70245361328125, 2.793731689453125, 2.885009765625, 2.976287841796875, 3.06756591796875, 3.158843994140625, 3.2501220703125, 3.341400146484375, 3.43267822265625, 3.523956298828125, 3.615234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 14.0, 21.0, 56.0, 71.0, 139.0, 262.0, 551.0, 1431.0, 5996.0, 43828.0, 838772.0, 3197180.0, 92146.0, 10179.0, 2178.0, 703.0, 311.0, 182.0, 114.0, 54.0, 28.0, 20.0, 9.0, 11.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.491943359375, -8.17919921875, -7.866455078125, -7.5537109375, -7.240966796875, -6.92822265625, -6.615478515625, -6.302734375, -5.989990234375, -5.67724609375, -5.364501953125, -5.0517578125, -4.739013671875, -4.42626953125, -4.113525390625, -3.80078125, -3.488037109375, -3.17529296875, -2.862548828125, -2.5498046875, -2.237060546875, -1.92431640625, -1.611572265625, -1.298828125, -0.986083984375, -0.67333984375, -0.360595703125, -0.0478515625, 0.264892578125, 0.57763671875, 0.890380859375, 1.203125, 1.515869140625, 1.82861328125, 2.141357421875, 2.4541015625, 2.766845703125, 3.07958984375, 3.392333984375, 3.705078125, 4.017822265625, 4.33056640625, 4.643310546875, 4.9560546875, 5.268798828125, 5.58154296875, 5.894287109375, 6.20703125, 6.519775390625, 6.83251953125, 7.145263671875, 7.4580078125, 7.770751953125, 8.08349609375, 8.396240234375, 8.708984375, 9.021728515625, 9.33447265625, 9.647216796875, 9.9599609375, 10.272705078125, 10.58544921875, 10.898193359375, 11.2109375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 12.0, 48.0, 107.0, 215.0, 256.0, 183.0, 100.0, 44.0, 27.0, 11.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.49657440185547, -22.79437255859375, -22.0921688079834, -21.38996696472168, -20.687763214111328, -19.98556137084961, -19.28335952758789, -18.581157684326172, -17.87895393371582, -17.1767520904541, -16.47454833984375, -15.772346496582031, -15.070143699645996, -14.367940902709961, -13.665739059448242, -12.963536262512207, -12.261333465576172, -11.559130668640137, -10.856927871704102, -10.154726028442383, -9.452523231506348, -8.750320434570312, -8.048118591308594, -7.345915794372559, -6.643712997436523, -5.941510200500488, -5.239307880401611, -4.537105560302734, -3.834902763366699, -3.132700204849243, -2.430497646331787, -1.7282953262329102, -1.0260944366455078, -0.32389187812805176, 0.3783106803894043, 1.0805132389068604, 1.7827157974243164, 2.4849183559417725, 3.1871209144592285, 3.8893232345581055, 4.591526031494141, 5.293728828430176, 5.995931148529053, 6.69813346862793, 7.400336265563965, 8.1025390625, 8.804740905761719, 9.506943702697754, 10.209146499633789, 10.911349296569824, 11.61355209350586, 12.315753936767578, 13.017956733703613, 13.720159530639648, 14.422361373901367, 15.124564170837402, 15.826766967773438, 16.528968811035156, 17.231172561645508, 17.933374404907227, 18.635578155517578, 19.337779998779297, 20.039981842041016, 20.742183685302734, 21.444387435913086]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 14.0, 16.0, 15.0, 25.0, 25.0, 41.0, 44.0, 38.0, 48.0, 69.0, 67.0, 77.0, 56.0, 54.0, 57.0, 53.0, 54.0, 46.0, 57.0, 42.0, 23.0, 31.0, 13.0, 14.0, 13.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.123873710632324, -11.831490516662598, -11.539107322692871, -11.246724128723145, -10.954339981079102, -10.661956787109375, -10.369573593139648, -10.077190399169922, -9.784807205200195, -9.492424011230469, -9.200040817260742, -8.907657623291016, -8.615274429321289, -8.322890281677246, -8.03050708770752, -7.738123893737793, -7.445740699768066, -7.15335750579834, -6.860974311828613, -6.5685906410217285, -6.276207447052002, -5.983824253082275, -5.691440582275391, -5.399057388305664, -5.1066741943359375, -4.814291000366211, -4.521907806396484, -4.2295241355896, -3.937140941619873, -3.6447577476501465, -3.352374315261841, -3.059990882873535, -2.767608642578125, -2.4752254486083984, -2.1828420162200928, -1.8904587030410767, -1.5980753898620605, -1.3056920766830444, -1.0133087635040283, -0.7209253311157227, -0.4285421371459961, -0.13615882396697998, 0.15622448921203613, 0.44860780239105225, 0.7409911155700684, 1.0333744287490845, 1.3257577419281006, 1.6181411743164062, 1.9105243682861328, 2.2029075622558594, 2.495290994644165, 2.7876744270324707, 3.0800576210021973, 3.372440814971924, 3.6648242473602295, 3.957207679748535, 4.249590873718262, 4.541974067687988, 4.834357261657715, 5.1267409324646, 5.419124126434326, 5.711507320404053, 6.0038909912109375, 6.296274185180664, 6.588657379150391]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 5.0, 5.0, 6.0, 7.0, 8.0, 17.0, 13.0, 21.0, 21.0, 26.0, 27.0, 25.0, 33.0, 38.0, 38.0, 43.0, 48.0, 31.0, 42.0, 40.0, 35.0, 44.0, 51.0, 38.0, 33.0, 34.0, 39.0, 49.0, 29.0, 24.0, 14.0, 23.0, 24.0, 11.0, 10.0, 11.0, 14.0, 3.0, 6.0, 7.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.479248046875, -0.4646568298339844, -0.45006561279296875, -0.4354743957519531, -0.4208831787109375, -0.4062919616699219, -0.39170074462890625, -0.3771095275878906, -0.362518310546875, -0.3479270935058594, -0.33333587646484375, -0.3187446594238281, -0.3041534423828125, -0.2895622253417969, -0.27497100830078125, -0.2603797912597656, -0.24578857421875, -0.23119735717773438, -0.21660614013671875, -0.20201492309570312, -0.1874237060546875, -0.17283248901367188, -0.15824127197265625, -0.14365005493164062, -0.129058837890625, -0.11446762084960938, -0.09987640380859375, -0.08528518676757812, -0.0706939697265625, -0.056102752685546875, -0.04151153564453125, -0.026920318603515625, -0.0123291015625, 0.002262115478515625, 0.01685333251953125, 0.031444549560546875, 0.0460357666015625, 0.060626983642578125, 0.07521820068359375, 0.08980941772460938, 0.104400634765625, 0.11899185180664062, 0.13358306884765625, 0.14817428588867188, 0.1627655029296875, 0.17735671997070312, 0.19194793701171875, 0.20653915405273438, 0.22113037109375, 0.23572158813476562, 0.25031280517578125, 0.2649040222167969, 0.2794952392578125, 0.2940864562988281, 0.30867767333984375, 0.3232688903808594, 0.337860107421875, 0.3524513244628906, 0.36704254150390625, 0.3816337585449219, 0.3962249755859375, 0.4108161926269531, 0.42540740966796875, 0.4399986267089844, 0.45458984375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 9.0, 15.0, 25.0, 41.0, 78.0, 150.0, 260.0, 541.0, 1173.0, 2475.0, 5615.0, 13835.0, 39941.0, 144488.0, 448955.0, 279631.0, 72693.0, 22911.0, 8665.0, 3776.0, 1662.0, 774.0, 376.0, 202.0, 108.0, 49.0, 33.0, 14.0, 11.0, 13.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.45703125, -0.44055938720703125, -0.4240875244140625, -0.40761566162109375, -0.391143798828125, -0.37467193603515625, -0.3582000732421875, -0.34172821044921875, -0.32525634765625, -0.30878448486328125, -0.2923126220703125, -0.27584075927734375, -0.259368896484375, -0.24289703369140625, -0.2264251708984375, -0.20995330810546875, -0.1934814453125, -0.17700958251953125, -0.1605377197265625, -0.14406585693359375, -0.127593994140625, -0.11112213134765625, -0.0946502685546875, -0.07817840576171875, -0.06170654296875, -0.04523468017578125, -0.0287628173828125, -0.01229095458984375, 0.004180908203125, 0.02065277099609375, 0.0371246337890625, 0.05359649658203125, 0.070068359375, 0.08654022216796875, 0.1030120849609375, 0.11948394775390625, 0.135955810546875, 0.15242767333984375, 0.1688995361328125, 0.18537139892578125, 0.20184326171875, 0.21831512451171875, 0.2347869873046875, 0.25125885009765625, 0.267730712890625, 0.28420257568359375, 0.3006744384765625, 0.31714630126953125, 0.3336181640625, 0.35009002685546875, 0.3665618896484375, 0.38303375244140625, 0.399505615234375, 0.41597747802734375, 0.4324493408203125, 0.44892120361328125, 0.46539306640625, 0.48186492919921875, 0.4983367919921875, 0.5148086547851562, 0.531280517578125, 0.5477523803710938, 0.5642242431640625, 0.5806961059570312, 0.59716796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 8.0, 6.0, 6.0, 11.0, 10.0, 16.0, 15.0, 20.0, 19.0, 25.0, 22.0, 25.0, 28.0, 34.0, 34.0, 34.0, 35.0, 46.0, 47.0, 36.0, 1069.0, 45.0, 38.0, 35.0, 35.0, 31.0, 37.0, 30.0, 28.0, 28.0, 26.0, 29.0, 21.0, 13.0, 14.0, 15.0, 12.0, 4.0, 10.0, 7.0, 10.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.485595703125, -0.4719963073730469, -0.45839691162109375, -0.4447975158691406, -0.4311981201171875, -0.4175987243652344, -0.40399932861328125, -0.3903999328613281, -0.376800537109375, -0.3632011413574219, -0.34960174560546875, -0.3360023498535156, -0.3224029541015625, -0.3088035583496094, -0.29520416259765625, -0.2816047668457031, -0.26800537109375, -0.2544059753417969, -0.24080657958984375, -0.22720718383789062, -0.2136077880859375, -0.20000839233398438, -0.18640899658203125, -0.17280960083007812, -0.159210205078125, -0.14561080932617188, -0.13201141357421875, -0.11841201782226562, -0.1048126220703125, -0.09121322631835938, -0.07761383056640625, -0.06401443481445312, -0.0504150390625, -0.036815643310546875, -0.02321624755859375, -0.009616851806640625, 0.0039825439453125, 0.017581939697265625, 0.03118133544921875, 0.044780731201171875, 0.058380126953125, 0.07197952270507812, 0.08557891845703125, 0.09917831420898438, 0.1127777099609375, 0.12637710571289062, 0.13997650146484375, 0.15357589721679688, 0.16717529296875, 0.18077468872070312, 0.19437408447265625, 0.20797348022460938, 0.2215728759765625, 0.23517227172851562, 0.24877166748046875, 0.2623710632324219, 0.275970458984375, 0.2895698547363281, 0.30316925048828125, 0.3167686462402344, 0.3303680419921875, 0.3439674377441406, 0.35756683349609375, 0.3711662292480469, 0.384765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 3.0, 9.0, 12.0, 17.0, 24.0, 35.0, 61.0, 70.0, 111.0, 178.0, 324.0, 541.0, 1038.0, 2061.0, 4297.0, 10658.0, 33149.0, 203895.0, 1621687.0, 171018.0, 29803.0, 9735.0, 4210.0, 1831.0, 1003.0, 536.0, 271.0, 187.0, 113.0, 71.0, 53.0, 33.0, 23.0, 15.0, 11.0, 8.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.462158203125, -0.4469871520996094, -0.43181610107421875, -0.4166450500488281, -0.4014739990234375, -0.3863029479980469, -0.37113189697265625, -0.3559608459472656, -0.340789794921875, -0.3256187438964844, -0.31044769287109375, -0.2952766418457031, -0.2801055908203125, -0.2649345397949219, -0.24976348876953125, -0.23459243774414062, -0.21942138671875, -0.20425033569335938, -0.18907928466796875, -0.17390823364257812, -0.1587371826171875, -0.14356613159179688, -0.12839508056640625, -0.11322402954101562, -0.098052978515625, -0.08288192749023438, -0.06771087646484375, -0.052539825439453125, -0.0373687744140625, -0.022197723388671875, -0.00702667236328125, 0.008144378662109375, 0.0233154296875, 0.038486480712890625, 0.05365753173828125, 0.06882858276367188, 0.0839996337890625, 0.09917068481445312, 0.11434173583984375, 0.12951278686523438, 0.144683837890625, 0.15985488891601562, 0.17502593994140625, 0.19019699096679688, 0.2053680419921875, 0.22053909301757812, 0.23571014404296875, 0.2508811950683594, 0.26605224609375, 0.2812232971191406, 0.29639434814453125, 0.3115653991699219, 0.3267364501953125, 0.3419075012207031, 0.35707855224609375, 0.3722496032714844, 0.387420654296875, 0.4025917053222656, 0.41776275634765625, 0.4329338073730469, 0.4481048583984375, 0.4632759094238281, 0.47844696044921875, 0.4936180114746094, 0.5087890625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 11.0, 7.0, 14.0, 15.0, 9.0, 6.0, 18.0, 32.0, 56.0, 156.0, 246.0, 157.0, 99.0, 39.0, 20.0, 11.0, 12.0, 7.0, 11.0, 4.0, 4.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1343994140625, -0.13028717041015625, -0.1261749267578125, -0.12206268310546875, -0.117950439453125, -0.11383819580078125, -0.1097259521484375, -0.10561370849609375, -0.10150146484375, -0.09738922119140625, -0.0932769775390625, -0.08916473388671875, -0.085052490234375, -0.08094024658203125, -0.0768280029296875, -0.07271575927734375, -0.068603515625, -0.06449127197265625, -0.0603790283203125, -0.05626678466796875, -0.052154541015625, -0.04804229736328125, -0.0439300537109375, -0.03981781005859375, -0.03570556640625, -0.03159332275390625, -0.0274810791015625, -0.02336883544921875, -0.019256591796875, -0.01514434814453125, -0.0110321044921875, -0.00691986083984375, -0.0028076171875, 0.00130462646484375, 0.0054168701171875, 0.00952911376953125, 0.013641357421875, 0.01775360107421875, 0.0218658447265625, 0.02597808837890625, 0.03009033203125, 0.03420257568359375, 0.0383148193359375, 0.04242706298828125, 0.046539306640625, 0.05065155029296875, 0.0547637939453125, 0.05887603759765625, 0.06298828125, 0.06710052490234375, 0.0712127685546875, 0.07532501220703125, 0.079437255859375, 0.08354949951171875, 0.0876617431640625, 0.09177398681640625, 0.09588623046875, 0.09999847412109375, 0.1041107177734375, 0.10822296142578125, 0.112335205078125, 0.11644744873046875, 0.1205596923828125, 0.12467193603515625, 0.1287841796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 8.0, 7.0, 7.0, 4.0, 6.0, 9.0, 13.0, 9.0, 23.0, 34.0, 25.0, 25.0, 51.0, 76.0, 85.0, 202.0, 814.0, 12426.0, 981176.0, 50717.0, 2108.0, 284.0, 113.0, 85.0, 46.0, 34.0, 21.0, 19.0, 9.0, 13.0, 11.0, 11.0, 13.0, 15.0, 12.0, 10.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.28125, -2.21148681640625, -2.1417236328125, -2.07196044921875, -2.002197265625, -1.93243408203125, -1.8626708984375, -1.79290771484375, -1.72314453125, -1.65338134765625, -1.5836181640625, -1.51385498046875, -1.444091796875, -1.37432861328125, -1.3045654296875, -1.23480224609375, -1.1650390625, -1.09527587890625, -1.0255126953125, -0.95574951171875, -0.885986328125, -0.81622314453125, -0.7464599609375, -0.67669677734375, -0.60693359375, -0.53717041015625, -0.4674072265625, -0.39764404296875, -0.327880859375, -0.25811767578125, -0.1883544921875, -0.11859130859375, -0.048828125, 0.02093505859375, 0.0906982421875, 0.16046142578125, 0.230224609375, 0.29998779296875, 0.3697509765625, 0.43951416015625, 0.50927734375, 0.57904052734375, 0.6488037109375, 0.71856689453125, 0.788330078125, 0.85809326171875, 0.9278564453125, 0.99761962890625, 1.0673828125, 1.13714599609375, 1.2069091796875, 1.27667236328125, 1.346435546875, 1.41619873046875, 1.4859619140625, 1.55572509765625, 1.62548828125, 1.69525146484375, 1.7650146484375, 1.83477783203125, 1.904541015625, 1.97430419921875, 2.0440673828125, 2.11383056640625, 2.18359375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 9.0, 29.0, 76.0, 234.0, 399.0, 160.0, 67.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9286573529243469, -0.8999905586242676, -0.8713237047195435, -0.8426569104194641, -0.8139901161193848, -0.7853232622146606, -0.7566564679145813, -0.727989673614502, -0.6993228197097778, -0.6706560254096985, -0.6419891715049744, -0.613322377204895, -0.5846555829048157, -0.5559887886047363, -0.5273219347000122, -0.49865514039993286, -0.4699883460998535, -0.4413215219974518, -0.41265472769737244, -0.3839879035949707, -0.35532110929489136, -0.3266542851924896, -0.2979874610900879, -0.26932066679000854, -0.2406538426876068, -0.21198703348636627, -0.18332022428512573, -0.154653400182724, -0.12598659098148346, -0.09731978178024292, -0.06865295767784119, -0.03998614847660065, -0.011319339275360107, 0.01734747365117073, 0.04601428657770157, 0.0746811032295227, 0.10334791243076324, 0.13201472163200378, 0.16068154573440552, 0.18934835493564606, 0.2180151641368866, 0.24668197333812714, 0.2753487825393677, 0.3040156066417694, 0.33268243074417114, 0.3613492250442505, 0.3900160491466522, 0.41868287324905396, 0.4473496675491333, 0.47601649165153503, 0.5046833157539368, 0.5333501100540161, 0.5620169043540955, 0.5906836986541748, 0.6193505525588989, 0.6480173468589783, 0.6766841411590576, 0.705350935459137, 0.7340177893638611, 0.7626845836639404, 0.7913513779640198, 0.8200181722640991, 0.8486850261688232, 0.8773518204689026, 0.9060186743736267]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 9.0, 13.0, 14.0, 10.0, 13.0, 19.0, 21.0, 19.0, 25.0, 23.0, 24.0, 32.0, 29.0, 38.0, 43.0, 47.0, 51.0, 37.0, 43.0, 40.0, 49.0, 53.0, 39.0, 32.0, 32.0, 37.0, 23.0, 29.0, 27.0, 20.0, 20.0, 13.0, 13.0, 8.0, 5.0, 2.0, 6.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22881704568862915, -0.22143736481666565, -0.21405768394470215, -0.20667800307273865, -0.19929832220077515, -0.19191864132881165, -0.18453896045684814, -0.17715927958488464, -0.16977959871292114, -0.16239991784095764, -0.15502023696899414, -0.14764055609703064, -0.14026087522506714, -0.13288119435310364, -0.12550151348114014, -0.11812182515859604, -0.11074213683605194, -0.10336245596408844, -0.09598277509212494, -0.08860309422016144, -0.08122341334819794, -0.07384373247623444, -0.06646404415369034, -0.05908436328172684, -0.051704682409763336, -0.044325001537799835, -0.036945320665836334, -0.029565636068582535, -0.022185955196619034, -0.014806274324655533, -0.007426589727401733, -4.690885543823242e-05, 0.0073327720165252686, 0.014712453819811344, 0.02209213562309742, 0.02947181835770607, 0.03685149922966957, 0.04423118010163307, 0.05161086469888687, 0.05899054557085037, 0.06637022644281387, 0.07374990731477737, 0.08112958818674088, 0.08850927650928497, 0.09588895738124847, 0.10326863825321198, 0.11064831912517548, 0.11802799999713898, 0.12540768086910248, 0.13278736174106598, 0.14016704261302948, 0.14754672348499298, 0.15492640435695648, 0.16230608522891998, 0.16968578100204468, 0.17706546187400818, 0.18444514274597168, 0.19182482361793518, 0.19920450448989868, 0.20658418536186218, 0.21396386623382568, 0.22134354710578918, 0.22872322797775269, 0.2361029088497162, 0.2434825897216797]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 4.0, 10.0, 6.0, 12.0, 17.0, 16.0, 21.0, 30.0, 24.0, 30.0, 30.0, 42.0, 35.0, 47.0, 45.0, 30.0, 47.0, 41.0, 35.0, 43.0, 52.0, 39.0, 33.0, 36.0, 39.0, 44.0, 29.0, 27.0, 13.0, 27.0, 22.0, 12.0, 6.0, 13.0, 10.0, 6.0, 6.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.485595703125, -0.4707984924316406, -0.45600128173828125, -0.4412040710449219, -0.4264068603515625, -0.4116096496582031, -0.39681243896484375, -0.3820152282714844, -0.367218017578125, -0.3524208068847656, -0.33762359619140625, -0.3228263854980469, -0.3080291748046875, -0.2932319641113281, -0.27843475341796875, -0.2636375427246094, -0.24884033203125, -0.23404312133789062, -0.21924591064453125, -0.20444869995117188, -0.1896514892578125, -0.17485427856445312, -0.16005706787109375, -0.14525985717773438, -0.130462646484375, -0.11566543579101562, -0.10086822509765625, -0.08607101440429688, -0.0712738037109375, -0.056476593017578125, -0.04167938232421875, -0.026882171630859375, -0.0120849609375, 0.002712249755859375, 0.01750946044921875, 0.032306671142578125, 0.0471038818359375, 0.061901092529296875, 0.07669830322265625, 0.09149551391601562, 0.106292724609375, 0.12108993530273438, 0.13588714599609375, 0.15068435668945312, 0.1654815673828125, 0.18027877807617188, 0.19507598876953125, 0.20987319946289062, 0.22467041015625, 0.23946762084960938, 0.25426483154296875, 0.2690620422363281, 0.2838592529296875, 0.2986564636230469, 0.31345367431640625, 0.3282508850097656, 0.343048095703125, 0.3578453063964844, 0.37264251708984375, 0.3874397277832031, 0.4022369384765625, 0.4170341491699219, 0.43183135986328125, 0.4466285705566406, 0.46142578125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 9.0, 18.0, 17.0, 25.0, 32.0, 28.0, 72.0, 100.0, 123.0, 182.0, 254.0, 384.0, 467.0, 666.0, 1070.0, 1507.0, 2412.0, 3668.0, 5840.0, 9400.0, 16332.0, 28343.0, 51993.0, 97930.0, 179779.0, 252603.0, 177671.0, 95908.0, 51421.0, 28243.0, 16141.0, 9393.0, 5673.0, 3651.0, 2320.0, 1517.0, 1013.0, 714.0, 489.0, 363.0, 213.0, 161.0, 114.0, 78.0, 47.0, 50.0, 33.0, 23.0, 27.0, 15.0, 10.0, 7.0, 4.0, 5.0, 1.0, 1.0], "bins": [-1.2421875, -1.2050933837890625, -1.167999267578125, -1.1309051513671875, -1.09381103515625, -1.0567169189453125, -1.019622802734375, -0.9825286865234375, -0.9454345703125, -0.9083404541015625, -0.871246337890625, -0.8341522216796875, -0.79705810546875, -0.7599639892578125, -0.722869873046875, -0.6857757568359375, -0.648681640625, -0.6115875244140625, -0.574493408203125, -0.5373992919921875, -0.50030517578125, -0.4632110595703125, -0.426116943359375, -0.3890228271484375, -0.3519287109375, -0.3148345947265625, -0.277740478515625, -0.2406463623046875, -0.20355224609375, -0.1664581298828125, -0.129364013671875, -0.0922698974609375, -0.05517578125, -0.0180816650390625, 0.019012451171875, 0.0561065673828125, 0.09320068359375, 0.1302947998046875, 0.167388916015625, 0.2044830322265625, 0.2415771484375, 0.2786712646484375, 0.315765380859375, 0.3528594970703125, 0.38995361328125, 0.4270477294921875, 0.464141845703125, 0.5012359619140625, 0.538330078125, 0.5754241943359375, 0.612518310546875, 0.6496124267578125, 0.68670654296875, 0.7238006591796875, 0.760894775390625, 0.7979888916015625, 0.8350830078125, 0.8721771240234375, 0.909271240234375, 0.9463653564453125, 0.98345947265625, 1.0205535888671875, 1.057647705078125, 1.0947418212890625, 1.1318359375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 6.0, 9.0, 6.0, 7.0, 14.0, 16.0, 14.0, 26.0, 23.0, 26.0, 30.0, 36.0, 53.0, 43.0, 60.0, 87.0, 140.0, 178.0, 1320.0, 248.0, 162.0, 83.0, 82.0, 60.0, 46.0, 47.0, 34.0, 42.0, 17.0, 36.0, 23.0, 16.0, 9.0, 10.0, 13.0, 4.0, 4.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.724609375, -1.6748809814453125, -1.625152587890625, -1.5754241943359375, -1.52569580078125, -1.4759674072265625, -1.426239013671875, -1.3765106201171875, -1.3267822265625, -1.2770538330078125, -1.227325439453125, -1.1775970458984375, -1.12786865234375, -1.0781402587890625, -1.028411865234375, -0.9786834716796875, -0.928955078125, -0.8792266845703125, -0.829498291015625, -0.7797698974609375, -0.73004150390625, -0.6803131103515625, -0.630584716796875, -0.5808563232421875, -0.5311279296875, -0.4813995361328125, -0.431671142578125, -0.3819427490234375, -0.33221435546875, -0.2824859619140625, -0.232757568359375, -0.1830291748046875, -0.13330078125, -0.0835723876953125, -0.033843994140625, 0.0158843994140625, 0.06561279296875, 0.1153411865234375, 0.165069580078125, 0.2147979736328125, 0.2645263671875, 0.3142547607421875, 0.363983154296875, 0.4137115478515625, 0.46343994140625, 0.5131683349609375, 0.562896728515625, 0.6126251220703125, 0.662353515625, 0.7120819091796875, 0.761810302734375, 0.8115386962890625, 0.86126708984375, 0.9109954833984375, 0.960723876953125, 1.0104522705078125, 1.0601806640625, 1.1099090576171875, 1.159637451171875, 1.2093658447265625, 1.25909423828125, 1.3088226318359375, 1.358551025390625, 1.4082794189453125, 1.4580078125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 1.0, 10.0, 11.0, 7.0, 15.0, 20.0, 11.0, 18.0, 19.0, 30.0, 33.0, 44.0, 58.0, 104.0, 230.0, 981.0, 12737.0, 542430.0, 2539170.0, 46595.0, 2350.0, 373.0, 131.0, 65.0, 46.0, 38.0, 32.0, 15.0, 22.0, 11.0, 11.0, 15.0, 10.0, 8.0, 9.0, 11.0, 4.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.33984375, -6.1365966796875, -5.933349609375, -5.7301025390625, -5.52685546875, -5.3236083984375, -5.120361328125, -4.9171142578125, -4.7138671875, -4.5106201171875, -4.307373046875, -4.1041259765625, -3.90087890625, -3.6976318359375, -3.494384765625, -3.2911376953125, -3.087890625, -2.8846435546875, -2.681396484375, -2.4781494140625, -2.27490234375, -2.0716552734375, -1.868408203125, -1.6651611328125, -1.4619140625, -1.2586669921875, -1.055419921875, -0.8521728515625, -0.64892578125, -0.4456787109375, -0.242431640625, -0.0391845703125, 0.1640625, 0.3673095703125, 0.570556640625, 0.7738037109375, 0.97705078125, 1.1802978515625, 1.383544921875, 1.5867919921875, 1.7900390625, 1.9932861328125, 2.196533203125, 2.3997802734375, 2.60302734375, 2.8062744140625, 3.009521484375, 3.2127685546875, 3.416015625, 3.6192626953125, 3.822509765625, 4.0257568359375, 4.22900390625, 4.4322509765625, 4.635498046875, 4.8387451171875, 5.0419921875, 5.2452392578125, 5.448486328125, 5.6517333984375, 5.85498046875, 6.0582275390625, 6.261474609375, 6.4647216796875, 6.66796875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 12.0, 23.0, 103.0, 195.0, 270.0, 230.0, 103.0, 59.0, 11.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421860694885254, -1.8986618518829346, -1.5551377534866333, -1.211613655090332, -0.8680894374847412, -0.5245652198791504, -0.18104124069213867, 0.16248297691345215, 0.506007194519043, 0.849531352519989, 1.193055510520935, 1.5365796089172363, 1.8801038265228271, 2.223628044128418, 2.5671520233154297, 2.9106762409210205, 3.2542004585266113, 3.597724676132202, 3.941248893737793, 4.284772872924805, 4.628296852111816, 4.971821308135986, 5.315345287322998, 5.658869743347168, 6.00239372253418, 6.345917701721191, 6.689442157745361, 7.032966136932373, 7.376490592956543, 7.720014572143555, 8.063538551330566, 8.407062530517578, 8.750587463378906, 9.094111442565918, 9.43763542175293, 9.781160354614258, 10.12468433380127, 10.468208312988281, 10.811732292175293, 11.155256271362305, 11.498781204223633, 11.842305183410645, 12.185829162597656, 12.529354095458984, 12.872878074645996, 13.216402053833008, 13.55992603302002, 13.903450012207031, 14.246973991394043, 14.590497970581055, 14.934021949768066, 15.277545928955078, 15.621070861816406, 15.964594841003418, 16.30811882019043, 16.651643753051758, 16.995166778564453, 17.33869171142578, 17.682214736938477, 18.025739669799805, 18.3692626953125, 18.712787628173828, 19.056312561035156, 19.39983558654785, 19.74336051940918]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 9.0, 4.0, 4.0, 7.0, 10.0, 8.0, 14.0, 15.0, 14.0, 15.0, 22.0, 19.0, 15.0, 29.0, 43.0, 26.0, 30.0, 32.0, 35.0, 44.0, 34.0, 37.0, 44.0, 39.0, 42.0, 36.0, 33.0, 25.0, 38.0, 30.0, 30.0, 29.0, 25.0, 32.0, 26.0, 11.0, 22.0, 18.0, 11.0, 7.0, 9.0, 10.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-5.0485663414001465, -4.901350975036621, -4.754136085510254, -4.6069207191467285, -4.459705352783203, -4.312490463256836, -4.1652750968933105, -4.018059730529785, -3.870844602584839, -3.7236294746398926, -3.576414108276367, -3.429198980331421, -3.2819838523864746, -3.134768486022949, -2.987553358078003, -2.8403382301330566, -2.6931228637695312, -2.545907735824585, -2.3986923694610596, -2.2514772415161133, -2.104261875152588, -1.9570467472076416, -1.8098316192626953, -1.6626163721084595, -1.5154011249542236, -1.3681858777999878, -1.220970630645752, -1.0737555027008057, -0.9265402555465698, -0.779325008392334, -0.6321098208427429, -0.48489463329315186, -0.3376789093017578, -0.19046369194984436, -0.04324847459793091, 0.10396674275398254, 0.251181960105896, 0.39839720726013184, 0.5456123948097229, 0.692827582359314, 0.8400428295135498, 0.9872580766677856, 1.1344733238220215, 1.2816884517669678, 1.4289036989212036, 1.5761189460754395, 1.7233340740203857, 1.8705493211746216, 2.0177645683288574, 2.1649796962738037, 2.312195062637329, 2.4594101905822754, 2.606625556945801, 2.753840684890747, 2.9010558128356934, 3.0482711791992188, 3.195486307144165, 3.3427014350891113, 3.4899168014526367, 3.637131929397583, 3.7843470573425293, 3.9315624237060547, 4.07877779006958, 4.225992679595947, 4.373208045959473]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 4.0, 7.0, 16.0, 11.0, 17.0, 21.0, 17.0, 17.0, 22.0, 34.0, 24.0, 46.0, 21.0, 32.0, 40.0, 39.0, 47.0, 32.0, 30.0, 40.0, 44.0, 40.0, 40.0, 41.0, 33.0, 23.0, 39.0, 34.0, 26.0, 26.0, 15.0, 20.0, 23.0, 11.0, 7.0, 13.0, 5.0, 11.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.490966796875, -0.4763832092285156, -0.46179962158203125, -0.4472160339355469, -0.4326324462890625, -0.4180488586425781, -0.40346527099609375, -0.3888816833496094, -0.374298095703125, -0.3597145080566406, -0.34513092041015625, -0.3305473327636719, -0.3159637451171875, -0.3013801574707031, -0.28679656982421875, -0.2722129821777344, -0.25762939453125, -0.24304580688476562, -0.22846221923828125, -0.21387863159179688, -0.1992950439453125, -0.18471145629882812, -0.17012786865234375, -0.15554428100585938, -0.140960693359375, -0.12637710571289062, -0.11179351806640625, -0.09720993041992188, -0.0826263427734375, -0.06804275512695312, -0.05345916748046875, -0.038875579833984375, -0.0242919921875, -0.009708404541015625, 0.00487518310546875, 0.019458770751953125, 0.0340423583984375, 0.048625946044921875, 0.06320953369140625, 0.07779312133789062, 0.092376708984375, 0.10696029663085938, 0.12154388427734375, 0.13612747192382812, 0.1507110595703125, 0.16529464721679688, 0.17987823486328125, 0.19446182250976562, 0.20904541015625, 0.22362899780273438, 0.23821258544921875, 0.2527961730957031, 0.2673797607421875, 0.2819633483886719, 0.29654693603515625, 0.3111305236816406, 0.325714111328125, 0.3402976989746094, 0.35488128662109375, 0.3694648742675781, 0.3840484619140625, 0.3986320495605469, 0.41321563720703125, 0.4277992248535156, 0.4423828125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 9.0, 4.0, 5.0, 10.0, 11.0, 13.0, 34.0, 39.0, 42.0, 72.0, 92.0, 159.0, 247.0, 415.0, 752.0, 1299.0, 2518.0, 5056.0, 10628.0, 23481.0, 56962.0, 170592.0, 1219573.0, 2320151.0, 248265.0, 75776.0, 30645.0, 13989.0, 6651.0, 3188.0, 1570.0, 890.0, 414.0, 247.0, 171.0, 101.0, 52.0, 46.0, 26.0, 22.0, 13.0, 17.0, 17.0, 9.0, 4.0, 1.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8955078125, -1.8365325927734375, -1.777557373046875, -1.7185821533203125, -1.65960693359375, -1.6006317138671875, -1.541656494140625, -1.4826812744140625, -1.4237060546875, -1.3647308349609375, -1.305755615234375, -1.2467803955078125, -1.18780517578125, -1.1288299560546875, -1.069854736328125, -1.0108795166015625, -0.951904296875, -0.8929290771484375, -0.833953857421875, -0.7749786376953125, -0.71600341796875, -0.6570281982421875, -0.598052978515625, -0.5390777587890625, -0.4801025390625, -0.4211273193359375, -0.362152099609375, -0.3031768798828125, -0.24420166015625, -0.1852264404296875, -0.126251220703125, -0.0672760009765625, -0.00830078125, 0.0506744384765625, 0.109649658203125, 0.1686248779296875, 0.22760009765625, 0.2865753173828125, 0.345550537109375, 0.4045257568359375, 0.4635009765625, 0.5224761962890625, 0.581451416015625, 0.6404266357421875, 0.69940185546875, 0.7583770751953125, 0.817352294921875, 0.8763275146484375, 0.935302734375, 0.9942779541015625, 1.053253173828125, 1.1122283935546875, 1.17120361328125, 1.2301788330078125, 1.289154052734375, 1.3481292724609375, 1.4071044921875, 1.4660797119140625, 1.525054931640625, 1.5840301513671875, 1.64300537109375, 1.7019805908203125, 1.760955810546875, 1.8199310302734375, 1.87890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 19.0, 29.0, 64.0, 97.0, 192.0, 371.0, 887.0, 1311.0, 552.0, 257.0, 150.0, 80.0, 36.0, 15.0, 7.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435546875, -3.304595947265625, -3.17364501953125, -3.042694091796875, -2.9117431640625, -2.780792236328125, -2.64984130859375, -2.518890380859375, -2.387939453125, -2.256988525390625, -2.12603759765625, -1.995086669921875, -1.8641357421875, -1.733184814453125, -1.60223388671875, -1.471282958984375, -1.34033203125, -1.209381103515625, -1.07843017578125, -0.947479248046875, -0.8165283203125, -0.685577392578125, -0.55462646484375, -0.423675537109375, -0.292724609375, -0.161773681640625, -0.03082275390625, 0.100128173828125, 0.2310791015625, 0.362030029296875, 0.49298095703125, 0.623931884765625, 0.7548828125, 0.885833740234375, 1.01678466796875, 1.147735595703125, 1.2786865234375, 1.409637451171875, 1.54058837890625, 1.671539306640625, 1.802490234375, 1.933441162109375, 2.06439208984375, 2.195343017578125, 2.3262939453125, 2.457244873046875, 2.58819580078125, 2.719146728515625, 2.85009765625, 2.981048583984375, 3.11199951171875, 3.242950439453125, 3.3739013671875, 3.504852294921875, 3.63580322265625, 3.766754150390625, 3.897705078125, 4.028656005859375, 4.15960693359375, 4.290557861328125, 4.4215087890625, 4.552459716796875, 4.68341064453125, 4.814361572265625, 4.9453125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 5.0, 11.0, 14.0, 19.0, 29.0, 29.0, 38.0, 63.0, 104.0, 207.0, 469.0, 1345.0, 5061.0, 27540.0, 270347.0, 3532265.0, 317876.0, 30655.0, 5653.0, 1480.0, 483.0, 226.0, 112.0, 66.0, 41.0, 26.0, 25.0, 15.0, 18.0, 16.0, 11.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.58856201171875, -5.3607177734375, -5.13287353515625, -4.905029296875, -4.67718505859375, -4.4493408203125, -4.22149658203125, -3.99365234375, -3.76580810546875, -3.5379638671875, -3.31011962890625, -3.082275390625, -2.85443115234375, -2.6265869140625, -2.39874267578125, -2.1708984375, -1.94305419921875, -1.7152099609375, -1.48736572265625, -1.259521484375, -1.03167724609375, -0.8038330078125, -0.57598876953125, -0.34814453125, -0.12030029296875, 0.1075439453125, 0.33538818359375, 0.563232421875, 0.79107666015625, 1.0189208984375, 1.24676513671875, 1.474609375, 1.70245361328125, 1.9302978515625, 2.15814208984375, 2.385986328125, 2.61383056640625, 2.8416748046875, 3.06951904296875, 3.29736328125, 3.52520751953125, 3.7530517578125, 3.98089599609375, 4.208740234375, 4.43658447265625, 4.6644287109375, 4.89227294921875, 5.1201171875, 5.34796142578125, 5.5758056640625, 5.80364990234375, 6.031494140625, 6.25933837890625, 6.4871826171875, 6.71502685546875, 6.94287109375, 7.17071533203125, 7.3985595703125, 7.62640380859375, 7.854248046875, 8.08209228515625, 8.3099365234375, 8.53778076171875, 8.765625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 6.0, 19.0, 26.0, 49.0, 60.0, 71.0, 103.0, 123.0, 131.0, 118.0, 105.0, 64.0, 45.0, 30.0, 18.0, 12.0, 10.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.885873794555664, -8.532870292663574, -8.179866790771484, -7.826864242553711, -7.473860740661621, -7.120857238769531, -6.7678542137146, -6.414851188659668, -6.061847686767578, -5.708844184875488, -5.355841159820557, -5.002838134765625, -4.649834632873535, -4.296831130981445, -3.9438281059265137, -3.590824842453003, -3.237821578979492, -2.8848183155059814, -2.5318150520324707, -2.17881178855896, -1.8258085250854492, -1.4728052616119385, -1.1198019981384277, -0.766798734664917, -0.41379547119140625, -0.06079220771789551, 0.29221105575561523, 0.645214319229126, 0.9982175827026367, 1.3512208461761475, 1.7042241096496582, 2.057227373123169, 2.4102306365966797, 2.7632339000701904, 3.116237163543701, 3.469240427017212, 3.8222436904907227, 4.1752471923828125, 4.528250217437744, 4.881253242492676, 5.234256744384766, 5.5872602462768555, 5.940263271331787, 6.293266296386719, 6.646269798278809, 6.999273300170898, 7.35227632522583, 7.705279350280762, 8.058282852172852, 8.411286354064941, 8.764289855957031, 9.117292404174805, 9.470295906066895, 9.823299407958984, 10.176301956176758, 10.529305458068848, 10.882308959960938, 11.235312461853027, 11.588315963745117, 11.94131851196289, 12.29432201385498, 12.64732551574707, 13.000328063964844, 13.353331565856934, 13.706335067749023]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 2.0, 4.0, 10.0, 12.0, 7.0, 18.0, 15.0, 8.0, 30.0, 19.0, 17.0, 32.0, 46.0, 32.0, 33.0, 42.0, 54.0, 39.0, 42.0, 47.0, 43.0, 52.0, 34.0, 46.0, 27.0, 27.0, 33.0, 33.0, 16.0, 26.0, 35.0, 21.0, 19.0, 16.0, 12.0, 8.0, 9.0, 6.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.796862602233887, -5.603631496429443, -5.410400390625, -5.217169761657715, -5.0239386558532715, -4.830707550048828, -4.637476444244385, -4.444245338439941, -4.251014709472656, -4.057783603668213, -3.8645527362823486, -3.6713216304779053, -3.478090763092041, -3.2848596572875977, -3.0916285514831543, -2.898397445678711, -2.7051663398742676, -2.511935234069824, -2.31870436668396, -2.1254732608795166, -1.9322422742843628, -1.739011287689209, -1.5457801818847656, -1.3525491952896118, -1.159318208694458, -0.9660872220993042, -0.7728561758995056, -0.579625129699707, -0.3863941431045532, -0.19316315650939941, 6.794929504394531e-05, 0.19329893589019775, 0.38652944564819336, 0.5797604322433472, 0.7729914784431458, 0.9662225246429443, 1.1594535112380981, 1.352684497833252, 1.5459156036376953, 1.7391465902328491, 1.932377576828003, 2.1256086826324463, 2.3188395500183105, 2.512070655822754, 2.7053017616271973, 2.8985326290130615, 3.091763734817505, 3.284994602203369, 3.4782257080078125, 3.671456813812256, 3.86468768119812, 4.057918548583984, 4.251149654388428, 4.444380760192871, 4.6376118659973145, 4.830842971801758, 5.024073600769043, 5.217304706573486, 5.41053581237793, 5.603766441345215, 5.796997547149658, 5.990228652954102, 6.183459758758545, 6.376690864562988, 6.569921970367432]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 5.0, 7.0, 7.0, 11.0, 13.0, 12.0, 19.0, 17.0, 22.0, 22.0, 29.0, 27.0, 28.0, 28.0, 41.0, 26.0, 42.0, 33.0, 36.0, 49.0, 42.0, 30.0, 44.0, 40.0, 52.0, 39.0, 40.0, 33.0, 23.0, 26.0, 20.0, 14.0, 19.0, 19.0, 15.0, 10.0, 15.0, 5.0, 5.0, 5.0, 4.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5009765625, -0.4853935241699219, -0.46981048583984375, -0.4542274475097656, -0.4386444091796875, -0.4230613708496094, -0.40747833251953125, -0.3918952941894531, -0.376312255859375, -0.3607292175292969, -0.34514617919921875, -0.3295631408691406, -0.3139801025390625, -0.2983970642089844, -0.28281402587890625, -0.2672309875488281, -0.25164794921875, -0.23606491088867188, -0.22048187255859375, -0.20489883422851562, -0.1893157958984375, -0.17373275756835938, -0.15814971923828125, -0.14256668090820312, -0.126983642578125, -0.11140060424804688, -0.09581756591796875, -0.08023452758789062, -0.0646514892578125, -0.049068450927734375, -0.03348541259765625, -0.017902374267578125, -0.0023193359375, 0.013263702392578125, 0.02884674072265625, 0.044429779052734375, 0.0600128173828125, 0.07559585571289062, 0.09117889404296875, 0.10676193237304688, 0.122344970703125, 0.13792800903320312, 0.15351104736328125, 0.16909408569335938, 0.1846771240234375, 0.20026016235351562, 0.21584320068359375, 0.23142623901367188, 0.24700927734375, 0.2625923156738281, 0.27817535400390625, 0.2937583923339844, 0.3093414306640625, 0.3249244689941406, 0.34050750732421875, 0.3560905456542969, 0.371673583984375, 0.3872566223144531, 0.40283966064453125, 0.4184226989746094, 0.4340057373046875, 0.4495887756347656, 0.46517181396484375, 0.4807548522949219, 0.496337890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 19.0, 16.0, 24.0, 32.0, 68.0, 81.0, 136.0, 203.0, 299.0, 406.0, 554.0, 916.0, 1282.0, 1828.0, 2843.0, 4065.0, 5928.0, 8872.0, 13149.0, 19876.0, 30667.0, 47379.0, 76207.0, 124814.0, 215619.0, 190839.0, 109778.0, 67550.0, 42849.0, 27271.0, 17974.0, 11934.0, 8046.0, 5394.0, 3771.0, 2496.0, 1672.0, 1183.0, 780.0, 550.0, 341.0, 274.0, 164.0, 130.0, 89.0, 52.0, 44.0, 28.0, 18.0, 12.0, 6.0, 5.0, 7.0, 4.0, 1.0, 3.0], "bins": [-0.88818359375, -0.8611679077148438, -0.8341522216796875, -0.8071365356445312, -0.780120849609375, -0.7531051635742188, -0.7260894775390625, -0.6990737915039062, -0.67205810546875, -0.6450424194335938, -0.6180267333984375, -0.5910110473632812, -0.563995361328125, -0.5369796752929688, -0.5099639892578125, -0.48294830322265625, -0.4559326171875, -0.42891693115234375, -0.4019012451171875, -0.37488555908203125, -0.347869873046875, -0.32085418701171875, -0.2938385009765625, -0.26682281494140625, -0.23980712890625, -0.21279144287109375, -0.1857757568359375, -0.15876007080078125, -0.131744384765625, -0.10472869873046875, -0.0777130126953125, -0.05069732666015625, -0.023681640625, 0.00333404541015625, 0.0303497314453125, 0.05736541748046875, 0.084381103515625, 0.11139678955078125, 0.1384124755859375, 0.16542816162109375, 0.19244384765625, 0.21945953369140625, 0.2464752197265625, 0.27349090576171875, 0.300506591796875, 0.32752227783203125, 0.3545379638671875, 0.38155364990234375, 0.4085693359375, 0.43558502197265625, 0.4626007080078125, 0.48961639404296875, 0.516632080078125, 0.5436477661132812, 0.5706634521484375, 0.5976791381835938, 0.62469482421875, 0.6517105102539062, 0.6787261962890625, 0.7057418823242188, 0.732757568359375, 0.7597732543945312, 0.7867889404296875, 0.8138046264648438, 0.8408203125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 6.0, 12.0, 19.0, 16.0, 15.0, 25.0, 19.0, 31.0, 25.0, 35.0, 37.0, 36.0, 26.0, 37.0, 40.0, 47.0, 34.0, 1071.0, 41.0, 43.0, 23.0, 38.0, 37.0, 36.0, 28.0, 27.0, 29.0, 25.0, 25.0, 17.0, 17.0, 20.0, 8.0, 12.0, 10.0, 9.0, 3.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.50244140625, -0.4882659912109375, -0.474090576171875, -0.4599151611328125, -0.44573974609375, -0.4315643310546875, -0.417388916015625, -0.4032135009765625, -0.3890380859375, -0.3748626708984375, -0.360687255859375, -0.3465118408203125, -0.33233642578125, -0.3181610107421875, -0.303985595703125, -0.2898101806640625, -0.275634765625, -0.2614593505859375, -0.247283935546875, -0.2331085205078125, -0.21893310546875, -0.2047576904296875, -0.190582275390625, -0.1764068603515625, -0.1622314453125, -0.1480560302734375, -0.133880615234375, -0.1197052001953125, -0.10552978515625, -0.0913543701171875, -0.077178955078125, -0.0630035400390625, -0.048828125, -0.0346527099609375, -0.020477294921875, -0.0063018798828125, 0.00787353515625, 0.0220489501953125, 0.036224365234375, 0.0503997802734375, 0.0645751953125, 0.0787506103515625, 0.092926025390625, 0.1071014404296875, 0.12127685546875, 0.1354522705078125, 0.149627685546875, 0.1638031005859375, 0.177978515625, 0.1921539306640625, 0.206329345703125, 0.2205047607421875, 0.23468017578125, 0.2488555908203125, 0.263031005859375, 0.2772064208984375, 0.2913818359375, 0.3055572509765625, 0.319732666015625, 0.3339080810546875, 0.34808349609375, 0.3622589111328125, 0.376434326171875, 0.3906097412109375, 0.40478515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 10.0, 6.0, 14.0, 12.0, 25.0, 28.0, 40.0, 76.0, 122.0, 168.0, 283.0, 396.0, 689.0, 1029.0, 1627.0, 2685.0, 4826.0, 8938.0, 17484.0, 37356.0, 93927.0, 325245.0, 1154469.0, 289887.0, 86412.0, 34915.0, 16478.0, 8391.0, 4600.0, 2709.0, 1616.0, 965.0, 592.0, 387.0, 241.0, 164.0, 127.0, 74.0, 37.0, 28.0, 20.0, 16.0, 5.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.7866744995117188, -0.7608489990234375, -0.7350234985351562, -0.709197998046875, -0.6833724975585938, -0.6575469970703125, -0.6317214965820312, -0.60589599609375, -0.5800704956054688, -0.5542449951171875, -0.5284194946289062, -0.502593994140625, -0.47676849365234375, -0.4509429931640625, -0.42511749267578125, -0.3992919921875, -0.37346649169921875, -0.3476409912109375, -0.32181549072265625, -0.295989990234375, -0.27016448974609375, -0.2443389892578125, -0.21851348876953125, -0.19268798828125, -0.16686248779296875, -0.1410369873046875, -0.11521148681640625, -0.089385986328125, -0.06356048583984375, -0.0377349853515625, -0.01190948486328125, 0.013916015625, 0.03974151611328125, 0.0655670166015625, 0.09139251708984375, 0.117218017578125, 0.14304351806640625, 0.1688690185546875, 0.19469451904296875, 0.22052001953125, 0.24634552001953125, 0.2721710205078125, 0.29799652099609375, 0.323822021484375, 0.34964752197265625, 0.3754730224609375, 0.40129852294921875, 0.4271240234375, 0.45294952392578125, 0.4787750244140625, 0.5046005249023438, 0.530426025390625, 0.5562515258789062, 0.5820770263671875, 0.6079025268554688, 0.63372802734375, 0.6595535278320312, 0.6853790283203125, 0.7112045288085938, 0.737030029296875, 0.7628555297851562, 0.7886810302734375, 0.8145065307617188, 0.84033203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 3.0, 6.0, 6.0, 9.0, 5.0, 15.0, 16.0, 21.0, 30.0, 31.0, 47.0, 75.0, 92.0, 139.0, 131.0, 86.0, 80.0, 55.0, 27.0, 27.0, 20.0, 14.0, 14.0, 7.0, 11.0, 8.0, 4.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.381103515625, -0.3695182800292969, -0.35793304443359375, -0.3463478088378906, -0.3347625732421875, -0.3231773376464844, -0.31159210205078125, -0.3000068664550781, -0.288421630859375, -0.2768363952636719, -0.26525115966796875, -0.2536659240722656, -0.2420806884765625, -0.23049545288085938, -0.21891021728515625, -0.20732498168945312, -0.19573974609375, -0.18415451049804688, -0.17256927490234375, -0.16098403930664062, -0.1493988037109375, -0.13781356811523438, -0.12622833251953125, -0.11464309692382812, -0.103057861328125, -0.09147262573242188, -0.07988739013671875, -0.06830215454101562, -0.0567169189453125, -0.045131683349609375, -0.03354644775390625, -0.021961212158203125, -0.0103759765625, 0.001209259033203125, 0.01279449462890625, 0.024379730224609375, 0.0359649658203125, 0.047550201416015625, 0.05913543701171875, 0.07072067260742188, 0.082305908203125, 0.09389114379882812, 0.10547637939453125, 0.11706161499023438, 0.1286468505859375, 0.14023208618164062, 0.15181732177734375, 0.16340255737304688, 0.17498779296875, 0.18657302856445312, 0.19815826416015625, 0.20974349975585938, 0.2213287353515625, 0.23291397094726562, 0.24449920654296875, 0.2560844421386719, 0.267669677734375, 0.2792549133300781, 0.29084014892578125, 0.3024253845214844, 0.3140106201171875, 0.3255958557128906, 0.33718109130859375, 0.3487663269042969, 0.3603515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 10.0, 13.0, 13.0, 20.0, 18.0, 17.0, 22.0, 32.0, 53.0, 59.0, 99.0, 138.0, 266.0, 664.0, 1877.0, 14154.0, 930854.0, 94097.0, 4045.0, 1038.0, 435.0, 173.0, 113.0, 73.0, 57.0, 41.0, 30.0, 19.0, 27.0, 11.0, 18.0, 11.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0], "bins": [-4.9140625, -4.76397705078125, -4.6138916015625, -4.46380615234375, -4.313720703125, -4.16363525390625, -4.0135498046875, -3.86346435546875, -3.71337890625, -3.56329345703125, -3.4132080078125, -3.26312255859375, -3.113037109375, -2.96295166015625, -2.8128662109375, -2.66278076171875, -2.5126953125, -2.36260986328125, -2.2125244140625, -2.06243896484375, -1.912353515625, -1.76226806640625, -1.6121826171875, -1.46209716796875, -1.31201171875, -1.16192626953125, -1.0118408203125, -0.86175537109375, -0.711669921875, -0.56158447265625, -0.4114990234375, -0.26141357421875, -0.111328125, 0.03875732421875, 0.1888427734375, 0.33892822265625, 0.489013671875, 0.63909912109375, 0.7891845703125, 0.93927001953125, 1.08935546875, 1.23944091796875, 1.3895263671875, 1.53961181640625, 1.689697265625, 1.83978271484375, 1.9898681640625, 2.13995361328125, 2.2900390625, 2.44012451171875, 2.5902099609375, 2.74029541015625, 2.890380859375, 3.04046630859375, 3.1905517578125, 3.34063720703125, 3.49072265625, 3.64080810546875, 3.7908935546875, 3.94097900390625, 4.091064453125, 4.24114990234375, 4.3912353515625, 4.54132080078125, 4.69140625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 21.0, 48.0, 89.0, 206.0, 297.0, 205.0, 94.0, 27.0, 13.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7928172945976257, -0.7447412610054016, -0.6966651678085327, -0.6485891342163086, -0.6005131006240845, -0.5524370670318604, -0.5043609738349915, -0.45628494024276733, -0.4082088768482208, -0.3601328134536743, -0.3120567798614502, -0.2639807164669037, -0.21590466797351837, -0.16782861948013306, -0.11975255608558655, -0.07167652249336243, -0.023600459098815918, 0.024475593119859695, 0.07255164533853531, 0.12062770128250122, 0.16870374977588654, 0.21677979826927185, 0.26485586166381836, 0.3129318952560425, 0.361007958650589, 0.4090840220451355, 0.4571600556373596, 0.5052361488342285, 0.5533121824264526, 0.6013882160186768, 0.6494642496109009, 0.697540283203125, 0.7456163167953491, 0.7936923503875732, 0.8417684435844421, 0.8898444771766663, 0.9379205107688904, 0.9859966039657593, 1.0340726375579834, 1.0821486711502075, 1.1302247047424316, 1.1783007383346558, 1.2263767719268799, 1.2744529247283936, 1.3225289583206177, 1.3706049919128418, 1.418681025505066, 1.46675705909729, 1.5148332118988037, 1.5629092454910278, 1.610985279083252, 1.6590614318847656, 1.7071374654769897, 1.7552134990692139, 1.803289532661438, 1.851365566253662, 1.8994415998458862, 1.9475176334381104, 1.9955936670303345, 2.0436697006225586, 2.0917458534240723, 2.139821767807007, 2.1878979206085205, 2.235973834991455, 2.2840499877929688]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 6.0, 13.0, 11.0, 13.0, 23.0, 19.0, 14.0, 21.0, 39.0, 30.0, 23.0, 40.0, 30.0, 46.0, 38.0, 44.0, 35.0, 38.0, 44.0, 38.0, 37.0, 46.0, 34.0, 40.0, 25.0, 37.0, 37.0, 33.0, 26.0, 14.0, 18.0, 14.0, 15.0, 8.0, 13.0, 9.0, 5.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3175188899040222, -0.3081035017967224, -0.298688143491745, -0.2892727553844452, -0.2798573970794678, -0.27044200897216797, -0.26102662086486816, -0.25161126255989075, -0.24219587445259094, -0.23278050124645233, -0.22336512804031372, -0.21394973993301392, -0.2045343667268753, -0.1951189935207367, -0.18570362031459808, -0.17628824710845947, -0.16687287390232086, -0.15745750069618225, -0.14804212749004364, -0.13862675428390503, -0.12921136617660522, -0.11979599297046661, -0.110380619764328, -0.1009652391076088, -0.09154986590147018, -0.08213449269533157, -0.07271911203861237, -0.06330373883247375, -0.053888361901044846, -0.044472984969615936, -0.035057611763477325, -0.025642231106758118, -0.016226857900619507, -0.006811481900513172, 0.0026038940995931625, 0.012019269168376923, 0.021434646099805832, 0.03085002303123474, 0.04026539623737335, 0.04968077689409256, 0.05909615010023117, 0.06851152330636978, 0.07792690396308899, 0.0873422771692276, 0.09675765037536621, 0.10617303103208542, 0.11558840423822403, 0.12500378489494324, 0.13441915810108185, 0.14383453130722046, 0.15324990451335907, 0.16266527771949768, 0.17208066582679749, 0.1814960390329361, 0.1909114122390747, 0.2003268003463745, 0.20974215865135193, 0.21915753185749054, 0.22857290506362915, 0.23798829317092896, 0.24740366637706757, 0.2568190395832062, 0.2662343978881836, 0.2756497859954834, 0.2850651741027832]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 7.0, 7.0, 10.0, 14.0, 11.0, 20.0, 16.0, 17.0, 25.0, 27.0, 25.0, 27.0, 29.0, 41.0, 25.0, 44.0, 32.0, 31.0, 42.0, 48.0, 36.0, 37.0, 41.0, 47.0, 47.0, 39.0, 35.0, 26.0, 21.0, 28.0, 12.0, 18.0, 22.0, 15.0, 13.0, 12.0, 6.0, 6.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50390625, -0.4883689880371094, -0.47283172607421875, -0.4572944641113281, -0.4417572021484375, -0.4262199401855469, -0.41068267822265625, -0.3951454162597656, -0.379608154296875, -0.3640708923339844, -0.34853363037109375, -0.3329963684082031, -0.3174591064453125, -0.3019218444824219, -0.28638458251953125, -0.2708473205566406, -0.25531005859375, -0.23977279663085938, -0.22423553466796875, -0.20869827270507812, -0.1931610107421875, -0.17762374877929688, -0.16208648681640625, -0.14654922485351562, -0.131011962890625, -0.11547470092773438, -0.09993743896484375, -0.08440017700195312, -0.0688629150390625, -0.053325653076171875, -0.03778839111328125, -0.022251129150390625, -0.0067138671875, 0.008823394775390625, 0.02436065673828125, 0.039897918701171875, 0.0554351806640625, 0.07097244262695312, 0.08650970458984375, 0.10204696655273438, 0.117584228515625, 0.13312149047851562, 0.14865875244140625, 0.16419601440429688, 0.1797332763671875, 0.19527053833007812, 0.21080780029296875, 0.22634506225585938, 0.24188232421875, 0.2574195861816406, 0.27295684814453125, 0.2884941101074219, 0.3040313720703125, 0.3195686340332031, 0.33510589599609375, 0.3506431579589844, 0.366180419921875, 0.3817176818847656, 0.39725494384765625, 0.4127922058105469, 0.4283294677734375, 0.4438667297363281, 0.45940399169921875, 0.4749412536621094, 0.490478515625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 9.0, 15.0, 14.0, 19.0, 31.0, 46.0, 64.0, 77.0, 115.0, 190.0, 295.0, 378.0, 497.0, 732.0, 1005.0, 1536.0, 2215.0, 3435.0, 5669.0, 9609.0, 18058.0, 36190.0, 79241.0, 178075.0, 299535.0, 216333.0, 99165.0, 44573.0, 21626.0, 11310.0, 6445.0, 3978.0, 2552.0, 1664.0, 1108.0, 825.0, 530.0, 418.0, 268.0, 188.0, 152.0, 102.0, 85.0, 67.0, 33.0, 23.0, 20.0, 14.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.8388671875, -0.8131637573242188, -0.7874603271484375, -0.7617568969726562, -0.736053466796875, -0.7103500366210938, -0.6846466064453125, -0.6589431762695312, -0.63323974609375, -0.6075363159179688, -0.5818328857421875, -0.5561294555664062, -0.530426025390625, -0.5047225952148438, -0.4790191650390625, -0.45331573486328125, -0.4276123046875, -0.40190887451171875, -0.3762054443359375, -0.35050201416015625, -0.324798583984375, -0.29909515380859375, -0.2733917236328125, -0.24768829345703125, -0.22198486328125, -0.19628143310546875, -0.1705780029296875, -0.14487457275390625, -0.119171142578125, -0.09346771240234375, -0.0677642822265625, -0.04206085205078125, -0.016357421875, 0.00934600830078125, 0.0350494384765625, 0.06075286865234375, 0.086456298828125, 0.11215972900390625, 0.1378631591796875, 0.16356658935546875, 0.18927001953125, 0.21497344970703125, 0.2406768798828125, 0.26638031005859375, 0.292083740234375, 0.31778717041015625, 0.3434906005859375, 0.36919403076171875, 0.3948974609375, 0.42060089111328125, 0.4463043212890625, 0.47200775146484375, 0.497711181640625, 0.5234146118164062, 0.5491180419921875, 0.5748214721679688, 0.60052490234375, 0.6262283325195312, 0.6519317626953125, 0.6776351928710938, 0.703338623046875, 0.7290420532226562, 0.7547454833984375, 0.7804489135742188, 0.80615234375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 11.0, 7.0, 6.0, 14.0, 9.0, 19.0, 12.0, 19.0, 33.0, 35.0, 27.0, 35.0, 49.0, 40.0, 60.0, 67.0, 102.0, 192.0, 1290.0, 309.0, 164.0, 106.0, 66.0, 47.0, 51.0, 31.0, 42.0, 20.0, 27.0, 16.0, 24.0, 25.0, 11.0, 13.0, 11.0, 10.0, 10.0, 4.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9755859375, -1.913818359375, -1.85205078125, -1.790283203125, -1.728515625, -1.666748046875, -1.60498046875, -1.543212890625, -1.4814453125, -1.419677734375, -1.35791015625, -1.296142578125, -1.234375, -1.172607421875, -1.11083984375, -1.049072265625, -0.9873046875, -0.925537109375, -0.86376953125, -0.802001953125, -0.740234375, -0.678466796875, -0.61669921875, -0.554931640625, -0.4931640625, -0.431396484375, -0.36962890625, -0.307861328125, -0.24609375, -0.184326171875, -0.12255859375, -0.060791015625, 0.0009765625, 0.062744140625, 0.12451171875, 0.186279296875, 0.248046875, 0.309814453125, 0.37158203125, 0.433349609375, 0.4951171875, 0.556884765625, 0.61865234375, 0.680419921875, 0.7421875, 0.803955078125, 0.86572265625, 0.927490234375, 0.9892578125, 1.051025390625, 1.11279296875, 1.174560546875, 1.236328125, 1.298095703125, 1.35986328125, 1.421630859375, 1.4833984375, 1.545166015625, 1.60693359375, 1.668701171875, 1.73046875, 1.792236328125, 1.85400390625, 1.915771484375, 1.9775390625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 5.0, 3.0, 7.0, 14.0, 5.0, 8.0, 15.0, 24.0, 28.0, 41.0, 65.0, 85.0, 161.0, 285.0, 637.0, 1550.0, 4291.0, 14570.0, 74941.0, 1125655.0, 1791409.0, 104915.0, 18379.0, 5175.0, 1852.0, 724.0, 347.0, 176.0, 95.0, 66.0, 38.0, 27.0, 24.0, 16.0, 13.0, 10.0, 14.0, 4.0, 8.0, 6.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.556640625, -3.449127197265625, -3.34161376953125, -3.234100341796875, -3.1265869140625, -3.019073486328125, -2.91156005859375, -2.804046630859375, -2.696533203125, -2.589019775390625, -2.48150634765625, -2.373992919921875, -2.2664794921875, -2.158966064453125, -2.05145263671875, -1.943939208984375, -1.83642578125, -1.728912353515625, -1.62139892578125, -1.513885498046875, -1.4063720703125, -1.298858642578125, -1.19134521484375, -1.083831787109375, -0.976318359375, -0.868804931640625, -0.76129150390625, -0.653778076171875, -0.5462646484375, -0.438751220703125, -0.33123779296875, -0.223724365234375, -0.1162109375, -0.008697509765625, 0.09881591796875, 0.206329345703125, 0.3138427734375, 0.421356201171875, 0.52886962890625, 0.636383056640625, 0.743896484375, 0.851409912109375, 0.95892333984375, 1.066436767578125, 1.1739501953125, 1.281463623046875, 1.38897705078125, 1.496490478515625, 1.60400390625, 1.711517333984375, 1.81903076171875, 1.926544189453125, 2.0340576171875, 2.141571044921875, 2.24908447265625, 2.356597900390625, 2.464111328125, 2.571624755859375, 2.67913818359375, 2.786651611328125, 2.8941650390625, 3.001678466796875, 3.10919189453125, 3.216705322265625, 3.32421875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [4.0, 11.0, 70.0, 281.0, 452.0, 156.0, 45.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8823583126068115, -2.2170772552490234, -1.5517960786819458, -0.8865149021148682, -0.22123384475708008, 0.444047212600708, 1.1093285083770752, 1.7746093273162842, 2.4398906230926514, 3.1051716804504395, 3.7704529762268066, 4.435733795166016, 5.101015090942383, 5.76629638671875, 6.431577682495117, 7.096858024597168, 7.762139320373535, 8.427420616149902, 9.09270191192627, 9.75798225402832, 10.423263549804688, 11.088544845581055, 11.753826141357422, 12.419107437133789, 13.084388732910156, 13.749670028686523, 14.41495132446289, 15.080232620239258, 15.745512962341309, 16.41079330444336, 17.07607650756836, 17.741355895996094, 18.40663719177246, 19.071918487548828, 19.737199783325195, 20.402481079101562, 21.06776237487793, 21.733043670654297, 22.39832305908203, 23.0636043548584, 23.728885650634766, 24.394166946411133, 25.0594482421875, 25.724729537963867, 26.390010833740234, 27.05529022216797, 27.72057342529297, 28.385852813720703, 29.051136016845703, 29.71641731262207, 30.381698608398438, 31.046979904174805, 31.712261199951172, 32.377540588378906, 33.042823791503906, 33.70810317993164, 34.373382568359375, 35.03866195678711, 35.70394515991211, 36.369224548339844, 37.034507751464844, 37.69978713989258, 38.36507034301758, 39.03034973144531, 39.69563293457031]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 10.0, 7.0, 9.0, 9.0, 13.0, 6.0, 11.0, 18.0, 29.0, 29.0, 36.0, 24.0, 28.0, 31.0, 32.0, 33.0, 25.0, 50.0, 50.0, 37.0, 36.0, 40.0, 46.0, 36.0, 45.0, 37.0, 30.0, 34.0, 21.0, 18.0, 22.0, 22.0, 17.0, 14.0, 16.0, 9.0, 13.0, 11.0, 12.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.019500732421875, -5.821157455444336, -5.622813701629639, -5.424469947814941, -5.226126670837402, -5.027783393859863, -4.829439640045166, -4.631095886230469, -4.43275260925293, -4.234409332275391, -4.036065578460693, -3.837722063064575, -3.639378547668457, -3.441035032272339, -3.2426915168762207, -3.0443480014801025, -2.8460044860839844, -2.647660970687866, -2.449317455291748, -2.25097393989563, -2.0526304244995117, -1.8542869091033936, -1.6559433937072754, -1.4575998783111572, -1.259256362915039, -1.060912847518921, -0.8625693321228027, -0.6642258167266846, -0.4658823013305664, -0.26753878593444824, -0.06919527053833008, 0.12914824485778809, 0.32749223709106445, 0.5258357524871826, 0.7241792678833008, 0.922522783279419, 1.120866298675537, 1.3192098140716553, 1.5175533294677734, 1.7158968448638916, 1.9142403602600098, 2.112583875656128, 2.310927391052246, 2.5092709064483643, 2.7076144218444824, 2.9059579372406006, 3.1043014526367188, 3.302644968032837, 3.500988483428955, 3.6993319988250732, 3.8976755142211914, 4.0960187911987305, 4.294362545013428, 4.492706298828125, 4.691049575805664, 4.889392852783203, 5.0877366065979, 5.286080360412598, 5.484423637390137, 5.682766914367676, 5.881110668182373, 6.07945442199707, 6.277797698974609, 6.476140975952148, 6.674484729766846]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 5.0, 11.0, 5.0, 13.0, 10.0, 14.0, 21.0, 22.0, 25.0, 24.0, 22.0, 28.0, 30.0, 30.0, 32.0, 34.0, 34.0, 39.0, 41.0, 39.0, 45.0, 53.0, 49.0, 38.0, 38.0, 41.0, 35.0, 33.0, 25.0, 16.0, 22.0, 15.0, 21.0, 13.0, 17.0, 7.0, 8.0, 8.0, 8.0, 4.0, 1.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.54443359375, -0.5277481079101562, -0.5110626220703125, -0.49437713623046875, -0.477691650390625, -0.46100616455078125, -0.4443206787109375, -0.42763519287109375, -0.41094970703125, -0.39426422119140625, -0.3775787353515625, -0.36089324951171875, -0.344207763671875, -0.32752227783203125, -0.3108367919921875, -0.29415130615234375, -0.2774658203125, -0.26078033447265625, -0.2440948486328125, -0.22740936279296875, -0.210723876953125, -0.19403839111328125, -0.1773529052734375, -0.16066741943359375, -0.14398193359375, -0.12729644775390625, -0.1106109619140625, -0.09392547607421875, -0.077239990234375, -0.06055450439453125, -0.0438690185546875, -0.02718353271484375, -0.010498046875, 0.00618743896484375, 0.0228729248046875, 0.03955841064453125, 0.056243896484375, 0.07292938232421875, 0.0896148681640625, 0.10630035400390625, 0.12298583984375, 0.13967132568359375, 0.1563568115234375, 0.17304229736328125, 0.189727783203125, 0.20641326904296875, 0.2230987548828125, 0.23978424072265625, 0.2564697265625, 0.27315521240234375, 0.2898406982421875, 0.30652618408203125, 0.323211669921875, 0.33989715576171875, 0.3565826416015625, 0.37326812744140625, 0.38995361328125, 0.40663909912109375, 0.4233245849609375, 0.44001007080078125, 0.456695556640625, 0.47338104248046875, 0.4900665283203125, 0.5067520141601562, 0.5234375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 7.0, 7.0, 11.0, 11.0, 17.0, 24.0, 23.0, 31.0, 41.0, 71.0, 87.0, 160.0, 322.0, 715.0, 1775.0, 4466.0, 12013.0, 37619.0, 148681.0, 1970938.0, 1818605.0, 144001.0, 35962.0, 11583.0, 4174.0, 1600.0, 616.0, 277.0, 133.0, 78.0, 49.0, 43.0, 33.0, 18.0, 17.0, 17.0, 10.0, 12.0, 9.0, 3.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.340484619140625, -2.26495361328125, -2.189422607421875, -2.1138916015625, -2.038360595703125, -1.96282958984375, -1.887298583984375, -1.811767578125, -1.736236572265625, -1.66070556640625, -1.585174560546875, -1.5096435546875, -1.434112548828125, -1.35858154296875, -1.283050537109375, -1.20751953125, -1.131988525390625, -1.05645751953125, -0.980926513671875, -0.9053955078125, -0.829864501953125, -0.75433349609375, -0.678802490234375, -0.603271484375, -0.527740478515625, -0.45220947265625, -0.376678466796875, -0.3011474609375, -0.225616455078125, -0.15008544921875, -0.074554443359375, 0.0009765625, 0.076507568359375, 0.15203857421875, 0.227569580078125, 0.3031005859375, 0.378631591796875, 0.45416259765625, 0.529693603515625, 0.605224609375, 0.680755615234375, 0.75628662109375, 0.831817626953125, 0.9073486328125, 0.982879638671875, 1.05841064453125, 1.133941650390625, 1.20947265625, 1.285003662109375, 1.36053466796875, 1.436065673828125, 1.5115966796875, 1.587127685546875, 1.66265869140625, 1.738189697265625, 1.813720703125, 1.889251708984375, 1.96478271484375, 2.040313720703125, 2.1158447265625, 2.191375732421875, 2.26690673828125, 2.342437744140625, 2.41796875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 13.0, 10.0, 13.0, 12.0, 16.0, 38.0, 41.0, 67.0, 81.0, 114.0, 181.0, 258.0, 420.0, 621.0, 664.0, 505.0, 309.0, 213.0, 159.0, 106.0, 52.0, 51.0, 38.0, 27.0, 19.0, 12.0, 8.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.197265625, -2.13299560546875, -2.0687255859375, -2.00445556640625, -1.940185546875, -1.87591552734375, -1.8116455078125, -1.74737548828125, -1.68310546875, -1.61883544921875, -1.5545654296875, -1.49029541015625, -1.426025390625, -1.36175537109375, -1.2974853515625, -1.23321533203125, -1.1689453125, -1.10467529296875, -1.0404052734375, -0.97613525390625, -0.911865234375, -0.84759521484375, -0.7833251953125, -0.71905517578125, -0.65478515625, -0.59051513671875, -0.5262451171875, -0.46197509765625, -0.397705078125, -0.33343505859375, -0.2691650390625, -0.20489501953125, -0.140625, -0.07635498046875, -0.0120849609375, 0.05218505859375, 0.116455078125, 0.18072509765625, 0.2449951171875, 0.30926513671875, 0.37353515625, 0.43780517578125, 0.5020751953125, 0.56634521484375, 0.630615234375, 0.69488525390625, 0.7591552734375, 0.82342529296875, 0.8876953125, 0.95196533203125, 1.0162353515625, 1.08050537109375, 1.144775390625, 1.20904541015625, 1.2733154296875, 1.33758544921875, 1.40185546875, 1.46612548828125, 1.5303955078125, 1.59466552734375, 1.658935546875, 1.72320556640625, 1.7874755859375, 1.85174560546875, 1.916015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 14.0, 11.0, 21.0, 33.0, 58.0, 89.0, 157.0, 261.0, 454.0, 861.0, 1520.0, 2959.0, 6087.0, 13128.0, 32633.0, 98332.0, 404591.0, 2481168.0, 898052.0, 167413.0, 50580.0, 19156.0, 8317.0, 3981.0, 1899.0, 1073.0, 564.0, 347.0, 191.0, 111.0, 78.0, 51.0, 35.0, 18.0, 16.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.1468505859375, -3.047607421875, -2.9483642578125, -2.84912109375, -2.7498779296875, -2.650634765625, -2.5513916015625, -2.4521484375, -2.3529052734375, -2.253662109375, -2.1544189453125, -2.05517578125, -1.9559326171875, -1.856689453125, -1.7574462890625, -1.658203125, -1.5589599609375, -1.459716796875, -1.3604736328125, -1.26123046875, -1.1619873046875, -1.062744140625, -0.9635009765625, -0.8642578125, -0.7650146484375, -0.665771484375, -0.5665283203125, -0.46728515625, -0.3680419921875, -0.268798828125, -0.1695556640625, -0.0703125, 0.0289306640625, 0.128173828125, 0.2274169921875, 0.32666015625, 0.4259033203125, 0.525146484375, 0.6243896484375, 0.7236328125, 0.8228759765625, 0.922119140625, 1.0213623046875, 1.12060546875, 1.2198486328125, 1.319091796875, 1.4183349609375, 1.517578125, 1.6168212890625, 1.716064453125, 1.8153076171875, 1.91455078125, 2.0137939453125, 2.113037109375, 2.2122802734375, 2.3115234375, 2.4107666015625, 2.510009765625, 2.6092529296875, 2.70849609375, 2.8077392578125, 2.906982421875, 3.0062255859375, 3.10546875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 7.0, 10.0, 10.0, 33.0, 34.0, 57.0, 80.0, 98.0, 118.0, 104.0, 128.0, 105.0, 71.0, 47.0, 36.0, 18.0, 28.0, 12.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.10332489013672, -16.73491668701172, -16.366506576538086, -15.998098373413086, -15.62968921661377, -15.261280059814453, -14.892870903015137, -14.52446174621582, -14.15605354309082, -13.787644386291504, -13.419235229492188, -13.050827026367188, -12.682417869567871, -12.314008712768555, -11.945599555969238, -11.577190399169922, -11.208781242370605, -10.840372085571289, -10.471962928771973, -10.103553771972656, -9.735145568847656, -9.36673641204834, -8.998327255249023, -8.629918098449707, -8.26150894165039, -7.893099784851074, -7.524691104888916, -7.1562819480896, -6.787873268127441, -6.419464111328125, -6.051054954528809, -5.682645797729492, -5.314238548278809, -4.945829391479492, -4.577420711517334, -4.209011554718018, -3.8406026363372803, -3.472193717956543, -3.1037845611572266, -2.7353756427764893, -2.366966724395752, -1.9985578060150146, -1.6301487684249878, -1.261739730834961, -0.8933308124542236, -0.5249218940734863, -0.15651273727416992, 0.21189618110656738, 0.5803050994873047, 0.9487140774726868, 1.3171230554580688, 1.6855320930480957, 2.053941011428833, 2.4223499298095703, 2.7907590866088867, 3.159168004989624, 3.5275769233703613, 3.8959858417510986, 4.264394760131836, 4.632803916931152, 5.001213073730469, 5.369621753692627, 5.738030910491943, 6.106439590454102, 6.474848747253418]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 8.0, 6.0, 11.0, 10.0, 4.0, 10.0, 12.0, 26.0, 26.0, 14.0, 29.0, 23.0, 23.0, 24.0, 42.0, 38.0, 36.0, 45.0, 35.0, 37.0, 33.0, 40.0, 57.0, 30.0, 30.0, 32.0, 43.0, 31.0, 30.0, 27.0, 29.0, 18.0, 19.0, 19.0, 17.0, 10.0, 6.0, 12.0, 16.0, 10.0, 10.0, 6.0, 5.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 4.0], "bins": [-5.397995948791504, -5.233646392822266, -5.069296836853027, -4.904946804046631, -4.740597248077393, -4.576247692108154, -4.411898136138916, -4.247548580169678, -4.083198547363281, -3.918848991394043, -3.7544991970062256, -3.5901496410369873, -3.42579984664917, -3.2614502906799316, -3.0971007347106934, -2.932751178741455, -2.768401622772217, -2.6040520668029785, -2.439702272415161, -2.275352716445923, -2.1110029220581055, -1.9466533660888672, -1.782303810119629, -1.617954134941101, -1.4536044597625732, -1.2892547845840454, -1.1249051094055176, -0.9605555534362793, -0.7962058782577515, -0.6318562030792236, -0.4675065875053406, -0.3031569719314575, -0.1388077735900879, 0.025541871786117554, 0.189891517162323, 0.35424116253852844, 0.5185908079147339, 0.6829404830932617, 0.8472900986671448, 1.0116397142410278, 1.1759893894195557, 1.3403390645980835, 1.5046887397766113, 1.6690382957458496, 1.8333879709243774, 1.9977376461029053, 2.1620872020721436, 2.326436996459961, 2.490786552429199, 2.6551361083984375, 2.819485902786255, 2.983835458755493, 3.1481852531433105, 3.312534809112549, 3.476884365081787, 3.6412339210510254, 3.8055837154388428, 3.969933271408081, 4.134283065795898, 4.298632621765137, 4.462982177734375, 4.627331733703613, 4.79168176651001, 4.956031322479248, 5.120380878448486]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 1.0, 4.0, 12.0, 9.0, 10.0, 11.0, 16.0, 16.0, 17.0, 15.0, 15.0, 21.0, 22.0, 22.0, 27.0, 34.0, 34.0, 31.0, 45.0, 40.0, 43.0, 42.0, 45.0, 44.0, 40.0, 45.0, 21.0, 45.0, 27.0, 29.0, 26.0, 27.0, 24.0, 14.0, 18.0, 17.0, 13.0, 10.0, 14.0, 5.0, 5.0, 7.0, 6.0, 3.0, 7.0, 5.0, 1.0, 8.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.556640625, -0.5402145385742188, -0.5237884521484375, -0.5073623657226562, -0.490936279296875, -0.47451019287109375, -0.4580841064453125, -0.44165802001953125, -0.42523193359375, -0.40880584716796875, -0.3923797607421875, -0.37595367431640625, -0.359527587890625, -0.34310150146484375, -0.3266754150390625, -0.31024932861328125, -0.2938232421875, -0.27739715576171875, -0.2609710693359375, -0.24454498291015625, -0.228118896484375, -0.21169281005859375, -0.1952667236328125, -0.17884063720703125, -0.16241455078125, -0.14598846435546875, -0.1295623779296875, -0.11313629150390625, -0.096710205078125, -0.08028411865234375, -0.0638580322265625, -0.04743194580078125, -0.031005859375, -0.01457977294921875, 0.0018463134765625, 0.01827239990234375, 0.034698486328125, 0.05112457275390625, 0.0675506591796875, 0.08397674560546875, 0.10040283203125, 0.11682891845703125, 0.1332550048828125, 0.14968109130859375, 0.166107177734375, 0.18253326416015625, 0.1989593505859375, 0.21538543701171875, 0.2318115234375, 0.24823760986328125, 0.2646636962890625, 0.28108978271484375, 0.297515869140625, 0.31394195556640625, 0.3303680419921875, 0.34679412841796875, 0.36322021484375, 0.37964630126953125, 0.3960723876953125, 0.41249847412109375, 0.428924560546875, 0.44535064697265625, 0.4617767333984375, 0.47820281982421875, 0.49462890625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 4.0, 15.0, 17.0, 25.0, 42.0, 52.0, 74.0, 104.0, 152.0, 242.0, 320.0, 453.0, 616.0, 882.0, 1243.0, 1791.0, 2551.0, 3594.0, 5502.0, 7694.0, 10835.0, 16095.0, 23682.0, 35320.0, 52549.0, 80611.0, 133252.0, 217587.0, 166530.0, 96524.0, 61264.0, 40945.0, 27589.0, 18641.0, 12863.0, 8826.0, 5968.0, 4293.0, 2999.0, 1988.0, 1375.0, 1073.0, 658.0, 520.0, 360.0, 260.0, 168.0, 128.0, 82.0, 57.0, 58.0, 38.0, 22.0, 11.0, 5.0, 3.0, 4.0, 2.0], "bins": [-1.2265625, -1.190155029296875, -1.15374755859375, -1.117340087890625, -1.0809326171875, -1.044525146484375, -1.00811767578125, -0.971710205078125, -0.935302734375, -0.898895263671875, -0.86248779296875, -0.826080322265625, -0.7896728515625, -0.753265380859375, -0.71685791015625, -0.680450439453125, -0.64404296875, -0.607635498046875, -0.57122802734375, -0.534820556640625, -0.4984130859375, -0.462005615234375, -0.42559814453125, -0.389190673828125, -0.352783203125, -0.316375732421875, -0.27996826171875, -0.243560791015625, -0.2071533203125, -0.170745849609375, -0.13433837890625, -0.097930908203125, -0.0615234375, -0.025115966796875, 0.01129150390625, 0.047698974609375, 0.0841064453125, 0.120513916015625, 0.15692138671875, 0.193328857421875, 0.229736328125, 0.266143798828125, 0.30255126953125, 0.338958740234375, 0.3753662109375, 0.411773681640625, 0.44818115234375, 0.484588623046875, 0.52099609375, 0.557403564453125, 0.59381103515625, 0.630218505859375, 0.6666259765625, 0.703033447265625, 0.73944091796875, 0.775848388671875, 0.812255859375, 0.848663330078125, 0.88507080078125, 0.921478271484375, 0.9578857421875, 0.994293212890625, 1.03070068359375, 1.067108154296875, 1.103515625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 10.0, 8.0, 10.0, 9.0, 22.0, 20.0, 27.0, 14.0, 25.0, 26.0, 30.0, 26.0, 34.0, 38.0, 38.0, 37.0, 41.0, 36.0, 1065.0, 39.0, 38.0, 47.0, 34.0, 41.0, 31.0, 35.0, 33.0, 28.0, 24.0, 36.0, 18.0, 12.0, 17.0, 11.0, 9.0, 7.0, 7.0, 6.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.5830078125, -0.56671142578125, -0.5504150390625, -0.53411865234375, -0.517822265625, -0.50152587890625, -0.4852294921875, -0.46893310546875, -0.45263671875, -0.43634033203125, -0.4200439453125, -0.40374755859375, -0.387451171875, -0.37115478515625, -0.3548583984375, -0.33856201171875, -0.322265625, -0.30596923828125, -0.2896728515625, -0.27337646484375, -0.257080078125, -0.24078369140625, -0.2244873046875, -0.20819091796875, -0.19189453125, -0.17559814453125, -0.1593017578125, -0.14300537109375, -0.126708984375, -0.11041259765625, -0.0941162109375, -0.07781982421875, -0.0615234375, -0.04522705078125, -0.0289306640625, -0.01263427734375, 0.003662109375, 0.01995849609375, 0.0362548828125, 0.05255126953125, 0.06884765625, 0.08514404296875, 0.1014404296875, 0.11773681640625, 0.134033203125, 0.15032958984375, 0.1666259765625, 0.18292236328125, 0.19921875, 0.21551513671875, 0.2318115234375, 0.24810791015625, 0.264404296875, 0.28070068359375, 0.2969970703125, 0.31329345703125, 0.32958984375, 0.34588623046875, 0.3621826171875, 0.37847900390625, 0.394775390625, 0.41107177734375, 0.4273681640625, 0.44366455078125, 0.4599609375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 9.0, 20.0, 31.0, 45.0, 52.0, 73.0, 132.0, 170.0, 225.0, 327.0, 513.0, 714.0, 1038.0, 1655.0, 2564.0, 3900.0, 6026.0, 10120.0, 17274.0, 30450.0, 59212.0, 134633.0, 428811.0, 943207.0, 254523.0, 95836.0, 44741.0, 24169.0, 13825.0, 8215.0, 5071.0, 3160.0, 2042.0, 1475.0, 953.0, 607.0, 410.0, 310.0, 166.0, 107.0, 116.0, 68.0, 50.0, 24.0, 25.0, 8.0, 11.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-1.0302734375, -0.9993362426757812, -0.9683990478515625, -0.9374618530273438, -0.906524658203125, -0.8755874633789062, -0.8446502685546875, -0.8137130737304688, -0.78277587890625, -0.7518386840820312, -0.7209014892578125, -0.6899642944335938, -0.659027099609375, -0.6280899047851562, -0.5971527099609375, -0.5662155151367188, -0.5352783203125, -0.5043411254882812, -0.4734039306640625, -0.44246673583984375, -0.411529541015625, -0.38059234619140625, -0.3496551513671875, -0.31871795654296875, -0.28778076171875, -0.25684356689453125, -0.2259063720703125, -0.19496917724609375, -0.164031982421875, -0.13309478759765625, -0.1021575927734375, -0.07122039794921875, -0.040283203125, -0.00934600830078125, 0.0215911865234375, 0.05252838134765625, 0.083465576171875, 0.11440277099609375, 0.1453399658203125, 0.17627716064453125, 0.20721435546875, 0.23815155029296875, 0.2690887451171875, 0.30002593994140625, 0.330963134765625, 0.36190032958984375, 0.3928375244140625, 0.42377471923828125, 0.4547119140625, 0.48564910888671875, 0.5165863037109375, 0.5475234985351562, 0.578460693359375, 0.6093978881835938, 0.6403350830078125, 0.6712722778320312, 0.70220947265625, 0.7331466674804688, 0.7640838623046875, 0.7950210571289062, 0.825958251953125, 0.8568954467773438, 0.8878326416015625, 0.9187698364257812, 0.94970703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 1.0, 5.0, 1.0, 4.0, 6.0, 9.0, 4.0, 7.0, 15.0, 13.0, 16.0, 25.0, 40.0, 35.0, 57.0, 71.0, 121.0, 133.0, 95.0, 72.0, 62.0, 34.0, 34.0, 30.0, 16.0, 19.0, 13.0, 7.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.6044921875, -0.587493896484375, -0.57049560546875, -0.553497314453125, -0.5364990234375, -0.519500732421875, -0.50250244140625, -0.485504150390625, -0.468505859375, -0.451507568359375, -0.43450927734375, -0.417510986328125, -0.4005126953125, -0.383514404296875, -0.36651611328125, -0.349517822265625, -0.33251953125, -0.315521240234375, -0.29852294921875, -0.281524658203125, -0.2645263671875, -0.247528076171875, -0.23052978515625, -0.213531494140625, -0.196533203125, -0.179534912109375, -0.16253662109375, -0.145538330078125, -0.1285400390625, -0.111541748046875, -0.09454345703125, -0.077545166015625, -0.060546875, -0.043548583984375, -0.02655029296875, -0.009552001953125, 0.0074462890625, 0.024444580078125, 0.04144287109375, 0.058441162109375, 0.075439453125, 0.092437744140625, 0.10943603515625, 0.126434326171875, 0.1434326171875, 0.160430908203125, 0.17742919921875, 0.194427490234375, 0.21142578125, 0.228424072265625, 0.24542236328125, 0.262420654296875, 0.2794189453125, 0.296417236328125, 0.31341552734375, 0.330413818359375, 0.347412109375, 0.364410400390625, 0.38140869140625, 0.398406982421875, 0.4154052734375, 0.432403564453125, 0.44940185546875, 0.466400146484375, 0.4833984375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 4.0, 8.0, 10.0, 8.0, 7.0, 9.0, 15.0, 14.0, 17.0, 23.0, 26.0, 24.0, 41.0, 49.0, 80.0, 98.0, 144.0, 315.0, 822.0, 5189.0, 73338.0, 920985.0, 42076.0, 3749.0, 668.0, 244.0, 167.0, 89.0, 67.0, 55.0, 30.0, 29.0, 19.0, 13.0, 18.0, 21.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.64862060546875, -6.4300537109375, -6.21148681640625, -5.992919921875, -5.77435302734375, -5.5557861328125, -5.33721923828125, -5.11865234375, -4.90008544921875, -4.6815185546875, -4.46295166015625, -4.244384765625, -4.02581787109375, -3.8072509765625, -3.58868408203125, -3.3701171875, -3.15155029296875, -2.9329833984375, -2.71441650390625, -2.495849609375, -2.27728271484375, -2.0587158203125, -1.84014892578125, -1.62158203125, -1.40301513671875, -1.1844482421875, -0.96588134765625, -0.747314453125, -0.52874755859375, -0.3101806640625, -0.09161376953125, 0.126953125, 0.34552001953125, 0.5640869140625, 0.78265380859375, 1.001220703125, 1.21978759765625, 1.4383544921875, 1.65692138671875, 1.87548828125, 2.09405517578125, 2.3126220703125, 2.53118896484375, 2.749755859375, 2.96832275390625, 3.1868896484375, 3.40545654296875, 3.6240234375, 3.84259033203125, 4.0611572265625, 4.27972412109375, 4.498291015625, 4.71685791015625, 4.9354248046875, 5.15399169921875, 5.37255859375, 5.59112548828125, 5.8096923828125, 6.02825927734375, 6.246826171875, 6.46539306640625, 6.6839599609375, 6.90252685546875, 7.12109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 33.0, 46.0, 177.0, 298.0, 271.0, 114.0, 45.0, 18.0, 7.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9730452299118042, -1.8867396116256714, -1.800433874130249, -1.7141282558441162, -1.6278225183486938, -1.541516900062561, -1.4552111625671387, -1.3689055442810059, -1.282599925994873, -1.1962943077087402, -1.1099885702133179, -1.023682951927185, -0.9373772144317627, -0.8510715961456299, -0.7647659182548523, -0.6784602403640747, -0.5921545028686523, -0.5058488249778748, -0.41954314708709717, -0.33323749899864197, -0.24693182110786438, -0.1606261432170868, -0.07432049512863159, 0.011985182762145996, 0.09829086065292358, 0.18459653854370117, 0.27090221643447876, 0.35720786452293396, 0.44351354241371155, 0.5298192501068115, 0.6161248683929443, 0.7024305462837219, 0.78873610496521, 0.8750417828559875, 0.9613474607467651, 1.047653079032898, 1.1339588165283203, 1.2202644348144531, 1.306570053100586, 1.3928757905960083, 1.4791815280914307, 1.5654871463775635, 1.6517928838729858, 1.7380985021591187, 1.824404239654541, 1.9107098579406738, 1.9970154762268066, 2.0833210945129395, 2.1696267127990723, 2.255932331085205, 2.342237949371338, 2.42854380607605, 2.5148494243621826, 2.6011550426483154, 2.6874606609344482, 2.77376651763916, 2.860072135925293, 2.946377754211426, 3.0326833724975586, 3.1189892292022705, 3.2052948474884033, 3.291600465774536, 3.377906084060669, 3.464211940765381, 3.5505175590515137]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 5.0, 5.0, 12.0, 11.0, 14.0, 18.0, 17.0, 14.0, 19.0, 21.0, 30.0, 36.0, 30.0, 34.0, 49.0, 44.0, 50.0, 43.0, 49.0, 48.0, 53.0, 60.0, 38.0, 33.0, 53.0, 26.0, 31.0, 16.0, 22.0, 31.0, 17.0, 21.0, 14.0, 9.0, 8.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8940014839172363, -0.8682159185409546, -0.8424303531646729, -0.8166448473930359, -0.7908592820167542, -0.7650737166404724, -0.7392882108688354, -0.7135026454925537, -0.687717080116272, -0.6619315147399902, -0.6361459493637085, -0.6103604435920715, -0.5845748782157898, -0.5587893128395081, -0.5330038070678711, -0.5072182416915894, -0.4814326763153076, -0.4556471109390259, -0.42986157536506653, -0.4040760397911072, -0.37829047441482544, -0.3525049090385437, -0.32671937346458435, -0.300933837890625, -0.27514827251434326, -0.24936272203922272, -0.22357717156410217, -0.19779162108898163, -0.17200607061386108, -0.14622052013874054, -0.12043496966362, -0.09464941918849945, -0.06886392831802368, -0.04307837784290314, -0.017292827367782593, 0.008492723107337952, 0.034278273582458496, 0.06006382405757904, 0.08584937453269958, 0.11163492500782013, 0.13742047548294067, 0.16320602595806122, 0.18899157643318176, 0.2147771269083023, 0.24056267738342285, 0.2663482427597046, 0.29213377833366394, 0.3179193139076233, 0.34370487928390503, 0.36949044466018677, 0.3952759802341461, 0.42106151580810547, 0.4468470811843872, 0.47263264656066895, 0.4984181821346283, 0.5242037177085876, 0.5499892830848694, 0.5757748484611511, 0.6015603542327881, 0.6273459196090698, 0.6531314849853516, 0.6789170503616333, 0.704702615737915, 0.730488121509552, 0.7562736868858337]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 4.0, 3.0, 1.0, 5.0, 7.0, 13.0, 6.0, 13.0, 17.0, 11.0, 11.0, 13.0, 22.0, 20.0, 18.0, 31.0, 22.0, 21.0, 39.0, 37.0, 38.0, 42.0, 41.0, 41.0, 44.0, 47.0, 50.0, 33.0, 31.0, 34.0, 41.0, 33.0, 19.0, 26.0, 20.0, 20.0, 22.0, 19.0, 13.0, 11.0, 15.0, 8.0, 3.0, 5.0, 6.0, 6.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.55078125, -0.5342330932617188, -0.5176849365234375, -0.5011367797851562, -0.484588623046875, -0.46804046630859375, -0.4514923095703125, -0.43494415283203125, -0.41839599609375, -0.40184783935546875, -0.3852996826171875, -0.36875152587890625, -0.352203369140625, -0.33565521240234375, -0.3191070556640625, -0.30255889892578125, -0.2860107421875, -0.26946258544921875, -0.2529144287109375, -0.23636627197265625, -0.219818115234375, -0.20326995849609375, -0.1867218017578125, -0.17017364501953125, -0.15362548828125, -0.13707733154296875, -0.1205291748046875, -0.10398101806640625, -0.087432861328125, -0.07088470458984375, -0.0543365478515625, -0.03778839111328125, -0.021240234375, -0.00469207763671875, 0.0118560791015625, 0.02840423583984375, 0.044952392578125, 0.06150054931640625, 0.0780487060546875, 0.09459686279296875, 0.11114501953125, 0.12769317626953125, 0.1442413330078125, 0.16078948974609375, 0.177337646484375, 0.19388580322265625, 0.2104339599609375, 0.22698211669921875, 0.2435302734375, 0.26007843017578125, 0.2766265869140625, 0.29317474365234375, 0.309722900390625, 0.32627105712890625, 0.3428192138671875, 0.35936737060546875, 0.37591552734375, 0.39246368408203125, 0.4090118408203125, 0.42555999755859375, 0.442108154296875, 0.45865631103515625, 0.4752044677734375, 0.49175262451171875, 0.50830078125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 12.0, 11.0, 16.0, 27.0, 25.0, 43.0, 51.0, 81.0, 113.0, 180.0, 240.0, 329.0, 476.0, 780.0, 1053.0, 1722.0, 2854.0, 4943.0, 9696.0, 22938.0, 73045.0, 301968.0, 445426.0, 120348.0, 33728.0, 12815.0, 6225.0, 3428.0, 1997.0, 1291.0, 834.0, 521.0, 394.0, 261.0, 207.0, 117.0, 91.0, 71.0, 48.0, 31.0, 33.0, 21.0, 20.0, 7.0, 9.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.56640625, -1.519195556640625, -1.47198486328125, -1.424774169921875, -1.3775634765625, -1.330352783203125, -1.28314208984375, -1.235931396484375, -1.188720703125, -1.141510009765625, -1.09429931640625, -1.047088623046875, -0.9998779296875, -0.952667236328125, -0.90545654296875, -0.858245849609375, -0.81103515625, -0.763824462890625, -0.71661376953125, -0.669403076171875, -0.6221923828125, -0.574981689453125, -0.52777099609375, -0.480560302734375, -0.433349609375, -0.386138916015625, -0.33892822265625, -0.291717529296875, -0.2445068359375, -0.197296142578125, -0.15008544921875, -0.102874755859375, -0.0556640625, -0.008453369140625, 0.03875732421875, 0.085968017578125, 0.1331787109375, 0.180389404296875, 0.22760009765625, 0.274810791015625, 0.322021484375, 0.369232177734375, 0.41644287109375, 0.463653564453125, 0.5108642578125, 0.558074951171875, 0.60528564453125, 0.652496337890625, 0.69970703125, 0.746917724609375, 0.79412841796875, 0.841339111328125, 0.8885498046875, 0.935760498046875, 0.98297119140625, 1.030181884765625, 1.077392578125, 1.124603271484375, 1.17181396484375, 1.219024658203125, 1.2662353515625, 1.313446044921875, 1.36065673828125, 1.407867431640625, 1.455078125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 11.0, 7.0, 13.0, 7.0, 13.0, 18.0, 19.0, 16.0, 21.0, 23.0, 37.0, 50.0, 37.0, 53.0, 58.0, 73.0, 130.0, 201.0, 1288.0, 250.0, 151.0, 111.0, 74.0, 40.0, 46.0, 33.0, 27.0, 35.0, 33.0, 32.0, 21.0, 12.0, 23.0, 8.0, 14.0, 14.0, 8.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.9453125, -1.882049560546875, -1.81878662109375, -1.755523681640625, -1.6922607421875, -1.628997802734375, -1.56573486328125, -1.502471923828125, -1.439208984375, -1.375946044921875, -1.31268310546875, -1.249420166015625, -1.1861572265625, -1.122894287109375, -1.05963134765625, -0.996368408203125, -0.93310546875, -0.869842529296875, -0.80657958984375, -0.743316650390625, -0.6800537109375, -0.616790771484375, -0.55352783203125, -0.490264892578125, -0.427001953125, -0.363739013671875, -0.30047607421875, -0.237213134765625, -0.1739501953125, -0.110687255859375, -0.04742431640625, 0.015838623046875, 0.0791015625, 0.142364501953125, 0.20562744140625, 0.268890380859375, 0.3321533203125, 0.395416259765625, 0.45867919921875, 0.521942138671875, 0.585205078125, 0.648468017578125, 0.71173095703125, 0.774993896484375, 0.8382568359375, 0.901519775390625, 0.96478271484375, 1.028045654296875, 1.09130859375, 1.154571533203125, 1.21783447265625, 1.281097412109375, 1.3443603515625, 1.407623291015625, 1.47088623046875, 1.534149169921875, 1.597412109375, 1.660675048828125, 1.72393798828125, 1.787200927734375, 1.8504638671875, 1.913726806640625, 1.97698974609375, 2.040252685546875, 2.103515625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 10.0, 17.0, 20.0, 31.0, 27.0, 48.0, 64.0, 106.0, 171.0, 240.0, 444.0, 792.0, 1507.0, 3021.0, 7069.0, 19982.0, 92467.0, 1276830.0, 1596395.0, 110026.0, 22298.0, 7481.0, 3127.0, 1566.0, 754.0, 460.0, 258.0, 147.0, 101.0, 74.0, 45.0, 25.0, 20.0, 18.0, 10.0, 12.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.0625, -2.9669189453125, -2.871337890625, -2.7757568359375, -2.68017578125, -2.5845947265625, -2.489013671875, -2.3934326171875, -2.2978515625, -2.2022705078125, -2.106689453125, -2.0111083984375, -1.91552734375, -1.8199462890625, -1.724365234375, -1.6287841796875, -1.533203125, -1.4376220703125, -1.342041015625, -1.2464599609375, -1.15087890625, -1.0552978515625, -0.959716796875, -0.8641357421875, -0.7685546875, -0.6729736328125, -0.577392578125, -0.4818115234375, -0.38623046875, -0.2906494140625, -0.195068359375, -0.0994873046875, -0.00390625, 0.0916748046875, 0.187255859375, 0.2828369140625, 0.37841796875, 0.4739990234375, 0.569580078125, 0.6651611328125, 0.7607421875, 0.8563232421875, 0.951904296875, 1.0474853515625, 1.14306640625, 1.2386474609375, 1.334228515625, 1.4298095703125, 1.525390625, 1.6209716796875, 1.716552734375, 1.8121337890625, 1.90771484375, 2.0032958984375, 2.098876953125, 2.1944580078125, 2.2900390625, 2.3856201171875, 2.481201171875, 2.5767822265625, 2.67236328125, 2.7679443359375, 2.863525390625, 2.9591064453125, 3.0546875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 160.0, 516.0, 297.0, 31.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.6098747253418, -47.610504150390625, -46.61112976074219, -45.611759185791016, -44.61238479614258, -43.613014221191406, -42.613643646240234, -41.6142692565918, -40.614898681640625, -39.61552810668945, -38.616153717041016, -37.616783142089844, -36.617408752441406, -35.618038177490234, -34.61866760253906, -33.619293212890625, -32.61992263793945, -31.62055015563965, -30.621177673339844, -29.621807098388672, -28.622434616088867, -27.623062133789062, -26.623689651489258, -25.624317169189453, -24.62494468688965, -23.625572204589844, -22.62619972229004, -21.626829147338867, -20.627456665039062, -19.628084182739258, -18.628711700439453, -17.62934112548828, -16.629968643188477, -15.630596160888672, -14.631224632263184, -13.631852149963379, -12.63248062133789, -11.633108139038086, -10.633735656738281, -9.634364128112793, -8.634992599487305, -7.635620594024658, -6.636248588562012, -5.636876106262207, -4.637504577636719, -3.638132095336914, -2.6387600898742676, -1.639388084411621, -0.6400156021118164, 0.35935646295547485, 1.3587285280227661, 2.358100652694702, 3.3574726581573486, 4.356844902038574, 5.356216907501221, 6.355588912963867, 7.354960918426514, 8.35433292388916, 9.353705406188965, 10.353076934814453, 11.352449417114258, 12.351821899414062, 13.35119342803955, 14.350564956665039, 15.349937438964844]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 5.0, 2.0, 8.0, 2.0, 10.0, 10.0, 4.0, 24.0, 9.0, 20.0, 20.0, 23.0, 35.0, 33.0, 32.0, 35.0, 38.0, 37.0, 30.0, 51.0, 44.0, 36.0, 48.0, 43.0, 30.0, 53.0, 44.0, 30.0, 34.0, 42.0, 35.0, 24.0, 22.0, 14.0, 19.0, 12.0, 12.0, 11.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.972020149230957, -7.7430925369262695, -7.514164924621582, -7.285237789154053, -7.056310176849365, -6.827382564544678, -6.598455429077148, -6.369527816772461, -6.140600204467773, -5.911672592163086, -5.682744979858398, -5.453817844390869, -5.224890232086182, -4.995962619781494, -4.767035484313965, -4.538107872009277, -4.30918025970459, -4.080252647399902, -3.851325273513794, -3.6223978996276855, -3.393470287322998, -3.1645426750183105, -2.935615301132202, -2.7066879272460938, -2.4777603149414062, -2.2488327026367188, -2.0199053287506104, -1.7909778356552124, -1.5620503425598145, -1.3331228494644165, -1.1041953563690186, -0.8752678632736206, -0.6463403701782227, -0.4174128770828247, -0.18848538398742676, 0.04044210910797119, 0.26936960220336914, 0.4982970952987671, 0.727224588394165, 0.956152081489563, 1.185079574584961, 1.4140070676803589, 1.6429345607757568, 1.8718620538711548, 2.1007895469665527, 2.3297171592712402, 2.5586445331573486, 2.787571907043457, 3.0164995193481445, 3.245427131652832, 3.4743545055389404, 3.703281879425049, 3.9322094917297363, 4.161137104034424, 4.390064239501953, 4.618991851806641, 4.847919464111328, 5.076847076416016, 5.305774688720703, 5.534701824188232, 5.76362943649292, 5.992557048797607, 6.221484184265137, 6.450411796569824, 6.679339408874512]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 9.0, 10.0, 12.0, 9.0, 17.0, 13.0, 22.0, 6.0, 34.0, 14.0, 24.0, 25.0, 27.0, 32.0, 30.0, 31.0, 48.0, 35.0, 31.0, 56.0, 43.0, 40.0, 28.0, 46.0, 35.0, 28.0, 26.0, 28.0, 27.0, 25.0, 28.0, 17.0, 28.0, 18.0, 11.0, 12.0, 11.0, 14.0, 9.0, 1.0, 2.0, 5.0, 5.0, 7.0, 1.0, 0.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0], "bins": [-0.5556640625, -0.538330078125, -0.52099609375, -0.503662109375, -0.486328125, -0.468994140625, -0.45166015625, -0.434326171875, -0.4169921875, -0.399658203125, -0.38232421875, -0.364990234375, -0.34765625, -0.330322265625, -0.31298828125, -0.295654296875, -0.2783203125, -0.260986328125, -0.24365234375, -0.226318359375, -0.208984375, -0.191650390625, -0.17431640625, -0.156982421875, -0.1396484375, -0.122314453125, -0.10498046875, -0.087646484375, -0.0703125, -0.052978515625, -0.03564453125, -0.018310546875, -0.0009765625, 0.016357421875, 0.03369140625, 0.051025390625, 0.068359375, 0.085693359375, 0.10302734375, 0.120361328125, 0.1376953125, 0.155029296875, 0.17236328125, 0.189697265625, 0.20703125, 0.224365234375, 0.24169921875, 0.259033203125, 0.2763671875, 0.293701171875, 0.31103515625, 0.328369140625, 0.345703125, 0.363037109375, 0.38037109375, 0.397705078125, 0.4150390625, 0.432373046875, 0.44970703125, 0.467041015625, 0.484375, 0.501708984375, 0.51904296875, 0.536376953125, 0.5537109375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 11.0, 19.0, 14.0, 20.0, 33.0, 47.0, 46.0, 89.0, 121.0, 219.0, 336.0, 597.0, 998.0, 1798.0, 3433.0, 6564.0, 14003.0, 31969.0, 93755.0, 525400.0, 2793148.0, 562655.0, 97644.0, 33453.0, 14036.0, 6470.0, 3350.0, 1707.0, 947.0, 515.0, 276.0, 191.0, 130.0, 68.0, 51.0, 26.0, 32.0, 23.0, 13.0, 13.0, 14.0, 4.0, 8.0, 3.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.6328125, -1.5792999267578125, -1.525787353515625, -1.4722747802734375, -1.41876220703125, -1.3652496337890625, -1.311737060546875, -1.2582244873046875, -1.2047119140625, -1.1511993408203125, -1.097686767578125, -1.0441741943359375, -0.99066162109375, -0.9371490478515625, -0.883636474609375, -0.8301239013671875, -0.776611328125, -0.7230987548828125, -0.669586181640625, -0.6160736083984375, -0.56256103515625, -0.5090484619140625, -0.455535888671875, -0.4020233154296875, -0.3485107421875, -0.2949981689453125, -0.241485595703125, -0.1879730224609375, -0.13446044921875, -0.0809478759765625, -0.027435302734375, 0.0260772705078125, 0.07958984375, 0.1331024169921875, 0.186614990234375, 0.2401275634765625, 0.29364013671875, 0.3471527099609375, 0.400665283203125, 0.4541778564453125, 0.5076904296875, 0.5612030029296875, 0.614715576171875, 0.6682281494140625, 0.72174072265625, 0.7752532958984375, 0.828765869140625, 0.8822784423828125, 0.935791015625, 0.9893035888671875, 1.042816162109375, 1.0963287353515625, 1.14984130859375, 1.2033538818359375, 1.256866455078125, 1.3103790283203125, 1.3638916015625, 1.4174041748046875, 1.470916748046875, 1.5244293212890625, 1.57794189453125, 1.6314544677734375, 1.684967041015625, 1.7384796142578125, 1.7919921875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 2.0, 10.0, 15.0, 10.0, 31.0, 32.0, 47.0, 49.0, 64.0, 113.0, 178.0, 230.0, 365.0, 568.0, 718.0, 557.0, 331.0, 210.0, 167.0, 107.0, 78.0, 47.0, 35.0, 31.0, 20.0, 11.0, 14.0, 13.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.626953125, -2.5620574951171875, -2.497161865234375, -2.4322662353515625, -2.36737060546875, -2.3024749755859375, -2.237579345703125, -2.1726837158203125, -2.1077880859375, -2.0428924560546875, -1.977996826171875, -1.9131011962890625, -1.84820556640625, -1.7833099365234375, -1.718414306640625, -1.6535186767578125, -1.588623046875, -1.5237274169921875, -1.458831787109375, -1.3939361572265625, -1.32904052734375, -1.2641448974609375, -1.199249267578125, -1.1343536376953125, -1.0694580078125, -1.0045623779296875, -0.939666748046875, -0.8747711181640625, -0.80987548828125, -0.7449798583984375, -0.680084228515625, -0.6151885986328125, -0.55029296875, -0.4853973388671875, -0.420501708984375, -0.3556060791015625, -0.29071044921875, -0.2258148193359375, -0.160919189453125, -0.0960235595703125, -0.0311279296875, 0.0337677001953125, 0.098663330078125, 0.1635589599609375, 0.22845458984375, 0.2933502197265625, 0.358245849609375, 0.4231414794921875, 0.488037109375, 0.5529327392578125, 0.617828369140625, 0.6827239990234375, 0.74761962890625, 0.8125152587890625, 0.877410888671875, 0.9423065185546875, 1.0072021484375, 1.0720977783203125, 1.136993408203125, 1.2018890380859375, 1.26678466796875, 1.3316802978515625, 1.396575927734375, 1.4614715576171875, 1.5263671875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 13.0, 11.0, 18.0, 23.0, 40.0, 60.0, 69.0, 131.0, 226.0, 416.0, 830.0, 1762.0, 3629.0, 8510.0, 23255.0, 74160.0, 359721.0, 2816297.0, 736175.0, 115591.0, 32548.0, 11682.0, 4674.0, 2105.0, 1003.0, 499.0, 292.0, 174.0, 99.0, 61.0, 42.0, 38.0, 32.0, 22.0, 14.0, 6.0, 6.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-4.1328125, -4.02008056640625, -3.9073486328125, -3.79461669921875, -3.681884765625, -3.56915283203125, -3.4564208984375, -3.34368896484375, -3.23095703125, -3.11822509765625, -3.0054931640625, -2.89276123046875, -2.780029296875, -2.66729736328125, -2.5545654296875, -2.44183349609375, -2.3291015625, -2.21636962890625, -2.1036376953125, -1.99090576171875, -1.878173828125, -1.76544189453125, -1.6527099609375, -1.53997802734375, -1.42724609375, -1.31451416015625, -1.2017822265625, -1.08905029296875, -0.976318359375, -0.86358642578125, -0.7508544921875, -0.63812255859375, -0.525390625, -0.41265869140625, -0.2999267578125, -0.18719482421875, -0.074462890625, 0.03826904296875, 0.1510009765625, 0.26373291015625, 0.37646484375, 0.48919677734375, 0.6019287109375, 0.71466064453125, 0.827392578125, 0.94012451171875, 1.0528564453125, 1.16558837890625, 1.2783203125, 1.39105224609375, 1.5037841796875, 1.61651611328125, 1.729248046875, 1.84197998046875, 1.9547119140625, 2.06744384765625, 2.18017578125, 2.29290771484375, 2.4056396484375, 2.51837158203125, 2.631103515625, 2.74383544921875, 2.8565673828125, 2.96929931640625, 3.08203125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 12.0, 14.0, 40.0, 82.0, 122.0, 172.0, 180.0, 140.0, 110.0, 61.0, 32.0, 18.0, 15.0, 1.0, 3.0, 1.0, 1.0], "bins": [-29.702730178833008, -29.145294189453125, -28.587860107421875, -28.030424118041992, -27.47298812866211, -26.91555404663086, -26.358118057250977, -25.800682067871094, -25.243247985839844, -24.68581199645996, -24.12837791442871, -23.570941925048828, -23.013505935668945, -22.456071853637695, -21.898635864257812, -21.34119987487793, -20.783763885498047, -20.226327896118164, -19.668893814086914, -19.11145782470703, -18.55402183532715, -17.9965877532959, -17.439151763916016, -16.881715774536133, -16.324281692504883, -15.766846656799316, -15.209410667419434, -14.651975631713867, -14.0945405960083, -13.537105560302734, -12.979669570922852, -12.422234535217285, -11.864800453186035, -11.307365417480469, -10.749929428100586, -10.19249439239502, -9.635059356689453, -9.07762336730957, -8.520188331604004, -7.9627532958984375, -7.405317783355713, -6.847882270812988, -6.290447235107422, -5.733011722564697, -5.175576210021973, -4.618141174316406, -4.060705661773682, -3.503270387649536, -2.9458351135253906, -2.388399839401245, -1.83096444606781, -1.273529052734375, -0.7160937786102295, -0.15865850448608398, 0.3987770080566406, 0.9562122821807861, 1.5136475563049316, 2.071082830429077, 2.6285181045532227, 3.1859536170959473, 3.7433888912200928, 4.300824165344238, 4.858259677886963, 5.4156951904296875, 5.973130226135254]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 4.0, 6.0, 8.0, 9.0, 16.0, 13.0, 19.0, 12.0, 17.0, 21.0, 17.0, 26.0, 35.0, 38.0, 35.0, 30.0, 44.0, 35.0, 36.0, 39.0, 42.0, 39.0, 40.0, 38.0, 37.0, 29.0, 30.0, 31.0, 30.0, 39.0, 23.0, 27.0, 24.0, 27.0, 12.0, 10.0, 7.0, 9.0, 12.0, 5.0, 6.0, 8.0, 0.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-5.700688362121582, -5.527646064758301, -5.3546037673950195, -5.181561470031738, -5.008519172668457, -4.835476875305176, -4.6624345779418945, -4.489392280578613, -4.316349983215332, -4.143307685852051, -3.9702653884887695, -3.7972230911254883, -3.624180793762207, -3.451138496398926, -3.2780964374542236, -3.1050541400909424, -2.9320120811462402, -2.758969783782959, -2.5859274864196777, -2.4128851890563965, -2.2398428916931152, -2.066800594329834, -1.8937585353851318, -1.7207162380218506, -1.5476739406585693, -1.374631643295288, -1.2015893459320068, -1.0285471677780151, -0.8555048704147339, -0.6824625730514526, -0.5094203948974609, -0.3363780975341797, -0.16333532333374023, 0.009706944227218628, 0.1827492117881775, 0.35579144954681396, 0.5288337469100952, 0.7018760442733765, 0.8749182224273682, 1.0479605197906494, 1.2210028171539307, 1.394045114517212, 1.5670874118804932, 1.7401295900344849, 1.9131718873977661, 2.086214065551758, 2.259256362915039, 2.4322986602783203, 2.6053409576416016, 2.778383255004883, 2.951425552368164, 3.1244678497314453, 3.2975101470947266, 3.470552444458008, 3.64359450340271, 3.816636800765991, 3.9896790981292725, 4.162721157073975, 4.335763454437256, 4.508805751800537, 4.681848049163818, 4.8548903465271, 5.027932643890381, 5.200974941253662, 5.374017238616943]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 7.0, 8.0, 10.0, 6.0, 9.0, 15.0, 14.0, 9.0, 21.0, 18.0, 21.0, 31.0, 32.0, 34.0, 32.0, 27.0, 37.0, 32.0, 38.0, 40.0, 41.0, 48.0, 29.0, 28.0, 25.0, 30.0, 41.0, 31.0, 31.0, 31.0, 27.0, 22.0, 26.0, 20.0, 16.0, 13.0, 14.0, 13.0, 8.0, 8.0, 8.0, 7.0, 9.0, 3.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0], "bins": [-0.609375, -0.5915985107421875, -0.573822021484375, -0.5560455322265625, -0.53826904296875, -0.5204925537109375, -0.502716064453125, -0.4849395751953125, -0.4671630859375, -0.4493865966796875, -0.431610107421875, -0.4138336181640625, -0.39605712890625, -0.3782806396484375, -0.360504150390625, -0.3427276611328125, -0.324951171875, -0.3071746826171875, -0.289398193359375, -0.2716217041015625, -0.25384521484375, -0.2360687255859375, -0.218292236328125, -0.2005157470703125, -0.1827392578125, -0.1649627685546875, -0.147186279296875, -0.1294097900390625, -0.11163330078125, -0.0938568115234375, -0.076080322265625, -0.0583038330078125, -0.04052734375, -0.0227508544921875, -0.004974365234375, 0.0128021240234375, 0.03057861328125, 0.0483551025390625, 0.066131591796875, 0.0839080810546875, 0.1016845703125, 0.1194610595703125, 0.137237548828125, 0.1550140380859375, 0.17279052734375, 0.1905670166015625, 0.208343505859375, 0.2261199951171875, 0.243896484375, 0.2616729736328125, 0.279449462890625, 0.2972259521484375, 0.31500244140625, 0.3327789306640625, 0.350555419921875, 0.3683319091796875, 0.3861083984375, 0.4038848876953125, 0.421661376953125, 0.4394378662109375, 0.45721435546875, 0.4749908447265625, 0.492767333984375, 0.5105438232421875, 0.5283203125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 15.0, 24.0, 32.0, 38.0, 58.0, 97.0, 119.0, 174.0, 230.0, 356.0, 537.0, 737.0, 1104.0, 1681.0, 2337.0, 3638.0, 5558.0, 8490.0, 13441.0, 22065.0, 36307.0, 61827.0, 103913.0, 168785.0, 236645.0, 148566.0, 91301.0, 54167.0, 32191.0, 19273.0, 12092.0, 7674.0, 4985.0, 3161.0, 2271.0, 1471.0, 1013.0, 652.0, 463.0, 294.0, 239.0, 176.0, 110.0, 75.0, 55.0, 38.0, 29.0, 17.0, 13.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.3955078125, -1.3510284423828125, -1.306549072265625, -1.2620697021484375, -1.21759033203125, -1.1731109619140625, -1.128631591796875, -1.0841522216796875, -1.0396728515625, -0.9951934814453125, -0.950714111328125, -0.9062347412109375, -0.86175537109375, -0.8172760009765625, -0.772796630859375, -0.7283172607421875, -0.683837890625, -0.6393585205078125, -0.594879150390625, -0.5503997802734375, -0.50592041015625, -0.4614410400390625, -0.416961669921875, -0.3724822998046875, -0.3280029296875, -0.2835235595703125, -0.239044189453125, -0.1945648193359375, -0.15008544921875, -0.1056060791015625, -0.061126708984375, -0.0166473388671875, 0.02783203125, 0.0723114013671875, 0.116790771484375, 0.1612701416015625, 0.20574951171875, 0.2502288818359375, 0.294708251953125, 0.3391876220703125, 0.3836669921875, 0.4281463623046875, 0.472625732421875, 0.5171051025390625, 0.56158447265625, 0.6060638427734375, 0.650543212890625, 0.6950225830078125, 0.739501953125, 0.7839813232421875, 0.828460693359375, 0.8729400634765625, 0.91741943359375, 0.9618988037109375, 1.006378173828125, 1.0508575439453125, 1.0953369140625, 1.1398162841796875, 1.184295654296875, 1.2287750244140625, 1.27325439453125, 1.3177337646484375, 1.362213134765625, 1.4066925048828125, 1.451171875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 8.0, 14.0, 7.0, 11.0, 18.0, 10.0, 30.0, 27.0, 32.0, 31.0, 33.0, 34.0, 35.0, 42.0, 57.0, 37.0, 37.0, 1067.0, 56.0, 34.0, 57.0, 45.0, 43.0, 39.0, 32.0, 26.0, 40.0, 18.0, 27.0, 11.0, 5.0, 11.0, 10.0, 7.0, 7.0, 3.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.556640625, -0.5361862182617188, -0.5157318115234375, -0.49527740478515625, -0.474822998046875, -0.45436859130859375, -0.4339141845703125, -0.41345977783203125, -0.39300537109375, -0.37255096435546875, -0.3520965576171875, -0.33164215087890625, -0.311187744140625, -0.29073333740234375, -0.2702789306640625, -0.24982452392578125, -0.2293701171875, -0.20891571044921875, -0.1884613037109375, -0.16800689697265625, -0.147552490234375, -0.12709808349609375, -0.1066436767578125, -0.08618927001953125, -0.06573486328125, -0.04528045654296875, -0.0248260498046875, -0.00437164306640625, 0.016082763671875, 0.03653717041015625, 0.0569915771484375, 0.07744598388671875, 0.097900390625, 0.11835479736328125, 0.1388092041015625, 0.15926361083984375, 0.179718017578125, 0.20017242431640625, 0.2206268310546875, 0.24108123779296875, 0.26153564453125, 0.28199005126953125, 0.3024444580078125, 0.32289886474609375, 0.343353271484375, 0.36380767822265625, 0.3842620849609375, 0.40471649169921875, 0.4251708984375, 0.44562530517578125, 0.4660797119140625, 0.48653411865234375, 0.506988525390625, 0.5274429321289062, 0.5478973388671875, 0.5683517456054688, 0.58880615234375, 0.6092605590820312, 0.6297149658203125, 0.6501693725585938, 0.670623779296875, 0.6910781860351562, 0.7115325927734375, 0.7319869995117188, 0.75244140625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 1.0, 11.0, 6.0, 13.0, 15.0, 24.0, 37.0, 39.0, 69.0, 93.0, 150.0, 198.0, 339.0, 491.0, 792.0, 1246.0, 2029.0, 3418.0, 5747.0, 10337.0, 19361.0, 39588.0, 89547.0, 263337.0, 1069807.0, 376755.0, 113632.0, 47734.0, 23239.0, 12139.0, 6687.0, 3943.0, 2338.0, 1364.0, 912.0, 540.0, 357.0, 241.0, 158.0, 110.0, 87.0, 58.0, 37.0, 30.0, 29.0, 9.0, 15.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.302734375, -1.2639923095703125, -1.225250244140625, -1.1865081787109375, -1.14776611328125, -1.1090240478515625, -1.070281982421875, -1.0315399169921875, -0.9927978515625, -0.9540557861328125, -0.915313720703125, -0.8765716552734375, -0.83782958984375, -0.7990875244140625, -0.760345458984375, -0.7216033935546875, -0.682861328125, -0.6441192626953125, -0.605377197265625, -0.5666351318359375, -0.52789306640625, -0.4891510009765625, -0.450408935546875, -0.4116668701171875, -0.3729248046875, -0.3341827392578125, -0.295440673828125, -0.2566986083984375, -0.21795654296875, -0.1792144775390625, -0.140472412109375, -0.1017303466796875, -0.06298828125, -0.0242462158203125, 0.014495849609375, 0.0532379150390625, 0.09197998046875, 0.1307220458984375, 0.169464111328125, 0.2082061767578125, 0.2469482421875, 0.2856903076171875, 0.324432373046875, 0.3631744384765625, 0.40191650390625, 0.4406585693359375, 0.479400634765625, 0.5181427001953125, 0.556884765625, 0.5956268310546875, 0.634368896484375, 0.6731109619140625, 0.71185302734375, 0.7505950927734375, 0.789337158203125, 0.8280792236328125, 0.8668212890625, 0.9055633544921875, 0.944305419921875, 0.9830474853515625, 1.02178955078125, 1.0605316162109375, 1.099273681640625, 1.1380157470703125, 1.1767578125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 10.0, 13.0, 15.0, 19.0, 19.0, 43.0, 36.0, 49.0, 52.0, 88.0, 167.0, 106.0, 90.0, 61.0, 46.0, 36.0, 30.0, 23.0, 15.0, 15.0, 10.0, 8.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5036392211914062, -0.4882354736328125, -0.47283172607421875, -0.457427978515625, -0.44202423095703125, -0.4266204833984375, -0.41121673583984375, -0.39581298828125, -0.38040924072265625, -0.3650054931640625, -0.34960174560546875, -0.334197998046875, -0.31879425048828125, -0.3033905029296875, -0.28798675537109375, -0.2725830078125, -0.25717926025390625, -0.2417755126953125, -0.22637176513671875, -0.210968017578125, -0.19556427001953125, -0.1801605224609375, -0.16475677490234375, -0.14935302734375, -0.13394927978515625, -0.1185455322265625, -0.10314178466796875, -0.087738037109375, -0.07233428955078125, -0.0569305419921875, -0.04152679443359375, -0.026123046875, -0.01071929931640625, 0.0046844482421875, 0.02008819580078125, 0.035491943359375, 0.05089569091796875, 0.0662994384765625, 0.08170318603515625, 0.09710693359375, 0.11251068115234375, 0.1279144287109375, 0.14331817626953125, 0.158721923828125, 0.17412567138671875, 0.1895294189453125, 0.20493316650390625, 0.2203369140625, 0.23574066162109375, 0.2511444091796875, 0.26654815673828125, 0.281951904296875, 0.29735565185546875, 0.3127593994140625, 0.32816314697265625, 0.34356689453125, 0.35897064208984375, 0.3743743896484375, 0.38977813720703125, 0.405181884765625, 0.42058563232421875, 0.4359893798828125, 0.45139312744140625, 0.466796875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 6.0, 14.0, 16.0, 15.0, 22.0, 31.0, 40.0, 53.0, 100.0, 103.0, 202.0, 309.0, 852.0, 4756.0, 80259.0, 918941.0, 38201.0, 3084.0, 659.0, 274.0, 156.0, 120.0, 76.0, 61.0, 41.0, 31.0, 25.0, 27.0, 20.0, 10.0, 10.0, 6.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.77734375, -5.5872802734375, -5.397216796875, -5.2071533203125, -5.01708984375, -4.8270263671875, -4.636962890625, -4.4468994140625, -4.2568359375, -4.0667724609375, -3.876708984375, -3.6866455078125, -3.49658203125, -3.3065185546875, -3.116455078125, -2.9263916015625, -2.736328125, -2.5462646484375, -2.356201171875, -2.1661376953125, -1.97607421875, -1.7860107421875, -1.595947265625, -1.4058837890625, -1.2158203125, -1.0257568359375, -0.835693359375, -0.6456298828125, -0.45556640625, -0.2655029296875, -0.075439453125, 0.1146240234375, 0.3046875, 0.4947509765625, 0.684814453125, 0.8748779296875, 1.06494140625, 1.2550048828125, 1.445068359375, 1.6351318359375, 1.8251953125, 2.0152587890625, 2.205322265625, 2.3953857421875, 2.58544921875, 2.7755126953125, 2.965576171875, 3.1556396484375, 3.345703125, 3.5357666015625, 3.725830078125, 3.9158935546875, 4.10595703125, 4.2960205078125, 4.486083984375, 4.6761474609375, 4.8662109375, 5.0562744140625, 5.246337890625, 5.4364013671875, 5.62646484375, 5.8165283203125, 6.006591796875, 6.1966552734375, 6.38671875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 6.0, 21.0, 33.0, 71.0, 110.0, 174.0, 207.0, 168.0, 110.0, 46.0, 24.0, 16.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2841310501098633, -1.2372486591339111, -1.190366268157959, -1.1434838771820068, -1.0966014862060547, -1.0497190952301025, -1.0028367042541504, -0.9559541940689087, -0.9090718030929565, -0.8621894121170044, -0.8153070211410522, -0.7684246301651001, -0.7215421795845032, -0.674659788608551, -0.6277773976325989, -0.580894947052002, -0.5340126156806946, -0.48713022470474243, -0.4402478039264679, -0.39336541295051575, -0.3464829921722412, -0.29960060119628906, -0.2527182102203369, -0.20583578944206238, -0.15895339846611023, -0.11207099258899689, -0.06518859416246414, -0.018306195735931396, 0.028576210141181946, 0.07545861601829529, 0.12234100699424744, 0.16922342777252197, 0.21610581874847412, 0.26298820972442627, 0.3098706305027008, 0.35675302147865295, 0.4036354422569275, 0.45051783323287964, 0.4974002242088318, 0.5442826747894287, 0.5911650657653809, 0.638047456741333, 0.6849298477172852, 0.7318122386932373, 0.7786946892738342, 0.8255770802497864, 0.8724594712257385, 0.9193419218063354, 0.9662242531776428, 1.0131067037582397, 1.059989094734192, 1.106871485710144, 1.1537538766860962, 1.2006362676620483, 1.2475186586380005, 1.2944010496139526, 1.3412834405899048, 1.388165831565857, 1.435048222541809, 1.4819306135177612, 1.5288130044937134, 1.575695514678955, 1.6225779056549072, 1.6694602966308594, 1.7163426876068115]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 13.0, 8.0, 12.0, 16.0, 19.0, 23.0, 28.0, 18.0, 29.0, 34.0, 36.0, 34.0, 35.0, 45.0, 55.0, 33.0, 53.0, 42.0, 52.0, 51.0, 35.0, 32.0, 25.0, 23.0, 45.0, 28.0, 17.0, 28.0, 27.0, 17.0, 15.0, 8.0, 10.0, 9.0, 6.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5162479877471924, -0.4997146427631378, -0.48318129777908325, -0.4666479527950287, -0.4501146078109741, -0.43358129262924194, -0.4170479476451874, -0.4005146026611328, -0.38398125767707825, -0.3674479126930237, -0.3509145677089691, -0.33438122272491455, -0.3178479075431824, -0.3013145327568054, -0.28478121757507324, -0.2682478725910187, -0.2517145276069641, -0.23518118262290955, -0.21864783763885498, -0.2021145075559616, -0.18558116257190704, -0.16904781758785248, -0.1525144875049591, -0.13598114252090454, -0.11944779753684998, -0.10291445255279541, -0.08638111501932144, -0.06984777748584747, -0.05331443250179291, -0.03678108751773834, -0.020247749984264374, -0.0037144124507904053, 0.01281893253326416, 0.029352273792028427, 0.045885615050792694, 0.06241895630955696, 0.07895229756832123, 0.0954856425523758, 0.11201898008584976, 0.12855231761932373, 0.1450856626033783, 0.16161900758743286, 0.17815235257148743, 0.1946856826543808, 0.21121902763843536, 0.22775237262248993, 0.2442857027053833, 0.26081904768943787, 0.27735239267349243, 0.293885737657547, 0.31041908264160156, 0.32695242762565613, 0.3434857726097107, 0.36001908779144287, 0.37655243277549744, 0.393085777759552, 0.40961912274360657, 0.42615246772766113, 0.4426858127117157, 0.45921915769577026, 0.47575247287750244, 0.4922858476638794, 0.5088191628456116, 0.5253524780273438, 0.5418858528137207]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 9.0, 0.0, 6.0, 4.0, 12.0, 7.0, 6.0, 15.0, 12.0, 9.0, 13.0, 19.0, 20.0, 25.0, 27.0, 29.0, 31.0, 34.0, 32.0, 37.0, 29.0, 44.0, 35.0, 46.0, 36.0, 36.0, 25.0, 24.0, 33.0, 31.0, 40.0, 26.0, 36.0, 22.0, 26.0, 21.0, 27.0, 14.0, 12.0, 20.0, 9.0, 3.0, 10.0, 10.0, 6.0, 8.0, 6.0, 3.0, 9.0, 1.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.6064453125, -0.5887527465820312, -0.5710601806640625, -0.5533676147460938, -0.535675048828125, -0.5179824829101562, -0.5002899169921875, -0.48259735107421875, -0.46490478515625, -0.44721221923828125, -0.4295196533203125, -0.41182708740234375, -0.394134521484375, -0.37644195556640625, -0.3587493896484375, -0.34105682373046875, -0.3233642578125, -0.30567169189453125, -0.2879791259765625, -0.27028656005859375, -0.252593994140625, -0.23490142822265625, -0.2172088623046875, -0.19951629638671875, -0.18182373046875, -0.16413116455078125, -0.1464385986328125, -0.12874603271484375, -0.111053466796875, -0.09336090087890625, -0.0756683349609375, -0.05797576904296875, -0.040283203125, -0.02259063720703125, -0.0048980712890625, 0.01279449462890625, 0.030487060546875, 0.04817962646484375, 0.0658721923828125, 0.08356475830078125, 0.10125732421875, 0.11894989013671875, 0.1366424560546875, 0.15433502197265625, 0.172027587890625, 0.18972015380859375, 0.2074127197265625, 0.22510528564453125, 0.2427978515625, 0.26049041748046875, 0.2781829833984375, 0.29587554931640625, 0.313568115234375, 0.33126068115234375, 0.3489532470703125, 0.36664581298828125, 0.38433837890625, 0.40203094482421875, 0.4197235107421875, 0.43741607666015625, 0.455108642578125, 0.47280120849609375, 0.4904937744140625, 0.5081863403320312, 0.52587890625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 7.0, 9.0, 5.0, 13.0, 21.0, 21.0, 44.0, 56.0, 79.0, 117.0, 166.0, 206.0, 279.0, 392.0, 563.0, 751.0, 1059.0, 1529.0, 2200.0, 3282.0, 5330.0, 8702.0, 14807.0, 27328.0, 57994.0, 134099.0, 314829.0, 263244.0, 106035.0, 47106.0, 23408.0, 12737.0, 7610.0, 4645.0, 3029.0, 1984.0, 1429.0, 980.0, 683.0, 501.0, 353.0, 265.0, 186.0, 142.0, 95.0, 71.0, 47.0, 39.0, 27.0, 18.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.69384765625, -0.6713714599609375, -0.648895263671875, -0.6264190673828125, -0.60394287109375, -0.5814666748046875, -0.558990478515625, -0.5365142822265625, -0.5140380859375, -0.4915618896484375, -0.469085693359375, -0.4466094970703125, -0.42413330078125, -0.4016571044921875, -0.379180908203125, -0.3567047119140625, -0.334228515625, -0.3117523193359375, -0.289276123046875, -0.2667999267578125, -0.24432373046875, -0.2218475341796875, -0.199371337890625, -0.1768951416015625, -0.1544189453125, -0.1319427490234375, -0.109466552734375, -0.0869903564453125, -0.06451416015625, -0.0420379638671875, -0.019561767578125, 0.0029144287109375, 0.025390625, 0.0478668212890625, 0.070343017578125, 0.0928192138671875, 0.11529541015625, 0.1377716064453125, 0.160247802734375, 0.1827239990234375, 0.2052001953125, 0.2276763916015625, 0.250152587890625, 0.2726287841796875, 0.29510498046875, 0.3175811767578125, 0.340057373046875, 0.3625335693359375, 0.385009765625, 0.4074859619140625, 0.429962158203125, 0.4524383544921875, 0.47491455078125, 0.4973907470703125, 0.519866943359375, 0.5423431396484375, 0.5648193359375, 0.5872955322265625, 0.609771728515625, 0.6322479248046875, 0.65472412109375, 0.6772003173828125, 0.699676513671875, 0.7221527099609375, 0.74462890625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 10.0, 4.0, 8.0, 7.0, 7.0, 17.0, 12.0, 22.0, 31.0, 20.0, 24.0, 27.0, 36.0, 29.0, 31.0, 37.0, 55.0, 70.0, 115.0, 197.0, 1422.0, 211.0, 128.0, 73.0, 79.0, 39.0, 58.0, 41.0, 31.0, 29.0, 21.0, 27.0, 17.0, 14.0, 12.0, 11.0, 9.0, 18.0, 9.0, 11.0, 7.0, 4.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.986328125, -1.921478271484375, -1.85662841796875, -1.791778564453125, -1.7269287109375, -1.662078857421875, -1.59722900390625, -1.532379150390625, -1.467529296875, -1.402679443359375, -1.33782958984375, -1.272979736328125, -1.2081298828125, -1.143280029296875, -1.07843017578125, -1.013580322265625, -0.94873046875, -0.883880615234375, -0.81903076171875, -0.754180908203125, -0.6893310546875, -0.624481201171875, -0.55963134765625, -0.494781494140625, -0.429931640625, -0.365081787109375, -0.30023193359375, -0.235382080078125, -0.1705322265625, -0.105682373046875, -0.04083251953125, 0.024017333984375, 0.0888671875, 0.153717041015625, 0.21856689453125, 0.283416748046875, 0.3482666015625, 0.413116455078125, 0.47796630859375, 0.542816162109375, 0.607666015625, 0.672515869140625, 0.73736572265625, 0.802215576171875, 0.8670654296875, 0.931915283203125, 0.99676513671875, 1.061614990234375, 1.12646484375, 1.191314697265625, 1.25616455078125, 1.321014404296875, 1.3858642578125, 1.450714111328125, 1.51556396484375, 1.580413818359375, 1.645263671875, 1.710113525390625, 1.77496337890625, 1.839813232421875, 1.9046630859375, 1.969512939453125, 2.03436279296875, 2.099212646484375, 2.1640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 7.0, 8.0, 13.0, 10.0, 13.0, 22.0, 26.0, 28.0, 38.0, 57.0, 66.0, 106.0, 185.0, 305.0, 544.0, 1133.0, 2635.0, 7504.0, 28439.0, 165045.0, 2071851.0, 764591.0, 78193.0, 16342.0, 4762.0, 1773.0, 835.0, 396.0, 244.0, 156.0, 96.0, 70.0, 45.0, 31.0, 36.0, 25.0, 15.0, 12.0, 4.0, 7.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.498046875, -2.421905517578125, -2.34576416015625, -2.269622802734375, -2.1934814453125, -2.117340087890625, -2.04119873046875, -1.965057373046875, -1.888916015625, -1.812774658203125, -1.73663330078125, -1.660491943359375, -1.5843505859375, -1.508209228515625, -1.43206787109375, -1.355926513671875, -1.27978515625, -1.203643798828125, -1.12750244140625, -1.051361083984375, -0.9752197265625, -0.899078369140625, -0.82293701171875, -0.746795654296875, -0.670654296875, -0.594512939453125, -0.51837158203125, -0.442230224609375, -0.3660888671875, -0.289947509765625, -0.21380615234375, -0.137664794921875, -0.0615234375, 0.014617919921875, 0.09075927734375, 0.166900634765625, 0.2430419921875, 0.319183349609375, 0.39532470703125, 0.471466064453125, 0.547607421875, 0.623748779296875, 0.69989013671875, 0.776031494140625, 0.8521728515625, 0.928314208984375, 1.00445556640625, 1.080596923828125, 1.15673828125, 1.232879638671875, 1.30902099609375, 1.385162353515625, 1.4613037109375, 1.537445068359375, 1.61358642578125, 1.689727783203125, 1.765869140625, 1.842010498046875, 1.91815185546875, 1.994293212890625, 2.0704345703125, 2.146575927734375, 2.22271728515625, 2.298858642578125, 2.375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 4.0, 63.0, 337.0, 444.0, 153.0, 13.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.971606492996216, -2.269253730773926, -1.5669008493423462, -0.8645479679107666, -0.16219520568847656, 0.5401575565338135, 1.2425105571746826, 1.9448630809783936, 2.6472160816192627, 3.3495688438415527, 4.051921844482422, 4.754274368286133, 5.456627368927002, 6.158980369567871, 6.861332893371582, 7.563685417175293, 8.26603889465332, 8.968391418457031, 9.670744895935059, 10.37309741973877, 11.07544994354248, 11.777803421020508, 12.480155944824219, 13.18250846862793, 13.88486099243164, 14.587213516235352, 15.289566993713379, 15.99191951751709, 16.694272994995117, 17.396625518798828, 18.09897804260254, 18.80133056640625, 19.50368309020996, 20.206035614013672, 20.908388137817383, 21.610740661621094, 22.313095092773438, 23.01544761657715, 23.71780014038086, 24.42015266418457, 25.12250518798828, 25.824857711791992, 26.527210235595703, 27.229564666748047, 27.931917190551758, 28.63426971435547, 29.33662223815918, 30.03897476196289, 30.741329193115234, 31.443681716918945, 32.146034240722656, 32.848388671875, 33.55073928833008, 34.25309371948242, 34.9554443359375, 35.657798767089844, 36.36014938354492, 37.062503814697266, 37.764854431152344, 38.46720886230469, 39.169559478759766, 39.87191390991211, 40.57426452636719, 41.27661895751953, 41.978973388671875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 7.0, 12.0, 14.0, 21.0, 17.0, 20.0, 21.0, 23.0, 31.0, 37.0, 23.0, 29.0, 29.0, 39.0, 33.0, 38.0, 40.0, 44.0, 32.0, 48.0, 57.0, 42.0, 36.0, 36.0, 34.0, 24.0, 26.0, 27.0, 28.0, 28.0, 16.0, 17.0, 16.0, 6.0, 11.0, 11.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.071586608886719, -7.83027982711792, -7.588973045349121, -7.3476667404174805, -7.106359958648682, -6.865053176879883, -6.623746395111084, -6.382439613342285, -6.1411333084106445, -5.899826526641846, -5.658519744873047, -5.417213439941406, -5.175906658172607, -4.934599876403809, -4.69329309463501, -4.451986312866211, -4.210679531097412, -3.9693727493286133, -3.7280662059783936, -3.4867594242095947, -3.245452880859375, -3.004146099090576, -2.7628393173217773, -2.5215325355529785, -2.280225992202759, -2.03891921043396, -1.7976126670837402, -1.5563058853149414, -1.3149992227554321, -1.0736925601959229, -0.832385778427124, -0.5910791158676147, -0.34977245330810547, -0.1084657609462738, 0.13284093141555786, 0.3741476535797119, 0.6154543161392212, 0.8567609786987305, 1.0980677604675293, 1.3393744230270386, 1.5806810855865479, 1.8219877481460571, 2.0632944107055664, 2.3046011924743652, 2.545907974243164, 2.787214517593384, 3.0285212993621826, 3.2698278427124023, 3.511134624481201, 3.75244140625, 3.9937479496002197, 4.235054969787598, 4.476361274719238, 4.717668056488037, 4.958974838256836, 5.200281620025635, 5.441588401794434, 5.682895183563232, 5.924201965332031, 6.165508270263672, 6.406815052032471, 6.6481218338012695, 6.889428615570068, 7.130735397338867, 7.372041702270508]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 10.0, 13.0, 17.0, 10.0, 19.0, 15.0, 21.0, 27.0, 21.0, 35.0, 33.0, 34.0, 35.0, 41.0, 40.0, 34.0, 36.0, 43.0, 32.0, 36.0, 22.0, 41.0, 38.0, 38.0, 25.0, 36.0, 24.0, 21.0, 21.0, 19.0, 21.0, 17.0, 9.0, 11.0, 11.0, 8.0, 10.0, 7.0, 5.0, 12.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.60302734375, -0.5845184326171875, -0.566009521484375, -0.5475006103515625, -0.52899169921875, -0.5104827880859375, -0.491973876953125, -0.4734649658203125, -0.4549560546875, -0.4364471435546875, -0.417938232421875, -0.3994293212890625, -0.38092041015625, -0.3624114990234375, -0.343902587890625, -0.3253936767578125, -0.306884765625, -0.2883758544921875, -0.269866943359375, -0.2513580322265625, -0.23284912109375, -0.2143402099609375, -0.195831298828125, -0.1773223876953125, -0.1588134765625, -0.1403045654296875, -0.121795654296875, -0.1032867431640625, -0.08477783203125, -0.0662689208984375, -0.047760009765625, -0.0292510986328125, -0.0107421875, 0.0077667236328125, 0.026275634765625, 0.0447845458984375, 0.06329345703125, 0.0818023681640625, 0.100311279296875, 0.1188201904296875, 0.1373291015625, 0.1558380126953125, 0.174346923828125, 0.1928558349609375, 0.21136474609375, 0.2298736572265625, 0.248382568359375, 0.2668914794921875, 0.285400390625, 0.3039093017578125, 0.322418212890625, 0.3409271240234375, 0.35943603515625, 0.3779449462890625, 0.396453857421875, 0.4149627685546875, 0.4334716796875, 0.4519805908203125, 0.470489501953125, 0.4889984130859375, 0.50750732421875, 0.5260162353515625, 0.544525146484375, 0.5630340576171875, 0.58154296875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 7.0, 27.0, 27.0, 30.0, 55.0, 76.0, 102.0, 144.0, 241.0, 271.0, 472.0, 755.0, 1181.0, 1928.0, 3414.0, 6337.0, 12121.0, 26503.0, 66680.0, 259691.0, 1876148.0, 1608059.0, 220138.0, 59731.0, 24532.0, 11401.0, 5877.0, 3148.0, 1840.0, 1126.0, 741.0, 423.0, 300.0, 224.0, 136.0, 121.0, 76.0, 52.0, 34.0, 36.0, 14.0, 10.0, 10.0, 11.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3642578125, -1.3187103271484375, -1.273162841796875, -1.2276153564453125, -1.18206787109375, -1.1365203857421875, -1.090972900390625, -1.0454254150390625, -0.9998779296875, -0.9543304443359375, -0.908782958984375, -0.8632354736328125, -0.81768798828125, -0.7721405029296875, -0.726593017578125, -0.6810455322265625, -0.635498046875, -0.5899505615234375, -0.544403076171875, -0.4988555908203125, -0.45330810546875, -0.4077606201171875, -0.362213134765625, -0.3166656494140625, -0.2711181640625, -0.2255706787109375, -0.180023193359375, -0.1344757080078125, -0.08892822265625, -0.0433807373046875, 0.002166748046875, 0.0477142333984375, 0.09326171875, 0.1388092041015625, 0.184356689453125, 0.2299041748046875, 0.27545166015625, 0.3209991455078125, 0.366546630859375, 0.4120941162109375, 0.4576416015625, 0.5031890869140625, 0.548736572265625, 0.5942840576171875, 0.63983154296875, 0.6853790283203125, 0.730926513671875, 0.7764739990234375, 0.822021484375, 0.8675689697265625, 0.913116455078125, 0.9586639404296875, 1.00421142578125, 1.0497589111328125, 1.095306396484375, 1.1408538818359375, 1.1864013671875, 1.2319488525390625, 1.277496337890625, 1.3230438232421875, 1.36859130859375, 1.4141387939453125, 1.459686279296875, 1.5052337646484375, 1.55078125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 4.0, 8.0, 8.0, 16.0, 13.0, 22.0, 23.0, 38.0, 52.0, 69.0, 102.0, 194.0, 241.0, 397.0, 600.0, 689.0, 557.0, 330.0, 203.0, 150.0, 110.0, 71.0, 50.0, 37.0, 24.0, 17.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.46875, -2.4060211181640625, -2.343292236328125, -2.2805633544921875, -2.21783447265625, -2.1551055908203125, -2.092376708984375, -2.0296478271484375, -1.9669189453125, -1.9041900634765625, -1.841461181640625, -1.7787322998046875, -1.71600341796875, -1.6532745361328125, -1.590545654296875, -1.5278167724609375, -1.465087890625, -1.4023590087890625, -1.339630126953125, -1.2769012451171875, -1.21417236328125, -1.1514434814453125, -1.088714599609375, -1.0259857177734375, -0.9632568359375, -0.9005279541015625, -0.837799072265625, -0.7750701904296875, -0.71234130859375, -0.6496124267578125, -0.586883544921875, -0.5241546630859375, -0.46142578125, -0.3986968994140625, -0.335968017578125, -0.2732391357421875, -0.21051025390625, -0.1477813720703125, -0.085052490234375, -0.0223236083984375, 0.0404052734375, 0.1031341552734375, 0.165863037109375, 0.2285919189453125, 0.29132080078125, 0.3540496826171875, 0.416778564453125, 0.4795074462890625, 0.542236328125, 0.6049652099609375, 0.667694091796875, 0.7304229736328125, 0.79315185546875, 0.8558807373046875, 0.918609619140625, 0.9813385009765625, 1.0440673828125, 1.1067962646484375, 1.169525146484375, 1.2322540283203125, 1.29498291015625, 1.3577117919921875, 1.420440673828125, 1.4831695556640625, 1.5458984375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 9.0, 13.0, 23.0, 37.0, 46.0, 64.0, 111.0, 150.0, 212.0, 344.0, 600.0, 1018.0, 1563.0, 2958.0, 5719.0, 11652.0, 26101.0, 68469.0, 245341.0, 1661228.0, 1784862.0, 260539.0, 71222.0, 26682.0, 12006.0, 5869.0, 3078.0, 1774.0, 988.0, 559.0, 360.0, 218.0, 139.0, 92.0, 59.0, 44.0, 35.0, 29.0, 18.0, 14.0, 8.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3671875, -2.285614013671875, -2.20404052734375, -2.122467041015625, -2.0408935546875, -1.959320068359375, -1.87774658203125, -1.796173095703125, -1.714599609375, -1.633026123046875, -1.55145263671875, -1.469879150390625, -1.3883056640625, -1.306732177734375, -1.22515869140625, -1.143585205078125, -1.06201171875, -0.980438232421875, -0.89886474609375, -0.817291259765625, -0.7357177734375, -0.654144287109375, -0.57257080078125, -0.490997314453125, -0.409423828125, -0.327850341796875, -0.24627685546875, -0.164703369140625, -0.0831298828125, -0.001556396484375, 0.08001708984375, 0.161590576171875, 0.2431640625, 0.324737548828125, 0.40631103515625, 0.487884521484375, 0.5694580078125, 0.651031494140625, 0.73260498046875, 0.814178466796875, 0.895751953125, 0.977325439453125, 1.05889892578125, 1.140472412109375, 1.2220458984375, 1.303619384765625, 1.38519287109375, 1.466766357421875, 1.54833984375, 1.629913330078125, 1.71148681640625, 1.793060302734375, 1.8746337890625, 1.956207275390625, 2.03778076171875, 2.119354248046875, 2.200927734375, 2.282501220703125, 2.36407470703125, 2.445648193359375, 2.5272216796875, 2.608795166015625, 2.69036865234375, 2.771942138671875, 2.853515625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 13.0, 17.0, 44.0, 72.0, 139.0, 205.0, 186.0, 172.0, 86.0, 39.0, 24.0, 11.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.67986488342285, -21.0456485748291, -20.41143226623535, -19.777217864990234, -19.143001556396484, -18.508785247802734, -17.874568939208984, -17.240352630615234, -16.606136322021484, -15.971920013427734, -15.3377046585083, -14.70348834991455, -14.069272994995117, -13.435056686401367, -12.800840377807617, -12.166624069213867, -11.53240966796875, -10.898193359375, -10.263978004455566, -9.629761695861816, -8.995546340942383, -8.361330032348633, -7.727113723754883, -7.092897891998291, -6.458682060241699, -5.824466228485107, -5.190250396728516, -4.556034088134766, -3.921818256378174, -3.287602424621582, -2.653386354446411, -2.0191702842712402, -1.3849544525146484, -0.7507385015487671, -0.11652255058288574, 0.5176934003829956, 1.151909351348877, 1.7861251831054688, 2.4203412532806396, 3.0545573234558105, 3.6887731552124023, 4.322988986968994, 4.957204818725586, 5.591421127319336, 6.225636959075928, 6.8598527908325195, 7.4940690994262695, 8.128284454345703, 8.762500762939453, 9.396717071533203, 10.030932426452637, 10.665148735046387, 11.29936408996582, 11.93358039855957, 12.56779670715332, 13.20201301574707, 13.836228370666504, 14.470444679260254, 15.104660034179688, 15.738876342773438, 16.373092651367188, 17.007308959960938, 17.641523361206055, 18.275739669799805, 18.909955978393555]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 10.0, 4.0, 10.0, 13.0, 17.0, 19.0, 28.0, 25.0, 20.0, 30.0, 35.0, 42.0, 43.0, 32.0, 39.0, 48.0, 34.0, 42.0, 42.0, 31.0, 45.0, 30.0, 44.0, 32.0, 37.0, 35.0, 38.0, 29.0, 31.0, 12.0, 18.0, 14.0, 8.0, 11.0, 9.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.709970951080322, -5.535203456878662, -5.36043643951416, -5.1856689453125, -5.01090145111084, -4.836134433746338, -4.661366939544678, -4.486599922180176, -4.311832427978516, -4.1370649337768555, -3.9622979164123535, -3.7875304222106934, -3.6127631664276123, -3.4379959106445312, -3.263228416442871, -3.08846116065979, -2.913693904876709, -2.738926649093628, -2.564159393310547, -2.3893918991088867, -2.2146246433258057, -2.0398573875427246, -1.865090012550354, -1.6903226375579834, -1.5155553817749023, -1.3407881259918213, -1.1660207509994507, -0.9912534356117249, -0.816486120223999, -0.6417188048362732, -0.46695148944854736, -0.29218411445617676, -0.1174163818359375, 0.05735093355178833, 0.23211824893951416, 0.40688556432724, 0.5816528797149658, 0.7564201951026917, 0.9311875104904175, 1.105954885482788, 1.2807221412658691, 1.4554893970489502, 1.6302567720413208, 1.8050241470336914, 1.9797914028167725, 2.1545586585998535, 2.3293261528015137, 2.5040934085845947, 2.678860664367676, 2.853627920150757, 3.028395175933838, 3.203162670135498, 3.377929925918579, 3.55269718170166, 3.7274646759033203, 3.9022319316864014, 4.076999187469482, 4.251766681671143, 4.4265336990356445, 4.601301193237305, 4.776068687438965, 4.950835704803467, 5.125603199005127, 5.300370216369629, 5.475137710571289]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 3.0, 9.0, 10.0, 6.0, 12.0, 12.0, 12.0, 19.0, 20.0, 27.0, 24.0, 20.0, 25.0, 31.0, 39.0, 45.0, 43.0, 34.0, 37.0, 31.0, 43.0, 41.0, 34.0, 37.0, 35.0, 26.0, 31.0, 21.0, 36.0, 29.0, 31.0, 20.0, 26.0, 12.0, 17.0, 14.0, 9.0, 7.0, 13.0, 6.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5495758056640625, -0.530303955078125, -0.5110321044921875, -0.49176025390625, -0.4724884033203125, -0.453216552734375, -0.4339447021484375, -0.4146728515625, -0.3954010009765625, -0.376129150390625, -0.3568572998046875, -0.33758544921875, -0.3183135986328125, -0.299041748046875, -0.2797698974609375, -0.260498046875, -0.2412261962890625, -0.221954345703125, -0.2026824951171875, -0.18341064453125, -0.1641387939453125, -0.144866943359375, -0.1255950927734375, -0.1063232421875, -0.0870513916015625, -0.067779541015625, -0.0485076904296875, -0.02923583984375, -0.0099639892578125, 0.009307861328125, 0.0285797119140625, 0.0478515625, 0.0671234130859375, 0.086395263671875, 0.1056671142578125, 0.12493896484375, 0.1442108154296875, 0.163482666015625, 0.1827545166015625, 0.2020263671875, 0.2212982177734375, 0.240570068359375, 0.2598419189453125, 0.27911376953125, 0.2983856201171875, 0.317657470703125, 0.3369293212890625, 0.356201171875, 0.3754730224609375, 0.394744873046875, 0.4140167236328125, 0.43328857421875, 0.4525604248046875, 0.471832275390625, 0.4911041259765625, 0.5103759765625, 0.5296478271484375, 0.548919677734375, 0.5681915283203125, 0.58746337890625, 0.6067352294921875, 0.626007080078125, 0.6452789306640625, 0.66455078125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 12.0, 7.0, 11.0, 25.0, 30.0, 59.0, 77.0, 124.0, 146.0, 231.0, 349.0, 545.0, 890.0, 1353.0, 2123.0, 3293.0, 5354.0, 8456.0, 13622.0, 22529.0, 36028.0, 59649.0, 105900.0, 259524.0, 264777.0, 106758.0, 60821.0, 36506.0, 22218.0, 13677.0, 8486.0, 5535.0, 3431.0, 2111.0, 1389.0, 844.0, 554.0, 366.0, 270.0, 142.0, 94.0, 83.0, 42.0, 30.0, 40.0, 11.0, 11.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 3.0], "bins": [-1.1572265625, -1.123199462890625, -1.08917236328125, -1.055145263671875, -1.0211181640625, -0.987091064453125, -0.95306396484375, -0.919036865234375, -0.885009765625, -0.850982666015625, -0.81695556640625, -0.782928466796875, -0.7489013671875, -0.714874267578125, -0.68084716796875, -0.646820068359375, -0.61279296875, -0.578765869140625, -0.54473876953125, -0.510711669921875, -0.4766845703125, -0.442657470703125, -0.40863037109375, -0.374603271484375, -0.340576171875, -0.306549072265625, -0.27252197265625, -0.238494873046875, -0.2044677734375, -0.170440673828125, -0.13641357421875, -0.102386474609375, -0.068359375, -0.034332275390625, -0.00030517578125, 0.033721923828125, 0.0677490234375, 0.101776123046875, 0.13580322265625, 0.169830322265625, 0.203857421875, 0.237884521484375, 0.27191162109375, 0.305938720703125, 0.3399658203125, 0.373992919921875, 0.40802001953125, 0.442047119140625, 0.47607421875, 0.510101318359375, 0.54412841796875, 0.578155517578125, 0.6121826171875, 0.646209716796875, 0.68023681640625, 0.714263916015625, 0.748291015625, 0.782318115234375, 0.81634521484375, 0.850372314453125, 0.8843994140625, 0.918426513671875, 0.95245361328125, 0.986480712890625, 1.0205078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 6.0, 7.0, 11.0, 10.0, 10.0, 13.0, 12.0, 16.0, 18.0, 21.0, 18.0, 17.0, 31.0, 31.0, 20.0, 36.0, 30.0, 35.0, 34.0, 39.0, 28.0, 1069.0, 31.0, 29.0, 40.0, 37.0, 24.0, 31.0, 37.0, 27.0, 31.0, 27.0, 24.0, 20.0, 22.0, 15.0, 22.0, 20.0, 12.0, 6.0, 12.0, 9.0, 4.0, 4.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.509765625, -0.49430084228515625, -0.4788360595703125, -0.46337127685546875, -0.447906494140625, -0.43244171142578125, -0.4169769287109375, -0.40151214599609375, -0.38604736328125, -0.37058258056640625, -0.3551177978515625, -0.33965301513671875, -0.324188232421875, -0.30872344970703125, -0.2932586669921875, -0.27779388427734375, -0.2623291015625, -0.24686431884765625, -0.2313995361328125, -0.21593475341796875, -0.200469970703125, -0.18500518798828125, -0.1695404052734375, -0.15407562255859375, -0.13861083984375, -0.12314605712890625, -0.1076812744140625, -0.09221649169921875, -0.076751708984375, -0.06128692626953125, -0.0458221435546875, -0.03035736083984375, -0.014892578125, 0.00057220458984375, 0.0160369873046875, 0.03150177001953125, 0.046966552734375, 0.06243133544921875, 0.0778961181640625, 0.09336090087890625, 0.10882568359375, 0.12429046630859375, 0.1397552490234375, 0.15522003173828125, 0.170684814453125, 0.18614959716796875, 0.2016143798828125, 0.21707916259765625, 0.2325439453125, 0.24800872802734375, 0.2634735107421875, 0.27893829345703125, 0.294403076171875, 0.30986785888671875, 0.3253326416015625, 0.34079742431640625, 0.35626220703125, 0.37172698974609375, 0.3871917724609375, 0.40265655517578125, 0.418121337890625, 0.43358612060546875, 0.4490509033203125, 0.46451568603515625, 0.47998046875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 9.0, 12.0, 15.0, 13.0, 20.0, 40.0, 56.0, 78.0, 121.0, 161.0, 193.0, 334.0, 434.0, 596.0, 846.0, 1194.0, 1915.0, 2802.0, 4365.0, 6840.0, 10776.0, 17838.0, 31427.0, 60110.0, 129782.0, 436199.0, 1019696.0, 192121.0, 79812.0, 40338.0, 22176.0, 13170.0, 8056.0, 5001.0, 3440.0, 2175.0, 1562.0, 1056.0, 698.0, 483.0, 322.0, 270.0, 166.0, 123.0, 97.0, 54.0, 47.0, 31.0, 22.0, 12.0, 10.0, 8.0, 9.0, 5.0, 2.0, 0.0, 4.0], "bins": [-0.7490234375, -0.7264633178710938, -0.7039031982421875, -0.6813430786132812, -0.658782958984375, -0.6362228393554688, -0.6136627197265625, -0.5911026000976562, -0.56854248046875, -0.5459823608398438, -0.5234222412109375, -0.5008621215820312, -0.478302001953125, -0.45574188232421875, -0.4331817626953125, -0.41062164306640625, -0.3880615234375, -0.36550140380859375, -0.3429412841796875, -0.32038116455078125, -0.297821044921875, -0.27526092529296875, -0.2527008056640625, -0.23014068603515625, -0.20758056640625, -0.18502044677734375, -0.1624603271484375, -0.13990020751953125, -0.117340087890625, -0.09477996826171875, -0.0722198486328125, -0.04965972900390625, -0.027099609375, -0.00453948974609375, 0.0180206298828125, 0.04058074951171875, 0.063140869140625, 0.08570098876953125, 0.1082611083984375, 0.13082122802734375, 0.15338134765625, 0.17594146728515625, 0.1985015869140625, 0.22106170654296875, 0.243621826171875, 0.26618194580078125, 0.2887420654296875, 0.31130218505859375, 0.3338623046875, 0.35642242431640625, 0.3789825439453125, 0.40154266357421875, 0.424102783203125, 0.44666290283203125, 0.4692230224609375, 0.49178314208984375, 0.51434326171875, 0.5369033813476562, 0.5594635009765625, 0.5820236206054688, 0.604583740234375, 0.6271438598632812, 0.6497039794921875, 0.6722640991210938, 0.69482421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 4.0, 10.0, 12.0, 13.0, 7.0, 13.0, 14.0, 26.0, 21.0, 33.0, 55.0, 97.0, 213.0, 180.0, 70.0, 40.0, 34.0, 30.0, 25.0, 21.0, 15.0, 9.0, 10.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.451416015625, -0.4391937255859375, -0.426971435546875, -0.4147491455078125, -0.40252685546875, -0.3903045654296875, -0.378082275390625, -0.3658599853515625, -0.3536376953125, -0.3414154052734375, -0.329193115234375, -0.3169708251953125, -0.30474853515625, -0.2925262451171875, -0.280303955078125, -0.2680816650390625, -0.255859375, -0.2436370849609375, -0.231414794921875, -0.2191925048828125, -0.20697021484375, -0.1947479248046875, -0.182525634765625, -0.1703033447265625, -0.1580810546875, -0.1458587646484375, -0.133636474609375, -0.1214141845703125, -0.10919189453125, -0.0969696044921875, -0.084747314453125, -0.0725250244140625, -0.060302734375, -0.0480804443359375, -0.035858154296875, -0.0236358642578125, -0.01141357421875, 0.0008087158203125, 0.013031005859375, 0.0252532958984375, 0.0374755859375, 0.0496978759765625, 0.061920166015625, 0.0741424560546875, 0.08636474609375, 0.0985870361328125, 0.110809326171875, 0.1230316162109375, 0.13525390625, 0.1474761962890625, 0.159698486328125, 0.1719207763671875, 0.18414306640625, 0.1963653564453125, 0.208587646484375, 0.2208099365234375, 0.2330322265625, 0.2452545166015625, 0.257476806640625, 0.2696990966796875, 0.28192138671875, 0.2941436767578125, 0.306365966796875, 0.3185882568359375, 0.330810546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 7.0, 6.0, 5.0, 8.0, 15.0, 27.0, 30.0, 48.0, 66.0, 102.0, 175.0, 403.0, 2008.0, 29770.0, 972803.0, 39672.0, 2403.0, 490.0, 174.0, 91.0, 68.0, 45.0, 26.0, 28.0, 18.0, 19.0, 13.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2545166015625, -5.063720703125, -4.8729248046875, -4.68212890625, -4.4913330078125, -4.300537109375, -4.1097412109375, -3.9189453125, -3.7281494140625, -3.537353515625, -3.3465576171875, -3.15576171875, -2.9649658203125, -2.774169921875, -2.5833740234375, -2.392578125, -2.2017822265625, -2.010986328125, -1.8201904296875, -1.62939453125, -1.4385986328125, -1.247802734375, -1.0570068359375, -0.8662109375, -0.6754150390625, -0.484619140625, -0.2938232421875, -0.10302734375, 0.0877685546875, 0.278564453125, 0.4693603515625, 0.66015625, 0.8509521484375, 1.041748046875, 1.2325439453125, 1.42333984375, 1.6141357421875, 1.804931640625, 1.9957275390625, 2.1865234375, 2.3773193359375, 2.568115234375, 2.7589111328125, 2.94970703125, 3.1405029296875, 3.331298828125, 3.5220947265625, 3.712890625, 3.9036865234375, 4.094482421875, 4.2852783203125, 4.47607421875, 4.6668701171875, 4.857666015625, 5.0484619140625, 5.2392578125, 5.4300537109375, 5.620849609375, 5.8116455078125, 6.00244140625, 6.1932373046875, 6.384033203125, 6.5748291015625, 6.765625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 13.0, 14.0, 20.0, 50.0, 103.0, 108.0, 160.0, 158.0, 124.0, 112.0, 58.0, 39.0, 26.0, 8.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9719031453132629, -0.9457084536552429, -0.9195137023925781, -0.8933190107345581, -0.8671243190765381, -0.8409296274185181, -0.8147348761558533, -0.7885401844978333, -0.7623454332351685, -0.7361507415771484, -0.7099559903144836, -0.6837612986564636, -0.6575666069984436, -0.6313718557357788, -0.6051771640777588, -0.5789824724197388, -0.5527877807617188, -0.5265930891036987, -0.5003983378410339, -0.4742036461830139, -0.4480089545249939, -0.4218142330646515, -0.3956195116043091, -0.36942481994628906, -0.34323009848594666, -0.31703537702560425, -0.29084068536758423, -0.2646459639072418, -0.2384512573480606, -0.2122565507888794, -0.186061829328537, -0.15986712276935577, -0.13367241621017456, -0.10747770965099335, -0.08128299564123154, -0.05508828163146973, -0.028893575072288513, -0.0026988685131073, 0.023495852947235107, 0.04969055950641632, 0.07588526606559753, 0.10207997262477875, 0.12827467918395996, 0.15446940064430237, 0.18066410720348358, 0.2068588137626648, 0.2330535352230072, 0.2592482566833496, 0.28544294834136963, 0.31163766980171204, 0.33783236145973206, 0.36402708292007446, 0.3902217745780945, 0.4164164960384369, 0.4426112174987793, 0.4688059091567993, 0.4950006306171417, 0.5211953520774841, 0.5473900437355042, 0.573584794998169, 0.599779486656189, 0.625974178314209, 0.652168869972229, 0.6783636212348938, 0.7045583128929138]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 3.0, 11.0, 10.0, 10.0, 10.0, 23.0, 18.0, 22.0, 17.0, 21.0, 36.0, 30.0, 33.0, 31.0, 50.0, 54.0, 45.0, 39.0, 45.0, 45.0, 39.0, 45.0, 42.0, 27.0, 41.0, 31.0, 32.0, 26.0, 27.0, 28.0, 14.0, 20.0, 12.0, 11.0, 10.0, 8.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.3728671073913574, -0.3623582124710083, -0.3518493175506592, -0.34134042263031006, -0.3308315575122833, -0.3203226625919342, -0.3098137676715851, -0.29930487275123596, -0.28879597783088684, -0.2782870829105377, -0.2677781879901886, -0.25726932287216187, -0.24676041305065155, -0.23625153303146362, -0.2257426381111145, -0.21523374319076538, -0.20472486317157745, -0.19421596825122833, -0.1837070882320404, -0.17319819331169128, -0.16268929839134216, -0.15218040347099304, -0.14167152345180511, -0.131162628531456, -0.12065374106168747, -0.11014485359191895, -0.09963595867156982, -0.0891270712018013, -0.07861818373203278, -0.06810928881168365, -0.05760040134191513, -0.04709150642156601, -0.036582618951797485, -0.026073727756738663, -0.01556483842432499, -0.005055949091911316, 0.005452942103147507, 0.01596183329820633, 0.026470720767974854, 0.036979615688323975, 0.0474885031580925, 0.05799739435315132, 0.06850628554821014, 0.07901517301797867, 0.08952406048774719, 0.10003295540809631, 0.11054184287786484, 0.12105073779821396, 0.13155962526798248, 0.1420685201883316, 0.15257740020751953, 0.16308629512786865, 0.17359519004821777, 0.1841040849685669, 0.19461296498775482, 0.20512185990810394, 0.21563073992729187, 0.226139634847641, 0.23664851486682892, 0.24715740978717804, 0.25766628980636597, 0.2681751847267151, 0.2786840796470642, 0.28919297456741333, 0.29970186948776245]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 5.0, 6.0, 7.0, 11.0, 6.0, 10.0, 13.0, 12.0, 20.0, 19.0, 34.0, 18.0, 24.0, 24.0, 33.0, 36.0, 44.0, 38.0, 29.0, 45.0, 32.0, 43.0, 44.0, 28.0, 42.0, 32.0, 32.0, 26.0, 28.0, 27.0, 34.0, 25.0, 26.0, 26.0, 12.0, 15.0, 15.0, 10.0, 9.0, 11.0, 7.0, 8.0, 5.0, 7.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57373046875, -0.5543212890625, -0.534912109375, -0.5155029296875, -0.49609375, -0.4766845703125, -0.457275390625, -0.4378662109375, -0.41845703125, -0.3990478515625, -0.379638671875, -0.3602294921875, -0.3408203125, -0.3214111328125, -0.302001953125, -0.2825927734375, -0.26318359375, -0.2437744140625, -0.224365234375, -0.2049560546875, -0.185546875, -0.1661376953125, -0.146728515625, -0.1273193359375, -0.10791015625, -0.0885009765625, -0.069091796875, -0.0496826171875, -0.0302734375, -0.0108642578125, 0.008544921875, 0.0279541015625, 0.04736328125, 0.0667724609375, 0.086181640625, 0.1055908203125, 0.125, 0.1444091796875, 0.163818359375, 0.1832275390625, 0.20263671875, 0.2220458984375, 0.241455078125, 0.2608642578125, 0.2802734375, 0.2996826171875, 0.319091796875, 0.3385009765625, 0.35791015625, 0.3773193359375, 0.396728515625, 0.4161376953125, 0.435546875, 0.4549560546875, 0.474365234375, 0.4937744140625, 0.51318359375, 0.5325927734375, 0.552001953125, 0.5714111328125, 0.5908203125, 0.6102294921875, 0.629638671875, 0.6490478515625, 0.66845703125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 9.0, 7.0, 20.0, 17.0, 32.0, 37.0, 41.0, 66.0, 92.0, 146.0, 201.0, 286.0, 398.0, 604.0, 954.0, 1541.0, 2558.0, 4306.0, 7312.0, 13091.0, 25669.0, 56269.0, 146191.0, 325573.0, 267575.0, 105506.0, 42717.0, 20544.0, 10864.0, 6230.0, 3645.0, 2122.0, 1291.0, 867.0, 528.0, 403.0, 255.0, 172.0, 123.0, 85.0, 66.0, 40.0, 28.0, 33.0, 16.0, 12.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.88134765625, -0.856048583984375, -0.83074951171875, -0.805450439453125, -0.7801513671875, -0.754852294921875, -0.72955322265625, -0.704254150390625, -0.678955078125, -0.653656005859375, -0.62835693359375, -0.603057861328125, -0.5777587890625, -0.552459716796875, -0.52716064453125, -0.501861572265625, -0.4765625, -0.451263427734375, -0.42596435546875, -0.400665283203125, -0.3753662109375, -0.350067138671875, -0.32476806640625, -0.299468994140625, -0.274169921875, -0.248870849609375, -0.22357177734375, -0.198272705078125, -0.1729736328125, -0.147674560546875, -0.12237548828125, -0.097076416015625, -0.07177734375, -0.046478271484375, -0.02117919921875, 0.004119873046875, 0.0294189453125, 0.054718017578125, 0.08001708984375, 0.105316162109375, 0.130615234375, 0.155914306640625, 0.18121337890625, 0.206512451171875, 0.2318115234375, 0.257110595703125, 0.28240966796875, 0.307708740234375, 0.3330078125, 0.358306884765625, 0.38360595703125, 0.408905029296875, 0.4342041015625, 0.459503173828125, 0.48480224609375, 0.510101318359375, 0.535400390625, 0.560699462890625, 0.58599853515625, 0.611297607421875, 0.6365966796875, 0.661895751953125, 0.68719482421875, 0.712493896484375, 0.73779296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 4.0, 7.0, 11.0, 9.0, 15.0, 19.0, 20.0, 22.0, 36.0, 32.0, 36.0, 44.0, 44.0, 61.0, 60.0, 113.0, 283.0, 1515.0, 210.0, 108.0, 70.0, 54.0, 42.0, 32.0, 44.0, 28.0, 21.0, 22.0, 15.0, 16.0, 11.0, 14.0, 6.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.65753173828125, -2.5670166015625, -2.47650146484375, -2.385986328125, -2.29547119140625, -2.2049560546875, -2.11444091796875, -2.02392578125, -1.93341064453125, -1.8428955078125, -1.75238037109375, -1.661865234375, -1.57135009765625, -1.4808349609375, -1.39031982421875, -1.2998046875, -1.20928955078125, -1.1187744140625, -1.02825927734375, -0.937744140625, -0.84722900390625, -0.7567138671875, -0.66619873046875, -0.57568359375, -0.48516845703125, -0.3946533203125, -0.30413818359375, -0.213623046875, -0.12310791015625, -0.0325927734375, 0.05792236328125, 0.1484375, 0.23895263671875, 0.3294677734375, 0.41998291015625, 0.510498046875, 0.60101318359375, 0.6915283203125, 0.78204345703125, 0.87255859375, 0.96307373046875, 1.0535888671875, 1.14410400390625, 1.234619140625, 1.32513427734375, 1.4156494140625, 1.50616455078125, 1.5966796875, 1.68719482421875, 1.7777099609375, 1.86822509765625, 1.958740234375, 2.04925537109375, 2.1397705078125, 2.23028564453125, 2.32080078125, 2.41131591796875, 2.5018310546875, 2.59234619140625, 2.682861328125, 2.77337646484375, 2.8638916015625, 2.95440673828125, 3.044921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 6.0, 6.0, 6.0, 8.0, 10.0, 10.0, 14.0, 19.0, 25.0, 38.0, 48.0, 58.0, 108.0, 160.0, 290.0, 587.0, 1205.0, 3286.0, 11319.0, 61341.0, 873652.0, 2055208.0, 112677.0, 17782.0, 4594.0, 1597.0, 720.0, 349.0, 189.0, 116.0, 94.0, 52.0, 31.0, 28.0, 19.0, 18.0, 7.0, 6.0, 9.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.92181396484375, -2.8280029296875, -2.73419189453125, -2.640380859375, -2.54656982421875, -2.4527587890625, -2.35894775390625, -2.26513671875, -2.17132568359375, -2.0775146484375, -1.98370361328125, -1.889892578125, -1.79608154296875, -1.7022705078125, -1.60845947265625, -1.5146484375, -1.42083740234375, -1.3270263671875, -1.23321533203125, -1.139404296875, -1.04559326171875, -0.9517822265625, -0.85797119140625, -0.76416015625, -0.67034912109375, -0.5765380859375, -0.48272705078125, -0.388916015625, -0.29510498046875, -0.2012939453125, -0.10748291015625, -0.013671875, 0.08013916015625, 0.1739501953125, 0.26776123046875, 0.361572265625, 0.45538330078125, 0.5491943359375, 0.64300537109375, 0.73681640625, 0.83062744140625, 0.9244384765625, 1.01824951171875, 1.112060546875, 1.20587158203125, 1.2996826171875, 1.39349365234375, 1.4873046875, 1.58111572265625, 1.6749267578125, 1.76873779296875, 1.862548828125, 1.95635986328125, 2.0501708984375, 2.14398193359375, 2.23779296875, 2.33160400390625, 2.4254150390625, 2.51922607421875, 2.613037109375, 2.70684814453125, 2.8006591796875, 2.89447021484375, 2.98828125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 83.0, 594.0, 316.0, 22.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.26946258544922, -60.17092514038086, -59.072391510009766, -57.973854064941406, -56.87532043457031, -55.77678298950195, -54.67824935913086, -53.5797119140625, -52.481178283691406, -51.38264083862305, -50.28410720825195, -49.185569763183594, -48.0870361328125, -46.98849868774414, -45.88996505737305, -44.79142761230469, -43.692893981933594, -42.594356536865234, -41.49582290649414, -40.39728546142578, -39.29875183105469, -38.20021438598633, -37.101680755615234, -36.003143310546875, -34.904605865478516, -33.806068420410156, -32.70753479003906, -31.608999252319336, -30.51046371459961, -29.411928176879883, -28.313392639160156, -27.214855194091797, -26.116321563720703, -25.017786026000977, -23.91925048828125, -22.820714950561523, -21.722179412841797, -20.62364387512207, -19.525108337402344, -18.426570892333984, -17.328035354614258, -16.22949981689453, -15.130964279174805, -14.032428741455078, -12.933893203735352, -11.835357666015625, -10.736821174621582, -9.638285636901855, -8.539750099182129, -7.441214561462402, -6.342679023742676, -5.244143009185791, -4.1456074714660645, -3.047071933746338, -1.9485359191894531, -0.8500003814697266, 0.24853515625, 1.3470708131790161, 2.4456064701080322, 3.544142246246338, 4.6426777839660645, 5.741213321685791, 6.839749336242676, 7.938284873962402, 9.036820411682129]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 9.0, 8.0, 3.0, 12.0, 11.0, 13.0, 10.0, 15.0, 16.0, 18.0, 26.0, 26.0, 28.0, 28.0, 39.0, 21.0, 27.0, 44.0, 25.0, 37.0, 32.0, 36.0, 33.0, 27.0, 36.0, 27.0, 34.0, 23.0, 30.0, 25.0, 28.0, 26.0, 23.0, 32.0, 19.0, 18.0, 14.0, 23.0, 14.0, 14.0, 10.0, 6.0, 19.0, 6.0, 5.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0], "bins": [-6.8649678230285645, -6.663330078125, -6.4616923332214355, -6.260054588317871, -6.058416366577148, -5.856778621673584, -5.6551408767700195, -5.453503131866455, -5.251865386962891, -5.050227642059326, -4.848589897155762, -4.646951675415039, -4.445313930511475, -4.24367618560791, -4.042038440704346, -3.8404006958007812, -3.6387624740600586, -3.437124729156494, -3.2354867458343506, -3.033849000930786, -2.8322110176086426, -2.630573272705078, -2.4289355278015137, -2.227297782897949, -2.0256597995758057, -1.8240219354629517, -1.6223840713500977, -1.4207463264465332, -1.2191084623336792, -1.0174705982208252, -0.8158328533172607, -0.6141949892044067, -0.41255760192871094, -0.21091976761817932, -0.009281933307647705, 0.19235587120056152, 0.3939937353134155, 0.5956315994262695, 0.797269344329834, 0.998907208442688, 1.200545072555542, 1.402182936668396, 1.60382080078125, 1.8054585456848145, 2.007096290588379, 2.2087342739105225, 2.410372018814087, 2.6120100021362305, 2.813647747039795, 3.0152854919433594, 3.216923475265503, 3.4185612201690674, 3.620199203491211, 3.8218369483947754, 4.02347469329834, 4.225112438201904, 4.426750183105469, 4.628387928009033, 4.830025672912598, 5.03166389465332, 5.233301639556885, 5.434939384460449, 5.636577129364014, 5.838214874267578, 6.039853096008301]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 1.0, 6.0, 4.0, 6.0, 8.0, 7.0, 12.0, 10.0, 8.0, 18.0, 16.0, 20.0, 14.0, 16.0, 29.0, 28.0, 35.0, 32.0, 42.0, 27.0, 32.0, 38.0, 30.0, 36.0, 46.0, 39.0, 33.0, 38.0, 31.0, 32.0, 28.0, 36.0, 25.0, 17.0, 32.0, 23.0, 16.0, 23.0, 19.0, 17.0, 9.0, 10.0, 9.0, 5.0, 11.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.595703125, -0.5762405395507812, -0.5567779541015625, -0.5373153686523438, -0.517852783203125, -0.49839019775390625, -0.4789276123046875, -0.45946502685546875, -0.44000244140625, -0.42053985595703125, -0.4010772705078125, -0.38161468505859375, -0.362152099609375, -0.34268951416015625, -0.3232269287109375, -0.30376434326171875, -0.2843017578125, -0.26483917236328125, -0.2453765869140625, -0.22591400146484375, -0.206451416015625, -0.18698883056640625, -0.1675262451171875, -0.14806365966796875, -0.12860107421875, -0.10913848876953125, -0.0896759033203125, -0.07021331787109375, -0.050750732421875, -0.03128814697265625, -0.0118255615234375, 0.00763702392578125, 0.027099609375, 0.04656219482421875, 0.0660247802734375, 0.08548736572265625, 0.104949951171875, 0.12441253662109375, 0.1438751220703125, 0.16333770751953125, 0.18280029296875, 0.20226287841796875, 0.2217254638671875, 0.24118804931640625, 0.260650634765625, 0.28011322021484375, 0.2995758056640625, 0.31903839111328125, 0.3385009765625, 0.35796356201171875, 0.3774261474609375, 0.39688873291015625, 0.416351318359375, 0.43581390380859375, 0.4552764892578125, 0.47473907470703125, 0.49420166015625, 0.5136642456054688, 0.5331268310546875, 0.5525894165039062, 0.572052001953125, 0.5915145874023438, 0.6109771728515625, 0.6304397583007812, 0.64990234375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 14.0, 12.0, 24.0, 28.0, 34.0, 69.0, 85.0, 117.0, 209.0, 326.0, 577.0, 972.0, 1690.0, 3113.0, 6058.0, 12572.0, 28731.0, 81166.0, 388681.0, 2389567.0, 1051731.0, 148926.0, 43810.0, 17753.0, 8249.0, 4308.0, 2238.0, 1258.0, 708.0, 447.0, 279.0, 154.0, 104.0, 75.0, 45.0, 43.0, 25.0, 20.0, 17.0, 12.0, 9.0, 4.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4619293212890625, -1.409210205078125, -1.3564910888671875, -1.30377197265625, -1.2510528564453125, -1.198333740234375, -1.1456146240234375, -1.0928955078125, -1.0401763916015625, -0.987457275390625, -0.9347381591796875, -0.88201904296875, -0.8292999267578125, -0.776580810546875, -0.7238616943359375, -0.671142578125, -0.6184234619140625, -0.565704345703125, -0.5129852294921875, -0.46026611328125, -0.4075469970703125, -0.354827880859375, -0.3021087646484375, -0.2493896484375, -0.1966705322265625, -0.143951416015625, -0.0912322998046875, -0.03851318359375, 0.0142059326171875, 0.066925048828125, 0.1196441650390625, 0.17236328125, 0.2250823974609375, 0.277801513671875, 0.3305206298828125, 0.38323974609375, 0.4359588623046875, 0.488677978515625, 0.5413970947265625, 0.5941162109375, 0.6468353271484375, 0.699554443359375, 0.7522735595703125, 0.80499267578125, 0.8577117919921875, 0.910430908203125, 0.9631500244140625, 1.015869140625, 1.0685882568359375, 1.121307373046875, 1.1740264892578125, 1.22674560546875, 1.2794647216796875, 1.332183837890625, 1.3849029541015625, 1.4376220703125, 1.4903411865234375, 1.543060302734375, 1.5957794189453125, 1.64849853515625, 1.7012176513671875, 1.753936767578125, 1.8066558837890625, 1.859375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 12.0, 16.0, 14.0, 19.0, 14.0, 24.0, 18.0, 32.0, 49.0, 56.0, 82.0, 102.0, 105.0, 152.0, 214.0, 290.0, 389.0, 461.0, 451.0, 351.0, 287.0, 204.0, 149.0, 123.0, 85.0, 75.0, 52.0, 55.0, 28.0, 27.0, 15.0, 21.0, 21.0, 15.0, 13.0, 9.0, 4.0, 5.0, 6.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.361328125, -1.31585693359375, -1.2703857421875, -1.22491455078125, -1.179443359375, -1.13397216796875, -1.0885009765625, -1.04302978515625, -0.99755859375, -0.95208740234375, -0.9066162109375, -0.86114501953125, -0.815673828125, -0.77020263671875, -0.7247314453125, -0.67926025390625, -0.6337890625, -0.58831787109375, -0.5428466796875, -0.49737548828125, -0.451904296875, -0.40643310546875, -0.3609619140625, -0.31549072265625, -0.27001953125, -0.22454833984375, -0.1790771484375, -0.13360595703125, -0.088134765625, -0.04266357421875, 0.0028076171875, 0.04827880859375, 0.09375, 0.13922119140625, 0.1846923828125, 0.23016357421875, 0.275634765625, 0.32110595703125, 0.3665771484375, 0.41204833984375, 0.45751953125, 0.50299072265625, 0.5484619140625, 0.59393310546875, 0.639404296875, 0.68487548828125, 0.7303466796875, 0.77581787109375, 0.8212890625, 0.86676025390625, 0.9122314453125, 0.95770263671875, 1.003173828125, 1.04864501953125, 1.0941162109375, 1.13958740234375, 1.18505859375, 1.23052978515625, 1.2760009765625, 1.32147216796875, 1.366943359375, 1.41241455078125, 1.4578857421875, 1.50335693359375, 1.548828125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 12.0, 17.0, 25.0, 28.0, 40.0, 62.0, 106.0, 156.0, 208.0, 327.0, 518.0, 748.0, 1153.0, 1824.0, 2969.0, 5004.0, 8541.0, 16092.0, 31365.0, 68753.0, 174559.0, 625535.0, 2085201.0, 805902.0, 209100.0, 79217.0, 35300.0, 17703.0, 9653.0, 5333.0, 3192.0, 2011.0, 1221.0, 775.0, 477.0, 362.0, 237.0, 153.0, 114.0, 74.0, 59.0, 39.0, 31.0, 22.0, 17.0, 14.0, 10.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.8515625, -1.788970947265625, -1.72637939453125, -1.663787841796875, -1.6011962890625, -1.538604736328125, -1.47601318359375, -1.413421630859375, -1.350830078125, -1.288238525390625, -1.22564697265625, -1.163055419921875, -1.1004638671875, -1.037872314453125, -0.97528076171875, -0.912689208984375, -0.85009765625, -0.787506103515625, -0.72491455078125, -0.662322998046875, -0.5997314453125, -0.537139892578125, -0.47454833984375, -0.411956787109375, -0.349365234375, -0.286773681640625, -0.22418212890625, -0.161590576171875, -0.0989990234375, -0.036407470703125, 0.02618408203125, 0.088775634765625, 0.1513671875, 0.213958740234375, 0.27655029296875, 0.339141845703125, 0.4017333984375, 0.464324951171875, 0.52691650390625, 0.589508056640625, 0.652099609375, 0.714691162109375, 0.77728271484375, 0.839874267578125, 0.9024658203125, 0.965057373046875, 1.02764892578125, 1.090240478515625, 1.15283203125, 1.215423583984375, 1.27801513671875, 1.340606689453125, 1.4031982421875, 1.465789794921875, 1.52838134765625, 1.590972900390625, 1.653564453125, 1.716156005859375, 1.77874755859375, 1.841339111328125, 1.9039306640625, 1.966522216796875, 2.02911376953125, 2.091705322265625, 2.154296875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 12.0, 15.0, 28.0, 35.0, 72.0, 135.0, 132.0, 186.0, 133.0, 105.0, 78.0, 34.0, 22.0, 10.0, 2.0, 7.0, 1.0, 3.0, 1.0], "bins": [-27.673194885253906, -27.14453125, -26.615867614746094, -26.087203979492188, -25.55854034423828, -25.029874801635742, -24.501211166381836, -23.97254753112793, -23.443883895874023, -22.915220260620117, -22.38655662536621, -21.857892990112305, -21.329227447509766, -20.80056381225586, -20.271900177001953, -19.743236541748047, -19.21457290649414, -18.685909271240234, -18.157245635986328, -17.628582000732422, -17.099918365478516, -16.571252822875977, -16.04258918762207, -15.513925552368164, -14.985261917114258, -14.456598281860352, -13.927934646606445, -13.399270057678223, -12.870606422424316, -12.34194278717041, -11.813278198242188, -11.284614562988281, -10.755951881408691, -10.227288246154785, -9.698623657226562, -9.169960021972656, -8.64129638671875, -8.112632751464844, -7.583968639373779, -7.055304527282715, -6.526640892028809, -5.997977256774902, -5.469313144683838, -4.940649032592773, -4.411985397338867, -3.883321523666382, -3.3546576499938965, -2.825993776321411, -2.297329902648926, -1.7686660289764404, -1.240002155303955, -0.7113382816314697, -0.18267440795898438, 0.345989465713501, 0.8746533393859863, 1.4033172130584717, 1.931981086730957, 2.4606449604034424, 2.9893088340759277, 3.517972707748413, 4.046636581420898, 4.575300216674805, 5.103964328765869, 5.632628440856934, 6.16129207611084]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 12.0, 14.0, 10.0, 10.0, 19.0, 16.0, 23.0, 30.0, 23.0, 31.0, 53.0, 36.0, 32.0, 47.0, 37.0, 42.0, 45.0, 39.0, 35.0, 53.0, 40.0, 29.0, 27.0, 30.0, 42.0, 26.0, 30.0, 25.0, 16.0, 13.0, 16.0, 17.0, 15.0, 8.0, 7.0, 8.0, 5.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.795123100280762, -5.619701385498047, -5.44428014755249, -5.268858432769775, -5.0934367179870605, -4.918015480041504, -4.742593765258789, -4.567172050476074, -4.391750335693359, -4.2163286209106445, -4.040907382965088, -3.865485668182373, -3.690063953399658, -3.5146424770355225, -3.3392210006713867, -3.163799285888672, -2.9883780479431152, -2.8129565715789795, -2.6375348567962646, -2.462113380432129, -2.286691665649414, -2.1112701892852783, -1.9358487129211426, -1.7604271173477173, -1.585005521774292, -1.4095839262008667, -1.2341623306274414, -1.0587408542633057, -0.8833192586898804, -0.7078976631164551, -0.5324761867523193, -0.35705459117889404, -0.18163347244262695, -0.006211906671524048, 0.16920965909957886, 0.3446311950683594, 0.5200527906417847, 0.69547438621521, 0.8708958625793457, 1.046317458152771, 1.2217390537261963, 1.3971606492996216, 1.5725822448730469, 1.7480037212371826, 1.923425316810608, 2.098846912384033, 2.274268388748169, 2.4496898651123047, 2.6251115798950195, 2.8005330562591553, 2.97595477104187, 3.151376247406006, 3.3267979621887207, 3.5022194385528564, 3.677640914916992, 3.853062629699707, 4.028484344482422, 4.203906059265137, 4.379327297210693, 4.554749011993408, 4.730170726776123, 4.90559196472168, 5.0810136795043945, 5.256435394287109, 5.431856632232666]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 6.0, 5.0, 4.0, 4.0, 6.0, 7.0, 9.0, 7.0, 15.0, 11.0, 16.0, 14.0, 21.0, 20.0, 22.0, 25.0, 20.0, 27.0, 32.0, 24.0, 34.0, 34.0, 46.0, 49.0, 33.0, 45.0, 33.0, 48.0, 38.0, 32.0, 34.0, 27.0, 30.0, 29.0, 19.0, 29.0, 12.0, 30.0, 11.0, 10.0, 12.0, 14.0, 12.0, 6.0, 9.0, 9.0, 11.0, 7.0, 5.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6154632568359375, -0.595184326171875, -0.5749053955078125, -0.55462646484375, -0.5343475341796875, -0.514068603515625, -0.4937896728515625, -0.4735107421875, -0.4532318115234375, -0.432952880859375, -0.4126739501953125, -0.39239501953125, -0.3721160888671875, -0.351837158203125, -0.3315582275390625, -0.311279296875, -0.2910003662109375, -0.270721435546875, -0.2504425048828125, -0.23016357421875, -0.2098846435546875, -0.189605712890625, -0.1693267822265625, -0.1490478515625, -0.1287689208984375, -0.108489990234375, -0.0882110595703125, -0.06793212890625, -0.0476531982421875, -0.027374267578125, -0.0070953369140625, 0.01318359375, 0.0334625244140625, 0.053741455078125, 0.0740203857421875, 0.09429931640625, 0.1145782470703125, 0.134857177734375, 0.1551361083984375, 0.1754150390625, 0.1956939697265625, 0.215972900390625, 0.2362518310546875, 0.25653076171875, 0.2768096923828125, 0.297088623046875, 0.3173675537109375, 0.337646484375, 0.3579254150390625, 0.378204345703125, 0.3984832763671875, 0.41876220703125, 0.4390411376953125, 0.459320068359375, 0.4795989990234375, 0.4998779296875, 0.5201568603515625, 0.540435791015625, 0.5607147216796875, 0.58099365234375, 0.6012725830078125, 0.621551513671875, 0.6418304443359375, 0.662109375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 22.0, 17.0, 41.0, 66.0, 83.0, 126.0, 171.0, 326.0, 444.0, 688.0, 915.0, 1320.0, 2029.0, 2818.0, 4290.0, 6273.0, 8933.0, 13009.0, 18629.0, 26938.0, 38148.0, 53639.0, 77365.0, 135951.0, 337347.0, 97865.0, 66719.0, 46580.0, 32961.0, 23037.0, 16027.0, 11291.0, 7740.0, 5231.0, 3619.0, 2471.0, 1635.0, 1195.0, 824.0, 524.0, 388.0, 276.0, 166.0, 146.0, 82.0, 57.0, 39.0, 26.0, 19.0, 15.0, 4.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1884765625, -1.1492462158203125, -1.110015869140625, -1.0707855224609375, -1.03155517578125, -0.9923248291015625, -0.953094482421875, -0.9138641357421875, -0.8746337890625, -0.8354034423828125, -0.796173095703125, -0.7569427490234375, -0.71771240234375, -0.6784820556640625, -0.639251708984375, -0.6000213623046875, -0.560791015625, -0.5215606689453125, -0.482330322265625, -0.4430999755859375, -0.40386962890625, -0.3646392822265625, -0.325408935546875, -0.2861785888671875, -0.2469482421875, -0.2077178955078125, -0.168487548828125, -0.1292572021484375, -0.09002685546875, -0.0507965087890625, -0.011566162109375, 0.0276641845703125, 0.06689453125, 0.1061248779296875, 0.145355224609375, 0.1845855712890625, 0.22381591796875, 0.2630462646484375, 0.302276611328125, 0.3415069580078125, 0.3807373046875, 0.4199676513671875, 0.459197998046875, 0.4984283447265625, 0.53765869140625, 0.5768890380859375, 0.616119384765625, 0.6553497314453125, 0.694580078125, 0.7338104248046875, 0.773040771484375, 0.8122711181640625, 0.85150146484375, 0.8907318115234375, 0.929962158203125, 0.9691925048828125, 1.0084228515625, 1.0476531982421875, 1.086883544921875, 1.1261138916015625, 1.16534423828125, 1.2045745849609375, 1.243804931640625, 1.2830352783203125, 1.322265625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 10.0, 10.0, 7.0, 10.0, 6.0, 21.0, 16.0, 13.0, 11.0, 18.0, 24.0, 33.0, 28.0, 35.0, 34.0, 59.0, 42.0, 46.0, 44.0, 1069.0, 27.0, 35.0, 40.0, 35.0, 47.0, 34.0, 28.0, 27.0, 29.0, 26.0, 16.0, 22.0, 18.0, 22.0, 15.0, 13.0, 11.0, 7.0, 6.0, 14.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60986328125, -0.59124755859375, -0.5726318359375, -0.55401611328125, -0.535400390625, -0.51678466796875, -0.4981689453125, -0.47955322265625, -0.4609375, -0.44232177734375, -0.4237060546875, -0.40509033203125, -0.386474609375, -0.36785888671875, -0.3492431640625, -0.33062744140625, -0.31201171875, -0.29339599609375, -0.2747802734375, -0.25616455078125, -0.237548828125, -0.21893310546875, -0.2003173828125, -0.18170166015625, -0.1630859375, -0.14447021484375, -0.1258544921875, -0.10723876953125, -0.088623046875, -0.07000732421875, -0.0513916015625, -0.03277587890625, -0.01416015625, 0.00445556640625, 0.0230712890625, 0.04168701171875, 0.060302734375, 0.07891845703125, 0.0975341796875, 0.11614990234375, 0.134765625, 0.15338134765625, 0.1719970703125, 0.19061279296875, 0.209228515625, 0.22784423828125, 0.2464599609375, 0.26507568359375, 0.28369140625, 0.30230712890625, 0.3209228515625, 0.33953857421875, 0.358154296875, 0.37677001953125, 0.3953857421875, 0.41400146484375, 0.4326171875, 0.45123291015625, 0.4698486328125, 0.48846435546875, 0.507080078125, 0.52569580078125, 0.5443115234375, 0.56292724609375, 0.58154296875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 16.0, 26.0, 32.0, 51.0, 76.0, 84.0, 129.0, 193.0, 261.0, 357.0, 529.0, 740.0, 1150.0, 1687.0, 2471.0, 3666.0, 5609.0, 8762.0, 14345.0, 23537.0, 41284.0, 77973.0, 184725.0, 1078431.0, 390957.0, 119477.0, 57502.0, 31590.0, 18441.0, 11403.0, 7175.0, 4794.0, 3109.0, 2005.0, 1421.0, 960.0, 667.0, 448.0, 301.0, 218.0, 123.0, 139.0, 90.0, 56.0, 39.0, 32.0, 12.0, 12.0, 8.0, 8.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.95654296875, -0.9244155883789062, -0.8922882080078125, -0.8601608276367188, -0.828033447265625, -0.7959060668945312, -0.7637786865234375, -0.7316513061523438, -0.69952392578125, -0.6673965454101562, -0.6352691650390625, -0.6031417846679688, -0.571014404296875, -0.5388870239257812, -0.5067596435546875, -0.47463226318359375, -0.4425048828125, -0.41037750244140625, -0.3782501220703125, -0.34612274169921875, -0.313995361328125, -0.28186798095703125, -0.2497406005859375, -0.21761322021484375, -0.18548583984375, -0.15335845947265625, -0.1212310791015625, -0.08910369873046875, -0.056976318359375, -0.02484893798828125, 0.0072784423828125, 0.03940582275390625, 0.071533203125, 0.10366058349609375, 0.1357879638671875, 0.16791534423828125, 0.200042724609375, 0.23217010498046875, 0.2642974853515625, 0.29642486572265625, 0.32855224609375, 0.36067962646484375, 0.3928070068359375, 0.42493438720703125, 0.457061767578125, 0.48918914794921875, 0.5213165283203125, 0.5534439086914062, 0.5855712890625, 0.6176986694335938, 0.6498260498046875, 0.6819534301757812, 0.714080810546875, 0.7462081909179688, 0.7783355712890625, 0.8104629516601562, 0.84259033203125, 0.8747177124023438, 0.9068450927734375, 0.9389724731445312, 0.971099853515625, 1.0032272338867188, 1.0353546142578125, 1.0674819946289062, 1.099609375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 8.0, 3.0, 9.0, 10.0, 13.0, 12.0, 16.0, 15.0, 19.0, 23.0, 25.0, 52.0, 51.0, 61.0, 114.0, 197.0, 58.0, 68.0, 51.0, 38.0, 28.0, 26.0, 24.0, 12.0, 11.0, 11.0, 10.0, 8.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.35009765625, -0.33849334716796875, -0.3268890380859375, -0.31528472900390625, -0.303680419921875, -0.29207611083984375, -0.2804718017578125, -0.26886749267578125, -0.25726318359375, -0.24565887451171875, -0.2340545654296875, -0.22245025634765625, -0.210845947265625, -0.19924163818359375, -0.1876373291015625, -0.17603302001953125, -0.1644287109375, -0.15282440185546875, -0.1412200927734375, -0.12961578369140625, -0.118011474609375, -0.10640716552734375, -0.0948028564453125, -0.08319854736328125, -0.07159423828125, -0.05998992919921875, -0.0483856201171875, -0.03678131103515625, -0.025177001953125, -0.01357269287109375, -0.0019683837890625, 0.00963592529296875, 0.021240234375, 0.03284454345703125, 0.0444488525390625, 0.05605316162109375, 0.067657470703125, 0.07926177978515625, 0.0908660888671875, 0.10247039794921875, 0.11407470703125, 0.12567901611328125, 0.1372833251953125, 0.14888763427734375, 0.160491943359375, 0.17209625244140625, 0.1837005615234375, 0.19530487060546875, 0.2069091796875, 0.21851348876953125, 0.2301177978515625, 0.24172210693359375, 0.253326416015625, 0.26493072509765625, 0.2765350341796875, 0.28813934326171875, 0.29974365234375, 0.31134796142578125, 0.3229522705078125, 0.33455657958984375, 0.346160888671875, 0.35776519775390625, 0.3693695068359375, 0.38097381591796875, 0.392578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 5.0, 4.0, 7.0, 22.0, 16.0, 26.0, 41.0, 30.0, 63.0, 74.0, 113.0, 182.0, 315.0, 1409.0, 13063.0, 356743.0, 658102.0, 15629.0, 1724.0, 397.0, 192.0, 109.0, 66.0, 57.0, 31.0, 32.0, 19.0, 18.0, 10.0, 8.0, 11.0, 11.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.49481201171875, -5.3333740234375, -5.17193603515625, -5.010498046875, -4.84906005859375, -4.6876220703125, -4.52618408203125, -4.36474609375, -4.20330810546875, -4.0418701171875, -3.88043212890625, -3.718994140625, -3.55755615234375, -3.3961181640625, -3.23468017578125, -3.0732421875, -2.91180419921875, -2.7503662109375, -2.58892822265625, -2.427490234375, -2.26605224609375, -2.1046142578125, -1.94317626953125, -1.78173828125, -1.62030029296875, -1.4588623046875, -1.29742431640625, -1.135986328125, -0.97454833984375, -0.8131103515625, -0.65167236328125, -0.490234375, -0.32879638671875, -0.1673583984375, -0.00592041015625, 0.155517578125, 0.31695556640625, 0.4783935546875, 0.63983154296875, 0.80126953125, 0.96270751953125, 1.1241455078125, 1.28558349609375, 1.447021484375, 1.60845947265625, 1.7698974609375, 1.93133544921875, 2.0927734375, 2.25421142578125, 2.4156494140625, 2.57708740234375, 2.738525390625, 2.89996337890625, 3.0614013671875, 3.22283935546875, 3.38427734375, 3.54571533203125, 3.7071533203125, 3.86859130859375, 4.030029296875, 4.19146728515625, 4.3529052734375, 4.51434326171875, 4.67578125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 17.0, 17.0, 35.0, 60.0, 106.0, 163.0, 210.0, 160.0, 104.0, 64.0, 35.0, 21.0, 9.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5971916913986206, -0.5528547167778015, -0.5085177421569824, -0.46418073773384094, -0.41984376311302185, -0.37550678849220276, -0.3311697840690613, -0.2868328094482422, -0.2424958348274231, -0.198158860206604, -0.15382187068462372, -0.10948488116264343, -0.06514790654182434, -0.02081093192100525, 0.02352607250213623, 0.06786304712295532, 0.11220002174377441, 0.1565369963645935, 0.2008739858865738, 0.24521097540855408, 0.28954795002937317, 0.33388492465019226, 0.37822192907333374, 0.42255890369415283, 0.4668958783149719, 0.511232852935791, 0.5555698275566101, 0.5999068021774292, 0.6442438364028931, 0.6885807514190674, 0.7329177856445312, 0.7772547602653503, 0.821591854095459, 0.8659288287162781, 0.9102658033370972, 0.954602837562561, 0.9989397525787354, 1.0432767868041992, 1.087613821029663, 1.1319507360458374, 1.1762876510620117, 1.2206246852874756, 1.26496160030365, 1.3092986345291138, 1.353635549545288, 1.397972583770752, 1.4423096179962158, 1.4866465330123901, 1.530983567237854, 1.5753206014633179, 1.6196575164794922, 1.663994550704956, 1.7083314657211304, 1.7526684999465942, 1.7970054149627686, 1.8413424491882324, 1.8856794834136963, 1.9300165176391602, 1.9743534326553345, 2.018690347671509, 2.0630273818969727, 2.1073644161224365, 2.1517014503479004, 2.196038246154785, 2.240375280380249]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 5.0, 9.0, 15.0, 18.0, 15.0, 13.0, 11.0, 18.0, 26.0, 31.0, 24.0, 27.0, 36.0, 33.0, 32.0, 42.0, 33.0, 47.0, 39.0, 37.0, 41.0, 45.0, 43.0, 25.0, 48.0, 37.0, 39.0, 24.0, 25.0, 14.0, 30.0, 19.0, 18.0, 16.0, 11.0, 6.0, 13.0, 3.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.40269768238067627, -0.3897084593772888, -0.37671926617622375, -0.3637300729751587, -0.35074084997177124, -0.3377516269683838, -0.3247624337673187, -0.31177324056625366, -0.2987840175628662, -0.28579479455947876, -0.2728056013584137, -0.25981640815734863, -0.24682718515396118, -0.23383797705173492, -0.22084876894950867, -0.2078595608472824, -0.19487035274505615, -0.1818811446428299, -0.16889193654060364, -0.15590272843837738, -0.14291352033615112, -0.12992431223392487, -0.11693510413169861, -0.10394589602947235, -0.0909566879272461, -0.07796747982501984, -0.06497827172279358, -0.05198906362056732, -0.038999855518341064, -0.026010647416114807, -0.01302143931388855, -3.223121166229248e-05, 0.012956976890563965, 0.025946184992790222, 0.03893539309501648, 0.05192460119724274, 0.064913809299469, 0.07790301740169525, 0.09089222550392151, 0.10388143360614777, 0.11687064170837402, 0.12985984981060028, 0.14284905791282654, 0.1558382660150528, 0.16882747411727905, 0.1818166822195053, 0.19480589032173157, 0.20779509842395782, 0.22078430652618408, 0.23377351462841034, 0.2467627227306366, 0.25975191593170166, 0.2727411389350891, 0.28573036193847656, 0.2987195551395416, 0.3117087483406067, 0.32469797134399414, 0.3376871943473816, 0.35067638754844666, 0.3636655807495117, 0.37665480375289917, 0.3896440267562866, 0.4026332199573517, 0.41562241315841675, 0.4286116361618042]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 0.0, 6.0, 8.0, 7.0, 9.0, 8.0, 11.0, 13.0, 19.0, 18.0, 21.0, 17.0, 27.0, 26.0, 21.0, 26.0, 22.0, 34.0, 33.0, 44.0, 51.0, 45.0, 27.0, 47.0, 44.0, 46.0, 33.0, 34.0, 20.0, 33.0, 30.0, 25.0, 31.0, 17.0, 23.0, 20.0, 13.0, 12.0, 15.0, 7.0, 8.0, 10.0, 9.0, 11.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.604583740234375, -0.58367919921875, -0.562774658203125, -0.5418701171875, -0.520965576171875, -0.50006103515625, -0.479156494140625, -0.458251953125, -0.437347412109375, -0.41644287109375, -0.395538330078125, -0.3746337890625, -0.353729248046875, -0.33282470703125, -0.311920166015625, -0.291015625, -0.270111083984375, -0.24920654296875, -0.228302001953125, -0.2073974609375, -0.186492919921875, -0.16558837890625, -0.144683837890625, -0.123779296875, -0.102874755859375, -0.08197021484375, -0.061065673828125, -0.0401611328125, -0.019256591796875, 0.00164794921875, 0.022552490234375, 0.04345703125, 0.064361572265625, 0.08526611328125, 0.106170654296875, 0.1270751953125, 0.147979736328125, 0.16888427734375, 0.189788818359375, 0.210693359375, 0.231597900390625, 0.25250244140625, 0.273406982421875, 0.2943115234375, 0.315216064453125, 0.33612060546875, 0.357025146484375, 0.3779296875, 0.398834228515625, 0.41973876953125, 0.440643310546875, 0.4615478515625, 0.482452392578125, 0.50335693359375, 0.524261474609375, 0.545166015625, 0.566070556640625, 0.58697509765625, 0.607879638671875, 0.6287841796875, 0.649688720703125, 0.67059326171875, 0.691497802734375, 0.71240234375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 10.0, 14.0, 23.0, 26.0, 25.0, 61.0, 80.0, 143.0, 205.0, 344.0, 529.0, 838.0, 1369.0, 2487.0, 4261.0, 7503.0, 13308.0, 25473.0, 54100.0, 148231.0, 454110.0, 202086.0, 67085.0, 30385.0, 15491.0, 8571.0, 4775.0, 2759.0, 1654.0, 976.0, 587.0, 404.0, 207.0, 153.0, 100.0, 43.0, 46.0, 27.0, 16.0, 15.0, 14.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.9195327758789062, -0.8874053955078125, -0.8552780151367188, -0.823150634765625, -0.7910232543945312, -0.7588958740234375, -0.7267684936523438, -0.69464111328125, -0.6625137329101562, -0.6303863525390625, -0.5982589721679688, -0.566131591796875, -0.5340042114257812, -0.5018768310546875, -0.46974945068359375, -0.4376220703125, -0.40549468994140625, -0.3733673095703125, -0.34123992919921875, -0.309112548828125, -0.27698516845703125, -0.2448577880859375, -0.21273040771484375, -0.18060302734375, -0.14847564697265625, -0.1163482666015625, -0.08422088623046875, -0.052093505859375, -0.01996612548828125, 0.0121612548828125, 0.04428863525390625, 0.076416015625, 0.10854339599609375, 0.1406707763671875, 0.17279815673828125, 0.204925537109375, 0.23705291748046875, 0.2691802978515625, 0.30130767822265625, 0.33343505859375, 0.36556243896484375, 0.3976898193359375, 0.42981719970703125, 0.461944580078125, 0.49407196044921875, 0.5261993408203125, 0.5583267211914062, 0.5904541015625, 0.6225814819335938, 0.6547088623046875, 0.6868362426757812, 0.718963623046875, 0.7510910034179688, 0.7832183837890625, 0.8153457641601562, 0.84747314453125, 0.8796005249023438, 0.9117279052734375, 0.9438552856445312, 0.975982666015625, 1.0081100463867188, 1.0402374267578125, 1.0723648071289062, 1.1044921875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 11.0, 5.0, 5.0, 8.0, 9.0, 9.0, 14.0, 10.0, 18.0, 15.0, 24.0, 19.0, 32.0, 28.0, 31.0, 36.0, 42.0, 54.0, 69.0, 98.0, 209.0, 1445.0, 222.0, 123.0, 83.0, 70.0, 45.0, 42.0, 41.0, 28.0, 27.0, 27.0, 34.0, 24.0, 15.0, 15.0, 18.0, 15.0, 6.0, 5.0, 4.0, 4.0, 3.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.18359375, -2.1099853515625, -2.036376953125, -1.9627685546875, -1.88916015625, -1.8155517578125, -1.741943359375, -1.6683349609375, -1.5947265625, -1.5211181640625, -1.447509765625, -1.3739013671875, -1.30029296875, -1.2266845703125, -1.153076171875, -1.0794677734375, -1.005859375, -0.9322509765625, -0.858642578125, -0.7850341796875, -0.71142578125, -0.6378173828125, -0.564208984375, -0.4906005859375, -0.4169921875, -0.3433837890625, -0.269775390625, -0.1961669921875, -0.12255859375, -0.0489501953125, 0.024658203125, 0.0982666015625, 0.171875, 0.2454833984375, 0.319091796875, 0.3927001953125, 0.46630859375, 0.5399169921875, 0.613525390625, 0.6871337890625, 0.7607421875, 0.8343505859375, 0.907958984375, 0.9815673828125, 1.05517578125, 1.1287841796875, 1.202392578125, 1.2760009765625, 1.349609375, 1.4232177734375, 1.496826171875, 1.5704345703125, 1.64404296875, 1.7176513671875, 1.791259765625, 1.8648681640625, 1.9384765625, 2.0120849609375, 2.085693359375, 2.1593017578125, 2.23291015625, 2.3065185546875, 2.380126953125, 2.4537353515625, 2.52734375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 5.0, 3.0, 12.0, 9.0, 22.0, 22.0, 20.0, 35.0, 47.0, 57.0, 93.0, 118.0, 186.0, 300.0, 709.0, 2081.0, 8202.0, 46852.0, 1203301.0, 1813652.0, 56499.0, 9313.0, 2405.0, 768.0, 363.0, 195.0, 113.0, 68.0, 52.0, 37.0, 34.0, 22.0, 20.0, 11.0, 13.0, 13.0, 4.0, 11.0, 8.0, 1.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.287109375, -3.169891357421875, -3.05267333984375, -2.935455322265625, -2.8182373046875, -2.701019287109375, -2.58380126953125, -2.466583251953125, -2.349365234375, -2.232147216796875, -2.11492919921875, -1.997711181640625, -1.8804931640625, -1.763275146484375, -1.64605712890625, -1.528839111328125, -1.41162109375, -1.294403076171875, -1.17718505859375, -1.059967041015625, -0.9427490234375, -0.825531005859375, -0.70831298828125, -0.591094970703125, -0.473876953125, -0.356658935546875, -0.23944091796875, -0.122222900390625, -0.0050048828125, 0.112213134765625, 0.22943115234375, 0.346649169921875, 0.4638671875, 0.581085205078125, 0.69830322265625, 0.815521240234375, 0.9327392578125, 1.049957275390625, 1.16717529296875, 1.284393310546875, 1.401611328125, 1.518829345703125, 1.63604736328125, 1.753265380859375, 1.8704833984375, 1.987701416015625, 2.10491943359375, 2.222137451171875, 2.33935546875, 2.456573486328125, 2.57379150390625, 2.691009521484375, 2.8082275390625, 2.925445556640625, 3.04266357421875, 3.159881591796875, 3.277099609375, 3.394317626953125, 3.51153564453125, 3.628753662109375, 3.7459716796875, 3.863189697265625, 3.98040771484375, 4.097625732421875, 4.21484375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [52.0, 574.0, 374.0, 15.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2827086448669434, -1.0566604137420654, 0.1693878173828125, 1.3954360485076904, 2.6214842796325684, 3.8475327491760254, 5.073580741882324, 6.299628734588623, 7.52567720413208, 8.751725196838379, 9.977773666381836, 11.203822135925293, 12.42987060546875, 13.65591812133789, 14.881966590881348, 16.108015060424805, 17.334062576293945, 18.560110092163086, 19.78615951538086, 21.01220703125, 22.23825454711914, 23.464303970336914, 24.690351486206055, 25.916400909423828, 27.14244842529297, 28.36849594116211, 29.594545364379883, 30.820592880249023, 32.0466423034668, 33.27268981933594, 34.49873733520508, 35.72478485107422, 36.950836181640625, 38.176883697509766, 39.402931213378906, 40.62898254394531, 41.85503005981445, 43.081077575683594, 44.307125091552734, 45.533172607421875, 46.75922393798828, 47.98527145385742, 49.21131896972656, 50.43737030029297, 51.66341781616211, 52.88946533203125, 54.11551284790039, 55.34156036376953, 56.56760787963867, 57.79365539550781, 59.01970291137695, 60.24575424194336, 61.4718017578125, 62.69784927368164, 63.92389678955078, 65.14994812011719, 66.37599182128906, 67.60204315185547, 68.82808685302734, 70.05413818359375, 71.28018188476562, 72.50623321533203, 73.73228454589844, 74.95832824707031, 76.18437957763672]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 12.0, 8.0, 10.0, 11.0, 15.0, 21.0, 32.0, 25.0, 28.0, 30.0, 26.0, 43.0, 30.0, 40.0, 37.0, 49.0, 42.0, 41.0, 50.0, 44.0, 39.0, 31.0, 40.0, 24.0, 35.0, 28.0, 21.0, 22.0, 20.0, 26.0, 10.0, 10.0, 17.0, 11.0, 12.0, 8.0, 6.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.989790439605713, -6.767862796783447, -6.545935153961182, -6.324007034301758, -6.102079391479492, -5.880151748657227, -5.658224105834961, -5.436296463012695, -5.21436882019043, -4.992441177368164, -4.770513534545898, -4.548585891723633, -4.326657772064209, -4.104730129241943, -3.8828024864196777, -3.660874843597412, -3.4389467239379883, -3.2170190811157227, -2.995091199874878, -2.7731635570526123, -2.5512356758117676, -2.329308032989502, -2.1073803901672363, -1.8854526281356812, -1.663524866104126, -1.4415971040725708, -1.2196693420410156, -0.99774169921875, -0.7758139371871948, -0.5538861751556396, -0.331958532333374, -0.11003077030181885, 0.11189746856689453, 0.3338252007961273, 0.5557529330253601, 0.7776806354522705, 0.9996083974838257, 1.2215361595153809, 1.4434638023376465, 1.6653915643692017, 1.8873193264007568, 2.1092469692230225, 2.331174850463867, 2.553102493286133, 2.7750301361083984, 2.996958017349243, 3.218885660171509, 3.4408135414123535, 3.662741184234619, 3.8846688270568848, 4.10659646987915, 4.328524589538574, 4.55045223236084, 4.7723798751831055, 4.994307518005371, 5.216235160827637, 5.438162803649902, 5.660090446472168, 5.882018089294434, 6.103945732116699, 6.325873851776123, 6.547801494598389, 6.769729137420654, 6.99165678024292, 7.213584899902344]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 10.0, 9.0, 7.0, 5.0, 9.0, 14.0, 17.0, 25.0, 22.0, 17.0, 16.0, 26.0, 21.0, 30.0, 30.0, 22.0, 34.0, 46.0, 50.0, 42.0, 34.0, 42.0, 43.0, 35.0, 38.0, 36.0, 38.0, 37.0, 26.0, 17.0, 24.0, 18.0, 22.0, 22.0, 17.0, 14.0, 10.0, 10.0, 14.0, 9.0, 10.0, 12.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6904296875, -0.669036865234375, -0.64764404296875, -0.626251220703125, -0.6048583984375, -0.583465576171875, -0.56207275390625, -0.540679931640625, -0.519287109375, -0.497894287109375, -0.47650146484375, -0.455108642578125, -0.4337158203125, -0.412322998046875, -0.39093017578125, -0.369537353515625, -0.34814453125, -0.326751708984375, -0.30535888671875, -0.283966064453125, -0.2625732421875, -0.241180419921875, -0.21978759765625, -0.198394775390625, -0.177001953125, -0.155609130859375, -0.13421630859375, -0.112823486328125, -0.0914306640625, -0.070037841796875, -0.04864501953125, -0.027252197265625, -0.005859375, 0.015533447265625, 0.03692626953125, 0.058319091796875, 0.0797119140625, 0.101104736328125, 0.12249755859375, 0.143890380859375, 0.165283203125, 0.186676025390625, 0.20806884765625, 0.229461669921875, 0.2508544921875, 0.272247314453125, 0.29364013671875, 0.315032958984375, 0.33642578125, 0.357818603515625, 0.37921142578125, 0.400604248046875, 0.4219970703125, 0.443389892578125, 0.46478271484375, 0.486175537109375, 0.507568359375, 0.528961181640625, 0.55035400390625, 0.571746826171875, 0.5931396484375, 0.614532470703125, 0.63592529296875, 0.657318115234375, 0.6787109375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 11.0, 7.0, 9.0, 17.0, 24.0, 31.0, 40.0, 69.0, 105.0, 117.0, 199.0, 320.0, 390.0, 589.0, 1012.0, 1492.0, 2471.0, 4155.0, 7161.0, 13473.0, 27307.0, 63121.0, 201068.0, 1010276.0, 2073513.0, 567138.0, 127445.0, 46146.0, 20859.0, 10602.0, 5825.0, 3517.0, 2016.0, 1271.0, 826.0, 525.0, 354.0, 247.0, 158.0, 128.0, 78.0, 41.0, 45.0, 34.0, 17.0, 8.0, 14.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2421875, -1.1998291015625, -1.157470703125, -1.1151123046875, -1.07275390625, -1.0303955078125, -0.988037109375, -0.9456787109375, -0.9033203125, -0.8609619140625, -0.818603515625, -0.7762451171875, -0.73388671875, -0.6915283203125, -0.649169921875, -0.6068115234375, -0.564453125, -0.5220947265625, -0.479736328125, -0.4373779296875, -0.39501953125, -0.3526611328125, -0.310302734375, -0.2679443359375, -0.2255859375, -0.1832275390625, -0.140869140625, -0.0985107421875, -0.05615234375, -0.0137939453125, 0.028564453125, 0.0709228515625, 0.11328125, 0.1556396484375, 0.197998046875, 0.2403564453125, 0.28271484375, 0.3250732421875, 0.367431640625, 0.4097900390625, 0.4521484375, 0.4945068359375, 0.536865234375, 0.5792236328125, 0.62158203125, 0.6639404296875, 0.706298828125, 0.7486572265625, 0.791015625, 0.8333740234375, 0.875732421875, 0.9180908203125, 0.96044921875, 1.0028076171875, 1.045166015625, 1.0875244140625, 1.1298828125, 1.1722412109375, 1.214599609375, 1.2569580078125, 1.29931640625, 1.3416748046875, 1.384033203125, 1.4263916015625, 1.46875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 13.0, 8.0, 18.0, 18.0, 29.0, 26.0, 45.0, 50.0, 62.0, 88.0, 121.0, 171.0, 242.0, 305.0, 405.0, 504.0, 470.0, 375.0, 270.0, 207.0, 156.0, 120.0, 80.0, 67.0, 47.0, 44.0, 21.0, 30.0, 7.0, 19.0, 14.0, 6.0, 2.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.708984375, -1.657012939453125, -1.60504150390625, -1.553070068359375, -1.5010986328125, -1.449127197265625, -1.39715576171875, -1.345184326171875, -1.293212890625, -1.241241455078125, -1.18927001953125, -1.137298583984375, -1.0853271484375, -1.033355712890625, -0.98138427734375, -0.929412841796875, -0.87744140625, -0.825469970703125, -0.77349853515625, -0.721527099609375, -0.6695556640625, -0.617584228515625, -0.56561279296875, -0.513641357421875, -0.461669921875, -0.409698486328125, -0.35772705078125, -0.305755615234375, -0.2537841796875, -0.201812744140625, -0.14984130859375, -0.097869873046875, -0.0458984375, 0.006072998046875, 0.05804443359375, 0.110015869140625, 0.1619873046875, 0.213958740234375, 0.26593017578125, 0.317901611328125, 0.369873046875, 0.421844482421875, 0.47381591796875, 0.525787353515625, 0.5777587890625, 0.629730224609375, 0.68170166015625, 0.733673095703125, 0.78564453125, 0.837615966796875, 0.88958740234375, 0.941558837890625, 0.9935302734375, 1.045501708984375, 1.09747314453125, 1.149444580078125, 1.201416015625, 1.253387451171875, 1.30535888671875, 1.357330322265625, 1.4093017578125, 1.461273193359375, 1.51324462890625, 1.565216064453125, 1.6171875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 11.0, 7.0, 12.0, 20.0, 16.0, 25.0, 22.0, 34.0, 36.0, 81.0, 103.0, 127.0, 218.0, 322.0, 493.0, 739.0, 1121.0, 1769.0, 2710.0, 4501.0, 7368.0, 12900.0, 23041.0, 43843.0, 91329.0, 220142.0, 664973.0, 1740329.0, 878759.0, 274769.0, 110015.0, 51208.0, 26574.0, 14755.0, 8470.0, 4913.0, 2973.0, 1904.0, 1196.0, 788.0, 518.0, 367.0, 247.0, 138.0, 123.0, 99.0, 52.0, 37.0, 21.0, 18.0, 16.0, 11.0, 6.0, 7.0, 3.0, 4.0], "bins": [-1.771484375, -1.72174072265625, -1.6719970703125, -1.62225341796875, -1.572509765625, -1.52276611328125, -1.4730224609375, -1.42327880859375, -1.37353515625, -1.32379150390625, -1.2740478515625, -1.22430419921875, -1.174560546875, -1.12481689453125, -1.0750732421875, -1.02532958984375, -0.9755859375, -0.92584228515625, -0.8760986328125, -0.82635498046875, -0.776611328125, -0.72686767578125, -0.6771240234375, -0.62738037109375, -0.57763671875, -0.52789306640625, -0.4781494140625, -0.42840576171875, -0.378662109375, -0.32891845703125, -0.2791748046875, -0.22943115234375, -0.1796875, -0.12994384765625, -0.0802001953125, -0.03045654296875, 0.019287109375, 0.06903076171875, 0.1187744140625, 0.16851806640625, 0.21826171875, 0.26800537109375, 0.3177490234375, 0.36749267578125, 0.417236328125, 0.46697998046875, 0.5167236328125, 0.56646728515625, 0.6162109375, 0.66595458984375, 0.7156982421875, 0.76544189453125, 0.815185546875, 0.86492919921875, 0.9146728515625, 0.96441650390625, 1.01416015625, 1.06390380859375, 1.1136474609375, 1.16339111328125, 1.213134765625, 1.26287841796875, 1.3126220703125, 1.36236572265625, 1.412109375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 17.0, 23.0, 45.0, 45.0, 86.0, 94.0, 120.0, 116.0, 140.0, 99.0, 82.0, 46.0, 36.0, 18.0, 14.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.55085277557373, -13.13388442993164, -12.71691608428955, -12.299947738647461, -11.882979393005371, -11.466011047363281, -11.049042701721191, -10.632074356079102, -10.215106010437012, -9.798137664794922, -9.381169319152832, -8.964200973510742, -8.547232627868652, -8.130264282226562, -7.713295936584473, -7.296327590942383, -6.879358768463135, -6.462390422821045, -6.045422077178955, -5.628453731536865, -5.211485385894775, -4.794516563415527, -4.3775482177734375, -3.9605801105499268, -3.543611764907837, -3.126643419265747, -2.7096750736236572, -2.2927064895629883, -1.875738263130188, -1.4587697982788086, -1.0418014526367188, -0.6248331069946289, -0.20786476135253906, 0.20910361409187317, 0.6260719895362854, 1.04304039478302, 1.4600087404251099, 1.8769772052764893, 2.293945550918579, 2.710913896560669, 3.127882242202759, 3.5448505878448486, 3.9618189334869385, 4.378787517547607, 4.795755863189697, 5.212724208831787, 5.629692554473877, 6.046660900115967, 6.463629245758057, 6.8805975914001465, 7.297565937042236, 7.714534282684326, 8.131503105163574, 8.548471450805664, 8.965439796447754, 9.382408142089844, 9.799376487731934, 10.216344833374023, 10.633313179016113, 11.050281524658203, 11.467249870300293, 11.884218215942383, 12.301186561584473, 12.718154907226562, 13.135123252868652]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 8.0, 7.0, 9.0, 14.0, 17.0, 15.0, 14.0, 13.0, 20.0, 29.0, 25.0, 25.0, 26.0, 40.0, 37.0, 40.0, 44.0, 38.0, 37.0, 55.0, 40.0, 42.0, 50.0, 42.0, 39.0, 38.0, 35.0, 36.0, 40.0, 21.0, 20.0, 18.0, 14.0, 9.0, 12.0, 7.0, 9.0, 3.0, 7.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.6853227615356445, -6.489800453186035, -6.294277667999268, -6.098755359649658, -5.903232574462891, -5.707710266113281, -5.512187480926514, -5.316665172576904, -5.121142387390137, -4.925620079040527, -4.73009729385376, -4.53457498550415, -4.339052200317383, -4.143529891967773, -3.948007106781006, -3.7524847984313965, -3.556962251663208, -3.3614397048950195, -3.165917158126831, -2.9703946113586426, -2.774872064590454, -2.5793495178222656, -2.3838272094726562, -2.1883044242858887, -1.9927819967269897, -1.7972594499588013, -1.6017369031906128, -1.4062144756317139, -1.2106919288635254, -1.015169382095337, -0.8196468353271484, -0.62412428855896, -0.4286017417907715, -0.2330792099237442, -0.03755667805671692, 0.15796583890914917, 0.35348838567733765, 0.5490109324455261, 0.7445334196090698, 0.9400559663772583, 1.1355785131454468, 1.3311010599136353, 1.5266236066818237, 1.7221460342407227, 1.9176685810089111, 2.1131911277770996, 2.308713674545288, 2.5042362213134766, 2.699758768081665, 2.8952813148498535, 3.090803861618042, 3.2863264083862305, 3.481848955154419, 3.6773715019226074, 3.872893810272217, 4.068416595458984, 4.263938903808594, 4.459461212158203, 4.654983997344971, 4.85050630569458, 5.046029090881348, 5.241551399230957, 5.437074184417725, 5.632596492767334, 5.828119277954102]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 9.0, 17.0, 8.0, 16.0, 16.0, 20.0, 15.0, 20.0, 23.0, 28.0, 21.0, 30.0, 32.0, 32.0, 28.0, 39.0, 35.0, 39.0, 37.0, 47.0, 36.0, 34.0, 45.0, 43.0, 38.0, 28.0, 27.0, 30.0, 27.0, 19.0, 17.0, 17.0, 18.0, 15.0, 19.0, 15.0, 10.0, 7.0, 9.0, 5.0, 6.0, 5.0, 6.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.73046875, -0.7092666625976562, -0.6880645751953125, -0.6668624877929688, -0.645660400390625, -0.6244583129882812, -0.6032562255859375, -0.5820541381835938, -0.56085205078125, -0.5396499633789062, -0.5184478759765625, -0.49724578857421875, -0.476043701171875, -0.45484161376953125, -0.4336395263671875, -0.41243743896484375, -0.3912353515625, -0.37003326416015625, -0.3488311767578125, -0.32762908935546875, -0.306427001953125, -0.28522491455078125, -0.2640228271484375, -0.24282073974609375, -0.22161865234375, -0.20041656494140625, -0.1792144775390625, -0.15801239013671875, -0.136810302734375, -0.11560821533203125, -0.0944061279296875, -0.07320404052734375, -0.052001953125, -0.03079986572265625, -0.0095977783203125, 0.01160430908203125, 0.032806396484375, 0.05400848388671875, 0.0752105712890625, 0.09641265869140625, 0.11761474609375, 0.13881683349609375, 0.1600189208984375, 0.18122100830078125, 0.202423095703125, 0.22362518310546875, 0.2448272705078125, 0.26602935791015625, 0.2872314453125, 0.30843353271484375, 0.3296356201171875, 0.35083770751953125, 0.372039794921875, 0.39324188232421875, 0.4144439697265625, 0.43564605712890625, 0.45684814453125, 0.47805023193359375, 0.4992523193359375, 0.5204544067382812, 0.541656494140625, 0.5628585815429688, 0.5840606689453125, 0.6052627563476562, 0.62646484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 13.0, 19.0, 16.0, 39.0, 52.0, 93.0, 123.0, 201.0, 313.0, 537.0, 859.0, 1303.0, 2107.0, 3260.0, 5264.0, 8357.0, 13770.0, 22329.0, 36208.0, 58434.0, 93126.0, 143010.0, 245725.0, 151335.0, 98804.0, 62457.0, 38823.0, 23585.0, 14602.0, 8711.0, 5484.0, 3542.0, 2273.0, 1347.0, 873.0, 536.0, 353.0, 253.0, 155.0, 101.0, 63.0, 49.0, 18.0, 22.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.467926025390625, -1.41827392578125, -1.368621826171875, -1.3189697265625, -1.269317626953125, -1.21966552734375, -1.170013427734375, -1.120361328125, -1.070709228515625, -1.02105712890625, -0.971405029296875, -0.9217529296875, -0.872100830078125, -0.82244873046875, -0.772796630859375, -0.72314453125, -0.673492431640625, -0.62384033203125, -0.574188232421875, -0.5245361328125, -0.474884033203125, -0.42523193359375, -0.375579833984375, -0.325927734375, -0.276275634765625, -0.22662353515625, -0.176971435546875, -0.1273193359375, -0.077667236328125, -0.02801513671875, 0.021636962890625, 0.0712890625, 0.120941162109375, 0.17059326171875, 0.220245361328125, 0.2698974609375, 0.319549560546875, 0.36920166015625, 0.418853759765625, 0.468505859375, 0.518157958984375, 0.56781005859375, 0.617462158203125, 0.6671142578125, 0.716766357421875, 0.76641845703125, 0.816070556640625, 0.86572265625, 0.915374755859375, 0.96502685546875, 1.014678955078125, 1.0643310546875, 1.113983154296875, 1.16363525390625, 1.213287353515625, 1.262939453125, 1.312591552734375, 1.36224365234375, 1.411895751953125, 1.4615478515625, 1.511199951171875, 1.56085205078125, 1.610504150390625, 1.66015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 10.0, 20.0, 17.0, 23.0, 18.0, 24.0, 30.0, 27.0, 24.0, 31.0, 31.0, 33.0, 37.0, 34.0, 43.0, 47.0, 1062.0, 38.0, 37.0, 43.0, 44.0, 36.0, 31.0, 24.0, 20.0, 27.0, 24.0, 19.0, 13.0, 22.0, 21.0, 11.0, 9.0, 12.0, 15.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.578033447265625, -0.56036376953125, -0.542694091796875, -0.5250244140625, -0.507354736328125, -0.48968505859375, -0.472015380859375, -0.454345703125, -0.436676025390625, -0.41900634765625, -0.401336669921875, -0.3836669921875, -0.365997314453125, -0.34832763671875, -0.330657958984375, -0.31298828125, -0.295318603515625, -0.27764892578125, -0.259979248046875, -0.2423095703125, -0.224639892578125, -0.20697021484375, -0.189300537109375, -0.171630859375, -0.153961181640625, -0.13629150390625, -0.118621826171875, -0.1009521484375, -0.083282470703125, -0.06561279296875, -0.047943115234375, -0.0302734375, -0.012603759765625, 0.00506591796875, 0.022735595703125, 0.0404052734375, 0.058074951171875, 0.07574462890625, 0.093414306640625, 0.111083984375, 0.128753662109375, 0.14642333984375, 0.164093017578125, 0.1817626953125, 0.199432373046875, 0.21710205078125, 0.234771728515625, 0.25244140625, 0.270111083984375, 0.28778076171875, 0.305450439453125, 0.3231201171875, 0.340789794921875, 0.35845947265625, 0.376129150390625, 0.393798828125, 0.411468505859375, 0.42913818359375, 0.446807861328125, 0.4644775390625, 0.482147216796875, 0.49981689453125, 0.517486572265625, 0.53515625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 2.0, 19.0, 22.0, 38.0, 53.0, 76.0, 97.0, 151.0, 201.0, 347.0, 486.0, 675.0, 1082.0, 1631.0, 2558.0, 3900.0, 6021.0, 9352.0, 14858.0, 24921.0, 42888.0, 78388.0, 163921.0, 499394.0, 809958.0, 213572.0, 95154.0, 50440.0, 29109.0, 17413.0, 10717.0, 6884.0, 4298.0, 2833.0, 1803.0, 1255.0, 815.0, 588.0, 391.0, 257.0, 165.0, 136.0, 74.0, 53.0, 47.0, 23.0, 14.0, 18.0, 12.0, 12.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9453125, -0.9139556884765625, -0.882598876953125, -0.8512420654296875, -0.81988525390625, -0.7885284423828125, -0.757171630859375, -0.7258148193359375, -0.6944580078125, -0.6631011962890625, -0.631744384765625, -0.6003875732421875, -0.56903076171875, -0.5376739501953125, -0.506317138671875, -0.4749603271484375, -0.443603515625, -0.4122467041015625, -0.380889892578125, -0.3495330810546875, -0.31817626953125, -0.2868194580078125, -0.255462646484375, -0.2241058349609375, -0.1927490234375, -0.1613922119140625, -0.130035400390625, -0.0986785888671875, -0.06732177734375, -0.0359649658203125, -0.004608154296875, 0.0267486572265625, 0.05810546875, 0.0894622802734375, 0.120819091796875, 0.1521759033203125, 0.18353271484375, 0.2148895263671875, 0.246246337890625, 0.2776031494140625, 0.3089599609375, 0.3403167724609375, 0.371673583984375, 0.4030303955078125, 0.43438720703125, 0.4657440185546875, 0.497100830078125, 0.5284576416015625, 0.559814453125, 0.5911712646484375, 0.622528076171875, 0.6538848876953125, 0.68524169921875, 0.7165985107421875, 0.747955322265625, 0.7793121337890625, 0.8106689453125, 0.8420257568359375, 0.873382568359375, 0.9047393798828125, 0.93609619140625, 0.9674530029296875, 0.998809814453125, 1.0301666259765625, 1.0615234375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 3.0, 9.0, 10.0, 10.0, 11.0, 14.0, 21.0, 16.0, 33.0, 33.0, 66.0, 78.0, 119.0, 155.0, 104.0, 63.0, 59.0, 34.0, 23.0, 25.0, 15.0, 19.0, 15.0, 13.0, 4.0, 5.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40380859375, -0.38848876953125, -0.3731689453125, -0.35784912109375, -0.342529296875, -0.32720947265625, -0.3118896484375, -0.29656982421875, -0.28125, -0.26593017578125, -0.2506103515625, -0.23529052734375, -0.219970703125, -0.20465087890625, -0.1893310546875, -0.17401123046875, -0.15869140625, -0.14337158203125, -0.1280517578125, -0.11273193359375, -0.097412109375, -0.08209228515625, -0.0667724609375, -0.05145263671875, -0.0361328125, -0.02081298828125, -0.0054931640625, 0.00982666015625, 0.025146484375, 0.04046630859375, 0.0557861328125, 0.07110595703125, 0.08642578125, 0.10174560546875, 0.1170654296875, 0.13238525390625, 0.147705078125, 0.16302490234375, 0.1783447265625, 0.19366455078125, 0.208984375, 0.22430419921875, 0.2396240234375, 0.25494384765625, 0.270263671875, 0.28558349609375, 0.3009033203125, 0.31622314453125, 0.33154296875, 0.34686279296875, 0.3621826171875, 0.37750244140625, 0.392822265625, 0.40814208984375, 0.4234619140625, 0.43878173828125, 0.4541015625, 0.46942138671875, 0.4847412109375, 0.50006103515625, 0.515380859375, 0.53070068359375, 0.5460205078125, 0.56134033203125, 0.57666015625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 12.0, 7.0, 11.0, 15.0, 27.0, 39.0, 49.0, 63.0, 97.0, 152.0, 370.0, 1332.0, 7918.0, 121909.0, 882379.0, 29289.0, 3480.0, 695.0, 231.0, 121.0, 89.0, 60.0, 50.0, 33.0, 24.0, 16.0, 14.0, 5.0, 9.0, 12.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0], "bins": [-7.546875, -7.3497314453125, -7.152587890625, -6.9554443359375, -6.75830078125, -6.5611572265625, -6.364013671875, -6.1668701171875, -5.9697265625, -5.7725830078125, -5.575439453125, -5.3782958984375, -5.18115234375, -4.9840087890625, -4.786865234375, -4.5897216796875, -4.392578125, -4.1954345703125, -3.998291015625, -3.8011474609375, -3.60400390625, -3.4068603515625, -3.209716796875, -3.0125732421875, -2.8154296875, -2.6182861328125, -2.421142578125, -2.2239990234375, -2.02685546875, -1.8297119140625, -1.632568359375, -1.4354248046875, -1.23828125, -1.0411376953125, -0.843994140625, -0.6468505859375, -0.44970703125, -0.2525634765625, -0.055419921875, 0.1417236328125, 0.3388671875, 0.5360107421875, 0.733154296875, 0.9302978515625, 1.12744140625, 1.3245849609375, 1.521728515625, 1.7188720703125, 1.916015625, 2.1131591796875, 2.310302734375, 2.5074462890625, 2.70458984375, 2.9017333984375, 3.098876953125, 3.2960205078125, 3.4931640625, 3.6903076171875, 3.887451171875, 4.0845947265625, 4.28173828125, 4.4788818359375, 4.676025390625, 4.8731689453125, 5.0703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 25.0, 78.0, 320.0, 376.0, 156.0, 35.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9946963787078857, -2.8759143352508545, -2.757132053375244, -2.638350009918213, -2.5195679664611816, -2.4007856845855713, -2.28200364112854, -2.1632213592529297, -2.0444393157958984, -1.9256571531295776, -1.8068749904632568, -1.6880929470062256, -1.5693107843399048, -1.450528621673584, -1.3317465782165527, -1.212964415550232, -1.0941822528839111, -0.9754000902175903, -0.8566179871559143, -0.7378358840942383, -0.6190537214279175, -0.5002715587615967, -0.38148945569992065, -0.26270735263824463, -0.14392518997192383, -0.025143057107925415, 0.093639075756073, 0.2124212086200714, 0.3312033414840698, 0.4499855041503906, 0.5687676072120667, 0.6875497102737427, 0.8063316345214844, 0.9251137971878052, 1.043895959854126, 1.1626780033111572, 1.281460165977478, 1.4002423286437988, 1.51902437210083, 1.6378065347671509, 1.7565886974334717, 1.8753708600997925, 1.9941530227661133, 2.1129350662231445, 2.231717109680176, 2.350499391555786, 2.4692814350128174, 2.5880637168884277, 2.706845760345459, 2.8256278038024902, 2.9444100856781006, 3.063192129135132, 3.181974411010742, 3.3007564544677734, 3.4195384979248047, 3.538320541381836, 3.6571028232574463, 3.7758848667144775, 3.894667148590088, 4.013449192047119, 4.13223123550415, 4.25101375579834, 4.369795799255371, 4.488577842712402, 4.607359886169434]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 11.0, 16.0, 12.0, 14.0, 13.0, 23.0, 21.0, 29.0, 25.0, 31.0, 44.0, 37.0, 34.0, 35.0, 36.0, 54.0, 41.0, 39.0, 48.0, 27.0, 35.0, 44.0, 40.0, 39.0, 24.0, 33.0, 34.0, 28.0, 19.0, 15.0, 21.0, 13.0, 10.0, 7.0, 8.0, 3.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.593630850315094, -0.5732200741767883, -0.5528092980384827, -0.5323985815048218, -0.5119878053665161, -0.49157702922821045, -0.4711662530899048, -0.4507555067539215, -0.43034476041793823, -0.40993398427963257, -0.3895232379436493, -0.36911246180534363, -0.34870171546936035, -0.3282909393310547, -0.307880163192749, -0.28746941685676575, -0.2670586407184601, -0.2466478794813156, -0.22623711824417114, -0.20582634210586548, -0.1854155957698822, -0.16500481963157654, -0.14459405839443207, -0.1241832971572876, -0.10377253592014313, -0.08336177468299866, -0.06295101344585419, -0.04254024475812912, -0.02212948352098465, -0.0017187222838401794, 0.018692046403884888, 0.03910280764102936, 0.05951356887817383, 0.0799243301153183, 0.10033509135246277, 0.12074586004018784, 0.1411566138267517, 0.16156738996505737, 0.18197815120220184, 0.2023889124393463, 0.22279967367649078, 0.24321043491363525, 0.2636212110519409, 0.2840319573879242, 0.30444273352622986, 0.32485347986221313, 0.3452642560005188, 0.36567503213882446, 0.38608577847480774, 0.4064965546131134, 0.4269073009490967, 0.44731807708740234, 0.4677288234233856, 0.4881395995616913, 0.5085503458976746, 0.5289611220359802, 0.5493718981742859, 0.5697826743125916, 0.5901934504508972, 0.6106041669845581, 0.6310149431228638, 0.6514257192611694, 0.6718364953994751, 0.6922472715377808, 0.7126579880714417]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 14.0, 10.0, 8.0, 15.0, 16.0, 23.0, 14.0, 22.0, 25.0, 21.0, 29.0, 29.0, 27.0, 32.0, 30.0, 35.0, 37.0, 40.0, 42.0, 36.0, 35.0, 40.0, 49.0, 36.0, 30.0, 33.0, 27.0, 31.0, 20.0, 17.0, 26.0, 19.0, 13.0, 18.0, 11.0, 18.0, 10.0, 11.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0], "bins": [-0.69873046875, -0.6777572631835938, -0.6567840576171875, -0.6358108520507812, -0.614837646484375, -0.5938644409179688, -0.5728912353515625, -0.5519180297851562, -0.53094482421875, -0.5099716186523438, -0.4889984130859375, -0.46802520751953125, -0.447052001953125, -0.42607879638671875, -0.4051055908203125, -0.38413238525390625, -0.3631591796875, -0.34218597412109375, -0.3212127685546875, -0.30023956298828125, -0.279266357421875, -0.25829315185546875, -0.2373199462890625, -0.21634674072265625, -0.19537353515625, -0.17440032958984375, -0.1534271240234375, -0.13245391845703125, -0.111480712890625, -0.09050750732421875, -0.0695343017578125, -0.04856109619140625, -0.027587890625, -0.00661468505859375, 0.0143585205078125, 0.03533172607421875, 0.056304931640625, 0.07727813720703125, 0.0982513427734375, 0.11922454833984375, 0.14019775390625, 0.16117095947265625, 0.1821441650390625, 0.20311737060546875, 0.224090576171875, 0.24506378173828125, 0.2660369873046875, 0.28701019287109375, 0.3079833984375, 0.32895660400390625, 0.3499298095703125, 0.37090301513671875, 0.391876220703125, 0.41284942626953125, 0.4338226318359375, 0.45479583740234375, 0.47576904296875, 0.49674224853515625, 0.5177154541015625, 0.5386886596679688, 0.559661865234375, 0.5806350708007812, 0.6016082763671875, 0.6225814819335938, 0.6435546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 12.0, 15.0, 16.0, 20.0, 30.0, 52.0, 67.0, 156.0, 202.0, 329.0, 650.0, 1208.0, 2172.0, 4247.0, 8182.0, 17125.0, 37029.0, 88022.0, 223432.0, 354467.0, 180391.0, 70642.0, 30985.0, 14197.0, 7061.0, 3542.0, 1889.0, 1012.0, 536.0, 341.0, 195.0, 119.0, 56.0, 51.0, 30.0, 15.0, 8.0, 15.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.0947265625, -1.06463623046875, -1.0345458984375, -1.00445556640625, -0.974365234375, -0.94427490234375, -0.9141845703125, -0.88409423828125, -0.85400390625, -0.82391357421875, -0.7938232421875, -0.76373291015625, -0.733642578125, -0.70355224609375, -0.6734619140625, -0.64337158203125, -0.61328125, -0.58319091796875, -0.5531005859375, -0.52301025390625, -0.492919921875, -0.46282958984375, -0.4327392578125, -0.40264892578125, -0.37255859375, -0.34246826171875, -0.3123779296875, -0.28228759765625, -0.252197265625, -0.22210693359375, -0.1920166015625, -0.16192626953125, -0.1318359375, -0.10174560546875, -0.0716552734375, -0.04156494140625, -0.011474609375, 0.01861572265625, 0.0487060546875, 0.07879638671875, 0.10888671875, 0.13897705078125, 0.1690673828125, 0.19915771484375, 0.229248046875, 0.25933837890625, 0.2894287109375, 0.31951904296875, 0.349609375, 0.37969970703125, 0.4097900390625, 0.43988037109375, 0.469970703125, 0.50006103515625, 0.5301513671875, 0.56024169921875, 0.59033203125, 0.62042236328125, 0.6505126953125, 0.68060302734375, 0.710693359375, 0.74078369140625, 0.7708740234375, 0.80096435546875, 0.8310546875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 7.0, 8.0, 7.0, 10.0, 16.0, 11.0, 17.0, 22.0, 26.0, 39.0, 33.0, 28.0, 54.0, 52.0, 62.0, 86.0, 123.0, 219.0, 1324.0, 235.0, 131.0, 97.0, 66.0, 49.0, 51.0, 43.0, 28.0, 44.0, 20.0, 24.0, 19.0, 15.0, 16.0, 12.0, 7.0, 7.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.541015625, -2.457916259765625, -2.37481689453125, -2.291717529296875, -2.2086181640625, -2.125518798828125, -2.04241943359375, -1.959320068359375, -1.876220703125, -1.793121337890625, -1.71002197265625, -1.626922607421875, -1.5438232421875, -1.460723876953125, -1.37762451171875, -1.294525146484375, -1.21142578125, -1.128326416015625, -1.04522705078125, -0.962127685546875, -0.8790283203125, -0.795928955078125, -0.71282958984375, -0.629730224609375, -0.546630859375, -0.463531494140625, -0.38043212890625, -0.297332763671875, -0.2142333984375, -0.131134033203125, -0.04803466796875, 0.035064697265625, 0.1181640625, 0.201263427734375, 0.28436279296875, 0.367462158203125, 0.4505615234375, 0.533660888671875, 0.61676025390625, 0.699859619140625, 0.782958984375, 0.866058349609375, 0.94915771484375, 1.032257080078125, 1.1153564453125, 1.198455810546875, 1.28155517578125, 1.364654541015625, 1.44775390625, 1.530853271484375, 1.61395263671875, 1.697052001953125, 1.7801513671875, 1.863250732421875, 1.94635009765625, 2.029449462890625, 2.112548828125, 2.195648193359375, 2.27874755859375, 2.361846923828125, 2.4449462890625, 2.528045654296875, 2.61114501953125, 2.694244384765625, 2.77734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 6.0, 9.0, 10.0, 16.0, 21.0, 28.0, 43.0, 59.0, 79.0, 105.0, 165.0, 270.0, 502.0, 963.0, 2584.0, 9976.0, 86907.0, 2343338.0, 658892.0, 32809.0, 5331.0, 1644.0, 781.0, 373.0, 249.0, 161.0, 104.0, 63.0, 44.0, 31.0, 25.0, 24.0, 12.0, 14.0, 9.0, 6.0, 8.0, 6.0, 8.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.22265625, -4.0855712890625, -3.948486328125, -3.8114013671875, -3.67431640625, -3.5372314453125, -3.400146484375, -3.2630615234375, -3.1259765625, -2.9888916015625, -2.851806640625, -2.7147216796875, -2.57763671875, -2.4405517578125, -2.303466796875, -2.1663818359375, -2.029296875, -1.8922119140625, -1.755126953125, -1.6180419921875, -1.48095703125, -1.3438720703125, -1.206787109375, -1.0697021484375, -0.9326171875, -0.7955322265625, -0.658447265625, -0.5213623046875, -0.38427734375, -0.2471923828125, -0.110107421875, 0.0269775390625, 0.1640625, 0.3011474609375, 0.438232421875, 0.5753173828125, 0.71240234375, 0.8494873046875, 0.986572265625, 1.1236572265625, 1.2607421875, 1.3978271484375, 1.534912109375, 1.6719970703125, 1.80908203125, 1.9461669921875, 2.083251953125, 2.2203369140625, 2.357421875, 2.4945068359375, 2.631591796875, 2.7686767578125, 2.90576171875, 3.0428466796875, 3.179931640625, 3.3170166015625, 3.4541015625, 3.5911865234375, 3.728271484375, 3.8653564453125, 4.00244140625, 4.1395263671875, 4.276611328125, 4.4136962890625, 4.55078125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 35.0, 232.0, 423.0, 247.0, 64.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.212492942810059, -8.417913436889648, -7.62333345413208, -6.82875394821167, -6.034173965454102, -5.239594459533691, -4.445014953613281, -3.650434970855713, -2.8558554649353027, -2.0612757205963135, -1.2666960954666138, -0.47211647033691406, 0.3224632740020752, 1.1170430183410645, 1.9116225242614746, 2.706202507019043, 3.500782012939453, 4.295361518859863, 5.089941501617432, 5.884521007537842, 6.67910099029541, 7.47368049621582, 8.26826000213623, 9.06283950805664, 9.857419967651367, 10.651999473571777, 11.446578979492188, 12.241159439086914, 13.035738945007324, 13.830318450927734, 14.624897956848145, 15.419477462768555, 16.21405601501465, 17.008636474609375, 17.80321502685547, 18.597795486450195, 19.39237403869629, 20.186954498291016, 20.98153305053711, 21.776113510131836, 22.570693969726562, 23.36527442932129, 24.159852981567383, 24.95443344116211, 25.749011993408203, 26.54359245300293, 27.338172912597656, 28.13275146484375, 28.927330017089844, 29.72191047668457, 30.516489028930664, 31.31106948852539, 32.105648040771484, 32.900230407714844, 33.69480895996094, 34.48938751220703, 35.28396987915039, 36.078548431396484, 36.873130798339844, 37.66770935058594, 38.46228790283203, 39.256866455078125, 40.051448822021484, 40.84602737426758, 41.64060592651367]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 6.0, 5.0, 10.0, 8.0, 9.0, 9.0, 16.0, 20.0, 23.0, 26.0, 25.0, 20.0, 21.0, 31.0, 35.0, 32.0, 33.0, 30.0, 31.0, 36.0, 36.0, 40.0, 35.0, 33.0, 32.0, 33.0, 29.0, 24.0, 39.0, 28.0, 38.0, 20.0, 24.0, 22.0, 17.0, 19.0, 15.0, 9.0, 9.0, 14.0, 11.0, 8.0, 5.0, 7.0, 9.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.65683650970459, -5.471185207366943, -5.285534381866455, -5.099883079528809, -4.91423225402832, -4.728580951690674, -4.542929649353027, -4.357278823852539, -4.171627521514893, -3.985976457595825, -3.800325393676758, -3.6146740913391113, -3.429023027420044, -3.2433719635009766, -3.05772066116333, -2.8720695972442627, -2.6864185333251953, -2.500767469406128, -2.3151164054870605, -2.129465103149414, -1.9438140392303467, -1.7581629753112793, -1.5725117921829224, -1.3868606090545654, -1.201209545135498, -1.0155584812164307, -0.8299072980880737, -0.6442561745643616, -0.4586050510406494, -0.27295392751693726, -0.0873028039932251, 0.09834837913513184, 0.283998966217041, 0.4696500897407532, 0.6553012132644653, 0.8409523367881775, 1.0266034603118896, 1.212254524230957, 1.397905707359314, 1.583556890487671, 1.7692079544067383, 1.9548590183258057, 2.140510082244873, 2.3261613845825195, 2.511812448501587, 2.6974635124206543, 2.883114814758301, 3.068765878677368, 3.2544169425964355, 3.440068006515503, 3.6257190704345703, 3.811370372772217, 3.997021436691284, 4.182672500610352, 4.368323802947998, 4.5539751052856445, 4.739625930786133, 4.925277233123779, 5.110928058624268, 5.296579360961914, 5.482230186462402, 5.667881488800049, 5.853532791137695, 6.039183616638184, 6.22483491897583]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 0.0, 4.0, 8.0, 5.0, 12.0, 13.0, 8.0, 13.0, 20.0, 21.0, 20.0, 19.0, 21.0, 31.0, 19.0, 26.0, 28.0, 29.0, 26.0, 34.0, 37.0, 43.0, 34.0, 37.0, 45.0, 32.0, 36.0, 49.0, 39.0, 28.0, 24.0, 20.0, 29.0, 23.0, 18.0, 22.0, 10.0, 21.0, 16.0, 11.0, 12.0, 9.0, 11.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.6640625, -0.6436843872070312, -0.6233062744140625, -0.6029281616210938, -0.582550048828125, -0.5621719360351562, -0.5417938232421875, -0.5214157104492188, -0.50103759765625, -0.48065948486328125, -0.4602813720703125, -0.43990325927734375, -0.419525146484375, -0.39914703369140625, -0.3787689208984375, -0.35839080810546875, -0.3380126953125, -0.31763458251953125, -0.2972564697265625, -0.27687835693359375, -0.256500244140625, -0.23612213134765625, -0.2157440185546875, -0.19536590576171875, -0.17498779296875, -0.15460968017578125, -0.1342315673828125, -0.11385345458984375, -0.093475341796875, -0.07309722900390625, -0.0527191162109375, -0.03234100341796875, -0.011962890625, 0.00841522216796875, 0.0287933349609375, 0.04917144775390625, 0.069549560546875, 0.08992767333984375, 0.1103057861328125, 0.13068389892578125, 0.15106201171875, 0.17144012451171875, 0.1918182373046875, 0.21219635009765625, 0.232574462890625, 0.25295257568359375, 0.2733306884765625, 0.29370880126953125, 0.3140869140625, 0.33446502685546875, 0.3548431396484375, 0.37522125244140625, 0.395599365234375, 0.41597747802734375, 0.4363555908203125, 0.45673370361328125, 0.47711181640625, 0.49748992919921875, 0.5178680419921875, 0.5382461547851562, 0.558624267578125, 0.5790023803710938, 0.5993804931640625, 0.6197586059570312, 0.64013671875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 7.0, 17.0, 20.0, 29.0, 37.0, 56.0, 68.0, 97.0, 124.0, 156.0, 245.0, 304.0, 495.0, 738.0, 1148.0, 1941.0, 3233.0, 5743.0, 11104.0, 22664.0, 51183.0, 144301.0, 624225.0, 2061370.0, 946879.0, 197685.0, 63768.0, 26951.0, 13003.0, 6714.0, 3769.0, 2164.0, 1317.0, 839.0, 556.0, 380.0, 244.0, 169.0, 150.0, 97.0, 68.0, 51.0, 46.0, 29.0, 29.0, 19.0, 14.0, 6.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.4345703125, -1.39190673828125, -1.3492431640625, -1.30657958984375, -1.263916015625, -1.22125244140625, -1.1785888671875, -1.13592529296875, -1.09326171875, -1.05059814453125, -1.0079345703125, -0.96527099609375, -0.922607421875, -0.87994384765625, -0.8372802734375, -0.79461669921875, -0.751953125, -0.70928955078125, -0.6666259765625, -0.62396240234375, -0.581298828125, -0.53863525390625, -0.4959716796875, -0.45330810546875, -0.41064453125, -0.36798095703125, -0.3253173828125, -0.28265380859375, -0.239990234375, -0.19732666015625, -0.1546630859375, -0.11199951171875, -0.0693359375, -0.02667236328125, 0.0159912109375, 0.05865478515625, 0.101318359375, 0.14398193359375, 0.1866455078125, 0.22930908203125, 0.27197265625, 0.31463623046875, 0.3572998046875, 0.39996337890625, 0.442626953125, 0.48529052734375, 0.5279541015625, 0.57061767578125, 0.61328125, 0.65594482421875, 0.6986083984375, 0.74127197265625, 0.783935546875, 0.82659912109375, 0.8692626953125, 0.91192626953125, 0.95458984375, 0.99725341796875, 1.0399169921875, 1.08258056640625, 1.125244140625, 1.16790771484375, 1.2105712890625, 1.25323486328125, 1.2958984375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 12.0, 15.0, 25.0, 41.0, 45.0, 92.0, 114.0, 145.0, 227.0, 329.0, 483.0, 618.0, 563.0, 408.0, 301.0, 185.0, 124.0, 91.0, 55.0, 50.0, 30.0, 28.0, 21.0, 12.0, 11.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.189239501953125, -2.12457275390625, -2.059906005859375, -1.9952392578125, -1.930572509765625, -1.86590576171875, -1.801239013671875, -1.736572265625, -1.671905517578125, -1.60723876953125, -1.542572021484375, -1.4779052734375, -1.413238525390625, -1.34857177734375, -1.283905029296875, -1.21923828125, -1.154571533203125, -1.08990478515625, -1.025238037109375, -0.9605712890625, -0.895904541015625, -0.83123779296875, -0.766571044921875, -0.701904296875, -0.637237548828125, -0.57257080078125, -0.507904052734375, -0.4432373046875, -0.378570556640625, -0.31390380859375, -0.249237060546875, -0.1845703125, -0.119903564453125, -0.05523681640625, 0.009429931640625, 0.0740966796875, 0.138763427734375, 0.20343017578125, 0.268096923828125, 0.332763671875, 0.397430419921875, 0.46209716796875, 0.526763916015625, 0.5914306640625, 0.656097412109375, 0.72076416015625, 0.785430908203125, 0.85009765625, 0.914764404296875, 0.97943115234375, 1.044097900390625, 1.1087646484375, 1.173431396484375, 1.23809814453125, 1.302764892578125, 1.367431640625, 1.432098388671875, 1.49676513671875, 1.561431884765625, 1.6260986328125, 1.690765380859375, 1.75543212890625, 1.820098876953125, 1.884765625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 8.0, 14.0, 23.0, 41.0, 83.0, 161.0, 333.0, 759.0, 1922.0, 5320.0, 17952.0, 94770.0, 1201053.0, 2654137.0, 177756.0, 28140.0, 7355.0, 2541.0, 941.0, 479.0, 231.0, 113.0, 64.0, 27.0, 14.0, 11.0, 7.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.22698974609375, -4.0867919921875, -3.94659423828125, -3.806396484375, -3.66619873046875, -3.5260009765625, -3.38580322265625, -3.24560546875, -3.10540771484375, -2.9652099609375, -2.82501220703125, -2.684814453125, -2.54461669921875, -2.4044189453125, -2.26422119140625, -2.1240234375, -1.98382568359375, -1.8436279296875, -1.70343017578125, -1.563232421875, -1.42303466796875, -1.2828369140625, -1.14263916015625, -1.00244140625, -0.86224365234375, -0.7220458984375, -0.58184814453125, -0.441650390625, -0.30145263671875, -0.1612548828125, -0.02105712890625, 0.119140625, 0.25933837890625, 0.3995361328125, 0.53973388671875, 0.679931640625, 0.82012939453125, 0.9603271484375, 1.10052490234375, 1.24072265625, 1.38092041015625, 1.5211181640625, 1.66131591796875, 1.801513671875, 1.94171142578125, 2.0819091796875, 2.22210693359375, 2.3623046875, 2.50250244140625, 2.6427001953125, 2.78289794921875, 2.923095703125, 3.06329345703125, 3.2034912109375, 3.34368896484375, 3.48388671875, 3.62408447265625, 3.7642822265625, 3.90447998046875, 4.044677734375, 4.18487548828125, 4.3250732421875, 4.46527099609375, 4.60546875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 11.0, 26.0, 92.0, 223.0, 277.0, 203.0, 118.0, 42.0, 14.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.19737243652344, -31.208555221557617, -30.219738006591797, -29.23092269897461, -28.24210548400879, -27.25328826904297, -26.26447105407715, -25.275653839111328, -24.28683853149414, -23.29802131652832, -22.3092041015625, -21.320388793945312, -20.331571578979492, -19.342754364013672, -18.35393714904785, -17.36511993408203, -16.37630271911621, -15.38748550415039, -14.398669242858887, -13.409852027893066, -12.421035766601562, -11.432218551635742, -10.443401336669922, -9.454584121704102, -8.465767860412598, -7.4769511222839355, -6.488134384155273, -5.499317169189453, -4.510500431060791, -3.521683692932129, -2.5328664779663086, -1.5440497398376465, -0.5552349090576172, 0.4335819482803345, 1.4223988056182861, 2.4112157821655273, 3.4000325202941895, 4.388849258422852, 5.377666473388672, 6.366483211517334, 7.355299949645996, 8.344117164611816, 9.33293342590332, 10.32175064086914, 11.310567855834961, 12.299384117126465, 13.288201332092285, 14.277017593383789, 15.26583480834961, 16.25465202331543, 17.24346923828125, 18.232284545898438, 19.221101760864258, 20.209918975830078, 21.1987361907959, 22.18755340576172, 23.176368713378906, 24.165185928344727, 25.154003143310547, 26.142818450927734, 27.131635665893555, 28.120452880859375, 29.109270095825195, 30.098087310791016, 31.086904525756836]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 9.0, 6.0, 11.0, 10.0, 15.0, 11.0, 10.0, 20.0, 17.0, 26.0, 15.0, 35.0, 17.0, 31.0, 40.0, 30.0, 44.0, 46.0, 41.0, 37.0, 51.0, 49.0, 34.0, 32.0, 39.0, 48.0, 37.0, 40.0, 29.0, 18.0, 25.0, 21.0, 25.0, 15.0, 15.0, 8.0, 6.0, 9.0, 9.0, 10.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.397795677185059, -5.207033634185791, -5.016271591186523, -4.825509548187256, -4.634747505187988, -4.443985462188721, -4.253223419189453, -4.062460899353027, -3.871699094772339, -3.6809370517730713, -3.4901750087738037, -3.299412727355957, -3.1086506843566895, -2.917888641357422, -2.7271265983581543, -2.5363645553588867, -2.345602512359619, -2.1548404693603516, -1.964078426361084, -1.7733162641525269, -1.5825542211532593, -1.3917921781539917, -1.2010300159454346, -1.010267972946167, -0.8195059299468994, -0.6287438869476318, -0.4379817843437195, -0.24721968173980713, -0.05645763874053955, 0.13430440425872803, 0.32506656646728516, 0.5158286094665527, 0.7065906524658203, 0.8973526954650879, 1.0881147384643555, 1.2788769006729126, 1.4696389436721802, 1.6604009866714478, 1.8511631488800049, 2.0419251918792725, 2.23268723487854, 2.4234492778778076, 2.614211320877075, 2.804973602294922, 2.9957356452941895, 3.186497688293457, 3.3772597312927246, 3.568021774291992, 3.7587838172912598, 3.9495458602905273, 4.140307903289795, 4.3310699462890625, 4.52183198928833, 4.712594032287598, 4.903356552124023, 5.094118118286133, 5.284880638122559, 5.475642681121826, 5.666404724121094, 5.857166767120361, 6.047928810119629, 6.2386908531188965, 6.429452896118164, 6.62021541595459, 6.810976982116699]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 9.0, 4.0, 4.0, 7.0, 12.0, 12.0, 14.0, 18.0, 19.0, 17.0, 24.0, 30.0, 25.0, 30.0, 22.0, 32.0, 43.0, 31.0, 25.0, 31.0, 51.0, 34.0, 46.0, 48.0, 41.0, 40.0, 33.0, 32.0, 29.0, 29.0, 26.0, 29.0, 14.0, 14.0, 25.0, 25.0, 13.0, 15.0, 8.0, 11.0, 6.0, 9.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7138519287109375, -0.691375732421875, -0.6688995361328125, -0.64642333984375, -0.6239471435546875, -0.601470947265625, -0.5789947509765625, -0.5565185546875, -0.5340423583984375, -0.511566162109375, -0.4890899658203125, -0.46661376953125, -0.4441375732421875, -0.421661376953125, -0.3991851806640625, -0.376708984375, -0.3542327880859375, -0.331756591796875, -0.3092803955078125, -0.28680419921875, -0.2643280029296875, -0.241851806640625, -0.2193756103515625, -0.1968994140625, -0.1744232177734375, -0.151947021484375, -0.1294708251953125, -0.10699462890625, -0.0845184326171875, -0.062042236328125, -0.0395660400390625, -0.01708984375, 0.0053863525390625, 0.027862548828125, 0.0503387451171875, 0.07281494140625, 0.0952911376953125, 0.117767333984375, 0.1402435302734375, 0.1627197265625, 0.1851959228515625, 0.207672119140625, 0.2301483154296875, 0.25262451171875, 0.2751007080078125, 0.297576904296875, 0.3200531005859375, 0.342529296875, 0.3650054931640625, 0.387481689453125, 0.4099578857421875, 0.43243408203125, 0.4549102783203125, 0.477386474609375, 0.4998626708984375, 0.5223388671875, 0.5448150634765625, 0.567291259765625, 0.5897674560546875, 0.61224365234375, 0.6347198486328125, 0.657196044921875, 0.6796722412109375, 0.7021484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 8.0, 15.0, 35.0, 56.0, 71.0, 136.0, 244.0, 397.0, 646.0, 1079.0, 1740.0, 2922.0, 4923.0, 7901.0, 13431.0, 22146.0, 35723.0, 57408.0, 90610.0, 153680.0, 346001.0, 116703.0, 73247.0, 46516.0, 28757.0, 17548.0, 10591.0, 6246.0, 3931.0, 2250.0, 1396.0, 864.0, 491.0, 283.0, 201.0, 123.0, 76.0, 51.0, 38.0, 22.0, 13.0, 12.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.033203125, -1.973876953125, -1.91455078125, -1.855224609375, -1.7958984375, -1.736572265625, -1.67724609375, -1.617919921875, -1.55859375, -1.499267578125, -1.43994140625, -1.380615234375, -1.3212890625, -1.261962890625, -1.20263671875, -1.143310546875, -1.083984375, -1.024658203125, -0.96533203125, -0.906005859375, -0.8466796875, -0.787353515625, -0.72802734375, -0.668701171875, -0.609375, -0.550048828125, -0.49072265625, -0.431396484375, -0.3720703125, -0.312744140625, -0.25341796875, -0.194091796875, -0.134765625, -0.075439453125, -0.01611328125, 0.043212890625, 0.1025390625, 0.161865234375, 0.22119140625, 0.280517578125, 0.33984375, 0.399169921875, 0.45849609375, 0.517822265625, 0.5771484375, 0.636474609375, 0.69580078125, 0.755126953125, 0.814453125, 0.873779296875, 0.93310546875, 0.992431640625, 1.0517578125, 1.111083984375, 1.17041015625, 1.229736328125, 1.2890625, 1.348388671875, 1.40771484375, 1.467041015625, 1.5263671875, 1.585693359375, 1.64501953125, 1.704345703125, 1.763671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 3.0, 1.0, 3.0, 6.0, 11.0, 9.0, 11.0, 18.0, 10.0, 22.0, 19.0, 31.0, 24.0, 25.0, 27.0, 20.0, 26.0, 40.0, 39.0, 26.0, 38.0, 48.0, 1057.0, 46.0, 36.0, 32.0, 43.0, 26.0, 34.0, 39.0, 26.0, 23.0, 26.0, 23.0, 18.0, 22.0, 20.0, 15.0, 13.0, 7.0, 10.0, 4.0, 7.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5537109375, -0.5359954833984375, -0.518280029296875, -0.5005645751953125, -0.48284912109375, -0.4651336669921875, -0.447418212890625, -0.4297027587890625, -0.4119873046875, -0.3942718505859375, -0.376556396484375, -0.3588409423828125, -0.34112548828125, -0.3234100341796875, -0.305694580078125, -0.2879791259765625, -0.270263671875, -0.2525482177734375, -0.234832763671875, -0.2171173095703125, -0.19940185546875, -0.1816864013671875, -0.163970947265625, -0.1462554931640625, -0.1285400390625, -0.1108245849609375, -0.093109130859375, -0.0753936767578125, -0.05767822265625, -0.0399627685546875, -0.022247314453125, -0.0045318603515625, 0.01318359375, 0.0308990478515625, 0.048614501953125, 0.0663299560546875, 0.08404541015625, 0.1017608642578125, 0.119476318359375, 0.1371917724609375, 0.1549072265625, 0.1726226806640625, 0.190338134765625, 0.2080535888671875, 0.22576904296875, 0.2434844970703125, 0.261199951171875, 0.2789154052734375, 0.296630859375, 0.3143463134765625, 0.332061767578125, 0.3497772216796875, 0.36749267578125, 0.3852081298828125, 0.402923583984375, 0.4206390380859375, 0.4383544921875, 0.4560699462890625, 0.473785400390625, 0.4915008544921875, 0.50921630859375, 0.5269317626953125, 0.544647216796875, 0.5623626708984375, 0.580078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 8.0, 6.0, 13.0, 13.0, 18.0, 36.0, 47.0, 61.0, 85.0, 99.0, 166.0, 236.0, 319.0, 434.0, 662.0, 942.0, 1334.0, 2091.0, 3101.0, 4949.0, 7586.0, 12082.0, 19457.0, 31970.0, 57126.0, 111207.0, 282383.0, 1094716.0, 234617.0, 99266.0, 52047.0, 29884.0, 18083.0, 11200.0, 7114.0, 4582.0, 2976.0, 1964.0, 1334.0, 878.0, 622.0, 431.0, 305.0, 198.0, 139.0, 101.0, 87.0, 47.0, 30.0, 30.0, 23.0, 12.0, 4.0, 6.0, 7.0, 4.0, 7.0, 0.0, 1.0, 1.0], "bins": [-1.0361328125, -1.0031585693359375, -0.970184326171875, -0.9372100830078125, -0.90423583984375, -0.8712615966796875, -0.838287353515625, -0.8053131103515625, -0.7723388671875, -0.7393646240234375, -0.706390380859375, -0.6734161376953125, -0.64044189453125, -0.6074676513671875, -0.574493408203125, -0.5415191650390625, -0.508544921875, -0.4755706787109375, -0.442596435546875, -0.4096221923828125, -0.37664794921875, -0.3436737060546875, -0.310699462890625, -0.2777252197265625, -0.2447509765625, -0.2117767333984375, -0.178802490234375, -0.1458282470703125, -0.11285400390625, -0.0798797607421875, -0.046905517578125, -0.0139312744140625, 0.01904296875, 0.0520172119140625, 0.084991455078125, 0.1179656982421875, 0.15093994140625, 0.1839141845703125, 0.216888427734375, 0.2498626708984375, 0.2828369140625, 0.3158111572265625, 0.348785400390625, 0.3817596435546875, 0.41473388671875, 0.4477081298828125, 0.480682373046875, 0.5136566162109375, 0.546630859375, 0.5796051025390625, 0.612579345703125, 0.6455535888671875, 0.67852783203125, 0.7115020751953125, 0.744476318359375, 0.7774505615234375, 0.8104248046875, 0.8433990478515625, 0.876373291015625, 0.9093475341796875, 0.94232177734375, 0.9752960205078125, 1.008270263671875, 1.0412445068359375, 1.07421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 6.0, 3.0, 3.0, 7.0, 13.0, 11.0, 14.0, 25.0, 14.0, 22.0, 31.0, 48.0, 49.0, 65.0, 164.0, 164.0, 91.0, 42.0, 29.0, 25.0, 21.0, 24.0, 13.0, 18.0, 8.0, 15.0, 8.0, 9.0, 10.0, 3.0, 7.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.416748046875, -0.40579986572265625, -0.3948516845703125, -0.38390350341796875, -0.372955322265625, -0.36200714111328125, -0.3510589599609375, -0.34011077880859375, -0.32916259765625, -0.31821441650390625, -0.3072662353515625, -0.29631805419921875, -0.285369873046875, -0.27442169189453125, -0.2634735107421875, -0.25252532958984375, -0.2415771484375, -0.23062896728515625, -0.2196807861328125, -0.20873260498046875, -0.197784423828125, -0.18683624267578125, -0.1758880615234375, -0.16493988037109375, -0.15399169921875, -0.14304351806640625, -0.1320953369140625, -0.12114715576171875, -0.110198974609375, -0.09925079345703125, -0.0883026123046875, -0.07735443115234375, -0.06640625, -0.05545806884765625, -0.0445098876953125, -0.03356170654296875, -0.022613525390625, -0.01166534423828125, -0.0007171630859375, 0.01023101806640625, 0.02117919921875, 0.03212738037109375, 0.0430755615234375, 0.05402374267578125, 0.064971923828125, 0.07592010498046875, 0.0868682861328125, 0.09781646728515625, 0.1087646484375, 0.11971282958984375, 0.1306610107421875, 0.14160919189453125, 0.152557373046875, 0.16350555419921875, 0.1744537353515625, 0.18540191650390625, 0.19635009765625, 0.20729827880859375, 0.2182464599609375, 0.22919464111328125, 0.240142822265625, 0.25109100341796875, 0.2620391845703125, 0.27298736572265625, 0.283935546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 11.0, 18.0, 14.0, 17.0, 18.0, 28.0, 41.0, 41.0, 65.0, 93.0, 167.0, 328.0, 1073.0, 7356.0, 140094.0, 869087.0, 26536.0, 2366.0, 541.0, 221.0, 128.0, 82.0, 59.0, 34.0, 27.0, 20.0, 13.0, 13.0, 10.0, 6.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.328125, -4.16925048828125, -4.0103759765625, -3.85150146484375, -3.692626953125, -3.53375244140625, -3.3748779296875, -3.21600341796875, -3.05712890625, -2.89825439453125, -2.7393798828125, -2.58050537109375, -2.421630859375, -2.26275634765625, -2.1038818359375, -1.94500732421875, -1.7861328125, -1.62725830078125, -1.4683837890625, -1.30950927734375, -1.150634765625, -0.99176025390625, -0.8328857421875, -0.67401123046875, -0.51513671875, -0.35626220703125, -0.1973876953125, -0.03851318359375, 0.120361328125, 0.27923583984375, 0.4381103515625, 0.59698486328125, 0.755859375, 0.91473388671875, 1.0736083984375, 1.23248291015625, 1.391357421875, 1.55023193359375, 1.7091064453125, 1.86798095703125, 2.02685546875, 2.18572998046875, 2.3446044921875, 2.50347900390625, 2.662353515625, 2.82122802734375, 2.9801025390625, 3.13897705078125, 3.2978515625, 3.45672607421875, 3.6156005859375, 3.77447509765625, 3.933349609375, 4.09222412109375, 4.2510986328125, 4.40997314453125, 4.56884765625, 4.72772216796875, 4.8865966796875, 5.04547119140625, 5.204345703125, 5.36322021484375, 5.5220947265625, 5.68096923828125, 5.83984375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 21.0, 98.0, 373.0, 416.0, 86.0, 13.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.602933645248413, -2.4791126251220703, -2.3552916049957275, -2.2314705848693848, -2.107649326324463, -1.9838283061981201, -1.8600072860717773, -1.7361862659454346, -1.6123651266098022, -1.4885441064834595, -1.3647229671478271, -1.2409019470214844, -1.1170809268951416, -0.9932597875595093, -0.8694387674331665, -0.745617687702179, -0.6217966079711914, -0.49797552824020386, -0.3741544783115387, -0.25033342838287354, -0.126512348651886, -0.0026912689208984375, 0.12112975120544434, 0.24495083093643188, 0.36877191066741943, 0.492592990398407, 0.6164140701293945, 0.7402350902557373, 0.8640561699867249, 0.9878772497177124, 1.1116982698440552, 1.2355194091796875, 1.3593401908874512, 1.483161211013794, 1.6069823503494263, 1.730803370475769, 1.8546245098114014, 1.9784455299377441, 2.102266550064087, 2.2260875701904297, 2.3499088287353516, 2.4737298488616943, 2.597550868988037, 2.721372127532959, 2.8451931476593018, 2.9690141677856445, 3.0928351879119873, 3.21665620803833, 3.340477228164673, 3.4642982482910156, 3.5881192684173584, 3.711940288543701, 3.835761547088623, 3.959582567214966, 4.083403587341309, 4.2072248458862305, 4.331045627593994, 4.454866886138916, 4.57868766784668, 4.702508926391602, 4.826329708099365, 4.950150966644287, 5.073971748352051, 5.197793006896973, 5.3216142654418945]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 9.0, 15.0, 15.0, 14.0, 20.0, 20.0, 19.0, 29.0, 33.0, 32.0, 35.0, 32.0, 27.0, 30.0, 39.0, 22.0, 46.0, 43.0, 55.0, 44.0, 45.0, 44.0, 37.0, 38.0, 41.0, 33.0, 26.0, 27.0, 16.0, 17.0, 18.0, 14.0, 11.0, 7.0, 8.0, 7.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5309973955154419, -0.51319420337677, -0.49539098143577576, -0.4775877594947815, -0.4597845673561096, -0.44198134541511536, -0.4241781234741211, -0.4063749313354492, -0.38857170939445496, -0.3707684874534607, -0.3529652953147888, -0.33516207337379456, -0.3173588514328003, -0.2995556592941284, -0.28175243735313416, -0.2639492154121399, -0.24614602327346802, -0.22834281623363495, -0.21053960919380188, -0.19273638725280762, -0.17493318021297455, -0.15712997317314148, -0.13932675123214722, -0.12152354419231415, -0.10372033715248108, -0.08591713011264801, -0.06811391562223434, -0.05031070485711098, -0.03250749409198761, -0.014704287052154541, 0.0030989274382591248, 0.02090214192867279, 0.038705289363861084, 0.05650850012898445, 0.07431171089410782, 0.09211492538452148, 0.10991813242435455, 0.12772133946418762, 0.14552456140518188, 0.16332776844501495, 0.18113097548484802, 0.1989341825246811, 0.21673738956451416, 0.23454061150550842, 0.2523438334465027, 0.27014702558517456, 0.2879502475261688, 0.3057534694671631, 0.32355666160583496, 0.3413598835468292, 0.3591630756855011, 0.37696629762649536, 0.39476948976516724, 0.4125727117061615, 0.43037593364715576, 0.44817912578582764, 0.4659823477268219, 0.48378556966781616, 0.501588761806488, 0.5193919539451599, 0.5371952056884766, 0.5549983978271484, 0.5728015899658203, 0.590604841709137, 0.6084080338478088]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 2.0, 7.0, 13.0, 13.0, 17.0, 15.0, 21.0, 22.0, 30.0, 27.0, 17.0, 33.0, 25.0, 40.0, 29.0, 35.0, 26.0, 33.0, 52.0, 41.0, 49.0, 35.0, 50.0, 30.0, 37.0, 35.0, 24.0, 19.0, 29.0, 19.0, 20.0, 22.0, 18.0, 24.0, 15.0, 8.0, 11.0, 11.0, 7.0, 5.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7265625, -0.7041091918945312, -0.6816558837890625, -0.6592025756835938, -0.636749267578125, -0.6142959594726562, -0.5918426513671875, -0.5693893432617188, -0.54693603515625, -0.5244827270507812, -0.5020294189453125, -0.47957611083984375, -0.457122802734375, -0.43466949462890625, -0.4122161865234375, -0.38976287841796875, -0.3673095703125, -0.34485626220703125, -0.3224029541015625, -0.29994964599609375, -0.277496337890625, -0.25504302978515625, -0.2325897216796875, -0.21013641357421875, -0.18768310546875, -0.16522979736328125, -0.1427764892578125, -0.12032318115234375, -0.097869873046875, -0.07541656494140625, -0.0529632568359375, -0.03050994873046875, -0.008056640625, 0.01439666748046875, 0.0368499755859375, 0.05930328369140625, 0.081756591796875, 0.10420989990234375, 0.1266632080078125, 0.14911651611328125, 0.17156982421875, 0.19402313232421875, 0.2164764404296875, 0.23892974853515625, 0.261383056640625, 0.28383636474609375, 0.3062896728515625, 0.32874298095703125, 0.3511962890625, 0.37364959716796875, 0.3961029052734375, 0.41855621337890625, 0.441009521484375, 0.46346282958984375, 0.4859161376953125, 0.5083694458007812, 0.53082275390625, 0.5532760620117188, 0.5757293701171875, 0.5981826782226562, 0.620635986328125, 0.6430892944335938, 0.6655426025390625, 0.6879959106445312, 0.71044921875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 6.0, 13.0, 13.0, 13.0, 35.0, 41.0, 64.0, 90.0, 141.0, 171.0, 259.0, 388.0, 524.0, 818.0, 1235.0, 1915.0, 2892.0, 4239.0, 6834.0, 10823.0, 17763.0, 29614.0, 52454.0, 102864.0, 226064.0, 284123.0, 141765.0, 67760.0, 37088.0, 21887.0, 13197.0, 8251.0, 5251.0, 3349.0, 2174.0, 1440.0, 948.0, 583.0, 455.0, 294.0, 241.0, 160.0, 95.0, 68.0, 50.0, 33.0, 18.0, 21.0, 12.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.701171875, -0.6771621704101562, -0.6531524658203125, -0.6291427612304688, -0.605133056640625, -0.5811233520507812, -0.5571136474609375, -0.5331039428710938, -0.50909423828125, -0.48508453369140625, -0.4610748291015625, -0.43706512451171875, -0.413055419921875, -0.38904571533203125, -0.3650360107421875, -0.34102630615234375, -0.3170166015625, -0.29300689697265625, -0.2689971923828125, -0.24498748779296875, -0.220977783203125, -0.19696807861328125, -0.1729583740234375, -0.14894866943359375, -0.12493896484375, -0.10092926025390625, -0.0769195556640625, -0.05290985107421875, -0.028900146484375, -0.00489044189453125, 0.0191192626953125, 0.04312896728515625, 0.067138671875, 0.09114837646484375, 0.1151580810546875, 0.13916778564453125, 0.163177490234375, 0.18718719482421875, 0.2111968994140625, 0.23520660400390625, 0.25921630859375, 0.28322601318359375, 0.3072357177734375, 0.33124542236328125, 0.355255126953125, 0.37926483154296875, 0.4032745361328125, 0.42728424072265625, 0.4512939453125, 0.47530364990234375, 0.4993133544921875, 0.5233230590820312, 0.547332763671875, 0.5713424682617188, 0.5953521728515625, 0.6193618774414062, 0.64337158203125, 0.6673812866210938, 0.6913909912109375, 0.7154006958007812, 0.739410400390625, 0.7634201049804688, 0.7874298095703125, 0.8114395141601562, 0.83544921875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 9.0, 5.0, 17.0, 14.0, 19.0, 14.0, 26.0, 21.0, 37.0, 35.0, 52.0, 44.0, 60.0, 84.0, 138.0, 217.0, 1374.0, 258.0, 140.0, 108.0, 70.0, 39.0, 51.0, 42.0, 35.0, 17.0, 24.0, 27.0, 10.0, 12.0, 9.0, 8.0, 8.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.972320556640625, -2.87237548828125, -2.772430419921875, -2.6724853515625, -2.572540283203125, -2.47259521484375, -2.372650146484375, -2.272705078125, -2.172760009765625, -2.07281494140625, -1.972869873046875, -1.8729248046875, -1.772979736328125, -1.67303466796875, -1.573089599609375, -1.47314453125, -1.373199462890625, -1.27325439453125, -1.173309326171875, -1.0733642578125, -0.973419189453125, -0.87347412109375, -0.773529052734375, -0.673583984375, -0.573638916015625, -0.47369384765625, -0.373748779296875, -0.2738037109375, -0.173858642578125, -0.07391357421875, 0.026031494140625, 0.1259765625, 0.225921630859375, 0.32586669921875, 0.425811767578125, 0.5257568359375, 0.625701904296875, 0.72564697265625, 0.825592041015625, 0.925537109375, 1.025482177734375, 1.12542724609375, 1.225372314453125, 1.3253173828125, 1.425262451171875, 1.52520751953125, 1.625152587890625, 1.72509765625, 1.825042724609375, 1.92498779296875, 2.024932861328125, 2.1248779296875, 2.224822998046875, 2.32476806640625, 2.424713134765625, 2.524658203125, 2.624603271484375, 2.72454833984375, 2.824493408203125, 2.9244384765625, 3.024383544921875, 3.12432861328125, 3.224273681640625, 3.32421875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 9.0, 11.0, 19.0, 31.0, 41.0, 53.0, 76.0, 140.0, 242.0, 539.0, 1377.0, 5544.0, 40972.0, 2499683.0, 570995.0, 20356.0, 3541.0, 1031.0, 449.0, 226.0, 118.0, 63.0, 46.0, 40.0, 22.0, 15.0, 17.0, 7.0, 6.0, 3.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-7.56640625, -7.3553466796875, -7.144287109375, -6.9332275390625, -6.72216796875, -6.5111083984375, -6.300048828125, -6.0889892578125, -5.8779296875, -5.6668701171875, -5.455810546875, -5.2447509765625, -5.03369140625, -4.8226318359375, -4.611572265625, -4.4005126953125, -4.189453125, -3.9783935546875, -3.767333984375, -3.5562744140625, -3.34521484375, -3.1341552734375, -2.923095703125, -2.7120361328125, -2.5009765625, -2.2899169921875, -2.078857421875, -1.8677978515625, -1.65673828125, -1.4456787109375, -1.234619140625, -1.0235595703125, -0.8125, -0.6014404296875, -0.390380859375, -0.1793212890625, 0.03173828125, 0.2427978515625, 0.453857421875, 0.6649169921875, 0.8759765625, 1.0870361328125, 1.298095703125, 1.5091552734375, 1.72021484375, 1.9312744140625, 2.142333984375, 2.3533935546875, 2.564453125, 2.7755126953125, 2.986572265625, 3.1976318359375, 3.40869140625, 3.6197509765625, 3.830810546875, 4.0418701171875, 4.2529296875, 4.4639892578125, 4.675048828125, 4.8861083984375, 5.09716796875, 5.3082275390625, 5.519287109375, 5.7303466796875, 5.94140625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [380.0, 638.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.847543716430664, -0.36647677421569824, 3.1145901679992676, 6.5956573486328125, 10.0767240524292, 13.557790756225586, 17.03885841369629, 20.51992416381836, 24.000991821289062, 27.482059478759766, 30.963125228881836, 34.444190979003906, 37.92525863647461, 41.40632629394531, 44.887393951416016, 48.36846160888672, 51.849525451660156, 55.33059310913086, 58.81166076660156, 62.292724609375, 65.77379608154297, 69.2548599243164, 72.73593139648438, 76.21699523925781, 79.69805908203125, 83.17912292480469, 86.66019439697266, 90.1412582397461, 93.62232971191406, 97.1033935546875, 100.58445739746094, 104.0655288696289, 107.54659271240234, 111.02765655517578, 114.50872802734375, 117.98979187011719, 121.47086334228516, 124.9519271850586, 128.43299865722656, 131.9140625, 135.39512634277344, 138.87619018554688, 142.3572540283203, 145.8383331298828, 149.31939697265625, 152.8004608154297, 156.28152465820312, 159.76258850097656, 163.24366760253906, 166.7247314453125, 170.20579528808594, 173.68687438964844, 177.16793823242188, 180.6490020751953, 184.13006591796875, 187.6111297607422, 191.09219360351562, 194.57325744628906, 198.0543212890625, 201.535400390625, 205.01646423339844, 208.49752807617188, 211.9785919189453, 215.45965576171875, 218.94073486328125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 10.0, 9.0, 7.0, 7.0, 10.0, 15.0, 10.0, 23.0, 9.0, 14.0, 17.0, 25.0, 22.0, 28.0, 33.0, 37.0, 24.0, 39.0, 40.0, 41.0, 36.0, 26.0, 44.0, 36.0, 38.0, 48.0, 35.0, 32.0, 29.0, 35.0, 31.0, 26.0, 19.0, 15.0, 30.0, 10.0, 17.0, 13.0, 8.0, 12.0, 8.0, 6.0, 2.0, 9.0, 3.0, 5.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.879245758056641, -7.6337690353393555, -7.38829231262207, -7.142815589904785, -6.8973388671875, -6.651862144470215, -6.40638542175293, -6.1609086990356445, -5.915431976318359, -5.669955253601074, -5.424478530883789, -5.179001808166504, -4.933525085449219, -4.688048362731934, -4.442571640014648, -4.197094917297363, -3.95161771774292, -3.7061409950256348, -3.4606642723083496, -3.2151875495910645, -2.9697108268737793, -2.724234104156494, -2.47875714302063, -2.2332804203033447, -1.9878036975860596, -1.7423269748687744, -1.4968502521514893, -1.2513734102249146, -1.0058966875076294, -0.7604199647903442, -0.5149431228637695, -0.2694664001464844, -0.023990154266357422, 0.22148659825325012, 0.46696335077285767, 0.7124401330947876, 0.9579168558120728, 1.203393578529358, 1.4488704204559326, 1.6943471431732178, 1.939823865890503, 2.185300588607788, 2.4307773113250732, 2.6762542724609375, 2.9217309951782227, 3.167207717895508, 3.412684440612793, 3.658161163330078, 3.9036378860473633, 4.149114608764648, 4.394591331481934, 4.640068054199219, 4.885544776916504, 5.131021499633789, 5.376498222351074, 5.621974945068359, 5.8674516677856445, 6.11292839050293, 6.358405113220215, 6.6038818359375, 6.849358558654785, 7.09483528137207, 7.3403120040893555, 7.585788726806641, 7.831265926361084]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 10.0, 6.0, 7.0, 6.0, 11.0, 10.0, 16.0, 11.0, 14.0, 21.0, 24.0, 25.0, 28.0, 33.0, 29.0, 39.0, 33.0, 34.0, 29.0, 34.0, 37.0, 42.0, 37.0, 50.0, 25.0, 39.0, 46.0, 40.0, 24.0, 31.0, 31.0, 18.0, 16.0, 24.0, 22.0, 20.0, 15.0, 14.0, 4.0, 8.0, 7.0, 4.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.83349609375, -0.8096084594726562, -0.7857208251953125, -0.7618331909179688, -0.737945556640625, -0.7140579223632812, -0.6901702880859375, -0.6662826538085938, -0.64239501953125, -0.6185073852539062, -0.5946197509765625, -0.5707321166992188, -0.546844482421875, -0.5229568481445312, -0.4990692138671875, -0.47518157958984375, -0.4512939453125, -0.42740631103515625, -0.4035186767578125, -0.37963104248046875, -0.355743408203125, -0.33185577392578125, -0.3079681396484375, -0.28408050537109375, -0.26019287109375, -0.23630523681640625, -0.2124176025390625, -0.18852996826171875, -0.164642333984375, -0.14075469970703125, -0.1168670654296875, -0.09297943115234375, -0.069091796875, -0.04520416259765625, -0.0213165283203125, 0.00257110595703125, 0.026458740234375, 0.05034637451171875, 0.0742340087890625, 0.09812164306640625, 0.12200927734375, 0.14589691162109375, 0.1697845458984375, 0.19367218017578125, 0.217559814453125, 0.24144744873046875, 0.2653350830078125, 0.28922271728515625, 0.3131103515625, 0.33699798583984375, 0.3608856201171875, 0.38477325439453125, 0.408660888671875, 0.43254852294921875, 0.4564361572265625, 0.48032379150390625, 0.50421142578125, 0.5280990600585938, 0.5519866943359375, 0.5758743286132812, 0.599761962890625, 0.6236495971679688, 0.6475372314453125, 0.6714248657226562, 0.6953125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 13.0, 25.0, 32.0, 64.0, 126.0, 224.0, 407.0, 710.0, 1247.0, 2469.0, 4852.0, 9796.0, 22715.0, 59851.0, 230549.0, 1623705.0, 1861949.0, 265772.0, 65795.0, 23360.0, 10009.0, 4867.0, 2619.0, 1317.0, 747.0, 452.0, 255.0, 173.0, 75.0, 43.0, 33.0, 15.0, 11.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7333984375, -1.6715850830078125, -1.609771728515625, -1.5479583740234375, -1.48614501953125, -1.4243316650390625, -1.362518310546875, -1.3007049560546875, -1.2388916015625, -1.1770782470703125, -1.115264892578125, -1.0534515380859375, -0.99163818359375, -0.9298248291015625, -0.868011474609375, -0.8061981201171875, -0.744384765625, -0.6825714111328125, -0.620758056640625, -0.5589447021484375, -0.49713134765625, -0.4353179931640625, -0.373504638671875, -0.3116912841796875, -0.2498779296875, -0.1880645751953125, -0.126251220703125, -0.0644378662109375, -0.00262451171875, 0.0591888427734375, 0.121002197265625, 0.1828155517578125, 0.24462890625, 0.3064422607421875, 0.368255615234375, 0.4300689697265625, 0.49188232421875, 0.5536956787109375, 0.615509033203125, 0.6773223876953125, 0.7391357421875, 0.8009490966796875, 0.862762451171875, 0.9245758056640625, 0.98638916015625, 1.0482025146484375, 1.110015869140625, 1.1718292236328125, 1.233642578125, 1.2954559326171875, 1.357269287109375, 1.4190826416015625, 1.48089599609375, 1.5427093505859375, 1.604522705078125, 1.6663360595703125, 1.7281494140625, 1.7899627685546875, 1.851776123046875, 1.9135894775390625, 1.97540283203125, 2.0372161865234375, 2.099029541015625, 2.1608428955078125, 2.22265625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 13.0, 9.0, 17.0, 12.0, 10.0, 22.0, 28.0, 40.0, 43.0, 64.0, 74.0, 106.0, 141.0, 198.0, 250.0, 351.0, 411.0, 488.0, 439.0, 340.0, 226.0, 177.0, 154.0, 100.0, 82.0, 56.0, 46.0, 39.0, 26.0, 30.0, 17.0, 16.0, 15.0, 6.0, 11.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5419921875, -1.4877166748046875, -1.433441162109375, -1.3791656494140625, -1.32489013671875, -1.2706146240234375, -1.216339111328125, -1.1620635986328125, -1.1077880859375, -1.0535125732421875, -0.999237060546875, -0.9449615478515625, -0.89068603515625, -0.8364105224609375, -0.782135009765625, -0.7278594970703125, -0.673583984375, -0.6193084716796875, -0.565032958984375, -0.5107574462890625, -0.45648193359375, -0.4022064208984375, -0.347930908203125, -0.2936553955078125, -0.2393798828125, -0.1851043701171875, -0.130828857421875, -0.0765533447265625, -0.02227783203125, 0.0319976806640625, 0.086273193359375, 0.1405487060546875, 0.19482421875, 0.2490997314453125, 0.303375244140625, 0.3576507568359375, 0.41192626953125, 0.4662017822265625, 0.520477294921875, 0.5747528076171875, 0.6290283203125, 0.6833038330078125, 0.737579345703125, 0.7918548583984375, 0.84613037109375, 0.9004058837890625, 0.954681396484375, 1.0089569091796875, 1.063232421875, 1.1175079345703125, 1.171783447265625, 1.2260589599609375, 1.28033447265625, 1.3346099853515625, 1.388885498046875, 1.4431610107421875, 1.4974365234375, 1.5517120361328125, 1.605987548828125, 1.6602630615234375, 1.71453857421875, 1.7688140869140625, 1.823089599609375, 1.8773651123046875, 1.931640625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 13.0, 16.0, 26.0, 32.0, 57.0, 87.0, 140.0, 204.0, 335.0, 529.0, 1004.0, 1884.0, 3938.0, 9106.0, 22690.0, 67482.0, 260255.0, 1651726.0, 1781708.0, 280083.0, 70758.0, 23876.0, 9535.0, 4200.0, 2051.0, 1043.0, 588.0, 346.0, 192.0, 114.0, 83.0, 61.0, 29.0, 31.0, 20.0, 5.0, 2.0, 9.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.06640625, -2.978851318359375, -2.89129638671875, -2.803741455078125, -2.7161865234375, -2.628631591796875, -2.54107666015625, -2.453521728515625, -2.365966796875, -2.278411865234375, -2.19085693359375, -2.103302001953125, -2.0157470703125, -1.928192138671875, -1.84063720703125, -1.753082275390625, -1.66552734375, -1.577972412109375, -1.49041748046875, -1.402862548828125, -1.3153076171875, -1.227752685546875, -1.14019775390625, -1.052642822265625, -0.965087890625, -0.877532958984375, -0.78997802734375, -0.702423095703125, -0.6148681640625, -0.527313232421875, -0.43975830078125, -0.352203369140625, -0.2646484375, -0.177093505859375, -0.08953857421875, -0.001983642578125, 0.0855712890625, 0.173126220703125, 0.26068115234375, 0.348236083984375, 0.435791015625, 0.523345947265625, 0.61090087890625, 0.698455810546875, 0.7860107421875, 0.873565673828125, 0.96112060546875, 1.048675537109375, 1.13623046875, 1.223785400390625, 1.31134033203125, 1.398895263671875, 1.4864501953125, 1.574005126953125, 1.66156005859375, 1.749114990234375, 1.836669921875, 1.924224853515625, 2.01177978515625, 2.099334716796875, 2.1868896484375, 2.274444580078125, 2.36199951171875, 2.449554443359375, 2.537109375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 9.0, 17.0, 31.0, 64.0, 102.0, 146.0, 159.0, 151.0, 130.0, 80.0, 59.0, 29.0, 16.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3687801361084, -25.79098892211914, -25.213199615478516, -24.635408401489258, -24.057619094848633, -23.479827880859375, -22.90203857421875, -22.324247360229492, -21.746456146240234, -21.168664932250977, -20.59087562561035, -20.013084411621094, -19.43529510498047, -18.85750389099121, -18.279714584350586, -17.701923370361328, -17.124134063720703, -16.546342849731445, -15.96855354309082, -15.390763282775879, -14.812973022460938, -14.23518180847168, -13.657391548156738, -13.079601287841797, -12.501811027526855, -11.924020767211914, -11.346230506896973, -10.768440246582031, -10.190649032592773, -9.612859725952148, -9.03506851196289, -8.45727825164795, -7.879486083984375, -7.301695823669434, -6.723905563354492, -6.146114826202393, -5.568324565887451, -4.99053430557251, -4.41274356842041, -3.8349533081054688, -3.2571630477905273, -2.679372787475586, -2.1015822887420654, -1.5237919092178345, -0.9460015296936035, -0.3682112693786621, 0.2095792293548584, 0.7873697280883789, 1.3651599884033203, 1.9429503679275513, 2.5207407474517822, 3.0985312461853027, 3.676321506500244, 4.2541117668151855, 4.831902503967285, 5.409692764282227, 5.987483024597168, 6.565273284912109, 7.143063545227051, 7.72085428237915, 8.29864501953125, 8.876434326171875, 9.454225540161133, 10.032015800476074, 10.609806060791016]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 8.0, 9.0, 6.0, 7.0, 7.0, 19.0, 17.0, 19.0, 21.0, 30.0, 17.0, 31.0, 32.0, 26.0, 36.0, 27.0, 27.0, 43.0, 50.0, 37.0, 43.0, 32.0, 34.0, 38.0, 25.0, 40.0, 25.0, 29.0, 42.0, 21.0, 19.0, 30.0, 19.0, 16.0, 18.0, 14.0, 8.0, 15.0, 13.0, 6.0, 5.0, 12.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.817947864532471, -5.6342549324035645, -5.450562477111816, -5.26686954498291, -5.083177089691162, -4.899484157562256, -4.715791702270508, -4.532098770141602, -4.348405838012695, -4.164712905883789, -3.981020450592041, -3.7973275184631348, -3.6136350631713867, -3.4299421310424805, -3.2462494373321533, -3.062556743621826, -2.878864288330078, -2.695171594619751, -2.511478900909424, -2.3277859687805176, -2.1440935134887695, -1.9604007005691528, -1.7767078876495361, -1.593015193939209, -1.4093225002288818, -1.2256298065185547, -1.0419371128082275, -0.8582442998886108, -0.6745516061782837, -0.49085891246795654, -0.30716609954833984, -0.1234734058380127, 0.06021881103515625, 0.2439115345478058, 0.4276042580604553, 0.6112970113754272, 0.7949897050857544, 0.9786823987960815, 1.1623752117156982, 1.3460679054260254, 1.5297605991363525, 1.7134532928466797, 1.8971459865570068, 2.080838680267334, 2.2645316123962402, 2.4482240676879883, 2.6319169998168945, 2.8156096935272217, 2.999302387237549, 3.182995080947876, 3.366687774658203, 3.5503807067871094, 3.7340731620788574, 3.9177660942077637, 4.101458549499512, 4.285151481628418, 4.468844413757324, 4.6525373458862305, 4.8362298011779785, 5.019922733306885, 5.203615188598633, 5.387308120727539, 5.571001052856445, 5.754693508148193, 5.938385963439941]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 5.0, 11.0, 8.0, 11.0, 19.0, 15.0, 13.0, 12.0, 15.0, 20.0, 20.0, 21.0, 28.0, 29.0, 24.0, 19.0, 33.0, 42.0, 42.0, 35.0, 33.0, 36.0, 39.0, 37.0, 35.0, 44.0, 25.0, 33.0, 26.0, 37.0, 30.0, 23.0, 25.0, 28.0, 19.0, 16.0, 13.0, 10.0, 10.0, 10.0, 11.0, 6.0, 4.0, 4.0, 5.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.70166015625, -0.6795196533203125, -0.657379150390625, -0.6352386474609375, -0.61309814453125, -0.5909576416015625, -0.568817138671875, -0.5466766357421875, -0.5245361328125, -0.5023956298828125, -0.480255126953125, -0.4581146240234375, -0.43597412109375, -0.4138336181640625, -0.391693115234375, -0.3695526123046875, -0.347412109375, -0.3252716064453125, -0.303131103515625, -0.2809906005859375, -0.25885009765625, -0.2367095947265625, -0.214569091796875, -0.1924285888671875, -0.1702880859375, -0.1481475830078125, -0.126007080078125, -0.1038665771484375, -0.08172607421875, -0.0595855712890625, -0.037445068359375, -0.0153045654296875, 0.0068359375, 0.0289764404296875, 0.051116943359375, 0.0732574462890625, 0.09539794921875, 0.1175384521484375, 0.139678955078125, 0.1618194580078125, 0.1839599609375, 0.2061004638671875, 0.228240966796875, 0.2503814697265625, 0.27252197265625, 0.2946624755859375, 0.316802978515625, 0.3389434814453125, 0.361083984375, 0.3832244873046875, 0.405364990234375, 0.4275054931640625, 0.44964599609375, 0.4717864990234375, 0.493927001953125, 0.5160675048828125, 0.5382080078125, 0.5603485107421875, 0.582489013671875, 0.6046295166015625, 0.62677001953125, 0.6489105224609375, 0.671051025390625, 0.6931915283203125, 0.71533203125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 6.0, 15.0, 30.0, 41.0, 73.0, 103.0, 134.0, 201.0, 265.0, 380.0, 588.0, 847.0, 1226.0, 1761.0, 2857.0, 4668.0, 8478.0, 16295.0, 33975.0, 89270.0, 430803.0, 320399.0, 72639.0, 29515.0, 14090.0, 7611.0, 4402.0, 2639.0, 1642.0, 1135.0, 749.0, 559.0, 356.0, 238.0, 168.0, 115.0, 84.0, 54.0, 43.0, 33.0, 32.0, 6.0, 6.0, 7.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.1845703125, -1.151580810546875, -1.11859130859375, -1.085601806640625, -1.0526123046875, -1.019622802734375, -0.98663330078125, -0.953643798828125, -0.920654296875, -0.887664794921875, -0.85467529296875, -0.821685791015625, -0.7886962890625, -0.755706787109375, -0.72271728515625, -0.689727783203125, -0.65673828125, -0.623748779296875, -0.59075927734375, -0.557769775390625, -0.5247802734375, -0.491790771484375, -0.45880126953125, -0.425811767578125, -0.392822265625, -0.359832763671875, -0.32684326171875, -0.293853759765625, -0.2608642578125, -0.227874755859375, -0.19488525390625, -0.161895751953125, -0.12890625, -0.095916748046875, -0.06292724609375, -0.029937744140625, 0.0030517578125, 0.036041259765625, 0.06903076171875, 0.102020263671875, 0.135009765625, 0.167999267578125, 0.20098876953125, 0.233978271484375, 0.2669677734375, 0.299957275390625, 0.33294677734375, 0.365936279296875, 0.39892578125, 0.431915283203125, 0.46490478515625, 0.497894287109375, 0.5308837890625, 0.563873291015625, 0.59686279296875, 0.629852294921875, 0.662841796875, 0.695831298828125, 0.72882080078125, 0.761810302734375, 0.7947998046875, 0.827789306640625, 0.86077880859375, 0.893768310546875, 0.9267578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 4.0, 4.0, 12.0, 4.0, 7.0, 11.0, 13.0, 14.0, 10.0, 25.0, 17.0, 22.0, 20.0, 25.0, 28.0, 40.0, 39.0, 30.0, 31.0, 36.0, 39.0, 1061.0, 34.0, 50.0, 52.0, 42.0, 43.0, 37.0, 44.0, 37.0, 24.0, 23.0, 20.0, 26.0, 23.0, 16.0, 15.0, 6.0, 8.0, 7.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.56298828125, -0.5446548461914062, -0.5263214111328125, -0.5079879760742188, -0.489654541015625, -0.47132110595703125, -0.4529876708984375, -0.43465423583984375, -0.41632080078125, -0.39798736572265625, -0.3796539306640625, -0.36132049560546875, -0.342987060546875, -0.32465362548828125, -0.3063201904296875, -0.28798675537109375, -0.2696533203125, -0.25131988525390625, -0.2329864501953125, -0.21465301513671875, -0.196319580078125, -0.17798614501953125, -0.1596527099609375, -0.14131927490234375, -0.12298583984375, -0.10465240478515625, -0.0863189697265625, -0.06798553466796875, -0.049652099609375, -0.03131866455078125, -0.0129852294921875, 0.00534820556640625, 0.023681640625, 0.04201507568359375, 0.0603485107421875, 0.07868194580078125, 0.097015380859375, 0.11534881591796875, 0.1336822509765625, 0.15201568603515625, 0.17034912109375, 0.18868255615234375, 0.2070159912109375, 0.22534942626953125, 0.243682861328125, 0.26201629638671875, 0.2803497314453125, 0.29868316650390625, 0.3170166015625, 0.33535003662109375, 0.3536834716796875, 0.37201690673828125, 0.390350341796875, 0.40868377685546875, 0.4270172119140625, 0.44535064697265625, 0.46368408203125, 0.48201751708984375, 0.5003509521484375, 0.5186843872070312, 0.537017822265625, 0.5553512573242188, 0.5736846923828125, 0.5920181274414062, 0.6103515625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 6.0, 8.0, 9.0, 11.0, 25.0, 18.0, 29.0, 45.0, 56.0, 87.0, 107.0, 148.0, 197.0, 252.0, 376.0, 505.0, 721.0, 1082.0, 1590.0, 2587.0, 4257.0, 7896.0, 17147.0, 44130.0, 173727.0, 1474702.0, 266843.0, 57270.0, 20547.0, 9300.0, 4886.0, 2834.0, 1733.0, 1239.0, 775.0, 586.0, 364.0, 244.0, 187.0, 160.0, 120.0, 92.0, 72.0, 43.0, 39.0, 23.0, 21.0, 10.0, 10.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7138671875, -0.6912841796875, -0.668701171875, -0.6461181640625, -0.62353515625, -0.6009521484375, -0.578369140625, -0.5557861328125, -0.533203125, -0.5106201171875, -0.488037109375, -0.4654541015625, -0.44287109375, -0.4202880859375, -0.397705078125, -0.3751220703125, -0.3525390625, -0.3299560546875, -0.307373046875, -0.2847900390625, -0.26220703125, -0.2396240234375, -0.217041015625, -0.1944580078125, -0.171875, -0.1492919921875, -0.126708984375, -0.1041259765625, -0.08154296875, -0.0589599609375, -0.036376953125, -0.0137939453125, 0.0087890625, 0.0313720703125, 0.053955078125, 0.0765380859375, 0.09912109375, 0.1217041015625, 0.144287109375, 0.1668701171875, 0.189453125, 0.2120361328125, 0.234619140625, 0.2572021484375, 0.27978515625, 0.3023681640625, 0.324951171875, 0.3475341796875, 0.3701171875, 0.3927001953125, 0.415283203125, 0.4378662109375, 0.46044921875, 0.4830322265625, 0.505615234375, 0.5281982421875, 0.55078125, 0.5733642578125, 0.595947265625, 0.6185302734375, 0.64111328125, 0.6636962890625, 0.686279296875, 0.7088623046875, 0.7314453125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 8.0, 12.0, 8.0, 16.0, 18.0, 22.0, 36.0, 35.0, 60.0, 153.0, 319.0, 93.0, 54.0, 35.0, 36.0, 21.0, 12.0, 12.0, 10.0, 7.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13190078735351562, -0.12598419189453125, -0.12006759643554688, -0.1141510009765625, -0.10823440551757812, -0.10231781005859375, -0.09640121459960938, -0.090484619140625, -0.08456802368164062, -0.07865142822265625, -0.07273483276367188, -0.0668182373046875, -0.060901641845703125, -0.05498504638671875, -0.049068450927734375, -0.04315185546875, -0.037235260009765625, -0.03131866455078125, -0.025402069091796875, -0.0194854736328125, -0.013568878173828125, -0.00765228271484375, -0.001735687255859375, 0.004180908203125, 0.010097503662109375, 0.01601409912109375, 0.021930694580078125, 0.0278472900390625, 0.033763885498046875, 0.03968048095703125, 0.045597076416015625, 0.051513671875, 0.057430267333984375, 0.06334686279296875, 0.06926345825195312, 0.0751800537109375, 0.08109664916992188, 0.08701324462890625, 0.09292984008789062, 0.098846435546875, 0.10476303100585938, 0.11067962646484375, 0.11659622192382812, 0.1225128173828125, 0.12842941284179688, 0.13434600830078125, 0.14026260375976562, 0.14617919921875, 0.15209579467773438, 0.15801239013671875, 0.16392898559570312, 0.1698455810546875, 0.17576217651367188, 0.18167877197265625, 0.18759536743164062, 0.193511962890625, 0.19942855834960938, 0.20534515380859375, 0.21126174926757812, 0.2171783447265625, 0.22309494018554688, 0.22901153564453125, 0.23492813110351562, 0.2408447265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 10.0, 11.0, 12.0, 23.0, 49.0, 44.0, 111.0, 295.0, 1526.0, 31951.0, 997336.0, 15615.0, 1082.0, 216.0, 96.0, 48.0, 24.0, 19.0, 13.0, 18.0, 13.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.884765625, -3.78619384765625, -3.6876220703125, -3.58905029296875, -3.490478515625, -3.39190673828125, -3.2933349609375, -3.19476318359375, -3.09619140625, -2.99761962890625, -2.8990478515625, -2.80047607421875, -2.701904296875, -2.60333251953125, -2.5047607421875, -2.40618896484375, -2.3076171875, -2.20904541015625, -2.1104736328125, -2.01190185546875, -1.913330078125, -1.81475830078125, -1.7161865234375, -1.61761474609375, -1.51904296875, -1.42047119140625, -1.3218994140625, -1.22332763671875, -1.124755859375, -1.02618408203125, -0.9276123046875, -0.82904052734375, -0.73046875, -0.63189697265625, -0.5333251953125, -0.43475341796875, -0.336181640625, -0.23760986328125, -0.1390380859375, -0.04046630859375, 0.05810546875, 0.15667724609375, 0.2552490234375, 0.35382080078125, 0.452392578125, 0.55096435546875, 0.6495361328125, 0.74810791015625, 0.8466796875, 0.94525146484375, 1.0438232421875, 1.14239501953125, 1.240966796875, 1.33953857421875, 1.4381103515625, 1.53668212890625, 1.63525390625, 1.73382568359375, 1.8323974609375, 1.93096923828125, 2.029541015625, 2.12811279296875, 2.2266845703125, 2.32525634765625, 2.423828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 7.0, 8.0, 11.0, 20.0, 23.0, 37.0, 52.0, 71.0, 119.0, 108.0, 144.0, 115.0, 109.0, 53.0, 49.0, 33.0, 20.0, 13.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3126414716243744, -0.30294299125671387, -0.29324454069137573, -0.2835460603237152, -0.2738476097583771, -0.26414912939071655, -0.2544506788253784, -0.2447521984577179, -0.23505373299121857, -0.22535526752471924, -0.2156568020582199, -0.20595833659172058, -0.19625985622406006, -0.18656140565872192, -0.1768629252910614, -0.16716445982456207, -0.15746599435806274, -0.14776752889156342, -0.1380690634250641, -0.12837059795856476, -0.11867212504148483, -0.1089736595749855, -0.09927518665790558, -0.08957672119140625, -0.07987825572490692, -0.07017979025840759, -0.060481321066617966, -0.05078285187482834, -0.04108438640832901, -0.03138592094182968, -0.021687451750040054, -0.011988982558250427, -0.0022905468940734863, 0.0074079204350709915, 0.01710638776421547, 0.026804855093359947, 0.036503322422504425, 0.046201787889003754, 0.05590025708079338, 0.06559872627258301, 0.07529719173908234, 0.08499565720558167, 0.094694122672081, 0.10439259558916092, 0.11409106105566025, 0.12378952652215958, 0.1334879994392395, 0.14318646490573883, 0.15288493037223816, 0.1625833958387375, 0.17228186130523682, 0.18198032677173615, 0.19167879223823547, 0.201377272605896, 0.21107573807239532, 0.22077420353889465, 0.23047266900539398, 0.2401711344718933, 0.24986959993839264, 0.25956806540489197, 0.2692665457725525, 0.2789649963378906, 0.28866347670555115, 0.29836195707321167, 0.3080604076385498]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 9.0, 9.0, 15.0, 15.0, 19.0, 28.0, 26.0, 29.0, 42.0, 36.0, 48.0, 43.0, 44.0, 44.0, 47.0, 47.0, 46.0, 48.0, 52.0, 31.0, 35.0, 45.0, 37.0, 33.0, 31.0, 29.0, 18.0, 16.0, 11.0, 14.0, 8.0, 10.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1592746376991272, -0.15363898873329163, -0.14800332486629486, -0.1423676609992981, -0.13673201203346252, -0.13109636306762695, -0.1254606992006302, -0.11982504278421402, -0.11418938636779785, -0.10855372995138168, -0.10291807353496552, -0.09728241711854935, -0.09164676070213318, -0.08601110428571701, -0.08037544786930084, -0.07473979145288467, -0.0691041350364685, -0.06346847862005234, -0.05783282220363617, -0.05219716578722, -0.04656150937080383, -0.040925852954387665, -0.0352901965379715, -0.02965454012155533, -0.02401888370513916, -0.018383227288722992, -0.012747570872306824, -0.0071119144558906555, -0.0014762580394744873, 0.004159398376941681, 0.009795054793357849, 0.015430711209774017, 0.021066367626190186, 0.026702024042606354, 0.03233768045902252, 0.03797333687543869, 0.04360899329185486, 0.04924464970827103, 0.054880306124687195, 0.06051596254110336, 0.06615161895751953, 0.0717872753739357, 0.07742293179035187, 0.08305858820676804, 0.0886942446231842, 0.09432990103960037, 0.09996555745601654, 0.10560121387243271, 0.11123687028884888, 0.11687252670526505, 0.12250818312168121, 0.12814384698867798, 0.13377949595451355, 0.13941514492034912, 0.1450508087873459, 0.15068647265434265, 0.15632212162017822, 0.1619577705860138, 0.16759343445301056, 0.17322909832000732, 0.1788647472858429, 0.18450039625167847, 0.19013606011867523, 0.195771723985672, 0.20140737295150757]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 7.0, 8.0, 11.0, 9.0, 15.0, 17.0, 14.0, 12.0, 15.0, 21.0, 17.0, 20.0, 28.0, 26.0, 27.0, 22.0, 26.0, 46.0, 39.0, 39.0, 32.0, 35.0, 38.0, 39.0, 33.0, 38.0, 31.0, 28.0, 32.0, 33.0, 35.0, 22.0, 24.0, 31.0, 17.0, 19.0, 14.0, 10.0, 11.0, 9.0, 9.0, 8.0, 6.0, 3.0, 5.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.70361328125, -0.6815872192382812, -0.6595611572265625, -0.6375350952148438, -0.615509033203125, -0.5934829711914062, -0.5714569091796875, -0.5494308471679688, -0.52740478515625, -0.5053787231445312, -0.4833526611328125, -0.46132659912109375, -0.439300537109375, -0.41727447509765625, -0.3952484130859375, -0.37322235107421875, -0.3511962890625, -0.32917022705078125, -0.3071441650390625, -0.28511810302734375, -0.263092041015625, -0.24106597900390625, -0.2190399169921875, -0.19701385498046875, -0.17498779296875, -0.15296173095703125, -0.1309356689453125, -0.10890960693359375, -0.086883544921875, -0.06485748291015625, -0.0428314208984375, -0.02080535888671875, 0.001220703125, 0.02324676513671875, 0.0452728271484375, 0.06729888916015625, 0.089324951171875, 0.11135101318359375, 0.1333770751953125, 0.15540313720703125, 0.17742919921875, 0.19945526123046875, 0.2214813232421875, 0.24350738525390625, 0.265533447265625, 0.28755950927734375, 0.3095855712890625, 0.33161163330078125, 0.3536376953125, 0.37566375732421875, 0.3976898193359375, 0.41971588134765625, 0.441741943359375, 0.46376800537109375, 0.4857940673828125, 0.5078201293945312, 0.52984619140625, 0.5518722534179688, 0.5738983154296875, 0.5959243774414062, 0.617950439453125, 0.6399765014648438, 0.6620025634765625, 0.6840286254882812, 0.7060546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 5.0, 9.0, 12.0, 21.0, 35.0, 39.0, 74.0, 105.0, 133.0, 231.0, 423.0, 567.0, 914.0, 1381.0, 2041.0, 3175.0, 4911.0, 7644.0, 12556.0, 21127.0, 37045.0, 68506.0, 129900.0, 217223.0, 225797.0, 140536.0, 74856.0, 40372.0, 22410.0, 13362.0, 8281.0, 5347.0, 3290.0, 2133.0, 1361.0, 932.0, 685.0, 363.0, 278.0, 158.0, 114.0, 78.0, 59.0, 26.0, 19.0, 11.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.865234375, -0.8332672119140625, -0.801300048828125, -0.7693328857421875, -0.73736572265625, -0.7053985595703125, -0.673431396484375, -0.6414642333984375, -0.6094970703125, -0.5775299072265625, -0.545562744140625, -0.5135955810546875, -0.48162841796875, -0.4496612548828125, -0.417694091796875, -0.3857269287109375, -0.353759765625, -0.3217926025390625, -0.289825439453125, -0.2578582763671875, -0.22589111328125, -0.1939239501953125, -0.161956787109375, -0.1299896240234375, -0.0980224609375, -0.0660552978515625, -0.034088134765625, -0.0021209716796875, 0.02984619140625, 0.0618133544921875, 0.093780517578125, 0.1257476806640625, 0.15771484375, 0.1896820068359375, 0.221649169921875, 0.2536163330078125, 0.28558349609375, 0.3175506591796875, 0.349517822265625, 0.3814849853515625, 0.4134521484375, 0.4454193115234375, 0.477386474609375, 0.5093536376953125, 0.54132080078125, 0.5732879638671875, 0.605255126953125, 0.6372222900390625, 0.669189453125, 0.7011566162109375, 0.733123779296875, 0.7650909423828125, 0.79705810546875, 0.8290252685546875, 0.860992431640625, 0.8929595947265625, 0.9249267578125, 0.9568939208984375, 0.988861083984375, 1.0208282470703125, 1.05279541015625, 1.0847625732421875, 1.116729736328125, 1.1486968994140625, 1.1806640625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 6.0, 5.0, 10.0, 9.0, 15.0, 10.0, 23.0, 19.0, 30.0, 35.0, 34.0, 38.0, 31.0, 32.0, 64.0, 94.0, 125.0, 190.0, 1314.0, 217.0, 174.0, 90.0, 76.0, 54.0, 48.0, 49.0, 40.0, 34.0, 31.0, 25.0, 12.0, 25.0, 12.0, 10.0, 17.0, 10.0, 9.0, 5.0, 1.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.8671875, -2.784393310546875, -2.70159912109375, -2.618804931640625, -2.5360107421875, -2.453216552734375, -2.37042236328125, -2.287628173828125, -2.204833984375, -2.122039794921875, -2.03924560546875, -1.956451416015625, -1.8736572265625, -1.790863037109375, -1.70806884765625, -1.625274658203125, -1.54248046875, -1.459686279296875, -1.37689208984375, -1.294097900390625, -1.2113037109375, -1.128509521484375, -1.04571533203125, -0.962921142578125, -0.880126953125, -0.797332763671875, -0.71453857421875, -0.631744384765625, -0.5489501953125, -0.466156005859375, -0.38336181640625, -0.300567626953125, -0.2177734375, -0.134979248046875, -0.05218505859375, 0.030609130859375, 0.1134033203125, 0.196197509765625, 0.27899169921875, 0.361785888671875, 0.444580078125, 0.527374267578125, 0.61016845703125, 0.692962646484375, 0.7757568359375, 0.858551025390625, 0.94134521484375, 1.024139404296875, 1.10693359375, 1.189727783203125, 1.27252197265625, 1.355316162109375, 1.4381103515625, 1.520904541015625, 1.60369873046875, 1.686492919921875, 1.769287109375, 1.852081298828125, 1.93487548828125, 2.017669677734375, 2.1004638671875, 2.183258056640625, 2.26605224609375, 2.348846435546875, 2.431640625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 13.0, 8.0, 8.0, 15.0, 23.0, 29.0, 26.0, 51.0, 83.0, 112.0, 167.0, 301.0, 516.0, 1306.0, 5923.0, 52833.0, 1765786.0, 1268761.0, 42202.0, 5165.0, 1151.0, 483.0, 224.0, 175.0, 97.0, 72.0, 49.0, 38.0, 27.0, 17.0, 18.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.44305419921875, -4.2650146484375, -4.08697509765625, -3.908935546875, -3.73089599609375, -3.5528564453125, -3.37481689453125, -3.19677734375, -3.01873779296875, -2.8406982421875, -2.66265869140625, -2.484619140625, -2.30657958984375, -2.1285400390625, -1.95050048828125, -1.7724609375, -1.59442138671875, -1.4163818359375, -1.23834228515625, -1.060302734375, -0.88226318359375, -0.7042236328125, -0.52618408203125, -0.34814453125, -0.17010498046875, 0.0079345703125, 0.18597412109375, 0.364013671875, 0.54205322265625, 0.7200927734375, 0.89813232421875, 1.076171875, 1.25421142578125, 1.4322509765625, 1.61029052734375, 1.788330078125, 1.96636962890625, 2.1444091796875, 2.32244873046875, 2.50048828125, 2.67852783203125, 2.8565673828125, 3.03460693359375, 3.212646484375, 3.39068603515625, 3.5687255859375, 3.74676513671875, 3.9248046875, 4.10284423828125, 4.2808837890625, 4.45892333984375, 4.636962890625, 4.81500244140625, 4.9930419921875, 5.17108154296875, 5.34912109375, 5.52716064453125, 5.7052001953125, 5.88323974609375, 6.061279296875, 6.23931884765625, 6.4173583984375, 6.59539794921875, 6.7734375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 115.0, 412.0, 386.0, 85.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.879435539245605, -9.662537574768066, -8.445638656616211, -7.228740692138672, -6.011842250823975, -4.794943809509277, -3.5780458450317383, -2.361146926879883, -1.1442489624023438, 0.07264935970306396, 1.2895476818084717, 2.50644588470459, 3.723344326019287, 4.940242767333984, 6.157140731811523, 7.374039649963379, 8.590937614440918, 9.807835578918457, 11.024734497070312, 12.241632461547852, 13.45853042602539, 14.675429344177246, 15.892327308654785, 17.10922622680664, 18.32612419128418, 19.54302215576172, 20.759920120239258, 21.976818084716797, 23.19371795654297, 24.410615921020508, 25.627513885498047, 26.84441375732422, 28.06131362915039, 29.27821159362793, 30.49510955810547, 31.71200942993164, 32.92890548706055, 34.14580535888672, 35.362701416015625, 36.5796012878418, 37.79650115966797, 39.01340103149414, 40.23029708862305, 41.44719696044922, 42.664093017578125, 43.8809928894043, 45.09789276123047, 46.314788818359375, 47.53168487548828, 48.74858474731445, 49.96548080444336, 51.18238067626953, 52.39927673339844, 53.61617660522461, 54.83307647705078, 56.04997253417969, 57.26687240600586, 58.48377227783203, 59.70066833496094, 60.91756820678711, 62.134464263916016, 63.35136413574219, 64.5682601928711, 65.78516387939453, 67.00205993652344]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 10.0, 4.0, 8.0, 22.0, 11.0, 14.0, 22.0, 33.0, 27.0, 33.0, 33.0, 37.0, 39.0, 46.0, 40.0, 40.0, 42.0, 43.0, 44.0, 44.0, 44.0, 39.0, 38.0, 40.0, 26.0, 32.0, 33.0, 29.0, 24.0, 16.0, 15.0, 14.0, 10.0, 7.0, 8.0, 2.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.827873229980469, -7.594815254211426, -7.361757755279541, -7.128699779510498, -6.895642280578613, -6.66258430480957, -6.429526329040527, -6.196468830108643, -5.963411331176758, -5.730353355407715, -5.49729585647583, -5.264237880706787, -5.031180381774902, -4.798122406005859, -4.565064430236816, -4.332006931304932, -4.098948955535889, -3.865891218185425, -3.632833480834961, -3.399775505065918, -3.166718006134033, -2.9336600303649902, -2.7006022930145264, -2.4675445556640625, -2.2344868183135986, -2.0014290809631348, -1.768371343612671, -1.5353134870529175, -1.3022557497024536, -1.0691980123519897, -0.8361401557922363, -0.6030824184417725, -0.3700251579284668, -0.13696739077568054, 0.09609037637710571, 0.32914817333221436, 0.5622059106826782, 0.7952636480331421, 1.0283215045928955, 1.2613792419433594, 1.4944369792938232, 1.727494716644287, 1.960552453994751, 2.193610191345215, 2.426668167114258, 2.6597256660461426, 2.8927836418151855, 3.1258413791656494, 3.3588991165161133, 3.591956853866577, 3.825014591217041, 4.058072566986084, 4.291130065917969, 4.524188041687012, 4.757246017456055, 4.9903035163879395, 5.223361015319824, 5.456418991088867, 5.689476490020752, 5.922534465789795, 6.15559196472168, 6.388649940490723, 6.621707916259766, 6.85476541519165, 7.087823390960693]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 3.0, 6.0, 9.0, 13.0, 8.0, 10.0, 16.0, 13.0, 18.0, 21.0, 21.0, 25.0, 18.0, 29.0, 28.0, 31.0, 42.0, 34.0, 38.0, 40.0, 43.0, 35.0, 34.0, 43.0, 37.0, 36.0, 42.0, 27.0, 31.0, 32.0, 24.0, 27.0, 23.0, 22.0, 19.0, 18.0, 9.0, 8.0, 13.0, 7.0, 13.0, 4.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.84716796875, -0.822662353515625, -0.79815673828125, -0.773651123046875, -0.7491455078125, -0.724639892578125, -0.70013427734375, -0.675628662109375, -0.651123046875, -0.626617431640625, -0.60211181640625, -0.577606201171875, -0.5531005859375, -0.528594970703125, -0.50408935546875, -0.479583740234375, -0.455078125, -0.430572509765625, -0.40606689453125, -0.381561279296875, -0.3570556640625, -0.332550048828125, -0.30804443359375, -0.283538818359375, -0.259033203125, -0.234527587890625, -0.21002197265625, -0.185516357421875, -0.1610107421875, -0.136505126953125, -0.11199951171875, -0.087493896484375, -0.06298828125, -0.038482666015625, -0.01397705078125, 0.010528564453125, 0.0350341796875, 0.059539794921875, 0.08404541015625, 0.108551025390625, 0.133056640625, 0.157562255859375, 0.18206787109375, 0.206573486328125, 0.2310791015625, 0.255584716796875, 0.28009033203125, 0.304595947265625, 0.3291015625, 0.353607177734375, 0.37811279296875, 0.402618408203125, 0.4271240234375, 0.451629638671875, 0.47613525390625, 0.500640869140625, 0.525146484375, 0.549652099609375, 0.57415771484375, 0.598663330078125, 0.6231689453125, 0.647674560546875, 0.67218017578125, 0.696685791015625, 0.72119140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 3.0, 2.0, 8.0, 14.0, 17.0, 12.0, 26.0, 33.0, 40.0, 60.0, 92.0, 153.0, 274.0, 483.0, 817.0, 1476.0, 2617.0, 5038.0, 9755.0, 20834.0, 51835.0, 165209.0, 903218.0, 2248468.0, 589126.0, 120046.0, 39998.0, 16832.0, 7928.0, 4170.0, 2301.0, 1323.0, 795.0, 430.0, 338.0, 159.0, 124.0, 69.0, 42.0, 27.0, 22.0, 18.0, 7.0, 13.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8076171875, -1.7500152587890625, -1.692413330078125, -1.6348114013671875, -1.57720947265625, -1.5196075439453125, -1.462005615234375, -1.4044036865234375, -1.3468017578125, -1.2891998291015625, -1.231597900390625, -1.1739959716796875, -1.11639404296875, -1.0587921142578125, -1.001190185546875, -0.9435882568359375, -0.885986328125, -0.8283843994140625, -0.770782470703125, -0.7131805419921875, -0.65557861328125, -0.5979766845703125, -0.540374755859375, -0.4827728271484375, -0.4251708984375, -0.3675689697265625, -0.309967041015625, -0.2523651123046875, -0.19476318359375, -0.1371612548828125, -0.079559326171875, -0.0219573974609375, 0.03564453125, 0.0932464599609375, 0.150848388671875, 0.2084503173828125, 0.26605224609375, 0.3236541748046875, 0.381256103515625, 0.4388580322265625, 0.4964599609375, 0.5540618896484375, 0.611663818359375, 0.6692657470703125, 0.72686767578125, 0.7844696044921875, 0.842071533203125, 0.8996734619140625, 0.957275390625, 1.0148773193359375, 1.072479248046875, 1.1300811767578125, 1.18768310546875, 1.2452850341796875, 1.302886962890625, 1.3604888916015625, 1.4180908203125, 1.4756927490234375, 1.533294677734375, 1.5908966064453125, 1.64849853515625, 1.7061004638671875, 1.763702392578125, 1.8213043212890625, 1.87890625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 8.0, 14.0, 12.0, 20.0, 20.0, 27.0, 56.0, 58.0, 56.0, 89.0, 114.0, 154.0, 205.0, 232.0, 369.0, 455.0, 458.0, 426.0, 298.0, 245.0, 168.0, 154.0, 103.0, 65.0, 60.0, 47.0, 41.0, 22.0, 24.0, 16.0, 13.0, 9.0, 12.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.587890625, -1.5354156494140625, -1.482940673828125, -1.4304656982421875, -1.37799072265625, -1.3255157470703125, -1.273040771484375, -1.2205657958984375, -1.1680908203125, -1.1156158447265625, -1.063140869140625, -1.0106658935546875, -0.95819091796875, -0.9057159423828125, -0.853240966796875, -0.8007659912109375, -0.748291015625, -0.6958160400390625, -0.643341064453125, -0.5908660888671875, -0.53839111328125, -0.4859161376953125, -0.433441162109375, -0.3809661865234375, -0.3284912109375, -0.2760162353515625, -0.223541259765625, -0.1710662841796875, -0.11859130859375, -0.0661163330078125, -0.013641357421875, 0.0388336181640625, 0.09130859375, 0.1437835693359375, 0.196258544921875, 0.2487335205078125, 0.30120849609375, 0.3536834716796875, 0.406158447265625, 0.4586334228515625, 0.5111083984375, 0.5635833740234375, 0.616058349609375, 0.6685333251953125, 0.72100830078125, 0.7734832763671875, 0.825958251953125, 0.8784332275390625, 0.930908203125, 0.9833831787109375, 1.035858154296875, 1.0883331298828125, 1.14080810546875, 1.1932830810546875, 1.245758056640625, 1.2982330322265625, 1.3507080078125, 1.4031829833984375, 1.455657958984375, 1.5081329345703125, 1.56060791015625, 1.6130828857421875, 1.665557861328125, 1.7180328369140625, 1.7705078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 8.0, 14.0, 18.0, 33.0, 45.0, 76.0, 147.0, 272.0, 527.0, 1099.0, 2588.0, 6382.0, 18199.0, 62954.0, 293341.0, 2162449.0, 1386108.0, 191874.0, 45213.0, 13924.0, 5078.0, 2098.0, 885.0, 422.0, 209.0, 123.0, 85.0, 29.0, 30.0, 12.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.12652587890625, -3.0284423828125, -2.93035888671875, -2.832275390625, -2.73419189453125, -2.6361083984375, -2.53802490234375, -2.43994140625, -2.34185791015625, -2.2437744140625, -2.14569091796875, -2.047607421875, -1.94952392578125, -1.8514404296875, -1.75335693359375, -1.6552734375, -1.55718994140625, -1.4591064453125, -1.36102294921875, -1.262939453125, -1.16485595703125, -1.0667724609375, -0.96868896484375, -0.87060546875, -0.77252197265625, -0.6744384765625, -0.57635498046875, -0.478271484375, -0.38018798828125, -0.2821044921875, -0.18402099609375, -0.0859375, 0.01214599609375, 0.1102294921875, 0.20831298828125, 0.306396484375, 0.40447998046875, 0.5025634765625, 0.60064697265625, 0.69873046875, 0.79681396484375, 0.8948974609375, 0.99298095703125, 1.091064453125, 1.18914794921875, 1.2872314453125, 1.38531494140625, 1.4833984375, 1.58148193359375, 1.6795654296875, 1.77764892578125, 1.875732421875, 1.97381591796875, 2.0718994140625, 2.16998291015625, 2.26806640625, 2.36614990234375, 2.4642333984375, 2.56231689453125, 2.660400390625, 2.75848388671875, 2.8565673828125, 2.95465087890625, 3.052734375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 18.0, 66.0, 157.0, 281.0, 258.0, 152.0, 56.0, 15.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.553844451904297, -20.61452293395996, -19.675201416015625, -18.73587989807129, -17.796558380126953, -16.857236862182617, -15.917916297912598, -14.978594779968262, -14.039273262023926, -13.09995174407959, -12.160630226135254, -11.221309661865234, -10.281988143920898, -9.342666625976562, -8.403345108032227, -7.464023590087891, -6.524702072143555, -5.585380554199219, -4.646059036254883, -3.706737995147705, -2.767416477203369, -1.8280949592590332, -0.8887739181518555, 0.05054759979248047, 0.9898691177368164, 1.9291905164718628, 2.868511915206909, 3.807833194732666, 4.747154712677002, 5.686476230621338, 6.625797271728516, 7.565118789672852, 8.504440307617188, 9.443761825561523, 10.38308334350586, 11.322404861450195, 12.261726379394531, 13.201047897338867, 14.140368461608887, 15.079689979553223, 16.019012451171875, 16.95833396911621, 17.897655487060547, 18.836977005004883, 19.77629852294922, 20.715620040893555, 21.65494155883789, 22.594261169433594, 23.53358268737793, 24.472904205322266, 25.4122257232666, 26.351547241210938, 27.290868759155273, 28.23019027709961, 29.169509887695312, 30.10883331298828, 31.048152923583984, 31.98747444152832, 32.926795959472656, 33.86611557006836, 34.80543899536133, 35.74475860595703, 36.68408203125, 37.6234016418457, 38.56272506713867]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 3.0, 10.0, 12.0, 14.0, 15.0, 17.0, 20.0, 21.0, 30.0, 26.0, 31.0, 28.0, 29.0, 29.0, 31.0, 34.0, 44.0, 40.0, 37.0, 46.0, 40.0, 41.0, 35.0, 41.0, 41.0, 29.0, 37.0, 35.0, 24.0, 27.0, 16.0, 26.0, 16.0, 14.0, 6.0, 10.0, 7.0, 10.0, 9.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.360253810882568, -6.184417247772217, -6.008580684661865, -5.832744121551514, -5.656907558441162, -5.4810709953308105, -5.305234432220459, -5.129397869110107, -4.953561305999756, -4.777724742889404, -4.601888179779053, -4.426051616668701, -4.25021505355835, -4.074378490447998, -3.8985419273376465, -3.722705364227295, -3.5468688011169434, -3.371032238006592, -3.1951956748962402, -3.0193591117858887, -2.843522548675537, -2.6676859855651855, -2.491849422454834, -2.3160128593444824, -2.140176296234131, -1.9643397331237793, -1.7885031700134277, -1.6126666069030762, -1.4368300437927246, -1.260993480682373, -1.0851569175720215, -0.9093203544616699, -0.7334833145141602, -0.5576467514038086, -0.38181018829345703, -0.20597362518310547, -0.030137062072753906, 0.14569950103759766, 0.3215360641479492, 0.4973726272583008, 0.6732091903686523, 0.8490457534790039, 1.0248823165893555, 1.200718879699707, 1.3765554428100586, 1.5523920059204102, 1.7282285690307617, 1.9040651321411133, 2.079901695251465, 2.2557382583618164, 2.431574821472168, 2.6074113845825195, 2.783247947692871, 2.9590845108032227, 3.134921073913574, 3.310757637023926, 3.4865942001342773, 3.662430763244629, 3.8382673263549805, 4.014103889465332, 4.189940452575684, 4.365777015686035, 4.541613578796387, 4.717450141906738, 4.89328670501709]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 7.0, 9.0, 4.0, 10.0, 7.0, 12.0, 11.0, 21.0, 19.0, 23.0, 23.0, 20.0, 27.0, 35.0, 30.0, 31.0, 37.0, 40.0, 32.0, 42.0, 34.0, 33.0, 44.0, 45.0, 40.0, 36.0, 34.0, 28.0, 35.0, 35.0, 25.0, 18.0, 17.0, 20.0, 20.0, 13.0, 17.0, 7.0, 6.0, 13.0, 8.0, 7.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.85546875, -0.8312301635742188, -0.8069915771484375, -0.7827529907226562, -0.758514404296875, -0.7342758178710938, -0.7100372314453125, -0.6857986450195312, -0.66156005859375, -0.6373214721679688, -0.6130828857421875, -0.5888442993164062, -0.564605712890625, -0.5403671264648438, -0.5161285400390625, -0.49188995361328125, -0.4676513671875, -0.44341278076171875, -0.4191741943359375, -0.39493560791015625, -0.370697021484375, -0.34645843505859375, -0.3222198486328125, -0.29798126220703125, -0.27374267578125, -0.24950408935546875, -0.2252655029296875, -0.20102691650390625, -0.176788330078125, -0.15254974365234375, -0.1283111572265625, -0.10407257080078125, -0.079833984375, -0.05559539794921875, -0.0313568115234375, -0.00711822509765625, 0.017120361328125, 0.04135894775390625, 0.0655975341796875, 0.08983612060546875, 0.11407470703125, 0.13831329345703125, 0.1625518798828125, 0.18679046630859375, 0.211029052734375, 0.23526763916015625, 0.2595062255859375, 0.28374481201171875, 0.3079833984375, 0.33222198486328125, 0.3564605712890625, 0.38069915771484375, 0.404937744140625, 0.42917633056640625, 0.4534149169921875, 0.47765350341796875, 0.50189208984375, 0.5261306762695312, 0.5503692626953125, 0.5746078491210938, 0.598846435546875, 0.6230850219726562, 0.6473236083984375, 0.6715621948242188, 0.69580078125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 6.0, 14.0, 18.0, 30.0, 50.0, 85.0, 171.0, 296.0, 562.0, 1159.0, 2075.0, 3746.0, 7502.0, 15059.0, 33318.0, 85552.0, 265035.0, 397570.0, 143082.0, 50546.0, 21316.0, 10227.0, 5252.0, 2703.0, 1455.0, 823.0, 458.0, 200.0, 111.0, 53.0, 24.0, 20.0, 14.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5432243347167969, -0.5268783569335938, -0.5105323791503906, -0.4941864013671875, -0.4778404235839844, -0.46149444580078125, -0.4451484680175781, -0.428802490234375, -0.4124565124511719, -0.39611053466796875, -0.3797645568847656, -0.3634185791015625, -0.3470726013183594, -0.33072662353515625, -0.3143806457519531, -0.29803466796875, -0.2816886901855469, -0.26534271240234375, -0.24899673461914062, -0.2326507568359375, -0.21630477905273438, -0.19995880126953125, -0.18361282348632812, -0.167266845703125, -0.15092086791992188, -0.13457489013671875, -0.11822891235351562, -0.1018829345703125, -0.08553695678710938, -0.06919097900390625, -0.052845001220703125, -0.0364990234375, -0.020153045654296875, -0.00380706787109375, 0.012538909912109375, 0.0288848876953125, 0.045230865478515625, 0.06157684326171875, 0.07792282104492188, 0.094268798828125, 0.11061477661132812, 0.12696075439453125, 0.14330673217773438, 0.1596527099609375, 0.17599868774414062, 0.19234466552734375, 0.20869064331054688, 0.22503662109375, 0.24138259887695312, 0.25772857666015625, 0.2740745544433594, 0.2904205322265625, 0.3067665100097656, 0.32311248779296875, 0.3394584655761719, 0.355804443359375, 0.3721504211425781, 0.38849639892578125, 0.4048423767089844, 0.4211883544921875, 0.4375343322753906, 0.45388031005859375, 0.4702262878417969, 0.486572265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 8.0, 8.0, 11.0, 8.0, 8.0, 17.0, 23.0, 24.0, 21.0, 24.0, 33.0, 34.0, 38.0, 35.0, 36.0, 34.0, 46.0, 44.0, 1068.0, 38.0, 42.0, 37.0, 38.0, 43.0, 29.0, 31.0, 27.0, 25.0, 21.0, 20.0, 17.0, 23.0, 23.0, 18.0, 12.0, 5.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.59716796875, -0.5784988403320312, -0.5598297119140625, -0.5411605834960938, -0.522491455078125, -0.5038223266601562, -0.4851531982421875, -0.46648406982421875, -0.44781494140625, -0.42914581298828125, -0.4104766845703125, -0.39180755615234375, -0.373138427734375, -0.35446929931640625, -0.3358001708984375, -0.31713104248046875, -0.2984619140625, -0.27979278564453125, -0.2611236572265625, -0.24245452880859375, -0.223785400390625, -0.20511627197265625, -0.1864471435546875, -0.16777801513671875, -0.14910888671875, -0.13043975830078125, -0.1117706298828125, -0.09310150146484375, -0.074432373046875, -0.05576324462890625, -0.0370941162109375, -0.01842498779296875, 0.000244140625, 0.01891326904296875, 0.0375823974609375, 0.05625152587890625, 0.074920654296875, 0.09358978271484375, 0.1122589111328125, 0.13092803955078125, 0.14959716796875, 0.16826629638671875, 0.1869354248046875, 0.20560455322265625, 0.224273681640625, 0.24294281005859375, 0.2616119384765625, 0.28028106689453125, 0.2989501953125, 0.31761932373046875, 0.3362884521484375, 0.35495758056640625, 0.373626708984375, 0.39229583740234375, 0.4109649658203125, 0.42963409423828125, 0.44830322265625, 0.46697235107421875, 0.4856414794921875, 0.5043106079101562, 0.522979736328125, 0.5416488647460938, 0.5603179931640625, 0.5789871215820312, 0.59765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 11.0, 8.0, 11.0, 17.0, 27.0, 37.0, 48.0, 79.0, 98.0, 167.0, 287.0, 449.0, 700.0, 1254.0, 2276.0, 4405.0, 9453.0, 23015.0, 70302.0, 360133.0, 1373869.0, 174923.0, 44627.0, 16063.0, 7057.0, 3370.0, 1878.0, 1006.0, 563.0, 350.0, 212.0, 144.0, 92.0, 62.0, 35.0, 31.0, 24.0, 16.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35302734375, -0.3413810729980469, -0.32973480224609375, -0.3180885314941406, -0.3064422607421875, -0.2947959899902344, -0.28314971923828125, -0.2715034484863281, -0.259857177734375, -0.24821090698242188, -0.23656463623046875, -0.22491836547851562, -0.2132720947265625, -0.20162582397460938, -0.18997955322265625, -0.17833328247070312, -0.16668701171875, -0.15504074096679688, -0.14339447021484375, -0.13174819946289062, -0.1201019287109375, -0.10845565795898438, -0.09680938720703125, -0.08516311645507812, -0.073516845703125, -0.061870574951171875, -0.05022430419921875, -0.038578033447265625, -0.0269317626953125, -0.015285491943359375, -0.00363922119140625, 0.008007049560546875, 0.0196533203125, 0.031299591064453125, 0.04294586181640625, 0.054592132568359375, 0.0662384033203125, 0.07788467407226562, 0.08953094482421875, 0.10117721557617188, 0.112823486328125, 0.12446975708007812, 0.13611602783203125, 0.14776229858398438, 0.1594085693359375, 0.17105484008789062, 0.18270111083984375, 0.19434738159179688, 0.20599365234375, 0.21763992309570312, 0.22928619384765625, 0.24093246459960938, 0.2525787353515625, 0.2642250061035156, 0.27587127685546875, 0.2875175476074219, 0.299163818359375, 0.3108100891113281, 0.32245635986328125, 0.3341026306152344, 0.3457489013671875, 0.3573951721191406, 0.36904144287109375, 0.3806877136230469, 0.392333984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 8.0, 9.0, 10.0, 11.0, 22.0, 29.0, 37.0, 49.0, 90.0, 178.0, 194.0, 136.0, 58.0, 44.0, 33.0, 23.0, 17.0, 10.0, 7.0, 8.0, 6.0, 8.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08146190643310547, -0.07875633239746094, -0.0760507583618164, -0.07334518432617188, -0.07063961029052734, -0.06793403625488281, -0.06522846221923828, -0.06252288818359375, -0.05981731414794922, -0.05711174011230469, -0.054406166076660156, -0.051700592041015625, -0.048995018005371094, -0.04628944396972656, -0.04358386993408203, -0.0408782958984375, -0.03817272186279297, -0.03546714782714844, -0.032761573791503906, -0.030055999755859375, -0.027350425720214844, -0.024644851684570312, -0.02193927764892578, -0.01923370361328125, -0.01652812957763672, -0.013822555541992188, -0.011116981506347656, -0.008411407470703125, -0.005705833435058594, -0.0030002593994140625, -0.00029468536376953125, 0.002410888671875, 0.005116462707519531, 0.007822036743164062, 0.010527610778808594, 0.013233184814453125, 0.015938758850097656, 0.018644332885742188, 0.02134990692138672, 0.02405548095703125, 0.02676105499267578, 0.029466629028320312, 0.032172203063964844, 0.034877777099609375, 0.037583351135253906, 0.04028892517089844, 0.04299449920654297, 0.0457000732421875, 0.04840564727783203, 0.05111122131347656, 0.053816795349121094, 0.056522369384765625, 0.059227943420410156, 0.06193351745605469, 0.06463909149169922, 0.06734466552734375, 0.07005023956298828, 0.07275581359863281, 0.07546138763427734, 0.07816696166992188, 0.0808725357055664, 0.08357810974121094, 0.08628368377685547, 0.0889892578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 7.0, 6.0, 15.0, 7.0, 17.0, 23.0, 24.0, 31.0, 65.0, 115.0, 294.0, 1623.0, 46031.0, 983024.0, 15828.0, 934.0, 226.0, 88.0, 59.0, 31.0, 26.0, 24.0, 15.0, 11.0, 11.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.07379150390625, -1.0372314453125, -1.00067138671875, -0.964111328125, -0.92755126953125, -0.8909912109375, -0.85443115234375, -0.81787109375, -0.78131103515625, -0.7447509765625, -0.70819091796875, -0.671630859375, -0.63507080078125, -0.5985107421875, -0.56195068359375, -0.525390625, -0.48883056640625, -0.4522705078125, -0.41571044921875, -0.379150390625, -0.34259033203125, -0.3060302734375, -0.26947021484375, -0.23291015625, -0.19635009765625, -0.1597900390625, -0.12322998046875, -0.086669921875, -0.05010986328125, -0.0135498046875, 0.02301025390625, 0.0595703125, 0.09613037109375, 0.1326904296875, 0.16925048828125, 0.205810546875, 0.24237060546875, 0.2789306640625, 0.31549072265625, 0.35205078125, 0.38861083984375, 0.4251708984375, 0.46173095703125, 0.498291015625, 0.53485107421875, 0.5714111328125, 0.60797119140625, 0.64453125, 0.68109130859375, 0.7176513671875, 0.75421142578125, 0.790771484375, 0.82733154296875, 0.8638916015625, 0.90045166015625, 0.93701171875, 0.97357177734375, 1.0101318359375, 1.04669189453125, 1.083251953125, 1.11981201171875, 1.1563720703125, 1.19293212890625, 1.2294921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 33.0, 49.0, 107.0, 131.0, 195.0, 174.0, 135.0, 76.0, 45.0, 33.0, 9.0, 5.0, 3.0], "bins": [-0.3163999319076538, -0.310723215341568, -0.3050464987754822, -0.29936978220939636, -0.29369306564331055, -0.28801634907722473, -0.2823396325111389, -0.2766629159450531, -0.2709861993789673, -0.26530948281288147, -0.25963276624679565, -0.25395604968070984, -0.24827933311462402, -0.2426026165485382, -0.2369258999824524, -0.23124918341636658, -0.22557246685028076, -0.21989575028419495, -0.21421903371810913, -0.20854231715202332, -0.2028656005859375, -0.19718888401985168, -0.19151216745376587, -0.18583545088768005, -0.18015874922275543, -0.17448203265666962, -0.1688053160905838, -0.16312859952449799, -0.15745188295841217, -0.15177516639232635, -0.14609844982624054, -0.14042173326015472, -0.1347450166940689, -0.1290683001279831, -0.12339158356189728, -0.11771486699581146, -0.11203815042972565, -0.10636143386363983, -0.10068471729755402, -0.0950080007314682, -0.08933128416538239, -0.08365456759929657, -0.07797785103321075, -0.07230113446712494, -0.06662441790103912, -0.06094770133495331, -0.05527098849415779, -0.049594271928071976, -0.04391755908727646, -0.03824084252119064, -0.03256412595510483, -0.02688741125166416, -0.021210694685578346, -0.01553397811949253, -0.009857263416051865, -0.004180546849966049, 0.0014961697161197662, 0.007172885816544294, 0.012849601916968822, 0.018526317551732063, 0.02420303411781788, 0.029879750683903694, 0.03555646538734436, 0.041233181953430176, 0.04690989851951599]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 11.0, 6.0, 5.0, 17.0, 11.0, 21.0, 17.0, 10.0, 21.0, 19.0, 26.0, 29.0, 32.0, 27.0, 31.0, 32.0, 34.0, 38.0, 40.0, 39.0, 41.0, 33.0, 31.0, 28.0, 44.0, 30.0, 27.0, 31.0, 27.0, 25.0, 30.0, 28.0, 13.0, 17.0, 21.0, 17.0, 15.0, 17.0, 7.0, 13.0, 9.0, 5.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.06515049934387207, -0.06326282024383545, -0.06137513741850853, -0.05948745459318161, -0.05759977549314499, -0.05571209639310837, -0.05382441356778145, -0.05193673074245453, -0.05004905164241791, -0.04816137254238129, -0.04627368971705437, -0.04438600689172745, -0.042498327791690826, -0.040610648691654205, -0.038722965866327286, -0.036835283041000366, -0.034947603940963745, -0.033059924840927124, -0.031172242015600204, -0.029284561052918434, -0.027396880090236664, -0.025509199127554893, -0.023621518164873123, -0.021733837202191353, -0.019846156239509583, -0.017958475276827812, -0.016070794314146042, -0.014183113351464272, -0.012295432388782501, -0.010407751426100731, -0.00852007046341896, -0.00663238950073719, -0.00474470853805542, -0.0028570275753736496, -0.0009693466126918793, 0.000918334349989891, 0.0028060153126716614, 0.004693696275353432, 0.006581377238035202, 0.008469058200716972, 0.010356739163398743, 0.012244420126080513, 0.014132101088762283, 0.016019782051444054, 0.017907463014125824, 0.019795143976807594, 0.021682824939489365, 0.023570505902171135, 0.025458186864852905, 0.027345867827534676, 0.029233548790216446, 0.031121229752898216, 0.03300891071557999, 0.03489658981561661, 0.03678427264094353, 0.03867195546627045, 0.04055963456630707, 0.04244731366634369, 0.04433499649167061, 0.04622267931699753, 0.04811035841703415, 0.04999803751707077, 0.05188572034239769, 0.05377340316772461, 0.05566108226776123]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 7.0, 8.0, 5.0, 10.0, 7.0, 12.0, 12.0, 21.0, 17.0, 23.0, 21.0, 24.0, 26.0, 35.0, 28.0, 31.0, 35.0, 43.0, 31.0, 47.0, 30.0, 34.0, 43.0, 44.0, 39.0, 37.0, 36.0, 25.0, 35.0, 38.0, 21.0, 22.0, 12.0, 24.0, 19.0, 13.0, 17.0, 9.0, 6.0, 14.0, 7.0, 8.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.85498046875, -0.830780029296875, -0.80657958984375, -0.782379150390625, -0.7581787109375, -0.733978271484375, -0.70977783203125, -0.685577392578125, -0.661376953125, -0.637176513671875, -0.61297607421875, -0.588775634765625, -0.5645751953125, -0.540374755859375, -0.51617431640625, -0.491973876953125, -0.4677734375, -0.443572998046875, -0.41937255859375, -0.395172119140625, -0.3709716796875, -0.346771240234375, -0.32257080078125, -0.298370361328125, -0.274169921875, -0.249969482421875, -0.22576904296875, -0.201568603515625, -0.1773681640625, -0.153167724609375, -0.12896728515625, -0.104766845703125, -0.08056640625, -0.056365966796875, -0.03216552734375, -0.007965087890625, 0.0162353515625, 0.040435791015625, 0.06463623046875, 0.088836669921875, 0.113037109375, 0.137237548828125, 0.16143798828125, 0.185638427734375, 0.2098388671875, 0.234039306640625, 0.25823974609375, 0.282440185546875, 0.306640625, 0.330841064453125, 0.35504150390625, 0.379241943359375, 0.4034423828125, 0.427642822265625, 0.45184326171875, 0.476043701171875, 0.500244140625, 0.524444580078125, 0.54864501953125, 0.572845458984375, 0.5970458984375, 0.621246337890625, 0.64544677734375, 0.669647216796875, 0.69384765625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 13.0, 27.0, 33.0, 33.0, 46.0, 72.0, 112.0, 159.0, 260.0, 350.0, 580.0, 933.0, 1729.0, 2862.0, 5030.0, 9108.0, 17293.0, 32907.0, 63762.0, 130709.0, 317474.0, 247661.0, 105204.0, 52173.0, 27343.0, 14395.0, 7854.0, 4214.0, 2500.0, 1381.0, 811.0, 541.0, 319.0, 218.0, 137.0, 103.0, 66.0, 36.0, 29.0, 20.0, 11.0, 7.0, 12.0, 7.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.353515625, -1.31353759765625, -1.2735595703125, -1.23358154296875, -1.193603515625, -1.15362548828125, -1.1136474609375, -1.07366943359375, -1.03369140625, -0.99371337890625, -0.9537353515625, -0.91375732421875, -0.873779296875, -0.83380126953125, -0.7938232421875, -0.75384521484375, -0.7138671875, -0.67388916015625, -0.6339111328125, -0.59393310546875, -0.553955078125, -0.51397705078125, -0.4739990234375, -0.43402099609375, -0.39404296875, -0.35406494140625, -0.3140869140625, -0.27410888671875, -0.234130859375, -0.19415283203125, -0.1541748046875, -0.11419677734375, -0.07421875, -0.03424072265625, 0.0057373046875, 0.04571533203125, 0.085693359375, 0.12567138671875, 0.1656494140625, 0.20562744140625, 0.24560546875, 0.28558349609375, 0.3255615234375, 0.36553955078125, 0.405517578125, 0.44549560546875, 0.4854736328125, 0.52545166015625, 0.5654296875, 0.60540771484375, 0.6453857421875, 0.68536376953125, 0.725341796875, 0.76531982421875, 0.8052978515625, 0.84527587890625, 0.88525390625, 0.92523193359375, 0.9652099609375, 1.00518798828125, 1.045166015625, 1.08514404296875, 1.1251220703125, 1.16510009765625, 1.205078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 6.0, 6.0, 11.0, 5.0, 23.0, 18.0, 17.0, 29.0, 23.0, 35.0, 34.0, 38.0, 45.0, 68.0, 81.0, 104.0, 201.0, 1336.0, 301.0, 149.0, 101.0, 68.0, 51.0, 35.0, 29.0, 36.0, 41.0, 18.0, 26.0, 22.0, 14.0, 11.0, 13.0, 10.0, 8.0, 1.0, 10.0, 7.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-3.1328125, -3.04754638671875, -2.9622802734375, -2.87701416015625, -2.791748046875, -2.70648193359375, -2.6212158203125, -2.53594970703125, -2.45068359375, -2.36541748046875, -2.2801513671875, -2.19488525390625, -2.109619140625, -2.02435302734375, -1.9390869140625, -1.85382080078125, -1.7685546875, -1.68328857421875, -1.5980224609375, -1.51275634765625, -1.427490234375, -1.34222412109375, -1.2569580078125, -1.17169189453125, -1.08642578125, -1.00115966796875, -0.9158935546875, -0.83062744140625, -0.745361328125, -0.66009521484375, -0.5748291015625, -0.48956298828125, -0.404296875, -0.31903076171875, -0.2337646484375, -0.14849853515625, -0.063232421875, 0.02203369140625, 0.1072998046875, 0.19256591796875, 0.27783203125, 0.36309814453125, 0.4483642578125, 0.53363037109375, 0.618896484375, 0.70416259765625, 0.7894287109375, 0.87469482421875, 0.9599609375, 1.04522705078125, 1.1304931640625, 1.21575927734375, 1.301025390625, 1.38629150390625, 1.4715576171875, 1.55682373046875, 1.64208984375, 1.72735595703125, 1.8126220703125, 1.89788818359375, 1.983154296875, 2.06842041015625, 2.1536865234375, 2.23895263671875, 2.32421875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 6.0, 9.0, 11.0, 15.0, 14.0, 20.0, 15.0, 25.0, 39.0, 41.0, 60.0, 90.0, 105.0, 150.0, 210.0, 292.0, 640.0, 1997.0, 12817.0, 158211.0, 2527447.0, 412028.0, 26016.0, 3346.0, 846.0, 375.0, 229.0, 153.0, 111.0, 91.0, 69.0, 48.0, 29.0, 32.0, 28.0, 25.0, 12.0, 12.0, 11.0, 5.0, 7.0, 1.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-4.578125, -4.42877197265625, -4.2794189453125, -4.13006591796875, -3.980712890625, -3.83135986328125, -3.6820068359375, -3.53265380859375, -3.38330078125, -3.23394775390625, -3.0845947265625, -2.93524169921875, -2.785888671875, -2.63653564453125, -2.4871826171875, -2.33782958984375, -2.1884765625, -2.03912353515625, -1.8897705078125, -1.74041748046875, -1.591064453125, -1.44171142578125, -1.2923583984375, -1.14300537109375, -0.99365234375, -0.84429931640625, -0.6949462890625, -0.54559326171875, -0.396240234375, -0.24688720703125, -0.0975341796875, 0.05181884765625, 0.201171875, 0.35052490234375, 0.4998779296875, 0.64923095703125, 0.798583984375, 0.94793701171875, 1.0972900390625, 1.24664306640625, 1.39599609375, 1.54534912109375, 1.6947021484375, 1.84405517578125, 1.993408203125, 2.14276123046875, 2.2921142578125, 2.44146728515625, 2.5908203125, 2.74017333984375, 2.8895263671875, 3.03887939453125, 3.188232421875, 3.33758544921875, 3.4869384765625, 3.63629150390625, 3.78564453125, 3.93499755859375, 4.0843505859375, 4.23370361328125, 4.383056640625, 4.53240966796875, 4.6817626953125, 4.83111572265625, 4.98046875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 19.0, 161.0, 583.0, 241.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.482610702514648, -7.204277515411377, -5.9259443283081055, -4.647611618041992, -3.3692784309387207, -2.090945243835449, -0.8126125335693359, 0.46572113037109375, 1.744053840637207, 3.0223870277404785, 4.30072021484375, 5.579052925109863, 6.857386112213135, 8.135719299316406, 9.41405200958252, 10.69238567352295, 11.970718383789062, 13.249051094055176, 14.527384757995605, 15.805717468261719, 17.08405113220215, 18.362384796142578, 19.640716552734375, 20.919050216674805, 22.197383880615234, 23.475717544555664, 24.75404930114746, 26.03238296508789, 27.31071662902832, 28.58905029296875, 29.867382049560547, 31.145715713500977, 32.42404556274414, 33.70237731933594, 34.980712890625, 36.2590446472168, 37.537376403808594, 38.815711975097656, 40.09404373168945, 41.37237548828125, 42.65071105957031, 43.92904281616211, 45.20737838745117, 46.48571014404297, 47.764041900634766, 49.04237747192383, 50.320709228515625, 51.59904479980469, 52.87737274169922, 54.155704498291016, 55.43404006958008, 56.712371826171875, 57.99070358276367, 59.269039154052734, 60.54737091064453, 61.825706481933594, 63.10403823852539, 64.38236999511719, 65.66070556640625, 66.93904113769531, 68.21736907958984, 69.4957046508789, 70.77403259277344, 72.0523681640625, 73.33070373535156]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 3.0, 4.0, 3.0, 6.0, 14.0, 11.0, 14.0, 11.0, 17.0, 24.0, 23.0, 22.0, 27.0, 24.0, 27.0, 34.0, 34.0, 44.0, 31.0, 42.0, 32.0, 42.0, 30.0, 33.0, 34.0, 47.0, 35.0, 41.0, 41.0, 26.0, 26.0, 24.0, 26.0, 20.0, 25.0, 15.0, 12.0, 13.0, 16.0, 9.0, 8.0, 3.0, 4.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.860989570617676, -6.628107070922852, -6.395224571228027, -6.162342071533203, -5.929459571838379, -5.696577072143555, -5.463694095611572, -5.230811595916748, -4.997929096221924, -4.7650465965271, -4.532164096832275, -4.299281597137451, -4.066398620605469, -3.8335163593292236, -3.6006336212158203, -3.367751121520996, -3.134868621826172, -2.9019861221313477, -2.6691036224365234, -2.43622088432312, -2.203338384628296, -1.9704558849334717, -1.737573266029358, -1.5046906471252441, -1.27180814743042, -1.0389256477355957, -0.8060430288314819, -0.5731604695320129, -0.34027791023254395, -0.10739541053771973, 0.12548720836639404, 0.3583698272705078, 0.591252326965332, 0.824134886264801, 1.05701744556427, 1.2899000644683838, 1.522782564163208, 1.7556650638580322, 1.988547682762146, 2.2214303016662598, 2.454312801361084, 2.687195301055908, 2.9200778007507324, 3.1529605388641357, 3.38584303855896, 3.618725538253784, 3.8516082763671875, 4.084490776062012, 4.317373275756836, 4.55025577545166, 4.783138275146484, 5.016020774841309, 5.248903274536133, 5.481785774230957, 5.7146687507629395, 5.947551250457764, 6.180433750152588, 6.413316249847412, 6.646198749542236, 6.8790812492370605, 7.111964225769043, 7.344846725463867, 7.577729225158691, 7.810611724853516, 8.04349422454834]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 12.0, 11.0, 16.0, 24.0, 24.0, 28.0, 34.0, 33.0, 38.0, 31.0, 34.0, 29.0, 42.0, 36.0, 54.0, 48.0, 38.0, 52.0, 44.0, 41.0, 27.0, 37.0, 42.0, 31.0, 24.0, 22.0, 25.0, 18.0, 15.0, 9.0, 9.0, 9.0, 6.0, 8.0, 5.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0390625, -1.00958251953125, -0.9801025390625, -0.95062255859375, -0.921142578125, -0.89166259765625, -0.8621826171875, -0.83270263671875, -0.80322265625, -0.77374267578125, -0.7442626953125, -0.71478271484375, -0.685302734375, -0.65582275390625, -0.6263427734375, -0.59686279296875, -0.5673828125, -0.53790283203125, -0.5084228515625, -0.47894287109375, -0.449462890625, -0.41998291015625, -0.3905029296875, -0.36102294921875, -0.33154296875, -0.30206298828125, -0.2725830078125, -0.24310302734375, -0.213623046875, -0.18414306640625, -0.1546630859375, -0.12518310546875, -0.095703125, -0.06622314453125, -0.0367431640625, -0.00726318359375, 0.022216796875, 0.05169677734375, 0.0811767578125, 0.11065673828125, 0.14013671875, 0.16961669921875, 0.1990966796875, 0.22857666015625, 0.258056640625, 0.28753662109375, 0.3170166015625, 0.34649658203125, 0.3759765625, 0.40545654296875, 0.4349365234375, 0.46441650390625, 0.493896484375, 0.52337646484375, 0.5528564453125, 0.58233642578125, 0.61181640625, 0.64129638671875, 0.6707763671875, 0.70025634765625, 0.729736328125, 0.75921630859375, 0.7886962890625, 0.81817626953125, 0.84765625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 6.0, 4.0, 7.0, 10.0, 17.0, 21.0, 22.0, 43.0, 52.0, 84.0, 133.0, 209.0, 297.0, 429.0, 581.0, 855.0, 1282.0, 2043.0, 3235.0, 5269.0, 8943.0, 16423.0, 32333.0, 71371.0, 199111.0, 726645.0, 1759801.0, 942516.0, 255544.0, 86143.0, 37204.0, 18084.0, 9914.0, 5671.0, 3487.0, 2078.0, 1409.0, 920.0, 646.0, 440.0, 295.0, 205.0, 147.0, 115.0, 73.0, 51.0, 49.0, 24.0, 20.0, 13.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.376953125, -1.3319549560546875, -1.286956787109375, -1.2419586181640625, -1.19696044921875, -1.1519622802734375, -1.106964111328125, -1.0619659423828125, -1.0169677734375, -0.9719696044921875, -0.926971435546875, -0.8819732666015625, -0.83697509765625, -0.7919769287109375, -0.746978759765625, -0.7019805908203125, -0.656982421875, -0.6119842529296875, -0.566986083984375, -0.5219879150390625, -0.47698974609375, -0.4319915771484375, -0.386993408203125, -0.3419952392578125, -0.2969970703125, -0.2519989013671875, -0.207000732421875, -0.1620025634765625, -0.11700439453125, -0.0720062255859375, -0.027008056640625, 0.0179901123046875, 0.06298828125, 0.1079864501953125, 0.152984619140625, 0.1979827880859375, 0.24298095703125, 0.2879791259765625, 0.332977294921875, 0.3779754638671875, 0.4229736328125, 0.4679718017578125, 0.512969970703125, 0.5579681396484375, 0.60296630859375, 0.6479644775390625, 0.692962646484375, 0.7379608154296875, 0.782958984375, 0.8279571533203125, 0.872955322265625, 0.9179534912109375, 0.96295166015625, 1.0079498291015625, 1.052947998046875, 1.0979461669921875, 1.1429443359375, 1.1879425048828125, 1.232940673828125, 1.2779388427734375, 1.32293701171875, 1.3679351806640625, 1.412933349609375, 1.4579315185546875, 1.5029296875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 10.0, 12.0, 16.0, 20.0, 29.0, 46.0, 64.0, 75.0, 102.0, 159.0, 209.0, 363.0, 452.0, 553.0, 527.0, 429.0, 274.0, 186.0, 142.0, 118.0, 69.0, 36.0, 50.0, 26.0, 24.0, 14.0, 16.0, 13.0, 5.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6748046875, -1.6074371337890625, -1.540069580078125, -1.4727020263671875, -1.40533447265625, -1.3379669189453125, -1.270599365234375, -1.2032318115234375, -1.1358642578125, -1.0684967041015625, -1.001129150390625, -0.9337615966796875, -0.86639404296875, -0.7990264892578125, -0.731658935546875, -0.6642913818359375, -0.596923828125, -0.5295562744140625, -0.462188720703125, -0.3948211669921875, -0.32745361328125, -0.2600860595703125, -0.192718505859375, -0.1253509521484375, -0.0579833984375, 0.0093841552734375, 0.076751708984375, 0.1441192626953125, 0.21148681640625, 0.2788543701171875, 0.346221923828125, 0.4135894775390625, 0.48095703125, 0.5483245849609375, 0.615692138671875, 0.6830596923828125, 0.75042724609375, 0.8177947998046875, 0.885162353515625, 0.9525299072265625, 1.0198974609375, 1.0872650146484375, 1.154632568359375, 1.2220001220703125, 1.28936767578125, 1.3567352294921875, 1.424102783203125, 1.4914703369140625, 1.558837890625, 1.6262054443359375, 1.693572998046875, 1.7609405517578125, 1.82830810546875, 1.8956756591796875, 1.963043212890625, 2.0304107666015625, 2.0977783203125, 2.1651458740234375, 2.232513427734375, 2.2998809814453125, 2.36724853515625, 2.4346160888671875, 2.501983642578125, 2.5693511962890625, 2.63671875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 3.0, 1.0, 13.0, 14.0, 11.0, 10.0, 22.0, 19.0, 41.0, 50.0, 62.0, 147.0, 229.0, 479.0, 1227.0, 3539.0, 13596.0, 80456.0, 972912.0, 2861363.0, 221359.0, 29026.0, 6315.0, 1911.0, 731.0, 311.0, 148.0, 101.0, 49.0, 43.0, 27.0, 24.0, 9.0, 7.0, 13.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.1351318359375, -4.985107421875, -4.8350830078125, -4.68505859375, -4.5350341796875, -4.385009765625, -4.2349853515625, -4.0849609375, -3.9349365234375, -3.784912109375, -3.6348876953125, -3.48486328125, -3.3348388671875, -3.184814453125, -3.0347900390625, -2.884765625, -2.7347412109375, -2.584716796875, -2.4346923828125, -2.28466796875, -2.1346435546875, -1.984619140625, -1.8345947265625, -1.6845703125, -1.5345458984375, -1.384521484375, -1.2344970703125, -1.08447265625, -0.9344482421875, -0.784423828125, -0.6343994140625, -0.484375, -0.3343505859375, -0.184326171875, -0.0343017578125, 0.11572265625, 0.2657470703125, 0.415771484375, 0.5657958984375, 0.7158203125, 0.8658447265625, 1.015869140625, 1.1658935546875, 1.31591796875, 1.4659423828125, 1.615966796875, 1.7659912109375, 1.916015625, 2.0660400390625, 2.216064453125, 2.3660888671875, 2.51611328125, 2.6661376953125, 2.816162109375, 2.9661865234375, 3.1162109375, 3.2662353515625, 3.416259765625, 3.5662841796875, 3.71630859375, 3.8663330078125, 4.016357421875, 4.1663818359375, 4.31640625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 12.0, 29.0, 65.0, 141.0, 173.0, 213.0, 178.0, 106.0, 44.0, 26.0, 14.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.5664119720459, -26.829805374145508, -26.093198776245117, -25.356592178344727, -24.619985580444336, -23.883378982543945, -23.146770477294922, -22.41016387939453, -21.67355728149414, -20.93695068359375, -20.20034408569336, -19.46373748779297, -18.727130889892578, -17.990524291992188, -17.253917694091797, -16.517311096191406, -15.780704498291016, -15.044097900390625, -14.307491302490234, -13.570884704589844, -12.834278106689453, -12.097671508789062, -11.361063957214355, -10.624457359313965, -9.887850761413574, -9.151244163513184, -8.414637565612793, -7.678030490875244, -6.9414238929748535, -6.204817295074463, -5.468210220336914, -4.731603622436523, -3.994997024536133, -3.258390426635742, -2.5217835903167725, -1.7851767539978027, -1.048570156097412, -0.3119635581970215, 0.42464351654052734, 1.161250114440918, 1.8978567123413086, 2.634463310241699, 3.371070146560669, 4.107676982879639, 4.844283580780029, 5.58089017868042, 6.317497253417969, 7.054103851318359, 7.79071044921875, 8.52731704711914, 9.263923645019531, 10.000530242919922, 10.737136840820312, 11.473743438720703, 12.21035099029541, 12.9469575881958, 13.683564186096191, 14.420170783996582, 15.156777381896973, 15.89338493347168, 16.62999153137207, 17.36659812927246, 18.10320472717285, 18.839811325073242, 19.576417922973633]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 6.0, 8.0, 9.0, 9.0, 3.0, 15.0, 19.0, 29.0, 20.0, 24.0, 33.0, 27.0, 37.0, 37.0, 49.0, 44.0, 45.0, 47.0, 48.0, 36.0, 36.0, 39.0, 34.0, 27.0, 49.0, 31.0, 28.0, 34.0, 35.0, 21.0, 22.0, 14.0, 14.0, 9.0, 16.0, 7.0, 6.0, 5.0, 10.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.294687271118164, -5.095819473266602, -4.896952152252197, -4.698084354400635, -4.4992170333862305, -4.300349235534668, -4.101481914520264, -3.902614116668701, -3.703746795654297, -3.5048792362213135, -3.30601167678833, -3.1071441173553467, -2.9082765579223633, -2.70940899848938, -2.5105414390563965, -2.311673641204834, -2.1128060817718506, -1.9139385223388672, -1.7150709629058838, -1.5162034034729004, -1.317335844039917, -1.1184682846069336, -0.9196006059646606, -0.7207330465316772, -0.5218654870986938, -0.32299792766571045, -0.12413033843040466, 0.07473725080490112, 0.2736048102378845, 0.4724723696708679, 0.6713399887084961, 0.8702075481414795, 1.069075107574463, 1.2679426670074463, 1.4668102264404297, 1.665677785873413, 1.8645453453063965, 2.06341290473938, 2.2622804641723633, 2.461148262023926, 2.66001558303833, 2.8588831424713135, 3.057750701904297, 3.2566182613372803, 3.4554858207702637, 3.654353380203247, 3.8532209396362305, 4.052088737487793, 4.2509565353393555, 4.449824333190918, 4.648691654205322, 4.847559452056885, 5.046426773071289, 5.245294570922852, 5.444161891937256, 5.643029689788818, 5.841897010803223, 6.040764808654785, 6.2396321296691895, 6.438499927520752, 6.637367248535156, 6.836235046386719, 7.035102367401123, 7.2339701652526855, 7.43283748626709]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 15.0, 12.0, 19.0, 28.0, 27.0, 23.0, 31.0, 32.0, 29.0, 29.0, 47.0, 31.0, 30.0, 37.0, 40.0, 38.0, 35.0, 38.0, 37.0, 33.0, 39.0, 36.0, 42.0, 31.0, 32.0, 15.0, 23.0, 23.0, 28.0, 19.0, 11.0, 12.0, 5.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8701171875, -0.8435592651367188, -0.8170013427734375, -0.7904434204101562, -0.763885498046875, -0.7373275756835938, -0.7107696533203125, -0.6842117309570312, -0.65765380859375, -0.6310958862304688, -0.6045379638671875, -0.5779800415039062, -0.551422119140625, -0.5248641967773438, -0.4983062744140625, -0.47174835205078125, -0.4451904296875, -0.41863250732421875, -0.3920745849609375, -0.36551666259765625, -0.338958740234375, -0.31240081787109375, -0.2858428955078125, -0.25928497314453125, -0.23272705078125, -0.20616912841796875, -0.1796112060546875, -0.15305328369140625, -0.126495361328125, -0.09993743896484375, -0.0733795166015625, -0.04682159423828125, -0.020263671875, 0.00629425048828125, 0.0328521728515625, 0.05941009521484375, 0.085968017578125, 0.11252593994140625, 0.1390838623046875, 0.16564178466796875, 0.19219970703125, 0.21875762939453125, 0.2453155517578125, 0.27187347412109375, 0.298431396484375, 0.32498931884765625, 0.3515472412109375, 0.37810516357421875, 0.4046630859375, 0.43122100830078125, 0.4577789306640625, 0.48433685302734375, 0.510894775390625, 0.5374526977539062, 0.5640106201171875, 0.5905685424804688, 0.61712646484375, 0.6436843872070312, 0.6702423095703125, 0.6968002319335938, 0.723358154296875, 0.7499160766601562, 0.7764739990234375, 0.8030319213867188, 0.82958984375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 0.0, 1.0, 5.0, 6.0, 7.0, 13.0, 24.0, 30.0, 37.0, 71.0, 86.0, 116.0, 153.0, 283.0, 365.0, 511.0, 856.0, 1177.0, 1736.0, 2598.0, 4061.0, 6313.0, 10471.0, 18725.0, 48648.0, 212681.0, 513245.0, 146816.0, 37518.0, 16150.0, 9070.0, 5614.0, 3762.0, 2413.0, 1555.0, 1070.0, 762.0, 509.0, 362.0, 254.0, 146.0, 107.0, 73.0, 52.0, 22.0, 23.0, 17.0, 13.0, 7.0, 8.0, 5.0, 7.0, 2.0, 3.0, 6.0], "bins": [-0.83935546875, -0.8156356811523438, -0.7919158935546875, -0.7681961059570312, -0.744476318359375, -0.7207565307617188, -0.6970367431640625, -0.6733169555664062, -0.64959716796875, -0.6258773803710938, -0.6021575927734375, -0.5784378051757812, -0.554718017578125, -0.5309982299804688, -0.5072784423828125, -0.48355865478515625, -0.4598388671875, -0.43611907958984375, -0.4123992919921875, -0.38867950439453125, -0.364959716796875, -0.34123992919921875, -0.3175201416015625, -0.29380035400390625, -0.27008056640625, -0.24636077880859375, -0.2226409912109375, -0.19892120361328125, -0.175201416015625, -0.15148162841796875, -0.1277618408203125, -0.10404205322265625, -0.080322265625, -0.05660247802734375, -0.0328826904296875, -0.00916290283203125, 0.014556884765625, 0.03827667236328125, 0.0619964599609375, 0.08571624755859375, 0.10943603515625, 0.13315582275390625, 0.1568756103515625, 0.18059539794921875, 0.204315185546875, 0.22803497314453125, 0.2517547607421875, 0.27547454833984375, 0.2991943359375, 0.32291412353515625, 0.3466339111328125, 0.37035369873046875, 0.394073486328125, 0.41779327392578125, 0.4415130615234375, 0.46523284912109375, 0.48895263671875, 0.5126724243164062, 0.5363922119140625, 0.5601119995117188, 0.583831787109375, 0.6075515747070312, 0.6312713623046875, 0.6549911499023438, 0.6787109375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 14.0, 15.0, 18.0, 11.0, 21.0, 27.0, 32.0, 28.0, 23.0, 31.0, 34.0, 26.0, 44.0, 43.0, 47.0, 41.0, 1056.0, 46.0, 46.0, 36.0, 38.0, 46.0, 47.0, 32.0, 27.0, 19.0, 16.0, 19.0, 21.0, 21.0, 12.0, 7.0, 10.0, 9.0, 9.0, 7.0, 7.0, 6.0, 0.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5518264770507812, -0.5308990478515625, -0.5099716186523438, -0.489044189453125, -0.46811676025390625, -0.4471893310546875, -0.42626190185546875, -0.40533447265625, -0.38440704345703125, -0.3634796142578125, -0.34255218505859375, -0.321624755859375, -0.30069732666015625, -0.2797698974609375, -0.25884246826171875, -0.2379150390625, -0.21698760986328125, -0.1960601806640625, -0.17513275146484375, -0.154205322265625, -0.13327789306640625, -0.1123504638671875, -0.09142303466796875, -0.07049560546875, -0.04956817626953125, -0.0286407470703125, -0.00771331787109375, 0.013214111328125, 0.03414154052734375, 0.0550689697265625, 0.07599639892578125, 0.096923828125, 0.11785125732421875, 0.1387786865234375, 0.15970611572265625, 0.180633544921875, 0.20156097412109375, 0.2224884033203125, 0.24341583251953125, 0.26434326171875, 0.28527069091796875, 0.3061981201171875, 0.32712554931640625, 0.348052978515625, 0.36898040771484375, 0.3899078369140625, 0.41083526611328125, 0.4317626953125, 0.45269012451171875, 0.4736175537109375, 0.49454498291015625, 0.515472412109375, 0.5363998413085938, 0.5573272705078125, 0.5782546997070312, 0.59918212890625, 0.6201095581054688, 0.6410369873046875, 0.6619644165039062, 0.682891845703125, 0.7038192749023438, 0.7247467041015625, 0.7456741333007812, 0.7666015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 8.0, 4.0, 8.0, 21.0, 24.0, 31.0, 47.0, 66.0, 82.0, 112.0, 161.0, 260.0, 386.0, 628.0, 939.0, 1545.0, 2431.0, 4477.0, 8662.0, 20409.0, 68723.0, 559775.0, 1276902.0, 102054.0, 26219.0, 10481.0, 5073.0, 2876.0, 1608.0, 1026.0, 667.0, 450.0, 308.0, 186.0, 128.0, 84.0, 73.0, 56.0, 36.0, 27.0, 21.0, 20.0, 10.0, 5.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.485595703125, -0.4689216613769531, -0.45224761962890625, -0.4355735778808594, -0.4188995361328125, -0.4022254943847656, -0.38555145263671875, -0.3688774108886719, -0.352203369140625, -0.3355293273925781, -0.31885528564453125, -0.3021812438964844, -0.2855072021484375, -0.2688331604003906, -0.25215911865234375, -0.23548507690429688, -0.21881103515625, -0.20213699340820312, -0.18546295166015625, -0.16878890991210938, -0.1521148681640625, -0.13544082641601562, -0.11876678466796875, -0.10209274291992188, -0.085418701171875, -0.06874465942382812, -0.05207061767578125, -0.035396575927734375, -0.0187225341796875, -0.002048492431640625, 0.01462554931640625, 0.031299591064453125, 0.0479736328125, 0.06464767456054688, 0.08132171630859375, 0.09799575805664062, 0.1146697998046875, 0.13134384155273438, 0.14801788330078125, 0.16469192504882812, 0.181365966796875, 0.19804000854492188, 0.21471405029296875, 0.23138809204101562, 0.2480621337890625, 0.2647361755371094, 0.28141021728515625, 0.2980842590332031, 0.31475830078125, 0.3314323425292969, 0.34810638427734375, 0.3647804260253906, 0.3814544677734375, 0.3981285095214844, 0.41480255126953125, 0.4314765930175781, 0.448150634765625, 0.4648246765136719, 0.48149871826171875, 0.4981727600097656, 0.5148468017578125, 0.5315208435058594, 0.5481948852539062, 0.5648689270019531, 0.58154296875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 10.0, 4.0, 6.0, 4.0, 6.0, 3.0, 9.0, 10.0, 7.0, 15.0, 25.0, 46.0, 65.0, 107.0, 197.0, 206.0, 86.0, 36.0, 29.0, 22.0, 20.0, 15.0, 7.0, 12.0, 8.0, 8.0, 4.0, 3.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1282958984375, -0.1245107650756836, -0.12072563171386719, -0.11694049835205078, -0.11315536499023438, -0.10937023162841797, -0.10558509826660156, -0.10179996490478516, -0.09801483154296875, -0.09422969818115234, -0.09044456481933594, -0.08665943145751953, -0.08287429809570312, -0.07908916473388672, -0.07530403137207031, -0.0715188980102539, -0.0677337646484375, -0.0639486312866211, -0.06016349792480469, -0.05637836456298828, -0.052593231201171875, -0.04880809783935547, -0.04502296447753906, -0.041237831115722656, -0.03745269775390625, -0.033667564392089844, -0.029882431030273438, -0.02609729766845703, -0.022312164306640625, -0.01852703094482422, -0.014741897583007812, -0.010956764221191406, -0.007171630859375, -0.0033864974975585938, 0.0003986358642578125, 0.004183769226074219, 0.007968902587890625, 0.011754035949707031, 0.015539169311523438, 0.019324302673339844, 0.02310943603515625, 0.026894569396972656, 0.030679702758789062, 0.03446483612060547, 0.038249969482421875, 0.04203510284423828, 0.04582023620605469, 0.049605369567871094, 0.0533905029296875, 0.057175636291503906, 0.06096076965332031, 0.06474590301513672, 0.06853103637695312, 0.07231616973876953, 0.07610130310058594, 0.07988643646240234, 0.08367156982421875, 0.08745670318603516, 0.09124183654785156, 0.09502696990966797, 0.09881210327148438, 0.10259723663330078, 0.10638236999511719, 0.1101675033569336, 0.11395263671875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 3.0, 11.0, 8.0, 14.0, 16.0, 17.0, 31.0, 32.0, 62.0, 71.0, 191.0, 490.0, 1744.0, 7829.0, 86129.0, 926911.0, 19982.0, 3425.0, 910.0, 312.0, 143.0, 57.0, 41.0, 20.0, 17.0, 13.0, 14.0, 10.0, 10.0, 6.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5283203125, -1.479400634765625, -1.43048095703125, -1.381561279296875, -1.3326416015625, -1.283721923828125, -1.23480224609375, -1.185882568359375, -1.136962890625, -1.088043212890625, -1.03912353515625, -0.990203857421875, -0.9412841796875, -0.892364501953125, -0.84344482421875, -0.794525146484375, -0.74560546875, -0.696685791015625, -0.64776611328125, -0.598846435546875, -0.5499267578125, -0.501007080078125, -0.45208740234375, -0.403167724609375, -0.354248046875, -0.305328369140625, -0.25640869140625, -0.207489013671875, -0.1585693359375, -0.109649658203125, -0.06072998046875, -0.011810302734375, 0.037109375, 0.086029052734375, 0.13494873046875, 0.183868408203125, 0.2327880859375, 0.281707763671875, 0.33062744140625, 0.379547119140625, 0.428466796875, 0.477386474609375, 0.52630615234375, 0.575225830078125, 0.6241455078125, 0.673065185546875, 0.72198486328125, 0.770904541015625, 0.81982421875, 0.868743896484375, 0.91766357421875, 0.966583251953125, 1.0155029296875, 1.064422607421875, 1.11334228515625, 1.162261962890625, 1.211181640625, 1.260101318359375, 1.30902099609375, 1.357940673828125, 1.4068603515625, 1.455780029296875, 1.50469970703125, 1.553619384765625, 1.6025390625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 11.0, 19.0, 35.0, 64.0, 168.0, 232.0, 258.0, 126.0, 54.0, 23.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7675529718399048, -0.7524091005325317, -0.7372652292251587, -0.7221213579177856, -0.7069775462150574, -0.6918336749076843, -0.6766898036003113, -0.6615459322929382, -0.6464020609855652, -0.6312581896781921, -0.6161143183708191, -0.600970447063446, -0.5858266353607178, -0.5706827640533447, -0.5555388927459717, -0.5403950214385986, -0.5252511501312256, -0.5101072788238525, -0.4949634373188019, -0.47981956601142883, -0.4646756947040558, -0.4495318531990051, -0.4343879818916321, -0.41924411058425903, -0.4041002690792084, -0.3889563977718353, -0.37381255626678467, -0.3586686849594116, -0.3435248136520386, -0.3283809423446655, -0.31323710083961487, -0.2980932295322418, -0.2829493284225464, -0.26780545711517334, -0.2526616156101227, -0.23751774430274963, -0.2223738729953766, -0.20723001658916473, -0.19208616018295288, -0.17694228887557983, -0.16179844737052917, -0.14665459096431732, -0.13151071965694427, -0.11636686325073242, -0.10122299194335938, -0.08607913553714752, -0.07093527168035507, -0.05579140782356262, -0.040647536516189575, -0.025503672659397125, -0.010359810665249825, 0.004784051328897476, 0.019927915185689926, 0.03507177531719208, 0.05021563917398453, 0.06535950303077698, 0.08050336688756943, 0.09564723074436188, 0.11079109460115433, 0.12593495845794678, 0.14107881486415863, 0.15622267127037048, 0.17136654257774353, 0.18651041388511658, 0.20165427029132843]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 11.0, 11.0, 11.0, 18.0, 12.0, 23.0, 21.0, 33.0, 30.0, 28.0, 32.0, 40.0, 40.0, 48.0, 40.0, 45.0, 47.0, 49.0, 39.0, 51.0, 49.0, 40.0, 29.0, 39.0, 26.0, 26.0, 24.0, 22.0, 30.0, 16.0, 11.0, 14.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1331791877746582, -0.12952204048633575, -0.1258648931980133, -0.12220773100852966, -0.11855058372020721, -0.11489343643188477, -0.11123628169298172, -0.10757912695407867, -0.10392197966575623, -0.10026483237743378, -0.09660767763853073, -0.09295052289962769, -0.08929337561130524, -0.08563622832298279, -0.08197907358407974, -0.0783219188451767, -0.07466477155685425, -0.0710076242685318, -0.06735046952962875, -0.06369331479072571, -0.06003616750240326, -0.05637901648879051, -0.052721865475177765, -0.04906471446156502, -0.04540756344795227, -0.04175041243433952, -0.038093261420726776, -0.03443611040711403, -0.030778959393501282, -0.027121808379888535, -0.023464657366275787, -0.01980750635266304, -0.016150355339050293, -0.012493204325437546, -0.008836053311824799, -0.005178902298212051, -0.0015217512845993042, 0.002135399729013443, 0.00579255074262619, 0.009449701756238937, 0.013106852769851685, 0.016764003783464432, 0.02042115479707718, 0.024078305810689926, 0.027735456824302673, 0.03139260783791542, 0.03504975885152817, 0.038706909865140915, 0.04236406087875366, 0.04602121189236641, 0.049678362905979156, 0.053335513919591904, 0.05699266493320465, 0.0606498159468174, 0.06430696696043015, 0.06796412169933319, 0.07162126898765564, 0.07527841627597809, 0.07893557101488113, 0.08259272575378418, 0.08624987304210663, 0.08990702033042908, 0.09356417506933212, 0.09722132980823517, 0.10087847709655762]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 11.0, 6.0, 16.0, 12.0, 19.0, 29.0, 20.0, 28.0, 32.0, 31.0, 30.0, 25.0, 45.0, 30.0, 39.0, 40.0, 36.0, 39.0, 37.0, 33.0, 37.0, 35.0, 40.0, 34.0, 43.0, 33.0, 28.0, 19.0, 21.0, 23.0, 29.0, 18.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.876953125, -0.8502349853515625, -0.823516845703125, -0.7967987060546875, -0.77008056640625, -0.7433624267578125, -0.716644287109375, -0.6899261474609375, -0.6632080078125, -0.6364898681640625, -0.609771728515625, -0.5830535888671875, -0.55633544921875, -0.5296173095703125, -0.502899169921875, -0.4761810302734375, -0.449462890625, -0.4227447509765625, -0.396026611328125, -0.3693084716796875, -0.34259033203125, -0.3158721923828125, -0.289154052734375, -0.2624359130859375, -0.2357177734375, -0.2089996337890625, -0.182281494140625, -0.1555633544921875, -0.12884521484375, -0.1021270751953125, -0.075408935546875, -0.0486907958984375, -0.02197265625, 0.0047454833984375, 0.031463623046875, 0.0581817626953125, 0.08489990234375, 0.1116180419921875, 0.138336181640625, 0.1650543212890625, 0.1917724609375, 0.2184906005859375, 0.245208740234375, 0.2719268798828125, 0.29864501953125, 0.3253631591796875, 0.352081298828125, 0.3787994384765625, 0.405517578125, 0.4322357177734375, 0.458953857421875, 0.4856719970703125, 0.51239013671875, 0.5391082763671875, 0.565826416015625, 0.5925445556640625, 0.6192626953125, 0.6459808349609375, 0.672698974609375, 0.6994171142578125, 0.72613525390625, 0.7528533935546875, 0.779571533203125, 0.8062896728515625, 0.8330078125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 8.0, 11.0, 18.0, 27.0, 39.0, 61.0, 103.0, 172.0, 283.0, 514.0, 787.0, 1345.0, 2344.0, 4066.0, 7990.0, 15617.0, 34269.0, 83771.0, 225836.0, 382524.0, 169298.0, 64287.0, 27347.0, 12805.0, 6669.0, 3554.0, 1973.0, 1167.0, 640.0, 416.0, 230.0, 135.0, 97.0, 74.0, 34.0, 32.0, 9.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.15350341796875, -1.1097412109375, -1.06597900390625, -1.022216796875, -0.97845458984375, -0.9346923828125, -0.89093017578125, -0.84716796875, -0.80340576171875, -0.7596435546875, -0.71588134765625, -0.672119140625, -0.62835693359375, -0.5845947265625, -0.54083251953125, -0.4970703125, -0.45330810546875, -0.4095458984375, -0.36578369140625, -0.322021484375, -0.27825927734375, -0.2344970703125, -0.19073486328125, -0.14697265625, -0.10321044921875, -0.0594482421875, -0.01568603515625, 0.028076171875, 0.07183837890625, 0.1156005859375, 0.15936279296875, 0.203125, 0.24688720703125, 0.2906494140625, 0.33441162109375, 0.378173828125, 0.42193603515625, 0.4656982421875, 0.50946044921875, 0.55322265625, 0.59698486328125, 0.6407470703125, 0.68450927734375, 0.728271484375, 0.77203369140625, 0.8157958984375, 0.85955810546875, 0.9033203125, 0.94708251953125, 0.9908447265625, 1.03460693359375, 1.078369140625, 1.12213134765625, 1.1658935546875, 1.20965576171875, 1.25341796875, 1.29718017578125, 1.3409423828125, 1.38470458984375, 1.428466796875, 1.47222900390625, 1.5159912109375, 1.55975341796875, 1.603515625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 20.0, 9.0, 21.0, 23.0, 27.0, 22.0, 28.0, 41.0, 63.0, 68.0, 84.0, 119.0, 223.0, 1439.0, 262.0, 155.0, 78.0, 77.0, 56.0, 40.0, 36.0, 35.0, 26.0, 22.0, 14.0, 14.0, 5.0, 6.0, 9.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.56072998046875, -3.4515380859375, -3.34234619140625, -3.233154296875, -3.12396240234375, -3.0147705078125, -2.90557861328125, -2.79638671875, -2.68719482421875, -2.5780029296875, -2.46881103515625, -2.359619140625, -2.25042724609375, -2.1412353515625, -2.03204345703125, -1.9228515625, -1.81365966796875, -1.7044677734375, -1.59527587890625, -1.486083984375, -1.37689208984375, -1.2677001953125, -1.15850830078125, -1.04931640625, -0.94012451171875, -0.8309326171875, -0.72174072265625, -0.612548828125, -0.50335693359375, -0.3941650390625, -0.28497314453125, -0.17578125, -0.06658935546875, 0.0426025390625, 0.15179443359375, 0.260986328125, 0.37017822265625, 0.4793701171875, 0.58856201171875, 0.69775390625, 0.80694580078125, 0.9161376953125, 1.02532958984375, 1.134521484375, 1.24371337890625, 1.3529052734375, 1.46209716796875, 1.5712890625, 1.68048095703125, 1.7896728515625, 1.89886474609375, 2.008056640625, 2.11724853515625, 2.2264404296875, 2.33563232421875, 2.44482421875, 2.55401611328125, 2.6632080078125, 2.77239990234375, 2.881591796875, 2.99078369140625, 3.0999755859375, 3.20916748046875, 3.318359375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 13.0, 8.0, 16.0, 25.0, 37.0, 53.0, 78.0, 115.0, 206.0, 358.0, 746.0, 5051.0, 220749.0, 2888064.0, 27183.0, 1792.0, 473.0, 240.0, 155.0, 124.0, 58.0, 57.0, 28.0, 17.0, 12.0, 13.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.25, -7.9681396484375, -7.686279296875, -7.4044189453125, -7.12255859375, -6.8406982421875, -6.558837890625, -6.2769775390625, -5.9951171875, -5.7132568359375, -5.431396484375, -5.1495361328125, -4.86767578125, -4.5858154296875, -4.303955078125, -4.0220947265625, -3.740234375, -3.4583740234375, -3.176513671875, -2.8946533203125, -2.61279296875, -2.3309326171875, -2.049072265625, -1.7672119140625, -1.4853515625, -1.2034912109375, -0.921630859375, -0.6397705078125, -0.35791015625, -0.0760498046875, 0.205810546875, 0.4876708984375, 0.76953125, 1.0513916015625, 1.333251953125, 1.6151123046875, 1.89697265625, 2.1788330078125, 2.460693359375, 2.7425537109375, 3.0244140625, 3.3062744140625, 3.588134765625, 3.8699951171875, 4.15185546875, 4.4337158203125, 4.715576171875, 4.9974365234375, 5.279296875, 5.5611572265625, 5.843017578125, 6.1248779296875, 6.40673828125, 6.6885986328125, 6.970458984375, 7.2523193359375, 7.5341796875, 7.8160400390625, 8.097900390625, 8.3797607421875, 8.66162109375, 8.9434814453125, 9.225341796875, 9.5072021484375, 9.7890625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [564.0, 452.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9485621452331543, 0.06333446502685547, 3.0752310752868652, 6.087128162384033, 9.099023818969727, 12.110919952392578, 15.122817993164062, 18.134714126586914, 21.146610260009766, 24.158506393432617, 27.17040252685547, 30.182300567626953, 33.19419860839844, 36.206092834472656, 39.21799087524414, 42.229888916015625, 45.241783142089844, 48.25368118286133, 51.26557540893555, 54.27747344970703, 57.28936767578125, 60.301265716552734, 63.31316375732422, 66.32505798339844, 69.33695983886719, 72.3488540649414, 75.36075592041016, 78.37265014648438, 81.3845443725586, 84.39643859863281, 87.40834045410156, 90.42023468017578, 93.43212890625, 96.44402313232422, 99.45592498779297, 102.46781921386719, 105.4797134399414, 108.49160766601562, 111.50350952148438, 114.5154037475586, 117.52729797363281, 120.53919219970703, 123.55109405517578, 126.56298828125, 129.57489013671875, 132.58677673339844, 135.5986785888672, 138.61058044433594, 141.62246704101562, 144.63436889648438, 147.64625549316406, 150.6581573486328, 153.67005920410156, 156.68194580078125, 159.69384765625, 162.70574951171875, 165.7176513671875, 168.72955322265625, 171.74143981933594, 174.7533416748047, 177.76524353027344, 180.77713012695312, 183.78903198242188, 186.80093383789062, 189.8128204345703]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 5.0, 1.0, 2.0, 3.0, 9.0, 8.0, 10.0, 11.0, 16.0, 13.0, 22.0, 22.0, 27.0, 30.0, 30.0, 38.0, 33.0, 36.0, 46.0, 50.0, 40.0, 43.0, 43.0, 38.0, 35.0, 49.0, 33.0, 33.0, 36.0, 30.0, 26.0, 24.0, 25.0, 26.0, 19.0, 23.0, 13.0, 14.0, 8.0, 6.0, 7.0, 9.0, 2.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-8.967571258544922, -8.729320526123047, -8.491068840026855, -8.25281810760498, -8.014566421508789, -7.776315689086914, -7.538064479827881, -7.299813270568848, -7.0615620613098145, -6.823310852050781, -6.585059642791748, -6.346808433532715, -6.10855770111084, -5.870306015014648, -5.632055282592773, -5.39380407333374, -5.155552864074707, -4.917301654815674, -4.679050445556641, -4.440799236297607, -4.202548027038574, -3.96429705619812, -3.726046085357666, -3.487794876098633, -3.2495436668395996, -3.0112924575805664, -2.773041248321533, -2.534790277481079, -2.296539068222046, -2.0582878589630127, -1.820036768913269, -1.5817856788635254, -1.3435344696044922, -1.105283260345459, -0.8670321702957153, -0.6287810206413269, -0.3905298709869385, -0.15227866172790527, 0.08597242832183838, 0.32422351837158203, 0.5624747276306152, 0.8007258772850037, 1.038977026939392, 1.2772281169891357, 1.515479326248169, 1.7537305355072021, 1.9919816255569458, 2.2302327156066895, 2.4684839248657227, 2.706735134124756, 2.944986343383789, 3.183237314224243, 3.4214885234832764, 3.6597397327423096, 3.8979907035827637, 4.136241912841797, 4.37449312210083, 4.612744331359863, 4.8509955406188965, 5.08924674987793, 5.327497482299805, 5.565749168395996, 5.803999900817871, 6.042251110076904, 6.2805023193359375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 7.0, 11.0, 9.0, 8.0, 20.0, 24.0, 25.0, 32.0, 24.0, 23.0, 33.0, 34.0, 30.0, 36.0, 35.0, 48.0, 25.0, 41.0, 31.0, 42.0, 37.0, 31.0, 39.0, 47.0, 26.0, 26.0, 31.0, 31.0, 30.0, 23.0, 22.0, 20.0, 13.0, 7.0, 17.0, 6.0, 10.0, 2.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.892578125, -0.8648300170898438, -0.8370819091796875, -0.8093338012695312, -0.781585693359375, -0.7538375854492188, -0.7260894775390625, -0.6983413696289062, -0.67059326171875, -0.6428451538085938, -0.6150970458984375, -0.5873489379882812, -0.559600830078125, -0.5318527221679688, -0.5041046142578125, -0.47635650634765625, -0.4486083984375, -0.42086029052734375, -0.3931121826171875, -0.36536407470703125, -0.337615966796875, -0.30986785888671875, -0.2821197509765625, -0.25437164306640625, -0.22662353515625, -0.19887542724609375, -0.1711273193359375, -0.14337921142578125, -0.115631103515625, -0.08788299560546875, -0.0601348876953125, -0.03238677978515625, -0.004638671875, 0.02310943603515625, 0.0508575439453125, 0.07860565185546875, 0.106353759765625, 0.13410186767578125, 0.1618499755859375, 0.18959808349609375, 0.21734619140625, 0.24509429931640625, 0.2728424072265625, 0.30059051513671875, 0.328338623046875, 0.35608673095703125, 0.3838348388671875, 0.41158294677734375, 0.4393310546875, 0.46707916259765625, 0.4948272705078125, 0.5225753784179688, 0.550323486328125, 0.5780715942382812, 0.6058197021484375, 0.6335678100585938, 0.66131591796875, 0.6890640258789062, 0.7168121337890625, 0.7445602416992188, 0.772308349609375, 0.8000564575195312, 0.8278045654296875, 0.8555526733398438, 0.88330078125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 7.0, 7.0, 15.0, 23.0, 41.0, 52.0, 98.0, 119.0, 148.0, 252.0, 373.0, 563.0, 837.0, 1340.0, 2186.0, 3766.0, 6603.0, 12539.0, 25926.0, 60161.0, 168672.0, 631324.0, 1775443.0, 1068449.0, 277267.0, 87935.0, 35009.0, 15907.0, 8040.0, 4397.0, 2514.0, 1457.0, 927.0, 595.0, 404.0, 283.0, 194.0, 122.0, 99.0, 50.0, 52.0, 32.0, 19.0, 10.0, 16.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.4041900634765625, -1.355255126953125, -1.3063201904296875, -1.25738525390625, -1.2084503173828125, -1.159515380859375, -1.1105804443359375, -1.0616455078125, -1.0127105712890625, -0.963775634765625, -0.9148406982421875, -0.86590576171875, -0.8169708251953125, -0.768035888671875, -0.7191009521484375, -0.670166015625, -0.6212310791015625, -0.572296142578125, -0.5233612060546875, -0.47442626953125, -0.4254913330078125, -0.376556396484375, -0.3276214599609375, -0.2786865234375, -0.2297515869140625, -0.180816650390625, -0.1318817138671875, -0.08294677734375, -0.0340118408203125, 0.014923095703125, 0.0638580322265625, 0.11279296875, 0.1617279052734375, 0.210662841796875, 0.2595977783203125, 0.30853271484375, 0.3574676513671875, 0.406402587890625, 0.4553375244140625, 0.5042724609375, 0.5532073974609375, 0.602142333984375, 0.6510772705078125, 0.70001220703125, 0.7489471435546875, 0.797882080078125, 0.8468170166015625, 0.895751953125, 0.9446868896484375, 0.993621826171875, 1.0425567626953125, 1.09149169921875, 1.1404266357421875, 1.189361572265625, 1.2382965087890625, 1.2872314453125, 1.3361663818359375, 1.385101318359375, 1.4340362548828125, 1.48297119140625, 1.5319061279296875, 1.580841064453125, 1.6297760009765625, 1.6787109375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 4.0, 12.0, 8.0, 12.0, 15.0, 18.0, 23.0, 30.0, 27.0, 47.0, 50.0, 69.0, 90.0, 102.0, 160.0, 206.0, 233.0, 302.0, 403.0, 379.0, 379.0, 319.0, 239.0, 192.0, 137.0, 131.0, 95.0, 62.0, 63.0, 47.0, 44.0, 34.0, 36.0, 22.0, 13.0, 15.0, 10.0, 5.0, 6.0, 11.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.4326171875, -1.3839569091796875, -1.335296630859375, -1.2866363525390625, -1.23797607421875, -1.1893157958984375, -1.140655517578125, -1.0919952392578125, -1.0433349609375, -0.9946746826171875, -0.946014404296875, -0.8973541259765625, -0.84869384765625, -0.8000335693359375, -0.751373291015625, -0.7027130126953125, -0.654052734375, -0.6053924560546875, -0.556732177734375, -0.5080718994140625, -0.45941162109375, -0.4107513427734375, -0.362091064453125, -0.3134307861328125, -0.2647705078125, -0.2161102294921875, -0.167449951171875, -0.1187896728515625, -0.07012939453125, -0.0214691162109375, 0.027191162109375, 0.0758514404296875, 0.12451171875, 0.1731719970703125, 0.221832275390625, 0.2704925537109375, 0.31915283203125, 0.3678131103515625, 0.416473388671875, 0.4651336669921875, 0.5137939453125, 0.5624542236328125, 0.611114501953125, 0.6597747802734375, 0.70843505859375, 0.7570953369140625, 0.805755615234375, 0.8544158935546875, 0.903076171875, 0.9517364501953125, 1.000396728515625, 1.0490570068359375, 1.09771728515625, 1.1463775634765625, 1.195037841796875, 1.2436981201171875, 1.2923583984375, 1.3410186767578125, 1.389678955078125, 1.4383392333984375, 1.48699951171875, 1.5356597900390625, 1.584320068359375, 1.6329803466796875, 1.681640625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 11.0, 20.0, 29.0, 39.0, 44.0, 60.0, 78.0, 116.0, 164.0, 326.0, 645.0, 1512.0, 4101.0, 14433.0, 67561.0, 508535.0, 2941727.0, 559406.0, 72520.0, 15389.0, 4420.0, 1549.0, 642.0, 350.0, 199.0, 124.0, 65.0, 49.0, 36.0, 22.0, 24.0, 11.0, 18.0, 10.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.58203125, -4.453033447265625, -4.32403564453125, -4.195037841796875, -4.0660400390625, -3.937042236328125, -3.80804443359375, -3.679046630859375, -3.550048828125, -3.421051025390625, -3.29205322265625, -3.163055419921875, -3.0340576171875, -2.905059814453125, -2.77606201171875, -2.647064208984375, -2.51806640625, -2.389068603515625, -2.26007080078125, -2.131072998046875, -2.0020751953125, -1.873077392578125, -1.74407958984375, -1.615081787109375, -1.486083984375, -1.357086181640625, -1.22808837890625, -1.099090576171875, -0.9700927734375, -0.841094970703125, -0.71209716796875, -0.583099365234375, -0.4541015625, -0.325103759765625, -0.19610595703125, -0.067108154296875, 0.0618896484375, 0.190887451171875, 0.31988525390625, 0.448883056640625, 0.577880859375, 0.706878662109375, 0.83587646484375, 0.964874267578125, 1.0938720703125, 1.222869873046875, 1.35186767578125, 1.480865478515625, 1.60986328125, 1.738861083984375, 1.86785888671875, 1.996856689453125, 2.1258544921875, 2.254852294921875, 2.38385009765625, 2.512847900390625, 2.641845703125, 2.770843505859375, 2.89984130859375, 3.028839111328125, 3.1578369140625, 3.286834716796875, 3.41583251953125, 3.544830322265625, 3.673828125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 14.0, 34.0, 73.0, 146.0, 225.0, 212.0, 153.0, 90.0, 38.0, 14.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-39.67644500732422, -38.89781188964844, -38.119178771972656, -37.340545654296875, -36.561912536621094, -35.78327560424805, -35.004642486572266, -34.226009368896484, -33.4473762512207, -32.66874313354492, -31.89011001586914, -31.111474990844727, -30.332841873168945, -29.554208755493164, -28.77557373046875, -27.99694061279297, -27.218307495117188, -26.439674377441406, -25.661041259765625, -24.88240623474121, -24.10377311706543, -23.32513999938965, -22.546504974365234, -21.767871856689453, -20.989238739013672, -20.21060562133789, -19.43197250366211, -18.653337478637695, -17.874704360961914, -17.096071243286133, -16.31743621826172, -15.538803100585938, -14.760171890258789, -13.981538772583008, -13.20290470123291, -12.424270629882812, -11.645637512207031, -10.86700439453125, -10.088370323181152, -9.309736251831055, -8.531103134155273, -7.752469539642334, -6.9738359451293945, -6.195202350616455, -5.416568756103516, -4.637935161590576, -3.8593015670776367, -3.0806679725646973, -2.302034378051758, -1.5234007835388184, -0.7447671890258789, 0.03386640548706055, 0.8125, 1.5911335945129395, 2.369767189025879, 3.1484007835388184, 3.927034378051758, 4.705667972564697, 5.484301567077637, 6.262935161590576, 7.041568756103516, 7.820202350616455, 8.598835945129395, 9.377470016479492, 10.156103134155273]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 6.0, 7.0, 12.0, 11.0, 23.0, 11.0, 18.0, 27.0, 30.0, 36.0, 24.0, 29.0, 39.0, 35.0, 31.0, 41.0, 50.0, 27.0, 36.0, 37.0, 42.0, 28.0, 33.0, 47.0, 35.0, 33.0, 29.0, 24.0, 35.0, 27.0, 30.0, 17.0, 17.0, 10.0, 8.0, 11.0, 4.0, 6.0, 9.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.547563552856445, -6.342548847198486, -6.1375346183776855, -5.932519912719727, -5.727505683898926, -5.522490978240967, -5.317476272583008, -5.112462043762207, -4.907447814941406, -4.702433109283447, -4.4974188804626465, -4.2924041748046875, -4.087389945983887, -3.8823752403259277, -3.677360773086548, -3.472346305847168, -3.267331600189209, -3.062317132949829, -2.857302665710449, -2.6522879600524902, -2.4472737312316895, -2.2422590255737305, -2.0372445583343506, -1.8322300910949707, -1.6272156238555908, -1.422201156616211, -1.217186689376831, -1.0121721029281616, -0.8071576356887817, -0.6021431684494019, -0.3971285820007324, -0.19211411476135254, 0.01289987564086914, 0.2179143726825714, 0.4229288697242737, 0.6279433965682983, 0.8329578638076782, 1.037972331047058, 1.2429869174957275, 1.4480013847351074, 1.6530158519744873, 1.8580303192138672, 2.063044786453247, 2.268059253692627, 2.473073959350586, 2.6780881881713867, 2.8831028938293457, 3.0881173610687256, 3.2931318283081055, 3.4981462955474854, 3.7031607627868652, 3.908175468444824, 4.113189697265625, 4.318204402923584, 4.523219108581543, 4.728233337402344, 4.9332475662231445, 5.1382622718811035, 5.343276500701904, 5.548291206359863, 5.753305435180664, 5.958320140838623, 6.163334846496582, 6.368349075317383, 6.573363780975342]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 6.0, 12.0, 6.0, 13.0, 20.0, 15.0, 21.0, 13.0, 21.0, 25.0, 27.0, 27.0, 35.0, 26.0, 36.0, 30.0, 32.0, 35.0, 36.0, 42.0, 31.0, 42.0, 41.0, 34.0, 33.0, 29.0, 31.0, 39.0, 31.0, 28.0, 31.0, 16.0, 18.0, 13.0, 13.0, 16.0, 21.0, 15.0, 11.0, 3.0, 9.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.83984375, -0.8139419555664062, -0.7880401611328125, -0.7621383666992188, -0.736236572265625, -0.7103347778320312, -0.6844329833984375, -0.6585311889648438, -0.63262939453125, -0.6067276000976562, -0.5808258056640625, -0.5549240112304688, -0.529022216796875, -0.5031204223632812, -0.4772186279296875, -0.45131683349609375, -0.4254150390625, -0.39951324462890625, -0.3736114501953125, -0.34770965576171875, -0.321807861328125, -0.29590606689453125, -0.2700042724609375, -0.24410247802734375, -0.21820068359375, -0.19229888916015625, -0.1663970947265625, -0.14049530029296875, -0.114593505859375, -0.08869171142578125, -0.0627899169921875, -0.03688812255859375, -0.010986328125, 0.01491546630859375, 0.0408172607421875, 0.06671905517578125, 0.092620849609375, 0.11852264404296875, 0.1444244384765625, 0.17032623291015625, 0.19622802734375, 0.22212982177734375, 0.2480316162109375, 0.27393341064453125, 0.299835205078125, 0.32573699951171875, 0.3516387939453125, 0.37754058837890625, 0.4034423828125, 0.42934417724609375, 0.4552459716796875, 0.48114776611328125, 0.507049560546875, 0.5329513549804688, 0.5588531494140625, 0.5847549438476562, 0.61065673828125, 0.6365585327148438, 0.6624603271484375, 0.6883621215820312, 0.714263916015625, 0.7401657104492188, 0.7660675048828125, 0.7919692993164062, 0.81787109375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 18.0, 28.0, 46.0, 68.0, 100.0, 195.0, 331.0, 682.0, 1364.0, 2953.0, 6608.0, 15617.0, 43853.0, 158082.0, 507985.0, 220371.0, 56115.0, 19242.0, 8013.0, 3544.0, 1597.0, 805.0, 388.0, 217.0, 138.0, 74.0, 33.0, 21.0, 19.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7109375, -0.6925239562988281, -0.6741104125976562, -0.6556968688964844, -0.6372833251953125, -0.6188697814941406, -0.6004562377929688, -0.5820426940917969, -0.563629150390625, -0.5452156066894531, -0.5268020629882812, -0.5083885192871094, -0.4899749755859375, -0.4715614318847656, -0.45314788818359375, -0.4347343444824219, -0.41632080078125, -0.3979072570800781, -0.37949371337890625, -0.3610801696777344, -0.3426666259765625, -0.3242530822753906, -0.30583953857421875, -0.2874259948730469, -0.269012451171875, -0.2505989074707031, -0.23218536376953125, -0.21377182006835938, -0.1953582763671875, -0.17694473266601562, -0.15853118896484375, -0.14011764526367188, -0.1217041015625, -0.10329055786132812, -0.08487701416015625, -0.06646347045898438, -0.0480499267578125, -0.029636383056640625, -0.01122283935546875, 0.007190704345703125, 0.025604248046875, 0.044017791748046875, 0.06243133544921875, 0.08084487915039062, 0.0992584228515625, 0.11767196655273438, 0.13608551025390625, 0.15449905395507812, 0.17291259765625, 0.19132614135742188, 0.20973968505859375, 0.22815322875976562, 0.2465667724609375, 0.2649803161621094, 0.28339385986328125, 0.3018074035644531, 0.320220947265625, 0.3386344909667969, 0.35704803466796875, 0.3754615783691406, 0.3938751220703125, 0.4122886657714844, 0.43070220947265625, 0.4491157531738281, 0.467529296875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 8.0, 7.0, 11.0, 13.0, 18.0, 19.0, 16.0, 15.0, 16.0, 31.0, 30.0, 29.0, 39.0, 32.0, 27.0, 40.0, 24.0, 39.0, 48.0, 1068.0, 38.0, 44.0, 45.0, 38.0, 38.0, 37.0, 39.0, 33.0, 26.0, 15.0, 21.0, 23.0, 19.0, 21.0, 14.0, 9.0, 9.0, 6.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73974609375, -0.7193756103515625, -0.699005126953125, -0.6786346435546875, -0.65826416015625, -0.6378936767578125, -0.617523193359375, -0.5971527099609375, -0.5767822265625, -0.5564117431640625, -0.536041259765625, -0.5156707763671875, -0.49530029296875, -0.4749298095703125, -0.454559326171875, -0.4341888427734375, -0.413818359375, -0.3934478759765625, -0.373077392578125, -0.3527069091796875, -0.33233642578125, -0.3119659423828125, -0.291595458984375, -0.2712249755859375, -0.2508544921875, -0.2304840087890625, -0.210113525390625, -0.1897430419921875, -0.16937255859375, -0.1490020751953125, -0.128631591796875, -0.1082611083984375, -0.087890625, -0.0675201416015625, -0.047149658203125, -0.0267791748046875, -0.00640869140625, 0.0139617919921875, 0.034332275390625, 0.0547027587890625, 0.0750732421875, 0.0954437255859375, 0.115814208984375, 0.1361846923828125, 0.15655517578125, 0.1769256591796875, 0.197296142578125, 0.2176666259765625, 0.238037109375, 0.2584075927734375, 0.278778076171875, 0.2991485595703125, 0.31951904296875, 0.3398895263671875, 0.360260009765625, 0.3806304931640625, 0.4010009765625, 0.4213714599609375, 0.441741943359375, 0.4621124267578125, 0.48248291015625, 0.5028533935546875, 0.523223876953125, 0.5435943603515625, 0.56396484375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 3.0, 11.0, 14.0, 17.0, 33.0, 66.0, 83.0, 135.0, 292.0, 553.0, 1106.0, 2510.0, 6509.0, 20476.0, 103322.0, 1533703.0, 363899.0, 45081.0, 11788.0, 4107.0, 1655.0, 813.0, 392.0, 236.0, 108.0, 65.0, 53.0, 27.0, 21.0, 13.0, 16.0, 8.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5771484375, -0.5614509582519531, -0.5457534790039062, -0.5300559997558594, -0.5143585205078125, -0.4986610412597656, -0.48296356201171875, -0.4672660827636719, -0.451568603515625, -0.4358711242675781, -0.42017364501953125, -0.4044761657714844, -0.3887786865234375, -0.3730812072753906, -0.35738372802734375, -0.3416862487792969, -0.32598876953125, -0.3102912902832031, -0.29459381103515625, -0.2788963317871094, -0.2631988525390625, -0.24750137329101562, -0.23180389404296875, -0.21610641479492188, -0.200408935546875, -0.18471145629882812, -0.16901397705078125, -0.15331649780273438, -0.1376190185546875, -0.12192153930664062, -0.10622406005859375, -0.09052658081054688, -0.0748291015625, -0.059131622314453125, -0.04343414306640625, -0.027736663818359375, -0.0120391845703125, 0.003658294677734375, 0.01935577392578125, 0.035053253173828125, 0.050750732421875, 0.06644821166992188, 0.08214569091796875, 0.09784317016601562, 0.1135406494140625, 0.12923812866210938, 0.14493560791015625, 0.16063308715820312, 0.17633056640625, 0.19202804565429688, 0.20772552490234375, 0.22342300415039062, 0.2391204833984375, 0.2548179626464844, 0.27051544189453125, 0.2862129211425781, 0.301910400390625, 0.3176078796386719, 0.33330535888671875, 0.3490028381347656, 0.3647003173828125, 0.3803977966308594, 0.39609527587890625, 0.4117927551269531, 0.427490234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 2.0, 7.0, 9.0, 15.0, 19.0, 18.0, 26.0, 39.0, 60.0, 110.0, 189.0, 159.0, 108.0, 48.0, 36.0, 35.0, 18.0, 15.0, 16.0, 9.0, 12.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08135986328125, -0.07881832122802734, -0.07627677917480469, -0.07373523712158203, -0.07119369506835938, -0.06865215301513672, -0.06611061096191406, -0.0635690689086914, -0.06102752685546875, -0.058485984802246094, -0.05594444274902344, -0.05340290069580078, -0.050861358642578125, -0.04831981658935547, -0.04577827453613281, -0.043236732482910156, -0.0406951904296875, -0.038153648376464844, -0.03561210632324219, -0.03307056427001953, -0.030529022216796875, -0.02798748016357422, -0.025445938110351562, -0.022904396057128906, -0.02036285400390625, -0.017821311950683594, -0.015279769897460938, -0.012738227844238281, -0.010196685791015625, -0.007655143737792969, -0.0051136016845703125, -0.0025720596313476562, -3.0517578125e-05, 0.0025110244750976562, 0.0050525665283203125, 0.007594108581542969, 0.010135650634765625, 0.012677192687988281, 0.015218734741210938, 0.017760276794433594, 0.02030181884765625, 0.022843360900878906, 0.025384902954101562, 0.02792644500732422, 0.030467987060546875, 0.03300952911376953, 0.03555107116699219, 0.038092613220214844, 0.0406341552734375, 0.043175697326660156, 0.04571723937988281, 0.04825878143310547, 0.050800323486328125, 0.05334186553955078, 0.05588340759277344, 0.058424949645996094, 0.06096649169921875, 0.0635080337524414, 0.06604957580566406, 0.06859111785888672, 0.07113265991210938, 0.07367420196533203, 0.07621574401855469, 0.07875728607177734, 0.081298828125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 3.0, 5.0, 9.0, 6.0, 13.0, 12.0, 14.0, 34.0, 25.0, 30.0, 51.0, 44.0, 99.0, 283.0, 1674.0, 10236.0, 982219.0, 49067.0, 3649.0, 614.0, 152.0, 82.0, 46.0, 30.0, 32.0, 29.0, 14.0, 11.0, 11.0, 5.0, 5.0, 6.0, 10.0, 5.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.228515625, -1.19097900390625, -1.1534423828125, -1.11590576171875, -1.078369140625, -1.04083251953125, -1.0032958984375, -0.96575927734375, -0.92822265625, -0.89068603515625, -0.8531494140625, -0.81561279296875, -0.778076171875, -0.74053955078125, -0.7030029296875, -0.66546630859375, -0.6279296875, -0.59039306640625, -0.5528564453125, -0.51531982421875, -0.477783203125, -0.44024658203125, -0.4027099609375, -0.36517333984375, -0.32763671875, -0.29010009765625, -0.2525634765625, -0.21502685546875, -0.177490234375, -0.13995361328125, -0.1024169921875, -0.06488037109375, -0.02734375, 0.01019287109375, 0.0477294921875, 0.08526611328125, 0.122802734375, 0.16033935546875, 0.1978759765625, 0.23541259765625, 0.27294921875, 0.31048583984375, 0.3480224609375, 0.38555908203125, 0.423095703125, 0.46063232421875, 0.4981689453125, 0.53570556640625, 0.5732421875, 0.61077880859375, 0.6483154296875, 0.68585205078125, 0.723388671875, 0.76092529296875, 0.7984619140625, 0.83599853515625, 0.87353515625, 0.91107177734375, 0.9486083984375, 0.98614501953125, 1.023681640625, 1.06121826171875, 1.0987548828125, 1.13629150390625, 1.173828125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 59.0, 192.0, 401.0, 246.0, 75.0, 17.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30899348855018616, -0.2969755232334137, -0.2849575877189636, -0.27293962240219116, -0.2609216868877411, -0.24890372157096863, -0.23688577115535736, -0.2248678207397461, -0.21284985542297363, -0.20083190500736237, -0.1888139545917511, -0.17679598927497864, -0.16477803885936737, -0.1527600884437561, -0.14074213802814484, -0.12872418761253357, -0.1167062371969223, -0.10468828678131104, -0.09267032891511917, -0.0806523784995079, -0.06863442063331604, -0.05661647021770477, -0.044598519802093506, -0.03258056193590164, -0.020562611520290375, -0.008544658310711384, 0.003473294898867607, 0.015491247177124023, 0.02750920131802559, 0.039527155458927155, 0.05154510587453842, 0.06356306374073029, 0.07558101415634155, 0.08759896457195282, 0.09961692243814468, 0.11163487285375595, 0.12365283071994781, 0.13567078113555908, 0.14768873155117035, 0.15970668196678162, 0.17172464728355408, 0.18374259769916534, 0.1957605481147766, 0.20777851343154907, 0.21979646384716034, 0.2318144142627716, 0.24383236467838287, 0.25585031509399414, 0.2678682804107666, 0.27988624572753906, 0.29190418124198914, 0.3039221465587616, 0.31594008207321167, 0.32795804738998413, 0.3399760127067566, 0.35199394822120667, 0.36401188373565674, 0.3760298490524292, 0.3880477845668793, 0.40006574988365173, 0.4120836853981018, 0.42410165071487427, 0.43611961603164673, 0.4481375515460968, 0.46015551686286926]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 6.0, 6.0, 1.0, 3.0, 12.0, 11.0, 8.0, 21.0, 10.0, 22.0, 21.0, 20.0, 33.0, 35.0, 35.0, 48.0, 29.0, 49.0, 54.0, 49.0, 36.0, 48.0, 48.0, 38.0, 39.0, 36.0, 27.0, 34.0, 45.0, 24.0, 19.0, 18.0, 17.0, 22.0, 14.0, 17.0, 12.0, 7.0, 16.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.102711021900177, -0.10005365312099457, -0.09739627689123154, -0.0947389006614685, -0.09208153188228607, -0.08942416310310364, -0.0867667868733406, -0.08410941064357758, -0.08145204186439514, -0.07879467308521271, -0.07613729685544968, -0.07347992062568665, -0.07082255184650421, -0.06816518306732178, -0.06550780683755875, -0.06285043060779572, -0.06019306182861328, -0.05753568932414055, -0.054878316819667816, -0.052220944315195084, -0.04956357181072235, -0.04690619930624962, -0.044248826801776886, -0.04159145429730415, -0.03893408179283142, -0.03627670928835869, -0.033619336783885956, -0.030961964279413223, -0.02830459177494049, -0.025647219270467758, -0.022989846765995026, -0.020332474261522293, -0.01767510175704956, -0.015017729252576828, -0.012360356748104095, -0.009702984243631363, -0.00704561173915863, -0.004388239234685898, -0.0017308667302131653, 0.0009265057742595673, 0.0035838782787323, 0.006241250783205032, 0.008898623287677765, 0.011555995792150497, 0.01421336829662323, 0.016870740801095963, 0.019528113305568695, 0.022185485810041428, 0.02484285831451416, 0.027500230818986893, 0.030157603323459625, 0.03281497582793236, 0.03547234833240509, 0.03812972083687782, 0.040787093341350555, 0.04344446584582329, 0.04610183835029602, 0.04875921085476875, 0.051416583359241486, 0.05407395586371422, 0.05673132836818695, 0.05938870087265968, 0.062046073377132416, 0.06470344960689545, 0.06736081838607788]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 4.0, 7.0, 11.0, 6.0, 15.0, 20.0, 17.0, 18.0, 12.0, 22.0, 27.0, 26.0, 26.0, 34.0, 29.0, 32.0, 36.0, 34.0, 29.0, 37.0, 40.0, 35.0, 38.0, 43.0, 34.0, 30.0, 34.0, 30.0, 34.0, 34.0, 29.0, 29.0, 15.0, 18.0, 16.0, 14.0, 16.0, 21.0, 13.0, 9.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.837890625, -0.8119964599609375, -0.786102294921875, -0.7602081298828125, -0.73431396484375, -0.7084197998046875, -0.682525634765625, -0.6566314697265625, -0.6307373046875, -0.6048431396484375, -0.578948974609375, -0.5530548095703125, -0.52716064453125, -0.5012664794921875, -0.475372314453125, -0.4494781494140625, -0.423583984375, -0.3976898193359375, -0.371795654296875, -0.3459014892578125, -0.32000732421875, -0.2941131591796875, -0.268218994140625, -0.2423248291015625, -0.2164306640625, -0.1905364990234375, -0.164642333984375, -0.1387481689453125, -0.11285400390625, -0.0869598388671875, -0.061065673828125, -0.0351715087890625, -0.00927734375, 0.0166168212890625, 0.042510986328125, 0.0684051513671875, 0.09429931640625, 0.1201934814453125, 0.146087646484375, 0.1719818115234375, 0.1978759765625, 0.2237701416015625, 0.249664306640625, 0.2755584716796875, 0.30145263671875, 0.3273468017578125, 0.353240966796875, 0.3791351318359375, 0.405029296875, 0.4309234619140625, 0.456817626953125, 0.4827117919921875, 0.50860595703125, 0.5345001220703125, 0.560394287109375, 0.5862884521484375, 0.6121826171875, 0.6380767822265625, 0.663970947265625, 0.6898651123046875, 0.71575927734375, 0.7416534423828125, 0.767547607421875, 0.7934417724609375, 0.8193359375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 14.0, 28.0, 38.0, 63.0, 117.0, 207.0, 373.0, 660.0, 1354.0, 2605.0, 5334.0, 11922.0, 28842.0, 75799.0, 210918.0, 438137.0, 168397.0, 60952.0, 23580.0, 9817.0, 4468.0, 2297.0, 1167.0, 635.0, 374.0, 171.0, 104.0, 65.0, 27.0, 18.0, 15.0, 6.0, 3.0, 5.0, 5.0, 2.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.67578125, -1.6255950927734375, -1.575408935546875, -1.5252227783203125, -1.47503662109375, -1.4248504638671875, -1.374664306640625, -1.3244781494140625, -1.2742919921875, -1.2241058349609375, -1.173919677734375, -1.1237335205078125, -1.07354736328125, -1.0233612060546875, -0.973175048828125, -0.9229888916015625, -0.872802734375, -0.8226165771484375, -0.772430419921875, -0.7222442626953125, -0.67205810546875, -0.6218719482421875, -0.571685791015625, -0.5214996337890625, -0.4713134765625, -0.4211273193359375, -0.370941162109375, -0.3207550048828125, -0.27056884765625, -0.2203826904296875, -0.170196533203125, -0.1200103759765625, -0.06982421875, -0.0196380615234375, 0.030548095703125, 0.0807342529296875, 0.13092041015625, 0.1811065673828125, 0.231292724609375, 0.2814788818359375, 0.3316650390625, 0.3818511962890625, 0.432037353515625, 0.4822235107421875, 0.53240966796875, 0.5825958251953125, 0.632781982421875, 0.6829681396484375, 0.733154296875, 0.7833404541015625, 0.833526611328125, 0.8837127685546875, 0.93389892578125, 0.9840850830078125, 1.034271240234375, 1.0844573974609375, 1.1346435546875, 1.1848297119140625, 1.235015869140625, 1.2852020263671875, 1.33538818359375, 1.3855743408203125, 1.435760498046875, 1.4859466552734375, 1.5361328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 10.0, 10.0, 9.0, 12.0, 11.0, 7.0, 15.0, 20.0, 19.0, 35.0, 27.0, 23.0, 28.0, 48.0, 41.0, 45.0, 79.0, 120.0, 194.0, 1406.0, 229.0, 160.0, 104.0, 61.0, 47.0, 32.0, 36.0, 37.0, 29.0, 18.0, 25.0, 23.0, 15.0, 12.0, 14.0, 8.0, 6.0, 6.0, 3.0, 7.0, 4.0, 4.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.471282958984375, -2.38201904296875, -2.292755126953125, -2.2034912109375, -2.114227294921875, -2.02496337890625, -1.935699462890625, -1.846435546875, -1.757171630859375, -1.66790771484375, -1.578643798828125, -1.4893798828125, -1.400115966796875, -1.31085205078125, -1.221588134765625, -1.13232421875, -1.043060302734375, -0.95379638671875, -0.864532470703125, -0.7752685546875, -0.686004638671875, -0.59674072265625, -0.507476806640625, -0.418212890625, -0.328948974609375, -0.23968505859375, -0.150421142578125, -0.0611572265625, 0.028106689453125, 0.11737060546875, 0.206634521484375, 0.2958984375, 0.385162353515625, 0.47442626953125, 0.563690185546875, 0.6529541015625, 0.742218017578125, 0.83148193359375, 0.920745849609375, 1.010009765625, 1.099273681640625, 1.18853759765625, 1.277801513671875, 1.3670654296875, 1.456329345703125, 1.54559326171875, 1.634857177734375, 1.72412109375, 1.813385009765625, 1.90264892578125, 1.991912841796875, 2.0811767578125, 2.170440673828125, 2.25970458984375, 2.348968505859375, 2.438232421875, 2.527496337890625, 2.61676025390625, 2.706024169921875, 2.7952880859375, 2.884552001953125, 2.97381591796875, 3.063079833984375, 3.15234375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 9.0, 12.0, 21.0, 23.0, 45.0, 86.0, 182.0, 291.0, 642.0, 1644.0, 10162.0, 2485886.0, 638350.0, 5890.0, 1306.0, 519.0, 300.0, 141.0, 68.0, 44.0, 35.0, 14.0, 14.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1405029296875, -9.812255859375, -9.4840087890625, -9.15576171875, -8.8275146484375, -8.499267578125, -8.1710205078125, -7.8427734375, -7.5145263671875, -7.186279296875, -6.8580322265625, -6.52978515625, -6.2015380859375, -5.873291015625, -5.5450439453125, -5.216796875, -4.8885498046875, -4.560302734375, -4.2320556640625, -3.90380859375, -3.5755615234375, -3.247314453125, -2.9190673828125, -2.5908203125, -2.2625732421875, -1.934326171875, -1.6060791015625, -1.27783203125, -0.9495849609375, -0.621337890625, -0.2930908203125, 0.03515625, 0.3634033203125, 0.691650390625, 1.0198974609375, 1.34814453125, 1.6763916015625, 2.004638671875, 2.3328857421875, 2.6611328125, 2.9893798828125, 3.317626953125, 3.6458740234375, 3.97412109375, 4.3023681640625, 4.630615234375, 4.9588623046875, 5.287109375, 5.6153564453125, 5.943603515625, 6.2718505859375, 6.60009765625, 6.9283447265625, 7.256591796875, 7.5848388671875, 7.9130859375, 8.2413330078125, 8.569580078125, 8.8978271484375, 9.22607421875, 9.5543212890625, 9.882568359375, 10.2108154296875, 10.5390625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [3.0, 22.0, 232.0, 538.0, 207.0, 16.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5429890155792236, -2.524026870727539, -1.5050649642944336, -0.486102819442749, 0.5328590869903564, 1.551820993423462, 2.5707833766937256, 3.589745283126831, 4.608707427978516, 5.627669334411621, 6.646631240844727, 7.66559362411499, 8.684555053710938, 9.70351791381836, 10.722479820251465, 11.74144172668457, 12.760403633117676, 13.779365539550781, 14.798327445983887, 15.817289352416992, 16.836252212524414, 17.855213165283203, 18.874176025390625, 19.893138885498047, 20.912099838256836, 21.931062698364258, 22.950023651123047, 23.96898651123047, 24.987947463989258, 26.00691032409668, 27.02587127685547, 28.04483413696289, 29.063796997070312, 30.082759857177734, 31.101720809936523, 32.12068176269531, 33.139644622802734, 34.158607482910156, 35.17757034301758, 36.196533203125, 37.215492248535156, 38.23445510864258, 39.25341796875, 40.272377014160156, 41.29133987426758, 42.310302734375, 43.32926559448242, 44.348228454589844, 45.3671875, 46.38615036010742, 47.405113220214844, 48.424072265625, 49.44303512573242, 50.461997985839844, 51.480960845947266, 52.49992370605469, 53.51888656616211, 54.53784942626953, 55.55681228637695, 56.57577133178711, 57.59473419189453, 58.61369705200195, 59.632659912109375, 60.65161895751953, 61.67058181762695]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 0.0, 5.0, 9.0, 6.0, 9.0, 11.0, 8.0, 10.0, 6.0, 18.0, 11.0, 19.0, 23.0, 25.0, 21.0, 38.0, 40.0, 32.0, 31.0, 33.0, 39.0, 32.0, 41.0, 45.0, 33.0, 39.0, 53.0, 31.0, 43.0, 30.0, 24.0, 24.0, 28.0, 26.0, 21.0, 18.0, 24.0, 16.0, 15.0, 16.0, 18.0, 5.0, 8.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-8.231964111328125, -8.001847267150879, -7.771731376647949, -7.541615009307861, -7.311498641967773, -7.0813822746276855, -6.851265907287598, -6.621149063110352, -6.391033172607422, -6.160916805267334, -5.930800437927246, -5.700684070587158, -5.47056770324707, -5.240451335906982, -5.0103349685668945, -4.780218124389648, -4.5501017570495605, -4.319985389709473, -4.089869022369385, -3.859752655029297, -3.629636287689209, -3.399519920349121, -3.169403314590454, -2.939286947250366, -2.7091705799102783, -2.4790542125701904, -2.2489378452301025, -2.0188212394714355, -1.7887049913406372, -1.5585886240005493, -1.3284721374511719, -1.098355770111084, -0.8682398796081543, -0.6381235122680664, -0.40800708532333374, -0.17789065837860107, 0.052225708961486816, 0.2823420763015747, 0.5124585628509521, 0.74257493019104, 0.9726912975311279, 1.2028076648712158, 1.4329240322113037, 1.6630405187606812, 1.893156886100769, 2.1232733726501465, 2.3533897399902344, 2.5835061073303223, 2.81362247467041, 3.043738842010498, 3.273855209350586, 3.503971576690674, 3.7340879440307617, 3.9642043113708496, 4.1943206787109375, 4.424437522888184, 4.654553413391113, 4.884669780731201, 5.114786148071289, 5.344902515411377, 5.575018882751465, 5.805135250091553, 6.035251617431641, 6.265368461608887, 6.495484828948975]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 6.0, 11.0, 13.0, 18.0, 14.0, 13.0, 28.0, 23.0, 21.0, 31.0, 30.0, 34.0, 28.0, 36.0, 38.0, 33.0, 30.0, 37.0, 51.0, 36.0, 47.0, 40.0, 31.0, 28.0, 37.0, 29.0, 24.0, 32.0, 30.0, 22.0, 18.0, 17.0, 19.0, 17.0, 5.0, 13.0, 8.0, 9.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.931640625, -0.9038619995117188, -0.8760833740234375, -0.8483047485351562, -0.820526123046875, -0.7927474975585938, -0.7649688720703125, -0.7371902465820312, -0.70941162109375, -0.6816329956054688, -0.6538543701171875, -0.6260757446289062, -0.598297119140625, -0.5705184936523438, -0.5427398681640625, -0.5149612426757812, -0.4871826171875, -0.45940399169921875, -0.4316253662109375, -0.40384674072265625, -0.376068115234375, -0.34828948974609375, -0.3205108642578125, -0.29273223876953125, -0.26495361328125, -0.23717498779296875, -0.2093963623046875, -0.18161773681640625, -0.153839111328125, -0.12606048583984375, -0.0982818603515625, -0.07050323486328125, -0.042724609375, -0.01494598388671875, 0.0128326416015625, 0.04061126708984375, 0.068389892578125, 0.09616851806640625, 0.1239471435546875, 0.15172576904296875, 0.17950439453125, 0.20728302001953125, 0.2350616455078125, 0.26284027099609375, 0.290618896484375, 0.31839752197265625, 0.3461761474609375, 0.37395477294921875, 0.4017333984375, 0.42951202392578125, 0.4572906494140625, 0.48506927490234375, 0.512847900390625, 0.5406265258789062, 0.5684051513671875, 0.5961837768554688, 0.62396240234375, 0.6517410278320312, 0.6795196533203125, 0.7072982788085938, 0.735076904296875, 0.7628555297851562, 0.7906341552734375, 0.8184127807617188, 0.84619140625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 7.0, 12.0, 16.0, 12.0, 25.0, 41.0, 50.0, 71.0, 127.0, 228.0, 370.0, 675.0, 1271.0, 2435.0, 5005.0, 11512.0, 29682.0, 91912.0, 393846.0, 1872065.0, 1408832.0, 266408.0, 68400.0, 22789.0, 9294.0, 4258.0, 2211.0, 1130.0, 603.0, 374.0, 207.0, 122.0, 92.0, 54.0, 37.0, 25.0, 16.0, 17.0, 12.0, 5.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.09375, -2.031951904296875, -1.97015380859375, -1.908355712890625, -1.8465576171875, -1.784759521484375, -1.72296142578125, -1.661163330078125, -1.599365234375, -1.537567138671875, -1.47576904296875, -1.413970947265625, -1.3521728515625, -1.290374755859375, -1.22857666015625, -1.166778564453125, -1.10498046875, -1.043182373046875, -0.98138427734375, -0.919586181640625, -0.8577880859375, -0.795989990234375, -0.73419189453125, -0.672393798828125, -0.610595703125, -0.548797607421875, -0.48699951171875, -0.425201416015625, -0.3634033203125, -0.301605224609375, -0.23980712890625, -0.178009033203125, -0.1162109375, -0.054412841796875, 0.00738525390625, 0.069183349609375, 0.1309814453125, 0.192779541015625, 0.25457763671875, 0.316375732421875, 0.378173828125, 0.439971923828125, 0.50177001953125, 0.563568115234375, 0.6253662109375, 0.687164306640625, 0.74896240234375, 0.810760498046875, 0.87255859375, 0.934356689453125, 0.99615478515625, 1.057952880859375, 1.1197509765625, 1.181549072265625, 1.24334716796875, 1.305145263671875, 1.366943359375, 1.428741455078125, 1.49053955078125, 1.552337646484375, 1.6141357421875, 1.675933837890625, 1.73773193359375, 1.799530029296875, 1.861328125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 1.0, 15.0, 18.0, 19.0, 32.0, 42.0, 59.0, 52.0, 79.0, 112.0, 133.0, 142.0, 241.0, 292.0, 412.0, 461.0, 443.0, 342.0, 298.0, 192.0, 155.0, 111.0, 85.0, 79.0, 54.0, 36.0, 30.0, 30.0, 17.0, 14.0, 12.0, 7.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.712890625, -1.65887451171875, -1.6048583984375, -1.55084228515625, -1.496826171875, -1.44281005859375, -1.3887939453125, -1.33477783203125, -1.28076171875, -1.22674560546875, -1.1727294921875, -1.11871337890625, -1.064697265625, -1.01068115234375, -0.9566650390625, -0.90264892578125, -0.8486328125, -0.79461669921875, -0.7406005859375, -0.68658447265625, -0.632568359375, -0.57855224609375, -0.5245361328125, -0.47052001953125, -0.41650390625, -0.36248779296875, -0.3084716796875, -0.25445556640625, -0.200439453125, -0.14642333984375, -0.0924072265625, -0.03839111328125, 0.015625, 0.06964111328125, 0.1236572265625, 0.17767333984375, 0.231689453125, 0.28570556640625, 0.3397216796875, 0.39373779296875, 0.44775390625, 0.50177001953125, 0.5557861328125, 0.60980224609375, 0.663818359375, 0.71783447265625, 0.7718505859375, 0.82586669921875, 0.8798828125, 0.93389892578125, 0.9879150390625, 1.04193115234375, 1.095947265625, 1.14996337890625, 1.2039794921875, 1.25799560546875, 1.31201171875, 1.36602783203125, 1.4200439453125, 1.47406005859375, 1.528076171875, 1.58209228515625, 1.6361083984375, 1.69012451171875, 1.744140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 9.0, 20.0, 5.0, 20.0, 24.0, 34.0, 39.0, 65.0, 73.0, 121.0, 205.0, 397.0, 1410.0, 8030.0, 95549.0, 3080092.0, 965657.0, 36846.0, 4034.0, 845.0, 291.0, 140.0, 107.0, 70.0, 56.0, 32.0, 30.0, 21.0, 14.0, 11.0, 8.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.12664794921875, -6.9095458984375, -6.69244384765625, -6.475341796875, -6.25823974609375, -6.0411376953125, -5.82403564453125, -5.60693359375, -5.38983154296875, -5.1727294921875, -4.95562744140625, -4.738525390625, -4.52142333984375, -4.3043212890625, -4.08721923828125, -3.8701171875, -3.65301513671875, -3.4359130859375, -3.21881103515625, -3.001708984375, -2.78460693359375, -2.5675048828125, -2.35040283203125, -2.13330078125, -1.91619873046875, -1.6990966796875, -1.48199462890625, -1.264892578125, -1.04779052734375, -0.8306884765625, -0.61358642578125, -0.396484375, -0.17938232421875, 0.0377197265625, 0.25482177734375, 0.471923828125, 0.68902587890625, 0.9061279296875, 1.12322998046875, 1.34033203125, 1.55743408203125, 1.7745361328125, 1.99163818359375, 2.208740234375, 2.42584228515625, 2.6429443359375, 2.86004638671875, 3.0771484375, 3.29425048828125, 3.5113525390625, 3.72845458984375, 3.945556640625, 4.16265869140625, 4.3797607421875, 4.59686279296875, 4.81396484375, 5.03106689453125, 5.2481689453125, 5.46527099609375, 5.682373046875, 5.89947509765625, 6.1165771484375, 6.33367919921875, 6.55078125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 24.0, 69.0, 184.0, 295.0, 257.0, 117.0, 42.0, 15.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.029930114746094, -28.05422592163086, -27.078521728515625, -26.102819442749023, -25.12711524963379, -24.151411056518555, -23.175708770751953, -22.20000457763672, -21.224300384521484, -20.24859619140625, -19.272891998291016, -18.297189712524414, -17.32148551940918, -16.345781326293945, -15.370078086853027, -14.39437484741211, -13.418670654296875, -12.44296646118164, -11.467263221740723, -10.491559982299805, -9.51585578918457, -8.540151596069336, -7.564448356628418, -6.588744640350342, -5.613040924072266, -4.6373372077941895, -3.6616334915161133, -2.685929775238037, -1.710226058959961, -0.7345223426818848, 0.2411813735961914, 1.2168850898742676, 2.1925888061523438, 3.16829252243042, 4.143996238708496, 5.119699954986572, 6.095403671264648, 7.071107387542725, 8.0468111038208, 9.022514343261719, 9.998218536376953, 10.973922729492188, 11.949625968933105, 12.925329208374023, 13.901033401489258, 14.876737594604492, 15.85244083404541, 16.828144073486328, 17.803848266601562, 18.779552459716797, 19.75525665283203, 20.730958938598633, 21.706663131713867, 22.6823673248291, 23.658069610595703, 24.633773803710938, 25.609477996826172, 26.585182189941406, 27.56088638305664, 28.536588668823242, 29.512292861938477, 30.48799705505371, 31.463699340820312, 32.43940353393555, 33.41510772705078]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 7.0, 10.0, 4.0, 12.0, 20.0, 17.0, 22.0, 30.0, 26.0, 26.0, 26.0, 32.0, 44.0, 32.0, 44.0, 37.0, 48.0, 40.0, 62.0, 40.0, 28.0, 32.0, 38.0, 41.0, 40.0, 23.0, 38.0, 25.0, 23.0, 18.0, 27.0, 8.0, 15.0, 14.0, 11.0, 13.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.204721450805664, -6.984983921051025, -6.765246391296387, -6.545508861541748, -6.325771331787109, -6.1060333251953125, -5.886295795440674, -5.666558265686035, -5.4468207359313965, -5.227083206176758, -5.007345676422119, -4.7876081466674805, -4.567870140075684, -4.348133087158203, -4.128395080566406, -3.9086575508117676, -3.688920021057129, -3.4691824913024902, -3.2494449615478516, -3.029707193374634, -2.809969663619995, -2.5902321338653564, -2.3704943656921387, -2.1507568359375, -1.9310193061828613, -1.7112817764282227, -1.4915441274642944, -1.2718064785003662, -1.0520689487457275, -0.8323314189910889, -0.6125937700271606, -0.3928561210632324, -0.17311906814575195, 0.046618521213531494, 0.26635611057281494, 0.4860936999320984, 0.7058312892913818, 0.9255688190460205, 1.1453064680099487, 1.365044116973877, 1.5847816467285156, 1.8045191764831543, 2.024256706237793, 2.2439944744110107, 2.4637320041656494, 2.683469533920288, 2.903207302093506, 3.1229448318481445, 3.342682361602783, 3.562419891357422, 3.7821574211120605, 4.001894950866699, 4.221632957458496, 4.441370010375977, 4.661108016967773, 4.880845546722412, 5.100583076477051, 5.3203206062316895, 5.540058135986328, 5.759795665740967, 5.9795331954956055, 6.199271202087402, 6.419008731842041, 6.63874626159668, 6.858483791351318]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 1.0, 1.0, 4.0, 3.0, 8.0, 2.0, 8.0, 10.0, 15.0, 16.0, 18.0, 24.0, 29.0, 25.0, 29.0, 24.0, 28.0, 41.0, 25.0, 39.0, 25.0, 29.0, 35.0, 38.0, 45.0, 37.0, 42.0, 45.0, 34.0, 28.0, 38.0, 29.0, 24.0, 32.0, 29.0, 27.0, 15.0, 7.0, 12.0, 10.0, 9.0, 11.0, 8.0, 19.0, 3.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.80657958984375, -0.7806396484375, -0.75469970703125, -0.728759765625, -0.70281982421875, -0.6768798828125, -0.65093994140625, -0.625, -0.59906005859375, -0.5731201171875, -0.54718017578125, -0.521240234375, -0.49530029296875, -0.4693603515625, -0.44342041015625, -0.41748046875, -0.39154052734375, -0.3656005859375, -0.33966064453125, -0.313720703125, -0.28778076171875, -0.2618408203125, -0.23590087890625, -0.2099609375, -0.18402099609375, -0.1580810546875, -0.13214111328125, -0.106201171875, -0.08026123046875, -0.0543212890625, -0.02838134765625, -0.00244140625, 0.02349853515625, 0.0494384765625, 0.07537841796875, 0.101318359375, 0.12725830078125, 0.1531982421875, 0.17913818359375, 0.205078125, 0.23101806640625, 0.2569580078125, 0.28289794921875, 0.308837890625, 0.33477783203125, 0.3607177734375, 0.38665771484375, 0.41259765625, 0.43853759765625, 0.4644775390625, 0.49041748046875, 0.516357421875, 0.54229736328125, 0.5682373046875, 0.59417724609375, 0.6201171875, 0.64605712890625, 0.6719970703125, 0.69793701171875, 0.723876953125, 0.74981689453125, 0.7757568359375, 0.80169677734375, 0.82763671875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 11.0, 13.0, 23.0, 35.0, 42.0, 83.0, 111.0, 177.0, 210.0, 328.0, 466.0, 636.0, 1023.0, 1547.0, 2247.0, 3599.0, 5636.0, 9383.0, 16818.0, 32727.0, 71604.0, 166637.0, 306595.0, 229201.0, 101006.0, 44792.0, 22083.0, 12070.0, 6993.0, 4225.0, 2693.0, 1774.0, 1202.0, 830.0, 508.0, 375.0, 256.0, 163.0, 105.0, 87.0, 68.0, 54.0, 39.0, 29.0, 13.0, 7.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.2347412109375, -0.22797775268554688, -0.22121429443359375, -0.21445083618164062, -0.2076873779296875, -0.20092391967773438, -0.19416046142578125, -0.18739700317382812, -0.180633544921875, -0.17387008666992188, -0.16710662841796875, -0.16034317016601562, -0.1535797119140625, -0.14681625366210938, -0.14005279541015625, -0.13328933715820312, -0.12652587890625, -0.11976242065429688, -0.11299896240234375, -0.10623550415039062, -0.0994720458984375, -0.09270858764648438, -0.08594512939453125, -0.07918167114257812, -0.072418212890625, -0.06565475463867188, -0.05889129638671875, -0.052127838134765625, -0.0453643798828125, -0.038600921630859375, -0.03183746337890625, -0.025074005126953125, -0.018310546875, -0.011547088623046875, -0.00478363037109375, 0.001979827880859375, 0.0087432861328125, 0.015506744384765625, 0.02227020263671875, 0.029033660888671875, 0.035797119140625, 0.042560577392578125, 0.04932403564453125, 0.056087493896484375, 0.0628509521484375, 0.06961441040039062, 0.07637786865234375, 0.08314132690429688, 0.08990478515625, 0.09666824340820312, 0.10343170166015625, 0.11019515991210938, 0.1169586181640625, 0.12372207641601562, 0.13048553466796875, 0.13724899291992188, 0.144012451171875, 0.15077590942382812, 0.15753936767578125, 0.16430282592773438, 0.1710662841796875, 0.17782974243164062, 0.18459320068359375, 0.19135665893554688, 0.1981201171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 11.0, 9.0, 8.0, 8.0, 14.0, 13.0, 19.0, 27.0, 23.0, 32.0, 28.0, 39.0, 32.0, 42.0, 36.0, 32.0, 35.0, 36.0, 1058.0, 39.0, 54.0, 27.0, 41.0, 39.0, 35.0, 28.0, 28.0, 32.0, 27.0, 30.0, 20.0, 16.0, 8.0, 15.0, 15.0, 12.0, 8.0, 6.0, 10.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5625, -0.5438461303710938, -0.5251922607421875, -0.5065383911132812, -0.487884521484375, -0.46923065185546875, -0.4505767822265625, -0.43192291259765625, -0.41326904296875, -0.39461517333984375, -0.3759613037109375, -0.35730743408203125, -0.338653564453125, -0.31999969482421875, -0.3013458251953125, -0.28269195556640625, -0.2640380859375, -0.24538421630859375, -0.2267303466796875, -0.20807647705078125, -0.189422607421875, -0.17076873779296875, -0.1521148681640625, -0.13346099853515625, -0.11480712890625, -0.09615325927734375, -0.0774993896484375, -0.05884552001953125, -0.040191650390625, -0.02153778076171875, -0.0028839111328125, 0.01576995849609375, 0.034423828125, 0.05307769775390625, 0.0717315673828125, 0.09038543701171875, 0.109039306640625, 0.12769317626953125, 0.1463470458984375, 0.16500091552734375, 0.18365478515625, 0.20230865478515625, 0.2209625244140625, 0.23961639404296875, 0.258270263671875, 0.27692413330078125, 0.2955780029296875, 0.31423187255859375, 0.3328857421875, 0.35153961181640625, 0.3701934814453125, 0.38884735107421875, 0.407501220703125, 0.42615509033203125, 0.4448089599609375, 0.46346282958984375, 0.48211669921875, 0.5007705688476562, 0.5194244384765625, 0.5380783081054688, 0.556732177734375, 0.5753860473632812, 0.5940399169921875, 0.6126937866210938, 0.63134765625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 10.0, 14.0, 23.0, 43.0, 43.0, 84.0, 117.0, 211.0, 294.0, 548.0, 763.0, 1315.0, 2284.0, 3964.0, 7684.0, 16187.0, 39017.0, 116921.0, 553368.0, 1112956.0, 152317.0, 49161.0, 19689.0, 9001.0, 4598.0, 2594.0, 1496.0, 902.0, 545.0, 357.0, 223.0, 112.0, 79.0, 66.0, 41.0, 22.0, 17.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.170654296875, -0.16516876220703125, -0.1596832275390625, -0.15419769287109375, -0.148712158203125, -0.14322662353515625, -0.1377410888671875, -0.13225555419921875, -0.12677001953125, -0.12128448486328125, -0.1157989501953125, -0.11031341552734375, -0.104827880859375, -0.09934234619140625, -0.0938568115234375, -0.08837127685546875, -0.0828857421875, -0.07740020751953125, -0.0719146728515625, -0.06642913818359375, -0.060943603515625, -0.05545806884765625, -0.0499725341796875, -0.04448699951171875, -0.03900146484375, -0.03351593017578125, -0.0280303955078125, -0.02254486083984375, -0.017059326171875, -0.01157379150390625, -0.0060882568359375, -0.00060272216796875, 0.0048828125, 0.01036834716796875, 0.0158538818359375, 0.02133941650390625, 0.026824951171875, 0.03231048583984375, 0.0377960205078125, 0.04328155517578125, 0.04876708984375, 0.05425262451171875, 0.0597381591796875, 0.06522369384765625, 0.070709228515625, 0.07619476318359375, 0.0816802978515625, 0.08716583251953125, 0.0926513671875, 0.09813690185546875, 0.1036224365234375, 0.10910797119140625, 0.114593505859375, 0.12007904052734375, 0.1255645751953125, 0.13105010986328125, 0.13653564453125, 0.14202117919921875, 0.1475067138671875, 0.15299224853515625, 0.158477783203125, 0.16396331787109375, 0.1694488525390625, 0.17493438720703125, 0.180419921875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 6.0, 8.0, 14.0, 8.0, 17.0, 12.0, 19.0, 24.0, 35.0, 80.0, 166.0, 231.0, 161.0, 66.0, 32.0, 20.0, 12.0, 14.0, 13.0, 11.0, 6.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0389404296875, -0.03761720657348633, -0.036293983459472656, -0.034970760345458984, -0.03364753723144531, -0.03232431411743164, -0.03100109100341797, -0.029677867889404297, -0.028354644775390625, -0.027031421661376953, -0.02570819854736328, -0.02438497543334961, -0.023061752319335938, -0.021738529205322266, -0.020415306091308594, -0.019092082977294922, -0.01776885986328125, -0.016445636749267578, -0.015122413635253906, -0.013799190521240234, -0.012475967407226562, -0.01115274429321289, -0.009829521179199219, -0.008506298065185547, -0.007183074951171875, -0.005859851837158203, -0.004536628723144531, -0.0032134056091308594, -0.0018901824951171875, -0.0005669593811035156, 0.0007562637329101562, 0.002079486846923828, 0.0034027099609375, 0.004725933074951172, 0.006049156188964844, 0.007372379302978516, 0.008695602416992188, 0.01001882553100586, 0.011342048645019531, 0.012665271759033203, 0.013988494873046875, 0.015311717987060547, 0.01663494110107422, 0.01795816421508789, 0.019281387329101562, 0.020604610443115234, 0.021927833557128906, 0.023251056671142578, 0.02457427978515625, 0.025897502899169922, 0.027220726013183594, 0.028543949127197266, 0.029867172241210938, 0.03119039535522461, 0.03251361846923828, 0.03383684158325195, 0.035160064697265625, 0.0364832878112793, 0.03780651092529297, 0.03912973403930664, 0.04045295715332031, 0.041776180267333984, 0.043099403381347656, 0.04442262649536133, 0.045745849609375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 18.0, 26.0, 27.0, 82.0, 122.0, 406.0, 13930.0, 1020114.0, 13032.0, 450.0, 139.0, 67.0, 34.0, 24.0, 9.0, 3.0, 14.0, 6.0, 8.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.95361328125, -0.92596435546875, -0.8983154296875, -0.87066650390625, -0.843017578125, -0.81536865234375, -0.7877197265625, -0.76007080078125, -0.732421875, -0.70477294921875, -0.6771240234375, -0.64947509765625, -0.621826171875, -0.59417724609375, -0.5665283203125, -0.53887939453125, -0.51123046875, -0.48358154296875, -0.4559326171875, -0.42828369140625, -0.400634765625, -0.37298583984375, -0.3453369140625, -0.31768798828125, -0.2900390625, -0.26239013671875, -0.2347412109375, -0.20709228515625, -0.179443359375, -0.15179443359375, -0.1241455078125, -0.09649658203125, -0.06884765625, -0.04119873046875, -0.0135498046875, 0.01409912109375, 0.041748046875, 0.06939697265625, 0.0970458984375, 0.12469482421875, 0.15234375, 0.17999267578125, 0.2076416015625, 0.23529052734375, 0.262939453125, 0.29058837890625, 0.3182373046875, 0.34588623046875, 0.37353515625, 0.40118408203125, 0.4288330078125, 0.45648193359375, 0.484130859375, 0.51177978515625, 0.5394287109375, 0.56707763671875, 0.5947265625, 0.62237548828125, 0.6500244140625, 0.67767333984375, 0.705322265625, 0.73297119140625, 0.7606201171875, 0.78826904296875, 0.81591796875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 30.0, 129.0, 356.0, 339.0, 120.0, 23.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07033619284629822, -0.06333759427070618, -0.05633899196982384, -0.049340393394231796, -0.04234179109334946, -0.035343192517757416, -0.028344593942165375, -0.021345991641283035, -0.014347393065690994, -0.007348793093115091, -0.0003501931205391884, 0.006648406386375427, 0.013647006824612617, 0.020645607262849808, 0.02764420583844185, 0.03464280813932419, 0.04164140671491623, 0.04864000529050827, 0.05563860759139061, 0.06263720989227295, 0.06963580846786499, 0.07663440704345703, 0.08363300561904907, 0.09063160419464111, 0.09763020277023315, 0.1046288013458252, 0.11162739992141724, 0.11862599849700928, 0.12562459707260132, 0.13262319564819336, 0.1396217942237854, 0.14662040770053864, 0.15361900627613068, 0.16061760485172272, 0.16761620342731476, 0.1746148020029068, 0.18161340057849884, 0.18861201405525208, 0.19561061263084412, 0.20260921120643616, 0.2096078097820282, 0.21660640835762024, 0.22360500693321228, 0.23060360550880432, 0.23760220408439636, 0.2446008026599884, 0.25159940123558044, 0.2585979998111725, 0.2655965983867645, 0.27259519696235657, 0.2795937955379486, 0.28659239411354065, 0.2935909926891327, 0.30058959126472473, 0.3075881898403168, 0.3145867884159088, 0.32158541679382324, 0.3285840153694153, 0.3355826139450073, 0.34258121252059937, 0.3495798110961914, 0.35657840967178345, 0.3635770082473755, 0.37057560682296753, 0.37757420539855957]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 12.0, 9.0, 22.0, 20.0, 12.0, 17.0, 12.0, 21.0, 27.0, 25.0, 36.0, 37.0, 27.0, 31.0, 40.0, 38.0, 37.0, 30.0, 44.0, 36.0, 38.0, 47.0, 44.0, 39.0, 27.0, 38.0, 31.0, 23.0, 21.0, 19.0, 17.0, 23.0, 16.0, 9.0, 9.0, 10.0, 8.0, 6.0, 5.0, 7.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.04153925180435181, -0.04017271101474762, -0.038806166499853134, -0.03743962198495865, -0.03607308119535446, -0.034706540405750275, -0.03333999589085579, -0.031973451375961304, -0.030606910586357117, -0.02924036793410778, -0.027873825281858444, -0.026507282629609108, -0.02514073997735977, -0.023774197325110435, -0.0224076546728611, -0.021041112020611763, -0.019674569368362427, -0.01830802671611309, -0.016941484063863754, -0.015574941411614418, -0.014208398759365082, -0.012841856107115746, -0.01147531345486641, -0.010108770802617073, -0.008742228150367737, -0.007375685498118401, -0.006009142845869064, -0.004642600193619728, -0.003276057541370392, -0.0019095148891210556, -0.0005429722368717194, 0.0008235704153776169, 0.002190113067626953, 0.0035566557198762894, 0.004923198372125626, 0.006289741024374962, 0.007656283676624298, 0.009022826328873634, 0.01038936898112297, 0.011755911633372307, 0.013122454285621643, 0.01448899693787098, 0.015855539590120316, 0.017222082242369652, 0.018588624894618988, 0.019955167546868324, 0.02132171019911766, 0.022688252851366997, 0.024054795503616333, 0.02542133815586567, 0.026787880808115005, 0.028154423460364342, 0.029520966112613678, 0.030887508764863014, 0.03225405141711235, 0.033620595932006836, 0.03498713672161102, 0.03635367751121521, 0.037720222026109695, 0.03908676654100418, 0.04045330733060837, 0.041819848120212555, 0.04318639263510704, 0.044552937150001526, 0.04591947793960571]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 3.0, 2.0, 1.0, 4.0, 3.0, 8.0, 2.0, 8.0, 11.0, 13.0, 17.0, 20.0, 21.0, 31.0, 24.0, 31.0, 23.0, 30.0, 41.0, 26.0, 37.0, 23.0, 31.0, 33.0, 43.0, 45.0, 39.0, 39.0, 43.0, 34.0, 28.0, 37.0, 32.0, 23.0, 30.0, 28.0, 28.0, 14.0, 8.0, 13.0, 8.0, 11.0, 9.0, 10.0, 17.0, 3.0, 9.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8065185546875, -0.780517578125, -0.7545166015625, -0.728515625, -0.7025146484375, -0.676513671875, -0.6505126953125, -0.62451171875, -0.5985107421875, -0.572509765625, -0.5465087890625, -0.5205078125, -0.4945068359375, -0.468505859375, -0.4425048828125, -0.41650390625, -0.3905029296875, -0.364501953125, -0.3385009765625, -0.3125, -0.2864990234375, -0.260498046875, -0.2344970703125, -0.20849609375, -0.1824951171875, -0.156494140625, -0.1304931640625, -0.1044921875, -0.0784912109375, -0.052490234375, -0.0264892578125, -0.00048828125, 0.0255126953125, 0.051513671875, 0.0775146484375, 0.103515625, 0.1295166015625, 0.155517578125, 0.1815185546875, 0.20751953125, 0.2335205078125, 0.259521484375, 0.2855224609375, 0.3115234375, 0.3375244140625, 0.363525390625, 0.3895263671875, 0.41552734375, 0.4415283203125, 0.467529296875, 0.4935302734375, 0.51953125, 0.5455322265625, 0.571533203125, 0.5975341796875, 0.62353515625, 0.6495361328125, 0.675537109375, 0.7015380859375, 0.7275390625, 0.7535400390625, 0.779541015625, 0.8055419921875, 0.83154296875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 4.0, 9.0, 7.0, 13.0, 32.0, 24.0, 46.0, 42.0, 79.0, 146.0, 240.0, 386.0, 675.0, 1262.0, 2449.0, 4765.0, 10215.0, 23580.0, 64709.0, 215035.0, 440645.0, 186911.0, 56861.0, 21617.0, 9349.0, 4429.0, 2298.0, 1158.0, 601.0, 392.0, 182.0, 128.0, 72.0, 55.0, 39.0, 27.0, 20.0, 15.0, 8.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5751953125, -1.515625, -1.4560546875, -1.396484375, -1.3369140625, -1.27734375, -1.2177734375, -1.158203125, -1.0986328125, -1.0390625, -0.9794921875, -0.919921875, -0.8603515625, -0.80078125, -0.7412109375, -0.681640625, -0.6220703125, -0.5625, -0.5029296875, -0.443359375, -0.3837890625, -0.32421875, -0.2646484375, -0.205078125, -0.1455078125, -0.0859375, -0.0263671875, 0.033203125, 0.0927734375, 0.15234375, 0.2119140625, 0.271484375, 0.3310546875, 0.390625, 0.4501953125, 0.509765625, 0.5693359375, 0.62890625, 0.6884765625, 0.748046875, 0.8076171875, 0.8671875, 0.9267578125, 0.986328125, 1.0458984375, 1.10546875, 1.1650390625, 1.224609375, 1.2841796875, 1.34375, 1.4033203125, 1.462890625, 1.5224609375, 1.58203125, 1.6416015625, 1.701171875, 1.7607421875, 1.8203125, 1.8798828125, 1.939453125, 1.9990234375, 2.05859375, 2.1181640625, 2.177734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 7.0, 15.0, 17.0, 26.0, 25.0, 21.0, 30.0, 32.0, 41.0, 46.0, 48.0, 60.0, 69.0, 135.0, 213.0, 1396.0, 275.0, 141.0, 114.0, 46.0, 32.0, 44.0, 41.0, 27.0, 30.0, 22.0, 16.0, 19.0, 13.0, 10.0, 10.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.931640625, -2.829559326171875, -2.72747802734375, -2.625396728515625, -2.5233154296875, -2.421234130859375, -2.31915283203125, -2.217071533203125, -2.114990234375, -2.012908935546875, -1.91082763671875, -1.808746337890625, -1.7066650390625, -1.604583740234375, -1.50250244140625, -1.400421142578125, -1.29833984375, -1.196258544921875, -1.09417724609375, -0.992095947265625, -0.8900146484375, -0.787933349609375, -0.68585205078125, -0.583770751953125, -0.481689453125, -0.379608154296875, -0.27752685546875, -0.175445556640625, -0.0733642578125, 0.028717041015625, 0.13079833984375, 0.232879638671875, 0.3349609375, 0.437042236328125, 0.53912353515625, 0.641204833984375, 0.7432861328125, 0.845367431640625, 0.94744873046875, 1.049530029296875, 1.151611328125, 1.253692626953125, 1.35577392578125, 1.457855224609375, 1.5599365234375, 1.662017822265625, 1.76409912109375, 1.866180419921875, 1.96826171875, 2.070343017578125, 2.17242431640625, 2.274505615234375, 2.3765869140625, 2.478668212890625, 2.58074951171875, 2.682830810546875, 2.784912109375, 2.886993408203125, 2.98907470703125, 3.091156005859375, 3.1932373046875, 3.295318603515625, 3.39739990234375, 3.499481201171875, 3.6015625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 3.0, 14.0, 14.0, 24.0, 24.0, 36.0, 32.0, 77.0, 63.0, 105.0, 143.0, 215.0, 425.0, 1580.0, 11585.0, 307982.0, 2741585.0, 74196.0, 5515.0, 939.0, 386.0, 208.0, 133.0, 94.0, 79.0, 61.0, 42.0, 36.0, 31.0, 21.0, 15.0, 10.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.91192626953125, -6.7105712890625, -6.50921630859375, -6.307861328125, -6.10650634765625, -5.9051513671875, -5.70379638671875, -5.50244140625, -5.30108642578125, -5.0997314453125, -4.89837646484375, -4.697021484375, -4.49566650390625, -4.2943115234375, -4.09295654296875, -3.8916015625, -3.69024658203125, -3.4888916015625, -3.28753662109375, -3.086181640625, -2.88482666015625, -2.6834716796875, -2.48211669921875, -2.28076171875, -2.07940673828125, -1.8780517578125, -1.67669677734375, -1.475341796875, -1.27398681640625, -1.0726318359375, -0.87127685546875, -0.669921875, -0.46856689453125, -0.2672119140625, -0.06585693359375, 0.135498046875, 0.33685302734375, 0.5382080078125, 0.73956298828125, 0.94091796875, 1.14227294921875, 1.3436279296875, 1.54498291015625, 1.746337890625, 1.94769287109375, 2.1490478515625, 2.35040283203125, 2.5517578125, 2.75311279296875, 2.9544677734375, 3.15582275390625, 3.357177734375, 3.55853271484375, 3.7598876953125, 3.96124267578125, 4.16259765625, 4.36395263671875, 4.5653076171875, 4.76666259765625, 4.968017578125, 5.16937255859375, 5.3707275390625, 5.57208251953125, 5.7734375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 5.0, 79.0, 263.0, 428.0, 200.0, 35.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5068366527557373, -2.7066187858581543, -1.9064010381698608, -1.1061832904815674, -0.3059654235839844, 0.49425244331359863, 1.2944700717926025, 2.0946881771087646, 2.8949058055877686, 3.6951236724853516, 4.4953413009643555, 5.295558929443359, 6.0957770347595215, 6.895995140075684, 7.6962127685546875, 8.496430397033691, 9.296648025512695, 10.0968656539917, 10.897083282470703, 11.697301864624023, 12.497519493103027, 13.297737121582031, 14.097954750061035, 14.898172378540039, 15.69839096069336, 16.49860954284668, 17.298826217651367, 18.099044799804688, 18.899261474609375, 19.699480056762695, 20.499698638916016, 21.299915313720703, 22.100133895874023, 22.900352478027344, 23.70056915283203, 24.50078773498535, 25.30100440979004, 26.10122299194336, 26.901439666748047, 27.701658248901367, 28.501876831054688, 29.302095413208008, 30.102312088012695, 30.902530670166016, 31.702747344970703, 32.502967834472656, 33.303184509277344, 34.10340118408203, 34.90361785888672, 35.703834533691406, 36.50405502319336, 37.30427169799805, 38.104488372802734, 38.90470886230469, 39.704925537109375, 40.50514221191406, 41.305362701416016, 42.1055793762207, 42.905799865722656, 43.706016540527344, 44.50623321533203, 45.30644989013672, 46.10667037963867, 46.90688705444336, 47.70710372924805]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 4.0, 3.0, 14.0, 11.0, 12.0, 17.0, 16.0, 19.0, 30.0, 29.0, 25.0, 40.0, 32.0, 35.0, 45.0, 37.0, 45.0, 39.0, 44.0, 50.0, 35.0, 47.0, 38.0, 44.0, 27.0, 28.0, 27.0, 29.0, 27.0, 25.0, 19.0, 9.0, 23.0, 10.0, 7.0, 4.0, 11.0, 10.0, 2.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.103711128234863, -7.875274181365967, -7.64683723449707, -7.418400287628174, -7.189963340759277, -6.961526870727539, -6.733089447021484, -6.504652976989746, -6.27621603012085, -6.047779083251953, -5.819342136383057, -5.59090518951416, -5.362468242645264, -5.134031295776367, -4.905594825744629, -4.677157878875732, -4.448720932006836, -4.2202839851379395, -3.991847038269043, -3.7634100914001465, -3.534973382949829, -3.3065364360809326, -3.078099489212036, -2.8496627807617188, -2.621225357055664, -2.3927884101867676, -2.164351463317871, -1.9359146356582642, -1.7074778079986572, -1.4790408611297607, -1.2506039142608643, -1.0221670866012573, -0.7937302589416504, -0.5652933716773987, -0.3368564546108246, -0.10841953754425049, 0.12001734972000122, 0.34845423698425293, 0.5768911838531494, 0.8053280115127563, 1.0337649583816528, 1.2622019052505493, 1.4906387329101562, 1.7190756797790527, 1.9475126266479492, 2.1759495735168457, 2.404386520385742, 2.6328232288360596, 2.861260175704956, 3.0896971225738525, 3.318134069442749, 3.5465707778930664, 3.775007724761963, 4.003444671630859, 4.231881618499756, 4.460318565368652, 4.688755512237549, 4.917192459106445, 5.145629405975342, 5.374066352844238, 5.602503299713135, 5.830940246582031, 6.0593767166137695, 6.287813663482666, 6.5162506103515625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 8.0, 5.0, 11.0, 10.0, 15.0, 13.0, 25.0, 20.0, 27.0, 30.0, 28.0, 31.0, 34.0, 32.0, 30.0, 24.0, 32.0, 28.0, 40.0, 46.0, 39.0, 47.0, 33.0, 36.0, 46.0, 31.0, 33.0, 20.0, 29.0, 32.0, 19.0, 11.0, 26.0, 14.0, 21.0, 8.0, 7.0, 6.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.93212890625, -0.9042816162109375, -0.876434326171875, -0.8485870361328125, -0.82073974609375, -0.7928924560546875, -0.765045166015625, -0.7371978759765625, -0.7093505859375, -0.6815032958984375, -0.653656005859375, -0.6258087158203125, -0.59796142578125, -0.5701141357421875, -0.542266845703125, -0.5144195556640625, -0.486572265625, -0.4587249755859375, -0.430877685546875, -0.4030303955078125, -0.37518310546875, -0.3473358154296875, -0.319488525390625, -0.2916412353515625, -0.2637939453125, -0.2359466552734375, -0.208099365234375, -0.1802520751953125, -0.15240478515625, -0.1245574951171875, -0.096710205078125, -0.0688629150390625, -0.041015625, -0.0131683349609375, 0.014678955078125, 0.0425262451171875, 0.07037353515625, 0.0982208251953125, 0.126068115234375, 0.1539154052734375, 0.1817626953125, 0.2096099853515625, 0.237457275390625, 0.2653045654296875, 0.29315185546875, 0.3209991455078125, 0.348846435546875, 0.3766937255859375, 0.404541015625, 0.4323883056640625, 0.460235595703125, 0.4880828857421875, 0.51593017578125, 0.5437774658203125, 0.571624755859375, 0.5994720458984375, 0.6273193359375, 0.6551666259765625, 0.683013916015625, 0.7108612060546875, 0.73870849609375, 0.7665557861328125, 0.794403076171875, 0.8222503662109375, 0.85009765625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 4.0, 1.0, 7.0, 6.0, 9.0, 17.0, 15.0, 16.0, 29.0, 38.0, 49.0, 94.0, 108.0, 186.0, 263.0, 430.0, 715.0, 1239.0, 2149.0, 3907.0, 7983.0, 17358.0, 42931.0, 122248.0, 434231.0, 1556376.0, 1431597.0, 388279.0, 112275.0, 39764.0, 16208.0, 7261.0, 3665.0, 1916.0, 1132.0, 635.0, 359.0, 249.0, 165.0, 116.0, 76.0, 54.0, 30.0, 31.0, 14.0, 17.0, 11.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.4775390625, -1.426513671875, -1.37548828125, -1.324462890625, -1.2734375, -1.222412109375, -1.17138671875, -1.120361328125, -1.0693359375, -1.018310546875, -0.96728515625, -0.916259765625, -0.865234375, -0.814208984375, -0.76318359375, -0.712158203125, -0.6611328125, -0.610107421875, -0.55908203125, -0.508056640625, -0.45703125, -0.406005859375, -0.35498046875, -0.303955078125, -0.2529296875, -0.201904296875, -0.15087890625, -0.099853515625, -0.048828125, 0.002197265625, 0.05322265625, 0.104248046875, 0.1552734375, 0.206298828125, 0.25732421875, 0.308349609375, 0.359375, 0.410400390625, 0.46142578125, 0.512451171875, 0.5634765625, 0.614501953125, 0.66552734375, 0.716552734375, 0.767578125, 0.818603515625, 0.86962890625, 0.920654296875, 0.9716796875, 1.022705078125, 1.07373046875, 1.124755859375, 1.17578125, 1.226806640625, 1.27783203125, 1.328857421875, 1.3798828125, 1.430908203125, 1.48193359375, 1.532958984375, 1.583984375, 1.635009765625, 1.68603515625, 1.737060546875, 1.7880859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 18.0, 13.0, 18.0, 17.0, 29.0, 43.0, 65.0, 65.0, 85.0, 130.0, 181.0, 216.0, 285.0, 365.0, 483.0, 475.0, 385.0, 290.0, 210.0, 156.0, 121.0, 100.0, 77.0, 42.0, 41.0, 32.0, 28.0, 17.0, 21.0, 15.0, 11.0, 6.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5530242919921875, -1.497650146484375, -1.4422760009765625, -1.38690185546875, -1.3315277099609375, -1.276153564453125, -1.2207794189453125, -1.1654052734375, -1.1100311279296875, -1.054656982421875, -0.9992828369140625, -0.94390869140625, -0.8885345458984375, -0.833160400390625, -0.7777862548828125, -0.722412109375, -0.6670379638671875, -0.611663818359375, -0.5562896728515625, -0.50091552734375, -0.4455413818359375, -0.390167236328125, -0.3347930908203125, -0.2794189453125, -0.2240447998046875, -0.168670654296875, -0.1132965087890625, -0.05792236328125, -0.0025482177734375, 0.052825927734375, 0.1082000732421875, 0.16357421875, 0.2189483642578125, 0.274322509765625, 0.3296966552734375, 0.38507080078125, 0.4404449462890625, 0.495819091796875, 0.5511932373046875, 0.6065673828125, 0.6619415283203125, 0.717315673828125, 0.7726898193359375, 0.82806396484375, 0.8834381103515625, 0.938812255859375, 0.9941864013671875, 1.049560546875, 1.1049346923828125, 1.160308837890625, 1.2156829833984375, 1.27105712890625, 1.3264312744140625, 1.381805419921875, 1.4371795654296875, 1.4925537109375, 1.5479278564453125, 1.603302001953125, 1.6586761474609375, 1.71405029296875, 1.7694244384765625, 1.824798583984375, 1.8801727294921875, 1.935546875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 13.0, 14.0, 18.0, 14.0, 12.0, 31.0, 24.0, 51.0, 58.0, 80.0, 128.0, 170.0, 319.0, 659.0, 2191.0, 11124.0, 127242.0, 3096252.0, 906273.0, 41700.0, 5170.0, 1435.0, 498.0, 246.0, 150.0, 97.0, 73.0, 47.0, 45.0, 34.0, 24.0, 17.0, 18.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.91015625, -6.71710205078125, -6.5240478515625, -6.33099365234375, -6.137939453125, -5.94488525390625, -5.7518310546875, -5.55877685546875, -5.36572265625, -5.17266845703125, -4.9796142578125, -4.78656005859375, -4.593505859375, -4.40045166015625, -4.2073974609375, -4.01434326171875, -3.8212890625, -3.62823486328125, -3.4351806640625, -3.24212646484375, -3.049072265625, -2.85601806640625, -2.6629638671875, -2.46990966796875, -2.27685546875, -2.08380126953125, -1.8907470703125, -1.69769287109375, -1.504638671875, -1.31158447265625, -1.1185302734375, -0.92547607421875, -0.732421875, -0.53936767578125, -0.3463134765625, -0.15325927734375, 0.039794921875, 0.23284912109375, 0.4259033203125, 0.61895751953125, 0.81201171875, 1.00506591796875, 1.1981201171875, 1.39117431640625, 1.584228515625, 1.77728271484375, 1.9703369140625, 2.16339111328125, 2.3564453125, 2.54949951171875, 2.7425537109375, 2.93560791015625, 3.128662109375, 3.32171630859375, 3.5147705078125, 3.70782470703125, 3.90087890625, 4.09393310546875, 4.2869873046875, 4.48004150390625, 4.673095703125, 4.86614990234375, 5.0592041015625, 5.25225830078125, 5.4453125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 16.0, 22.0, 35.0, 56.0, 85.0, 93.0, 116.0, 124.0, 133.0, 85.0, 85.0, 47.0, 42.0, 26.0, 15.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.73993968963623, -12.360600471496582, -11.98126220703125, -11.601922988891602, -11.22258472442627, -10.843245506286621, -10.463907241821289, -10.08456802368164, -9.705228805541992, -9.325889587402344, -8.946551322937012, -8.567212104797363, -8.187873840332031, -7.808534622192383, -7.429195880889893, -7.049857139587402, -6.670518398284912, -6.291179656982422, -5.911840915679932, -5.532502174377441, -5.153162956237793, -4.773824214935303, -4.3944854736328125, -4.015146255493164, -3.635807752609253, -3.2564690113067627, -2.8771300315856934, -2.497791290283203, -2.118452548980713, -1.7391135692596436, -1.3597748279571533, -0.980435848236084, -0.6010971069335938, -0.22175827622413635, 0.15758055448532104, 0.536919355392456, 0.9162582159042358, 1.2955970764160156, 1.6749358177185059, 2.054274797439575, 2.4336135387420654, 2.8129522800445557, 3.192291259765625, 3.5716300010681152, 3.9509687423706055, 4.330307960510254, 4.709646224975586, 5.088985443115234, 5.468324184417725, 5.847662925720215, 6.227001667022705, 6.606340408325195, 6.985679626464844, 7.365018367767334, 7.744357109069824, 8.123696327209473, 8.503034591674805, 8.882373809814453, 9.261712074279785, 9.641051292419434, 10.020389556884766, 10.399728775024414, 10.779067993164062, 11.158406257629395, 11.537745475769043]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 9.0, 6.0, 8.0, 9.0, 14.0, 12.0, 11.0, 21.0, 23.0, 24.0, 25.0, 26.0, 29.0, 25.0, 39.0, 45.0, 44.0, 35.0, 33.0, 35.0, 31.0, 40.0, 28.0, 30.0, 33.0, 25.0, 34.0, 43.0, 32.0, 24.0, 32.0, 25.0, 18.0, 16.0, 21.0, 16.0, 12.0, 11.0, 9.0, 7.0, 13.0, 8.0, 5.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.274033546447754, -5.0995073318481445, -4.924981117248535, -4.750454902648926, -4.575928688049316, -4.401402473449707, -4.226876258850098, -4.052350044250488, -3.877824068069458, -3.7032978534698486, -3.5287716388702393, -3.354245662689209, -3.1797194480895996, -3.0051932334899902, -2.830667018890381, -2.6561408042907715, -2.481614589691162, -2.3070883750915527, -2.1325621604919434, -1.9580360651016235, -1.7835098505020142, -1.6089836359024048, -1.434457540512085, -1.2599313259124756, -1.0854051113128662, -0.9108788967132568, -0.7363527417182922, -0.5618265867233276, -0.38730037212371826, -0.2127741575241089, -0.03824806213378906, 0.1362781524658203, 0.3108038902282715, 0.48533007502555847, 0.6598562598228455, 0.8343824148178101, 1.0089086294174194, 1.1834348440170288, 1.3579609394073486, 1.532487154006958, 1.7070133686065674, 1.8815395832061768, 2.056065797805786, 2.2305917739868164, 2.405117988586426, 2.579644203186035, 2.7541704177856445, 2.928696632385254, 3.1032228469848633, 3.2777490615844727, 3.452275276184082, 3.6268014907836914, 3.801327705383301, 3.97585391998291, 4.1503801345825195, 4.324906349182129, 4.499432563781738, 4.673958778381348, 4.848484992980957, 5.023011207580566, 5.197537422180176, 5.372063636779785, 5.5465898513793945, 5.721116065979004, 5.895641803741455]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 7.0, 13.0, 5.0, 9.0, 11.0, 19.0, 19.0, 14.0, 24.0, 21.0, 23.0, 30.0, 36.0, 40.0, 40.0, 37.0, 42.0, 43.0, 30.0, 52.0, 40.0, 51.0, 42.0, 44.0, 29.0, 38.0, 26.0, 36.0, 19.0, 27.0, 17.0, 16.0, 12.0, 15.0, 8.0, 10.0, 12.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9443359375, -0.9150619506835938, -0.8857879638671875, -0.8565139770507812, -0.827239990234375, -0.7979660034179688, -0.7686920166015625, -0.7394180297851562, -0.71014404296875, -0.6808700561523438, -0.6515960693359375, -0.6223220825195312, -0.593048095703125, -0.5637741088867188, -0.5345001220703125, -0.5052261352539062, -0.4759521484375, -0.44667816162109375, -0.4174041748046875, -0.38813018798828125, -0.358856201171875, -0.32958221435546875, -0.3003082275390625, -0.27103424072265625, -0.24176025390625, -0.21248626708984375, -0.1832122802734375, -0.15393829345703125, -0.124664306640625, -0.09539031982421875, -0.0661163330078125, -0.03684234619140625, -0.007568359375, 0.02170562744140625, 0.0509796142578125, 0.08025360107421875, 0.109527587890625, 0.13880157470703125, 0.1680755615234375, 0.19734954833984375, 0.22662353515625, 0.25589752197265625, 0.2851715087890625, 0.31444549560546875, 0.343719482421875, 0.37299346923828125, 0.4022674560546875, 0.43154144287109375, 0.4608154296875, 0.49008941650390625, 0.5193634033203125, 0.5486373901367188, 0.577911376953125, 0.6071853637695312, 0.6364593505859375, 0.6657333374023438, 0.69500732421875, 0.7242813110351562, 0.7535552978515625, 0.7828292846679688, 0.812103271484375, 0.8413772583007812, 0.8706512451171875, 0.8999252319335938, 0.92919921875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 3.0, 9.0, 5.0, 13.0, 12.0, 13.0, 23.0, 33.0, 54.0, 60.0, 87.0, 91.0, 127.0, 188.0, 239.0, 335.0, 509.0, 692.0, 1027.0, 1697.0, 2910.0, 6269.0, 17475.0, 64515.0, 304985.0, 480903.0, 118617.0, 28285.0, 9283.0, 3918.0, 2069.0, 1248.0, 791.0, 543.0, 405.0, 310.0, 191.0, 164.0, 124.0, 93.0, 56.0, 53.0, 28.0, 31.0, 20.0, 17.0, 16.0, 7.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3734130859375, -0.36181640625, -0.3502197265625, -0.338623046875, -0.3270263671875, -0.3154296875, -0.3038330078125, -0.292236328125, -0.2806396484375, -0.26904296875, -0.2574462890625, -0.245849609375, -0.2342529296875, -0.22265625, -0.2110595703125, -0.199462890625, -0.1878662109375, -0.17626953125, -0.1646728515625, -0.153076171875, -0.1414794921875, -0.1298828125, -0.1182861328125, -0.106689453125, -0.0950927734375, -0.08349609375, -0.0718994140625, -0.060302734375, -0.0487060546875, -0.037109375, -0.0255126953125, -0.013916015625, -0.0023193359375, 0.00927734375, 0.0208740234375, 0.032470703125, 0.0440673828125, 0.0556640625, 0.0672607421875, 0.078857421875, 0.0904541015625, 0.10205078125, 0.1136474609375, 0.125244140625, 0.1368408203125, 0.1484375, 0.1600341796875, 0.171630859375, 0.1832275390625, 0.19482421875, 0.2064208984375, 0.218017578125, 0.2296142578125, 0.2412109375, 0.2528076171875, 0.264404296875, 0.2760009765625, 0.28759765625, 0.2991943359375, 0.310791015625, 0.3223876953125, 0.333984375, 0.3455810546875, 0.357177734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 8.0, 5.0, 13.0, 12.0, 9.0, 11.0, 11.0, 21.0, 19.0, 23.0, 27.0, 33.0, 24.0, 40.0, 33.0, 43.0, 32.0, 35.0, 43.0, 1060.0, 46.0, 42.0, 40.0, 40.0, 44.0, 39.0, 34.0, 37.0, 32.0, 26.0, 16.0, 28.0, 17.0, 12.0, 18.0, 9.0, 10.0, 8.0, 3.0, 9.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.533203125, -0.513397216796875, -0.49359130859375, -0.473785400390625, -0.4539794921875, -0.434173583984375, -0.41436767578125, -0.394561767578125, -0.374755859375, -0.354949951171875, -0.33514404296875, -0.315338134765625, -0.2955322265625, -0.275726318359375, -0.25592041015625, -0.236114501953125, -0.21630859375, -0.196502685546875, -0.17669677734375, -0.156890869140625, -0.1370849609375, -0.117279052734375, -0.09747314453125, -0.077667236328125, -0.057861328125, -0.038055419921875, -0.01824951171875, 0.001556396484375, 0.0213623046875, 0.041168212890625, 0.06097412109375, 0.080780029296875, 0.1005859375, 0.120391845703125, 0.14019775390625, 0.160003662109375, 0.1798095703125, 0.199615478515625, 0.21942138671875, 0.239227294921875, 0.259033203125, 0.278839111328125, 0.29864501953125, 0.318450927734375, 0.3382568359375, 0.358062744140625, 0.37786865234375, 0.397674560546875, 0.41748046875, 0.437286376953125, 0.45709228515625, 0.476898193359375, 0.4967041015625, 0.516510009765625, 0.53631591796875, 0.556121826171875, 0.575927734375, 0.595733642578125, 0.61553955078125, 0.635345458984375, 0.6551513671875, 0.674957275390625, 0.69476318359375, 0.714569091796875, 0.734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 23.0, 22.0, 27.0, 31.0, 53.0, 56.0, 89.0, 107.0, 152.0, 262.0, 357.0, 560.0, 893.0, 1764.0, 4072.0, 13414.0, 69559.0, 1137590.0, 785859.0, 61596.0, 12389.0, 3968.0, 1719.0, 861.0, 553.0, 326.0, 231.0, 149.0, 114.0, 86.0, 53.0, 56.0, 32.0, 20.0, 22.0, 10.0, 10.0, 6.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25, -0.24106216430664062, -0.23212432861328125, -0.22318649291992188, -0.2142486572265625, -0.20531082153320312, -0.19637298583984375, -0.18743515014648438, -0.178497314453125, -0.16955947875976562, -0.16062164306640625, -0.15168380737304688, -0.1427459716796875, -0.13380813598632812, -0.12487030029296875, -0.11593246459960938, -0.10699462890625, -0.09805679321289062, -0.08911895751953125, -0.08018112182617188, -0.0712432861328125, -0.062305450439453125, -0.05336761474609375, -0.044429779052734375, -0.035491943359375, -0.026554107666015625, -0.01761627197265625, -0.008678436279296875, 0.0002593994140625, 0.009197235107421875, 0.01813507080078125, 0.027072906494140625, 0.0360107421875, 0.044948577880859375, 0.05388641357421875, 0.06282424926757812, 0.0717620849609375, 0.08069992065429688, 0.08963775634765625, 0.09857559204101562, 0.107513427734375, 0.11645126342773438, 0.12538909912109375, 0.13432693481445312, 0.1432647705078125, 0.15220260620117188, 0.16114044189453125, 0.17007827758789062, 0.17901611328125, 0.18795394897460938, 0.19689178466796875, 0.20582962036132812, 0.2147674560546875, 0.22370529174804688, 0.23264312744140625, 0.24158096313476562, 0.250518798828125, 0.2594566345214844, 0.26839447021484375, 0.2773323059082031, 0.2862701416015625, 0.2952079772949219, 0.30414581298828125, 0.3130836486816406, 0.322021484375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 10.0, 11.0, 15.0, 15.0, 31.0, 40.0, 79.0, 103.0, 163.0, 168.0, 147.0, 70.0, 40.0, 31.0, 25.0, 9.0, 12.0, 3.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029296875, -0.028487682342529297, -0.027678489685058594, -0.02686929702758789, -0.026060104370117188, -0.025250911712646484, -0.02444171905517578, -0.023632526397705078, -0.022823333740234375, -0.022014141082763672, -0.02120494842529297, -0.020395755767822266, -0.019586563110351562, -0.01877737045288086, -0.017968177795410156, -0.017158985137939453, -0.01634979248046875, -0.015540599822998047, -0.014731407165527344, -0.01392221450805664, -0.013113021850585938, -0.012303829193115234, -0.011494636535644531, -0.010685443878173828, -0.009876251220703125, -0.009067058563232422, -0.008257865905761719, -0.007448673248291016, -0.0066394805908203125, -0.005830287933349609, -0.005021095275878906, -0.004211902618408203, -0.0034027099609375, -0.002593517303466797, -0.0017843246459960938, -0.0009751319885253906, -0.0001659393310546875, 0.0006432533264160156, 0.0014524459838867188, 0.002261638641357422, 0.003070831298828125, 0.003880023956298828, 0.004689216613769531, 0.005498409271240234, 0.0063076019287109375, 0.007116794586181641, 0.007925987243652344, 0.008735179901123047, 0.00954437255859375, 0.010353565216064453, 0.011162757873535156, 0.01197195053100586, 0.012781143188476562, 0.013590335845947266, 0.014399528503417969, 0.015208721160888672, 0.016017913818359375, 0.016827106475830078, 0.01763629913330078, 0.018445491790771484, 0.019254684448242188, 0.02006387710571289, 0.020873069763183594, 0.021682262420654297, 0.022491455078125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 5.0, 11.0, 23.0, 25.0, 51.0, 98.0, 257.0, 2466.0, 354991.0, 687205.0, 2830.0, 338.0, 88.0, 49.0, 38.0, 19.0, 20.0, 9.0, 0.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4527320861816406, -0.43598175048828125, -0.4192314147949219, -0.4024810791015625, -0.3857307434082031, -0.36898040771484375, -0.3522300720214844, -0.335479736328125, -0.3187294006347656, -0.30197906494140625, -0.2852287292480469, -0.2684783935546875, -0.2517280578613281, -0.23497772216796875, -0.21822738647460938, -0.20147705078125, -0.18472671508789062, -0.16797637939453125, -0.15122604370117188, -0.1344757080078125, -0.11772537231445312, -0.10097503662109375, -0.08422470092773438, -0.067474365234375, -0.050724029541015625, -0.03397369384765625, -0.017223358154296875, -0.0004730224609375, 0.016277313232421875, 0.03302764892578125, 0.049777984619140625, 0.0665283203125, 0.08327865600585938, 0.10002899169921875, 0.11677932739257812, 0.1335296630859375, 0.15027999877929688, 0.16703033447265625, 0.18378067016601562, 0.200531005859375, 0.21728134155273438, 0.23403167724609375, 0.2507820129394531, 0.2675323486328125, 0.2842826843261719, 0.30103302001953125, 0.3177833557128906, 0.33453369140625, 0.3512840270996094, 0.36803436279296875, 0.3847846984863281, 0.4015350341796875, 0.4182853698730469, 0.43503570556640625, 0.4517860412597656, 0.468536376953125, 0.4852867126464844, 0.5020370483398438, 0.5187873840332031, 0.5355377197265625, 0.5522880554199219, 0.5690383911132812, 0.5857887268066406, 0.6025390625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 32.0, 123.0, 426.0, 323.0, 77.0, 24.0, 3.0], "bins": [-0.2804708182811737, -0.2757810056209564, -0.27109119296073914, -0.26640138030052185, -0.26171156764030457, -0.25702178478240967, -0.2523319721221924, -0.2476421445608139, -0.2429523468017578, -0.23826253414154053, -0.23357272148132324, -0.22888292372226715, -0.22419311106204987, -0.21950329840183258, -0.2148134857416153, -0.210123673081398, -0.20543386042118073, -0.20074404776096344, -0.19605423510074615, -0.19136443734169006, -0.18667462468147278, -0.1819848120212555, -0.1772949993610382, -0.17260518670082092, -0.16791537404060364, -0.16322556138038635, -0.15853574872016907, -0.15384595096111298, -0.1491561383008957, -0.1444663256406784, -0.13977651298046112, -0.13508670032024384, -0.13039690256118774, -0.12570708990097046, -0.12101728469133377, -0.11632747203111649, -0.1116376668214798, -0.10694785416126251, -0.10225804150104523, -0.09756822884082794, -0.09287841618061066, -0.08818860352039337, -0.08349879831075668, -0.0788089856505394, -0.07411918044090271, -0.06942936778068542, -0.06473955512046814, -0.06004974618554115, -0.055359937250614166, -0.05067012831568718, -0.04598031938076019, -0.04129050672054291, -0.03660069778561592, -0.031910888850688934, -0.0272210780531168, -0.022531267255544662, -0.017841458320617676, -0.013151648454368114, -0.008461838588118553, -0.003772028721868992, 0.0009177811443805695, 0.005607590079307556, 0.010297400876879692, 0.014987211674451828, 0.019677020609378815]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 10.0, 7.0, 11.0, 15.0, 18.0, 26.0, 22.0, 31.0, 43.0, 31.0, 34.0, 36.0, 31.0, 35.0, 33.0, 37.0, 42.0, 43.0, 41.0, 40.0, 37.0, 40.0, 31.0, 38.0, 31.0, 26.0, 30.0, 26.0, 29.0, 20.0, 14.0, 14.0, 14.0, 8.0, 11.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023535728454589844, -0.02282014489173889, -0.02210456132888794, -0.021388977766036987, -0.020673394203186035, -0.019957810640335083, -0.01924222707748413, -0.01852664351463318, -0.017811059951782227, -0.017095476388931274, -0.016379892826080322, -0.01566430926322937, -0.014948725700378418, -0.014233142137527466, -0.013517558574676514, -0.012801975011825562, -0.01208639144897461, -0.011370807886123657, -0.010655224323272705, -0.009939640760421753, -0.0092240571975708, -0.008508473634719849, -0.0077928900718688965, -0.007077306509017944, -0.006361722946166992, -0.00564613938331604, -0.004930555820465088, -0.004214972257614136, -0.0034993886947631836, -0.0027838051319122314, -0.0020682215690612793, -0.0013526380062103271, -0.000637054443359375, 7.852911949157715e-05, 0.0007941126823425293, 0.0015096962451934814, 0.0022252798080444336, 0.0029408633708953857, 0.003656446933746338, 0.00437203049659729, 0.005087614059448242, 0.005803197622299194, 0.0065187811851501465, 0.007234364748001099, 0.00794994831085205, 0.008665531873703003, 0.009381115436553955, 0.010096698999404907, 0.01081228256225586, 0.011527866125106812, 0.012243449687957764, 0.012959033250808716, 0.013674616813659668, 0.01439020037651062, 0.015105783939361572, 0.015821367502212524, 0.016536951065063477, 0.01725253462791443, 0.01796811819076538, 0.018683701753616333, 0.019399285316467285, 0.020114868879318237, 0.02083045244216919, 0.02154603600502014, 0.022261619567871094]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 13.0, 5.0, 10.0, 10.0, 22.0, 16.0, 14.0, 24.0, 21.0, 23.0, 30.0, 36.0, 41.0, 39.0, 37.0, 43.0, 43.0, 31.0, 50.0, 44.0, 47.0, 41.0, 45.0, 29.0, 37.0, 27.0, 36.0, 20.0, 27.0, 16.0, 17.0, 11.0, 15.0, 8.0, 10.0, 13.0, 6.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9443359375, -0.9150466918945312, -0.8857574462890625, -0.8564682006835938, -0.827178955078125, -0.7978897094726562, -0.7686004638671875, -0.7393112182617188, -0.71002197265625, -0.6807327270507812, -0.6514434814453125, -0.6221542358398438, -0.592864990234375, -0.5635757446289062, -0.5342864990234375, -0.5049972534179688, -0.4757080078125, -0.44641876220703125, -0.4171295166015625, -0.38784027099609375, -0.358551025390625, -0.32926177978515625, -0.2999725341796875, -0.27068328857421875, -0.24139404296875, -0.21210479736328125, -0.1828155517578125, -0.15352630615234375, -0.124237060546875, -0.09494781494140625, -0.0656585693359375, -0.03636932373046875, -0.007080078125, 0.02220916748046875, 0.0514984130859375, 0.08078765869140625, 0.110076904296875, 0.13936614990234375, 0.1686553955078125, 0.19794464111328125, 0.22723388671875, 0.25652313232421875, 0.2858123779296875, 0.31510162353515625, 0.344390869140625, 0.37368011474609375, 0.4029693603515625, 0.43225860595703125, 0.4615478515625, 0.49083709716796875, 0.5201263427734375, 0.5494155883789062, 0.578704833984375, 0.6079940795898438, 0.6372833251953125, 0.6665725708007812, 0.69586181640625, 0.7251510620117188, 0.7544403076171875, 0.7837295532226562, 0.813018798828125, 0.8423080444335938, 0.8715972900390625, 0.9008865356445312, 0.93017578125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 5.0, 11.0, 7.0, 10.0, 16.0, 23.0, 40.0, 54.0, 69.0, 109.0, 130.0, 204.0, 312.0, 448.0, 641.0, 1077.0, 1597.0, 2368.0, 3853.0, 6345.0, 10195.0, 16304.0, 25855.0, 42291.0, 69604.0, 115133.0, 194751.0, 221403.0, 130772.0, 79029.0, 47813.0, 29420.0, 17684.0, 11430.0, 7109.0, 4401.0, 2776.0, 1779.0, 1197.0, 713.0, 509.0, 331.0, 238.0, 149.0, 117.0, 70.0, 52.0, 39.0, 20.0, 20.0, 10.0, 10.0, 7.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91845703125, -0.888946533203125, -0.85943603515625, -0.829925537109375, -0.8004150390625, -0.770904541015625, -0.74139404296875, -0.711883544921875, -0.682373046875, -0.652862548828125, -0.62335205078125, -0.593841552734375, -0.5643310546875, -0.534820556640625, -0.50531005859375, -0.475799560546875, -0.4462890625, -0.416778564453125, -0.38726806640625, -0.357757568359375, -0.3282470703125, -0.298736572265625, -0.26922607421875, -0.239715576171875, -0.210205078125, -0.180694580078125, -0.15118408203125, -0.121673583984375, -0.0921630859375, -0.062652587890625, -0.03314208984375, -0.003631591796875, 0.02587890625, 0.055389404296875, 0.08489990234375, 0.114410400390625, 0.1439208984375, 0.173431396484375, 0.20294189453125, 0.232452392578125, 0.261962890625, 0.291473388671875, 0.32098388671875, 0.350494384765625, 0.3800048828125, 0.409515380859375, 0.43902587890625, 0.468536376953125, 0.498046875, 0.527557373046875, 0.55706787109375, 0.586578369140625, 0.6160888671875, 0.645599365234375, 0.67510986328125, 0.704620361328125, 0.734130859375, 0.763641357421875, 0.79315185546875, 0.822662353515625, 0.8521728515625, 0.881683349609375, 0.91119384765625, 0.940704345703125, 0.97021484375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 3.0, 3.0, 7.0, 15.0, 9.0, 13.0, 19.0, 21.0, 27.0, 20.0, 25.0, 34.0, 41.0, 40.0, 52.0, 61.0, 102.0, 171.0, 264.0, 1309.0, 201.0, 122.0, 68.0, 43.0, 62.0, 29.0, 46.0, 30.0, 28.0, 32.0, 18.0, 20.0, 19.0, 18.0, 16.0, 12.0, 10.0, 8.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.91796875, -2.83251953125, -2.7470703125, -2.66162109375, -2.576171875, -2.49072265625, -2.4052734375, -2.31982421875, -2.234375, -2.14892578125, -2.0634765625, -1.97802734375, -1.892578125, -1.80712890625, -1.7216796875, -1.63623046875, -1.55078125, -1.46533203125, -1.3798828125, -1.29443359375, -1.208984375, -1.12353515625, -1.0380859375, -0.95263671875, -0.8671875, -0.78173828125, -0.6962890625, -0.61083984375, -0.525390625, -0.43994140625, -0.3544921875, -0.26904296875, -0.18359375, -0.09814453125, -0.0126953125, 0.07275390625, 0.158203125, 0.24365234375, 0.3291015625, 0.41455078125, 0.5, 0.58544921875, 0.6708984375, 0.75634765625, 0.841796875, 0.92724609375, 1.0126953125, 1.09814453125, 1.18359375, 1.26904296875, 1.3544921875, 1.43994140625, 1.525390625, 1.61083984375, 1.6962890625, 1.78173828125, 1.8671875, 1.95263671875, 2.0380859375, 2.12353515625, 2.208984375, 2.29443359375, 2.3798828125, 2.46533203125, 2.55078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 6.0, 6.0, 12.0, 16.0, 26.0, 41.0, 47.0, 72.0, 97.0, 152.0, 226.0, 434.0, 771.0, 2361.0, 28310.0, 2422492.0, 677040.0, 10587.0, 1506.0, 587.0, 331.0, 183.0, 137.0, 75.0, 62.0, 36.0, 20.0, 19.0, 13.0, 13.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.046875, -6.7938232421875, -6.540771484375, -6.2877197265625, -6.03466796875, -5.7816162109375, -5.528564453125, -5.2755126953125, -5.0224609375, -4.7694091796875, -4.516357421875, -4.2633056640625, -4.01025390625, -3.7572021484375, -3.504150390625, -3.2510986328125, -2.998046875, -2.7449951171875, -2.491943359375, -2.2388916015625, -1.98583984375, -1.7327880859375, -1.479736328125, -1.2266845703125, -0.9736328125, -0.7205810546875, -0.467529296875, -0.2144775390625, 0.03857421875, 0.2916259765625, 0.544677734375, 0.7977294921875, 1.05078125, 1.3038330078125, 1.556884765625, 1.8099365234375, 2.06298828125, 2.3160400390625, 2.569091796875, 2.8221435546875, 3.0751953125, 3.3282470703125, 3.581298828125, 3.8343505859375, 4.08740234375, 4.3404541015625, 4.593505859375, 4.8465576171875, 5.099609375, 5.3526611328125, 5.605712890625, 5.8587646484375, 6.11181640625, 6.3648681640625, 6.617919921875, 6.8709716796875, 7.1240234375, 7.3770751953125, 7.630126953125, 7.8831787109375, 8.13623046875, 8.3892822265625, 8.642333984375, 8.8953857421875, 9.1484375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 9.0, 38.0, 177.0, 418.0, 264.0, 97.0, 12.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.396899223327637, -4.594367027282715, -3.791834592819214, -2.989302158355713, -2.186769962310791, -1.3842377662658691, -0.5817050933837891, 0.2208271026611328, 1.0233592987060547, 1.8258916139602661, 2.6284239292144775, 3.4309563636779785, 4.2334885597229, 5.036020755767822, 5.838553428649902, 6.641085624694824, 7.443617820739746, 8.246150016784668, 9.04868221282959, 9.851215362548828, 10.65374755859375, 11.456279754638672, 12.258811950683594, 13.061344146728516, 13.863876342773438, 14.66640853881836, 15.468940734863281, 16.271472930908203, 17.074005126953125, 17.876537322998047, 18.67906951904297, 19.48160171508789, 20.284133911132812, 21.086666107177734, 21.889198303222656, 22.691730499267578, 23.4942626953125, 24.296794891357422, 25.099327087402344, 25.901859283447266, 26.704391479492188, 27.50692367553711, 28.30945587158203, 29.111988067626953, 29.914520263671875, 30.717052459716797, 31.51958465576172, 32.32211685180664, 33.12464904785156, 33.927181243896484, 34.729713439941406, 35.53224563598633, 36.33477783203125, 37.13731002807617, 37.939842224121094, 38.742374420166016, 39.5449104309082, 40.347442626953125, 41.14997482299805, 41.95250701904297, 42.75503921508789, 43.55757141113281, 44.360103607177734, 45.162635803222656, 45.96516799926758]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 4.0, 8.0, 5.0, 8.0, 15.0, 21.0, 18.0, 21.0, 29.0, 32.0, 26.0, 36.0, 25.0, 38.0, 35.0, 52.0, 36.0, 31.0, 42.0, 34.0, 46.0, 44.0, 37.0, 44.0, 37.0, 33.0, 39.0, 25.0, 26.0, 27.0, 22.0, 18.0, 14.0, 18.0, 13.0, 9.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.773736953735352, -6.5481743812561035, -6.322611331939697, -6.097048759460449, -5.871485710144043, -5.645923137664795, -5.420360565185547, -5.194797515869141, -4.969234943389893, -4.7436723709106445, -4.518109321594238, -4.29254674911499, -4.066984176635742, -3.841421127319336, -3.615858554840088, -3.3902957439422607, -3.1647329330444336, -2.9391701221466064, -2.7136073112487793, -2.4880447387695312, -2.262481927871704, -2.036919116973877, -1.8113564252853394, -1.5857937335968018, -1.3602309226989746, -1.1346681118011475, -0.9091054201126099, -0.6835426688194275, -0.4579799175262451, -0.23241710662841797, -0.006854414939880371, 0.21870827674865723, 0.4442715644836426, 0.669834315776825, 0.8953970670700073, 1.120959758758545, 1.346522569656372, 1.5720853805541992, 1.7976480722427368, 2.0232107639312744, 2.2487735748291016, 2.4743363857269287, 2.699899196624756, 2.925461769104004, 3.151024580001831, 3.376587390899658, 3.6021499633789062, 3.8277127742767334, 4.0532755851745605, 4.278838157653809, 4.504401206970215, 4.729963779449463, 4.955526351928711, 5.181089401245117, 5.406651973724365, 5.632214546203613, 5.8577775955200195, 6.083340167999268, 6.308903217315674, 6.534465789794922, 6.760028839111328, 6.985591411590576, 7.211153984069824, 7.4367170333862305, 7.6622796058654785]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 12.0, 4.0, 13.0, 8.0, 11.0, 11.0, 15.0, 26.0, 28.0, 26.0, 27.0, 32.0, 45.0, 43.0, 42.0, 46.0, 37.0, 29.0, 37.0, 52.0, 46.0, 38.0, 46.0, 34.0, 40.0, 17.0, 28.0, 37.0, 21.0, 27.0, 15.0, 15.0, 12.0, 13.0, 12.0, 8.0, 5.0, 6.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9873046875, -0.9558868408203125, -0.924468994140625, -0.8930511474609375, -0.86163330078125, -0.8302154541015625, -0.798797607421875, -0.7673797607421875, -0.7359619140625, -0.7045440673828125, -0.673126220703125, -0.6417083740234375, -0.61029052734375, -0.5788726806640625, -0.547454833984375, -0.5160369873046875, -0.484619140625, -0.4532012939453125, -0.421783447265625, -0.3903656005859375, -0.35894775390625, -0.3275299072265625, -0.296112060546875, -0.2646942138671875, -0.2332763671875, -0.2018585205078125, -0.170440673828125, -0.1390228271484375, -0.10760498046875, -0.0761871337890625, -0.044769287109375, -0.0133514404296875, 0.01806640625, 0.0494842529296875, 0.080902099609375, 0.1123199462890625, 0.14373779296875, 0.1751556396484375, 0.206573486328125, 0.2379913330078125, 0.2694091796875, 0.3008270263671875, 0.332244873046875, 0.3636627197265625, 0.39508056640625, 0.4264984130859375, 0.457916259765625, 0.4893341064453125, 0.520751953125, 0.5521697998046875, 0.583587646484375, 0.6150054931640625, 0.64642333984375, 0.6778411865234375, 0.709259033203125, 0.7406768798828125, 0.7720947265625, 0.8035125732421875, 0.834930419921875, 0.8663482666015625, 0.89776611328125, 0.9291839599609375, 0.960601806640625, 0.9920196533203125, 1.0234375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 11.0, 11.0, 15.0, 16.0, 28.0, 38.0, 51.0, 86.0, 124.0, 158.0, 257.0, 393.0, 680.0, 1042.0, 1887.0, 3486.0, 7023.0, 15259.0, 41202.0, 144330.0, 745077.0, 2271457.0, 744884.0, 145596.0, 41189.0, 15300.0, 6755.0, 3308.0, 1795.0, 1073.0, 622.0, 356.0, 252.0, 130.0, 111.0, 79.0, 54.0, 42.0, 22.0, 23.0, 14.0, 11.0, 2.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8486328125, -1.7837677001953125, -1.718902587890625, -1.6540374755859375, -1.58917236328125, -1.5243072509765625, -1.459442138671875, -1.3945770263671875, -1.3297119140625, -1.2648468017578125, -1.199981689453125, -1.1351165771484375, -1.07025146484375, -1.0053863525390625, -0.940521240234375, -0.8756561279296875, -0.810791015625, -0.7459259033203125, -0.681060791015625, -0.6161956787109375, -0.55133056640625, -0.4864654541015625, -0.421600341796875, -0.3567352294921875, -0.2918701171875, -0.2270050048828125, -0.162139892578125, -0.0972747802734375, -0.03240966796875, 0.0324554443359375, 0.097320556640625, 0.1621856689453125, 0.22705078125, 0.2919158935546875, 0.356781005859375, 0.4216461181640625, 0.48651123046875, 0.5513763427734375, 0.616241455078125, 0.6811065673828125, 0.7459716796875, 0.8108367919921875, 0.875701904296875, 0.9405670166015625, 1.00543212890625, 1.0702972412109375, 1.135162353515625, 1.2000274658203125, 1.264892578125, 1.3297576904296875, 1.394622802734375, 1.4594879150390625, 1.52435302734375, 1.5892181396484375, 1.654083251953125, 1.7189483642578125, 1.7838134765625, 1.8486785888671875, 1.913543701171875, 1.9784088134765625, 2.04327392578125, 2.1081390380859375, 2.173004150390625, 2.2378692626953125, 2.302734375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 8.0, 15.0, 24.0, 39.0, 35.0, 50.0, 53.0, 70.0, 100.0, 143.0, 180.0, 214.0, 287.0, 400.0, 460.0, 461.0, 351.0, 274.0, 203.0, 157.0, 136.0, 90.0, 68.0, 50.0, 40.0, 35.0, 26.0, 19.0, 14.0, 7.0, 4.0, 7.0, 6.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.513671875, -1.4626617431640625, -1.411651611328125, -1.3606414794921875, -1.30963134765625, -1.2586212158203125, -1.207611083984375, -1.1566009521484375, -1.1055908203125, -1.0545806884765625, -1.003570556640625, -0.9525604248046875, -0.90155029296875, -0.8505401611328125, -0.799530029296875, -0.7485198974609375, -0.697509765625, -0.6464996337890625, -0.595489501953125, -0.5444793701171875, -0.49346923828125, -0.4424591064453125, -0.391448974609375, -0.3404388427734375, -0.2894287109375, -0.2384185791015625, -0.187408447265625, -0.1363983154296875, -0.08538818359375, -0.0343780517578125, 0.016632080078125, 0.0676422119140625, 0.11865234375, 0.1696624755859375, 0.220672607421875, 0.2716827392578125, 0.32269287109375, 0.3737030029296875, 0.424713134765625, 0.4757232666015625, 0.5267333984375, 0.5777435302734375, 0.628753662109375, 0.6797637939453125, 0.73077392578125, 0.7817840576171875, 0.832794189453125, 0.8838043212890625, 0.934814453125, 0.9858245849609375, 1.036834716796875, 1.0878448486328125, 1.13885498046875, 1.1898651123046875, 1.240875244140625, 1.2918853759765625, 1.3428955078125, 1.3939056396484375, 1.444915771484375, 1.4959259033203125, 1.54693603515625, 1.5979461669921875, 1.648956298828125, 1.6999664306640625, 1.7509765625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 10.0, 20.0, 33.0, 27.0, 34.0, 49.0, 55.0, 68.0, 139.0, 187.0, 334.0, 1020.0, 4668.0, 56044.0, 3039947.0, 1061946.0, 25224.0, 2911.0, 702.0, 292.0, 152.0, 105.0, 63.0, 54.0, 48.0, 40.0, 32.0, 13.0, 18.0, 5.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.83990478515625, -7.5938720703125, -7.34783935546875, -7.101806640625, -6.85577392578125, -6.6097412109375, -6.36370849609375, -6.11767578125, -5.87164306640625, -5.6256103515625, -5.37957763671875, -5.133544921875, -4.88751220703125, -4.6414794921875, -4.39544677734375, -4.1494140625, -3.90338134765625, -3.6573486328125, -3.41131591796875, -3.165283203125, -2.91925048828125, -2.6732177734375, -2.42718505859375, -2.18115234375, -1.93511962890625, -1.6890869140625, -1.44305419921875, -1.197021484375, -0.95098876953125, -0.7049560546875, -0.45892333984375, -0.212890625, 0.03314208984375, 0.2791748046875, 0.52520751953125, 0.771240234375, 1.01727294921875, 1.2633056640625, 1.50933837890625, 1.75537109375, 2.00140380859375, 2.2474365234375, 2.49346923828125, 2.739501953125, 2.98553466796875, 3.2315673828125, 3.47760009765625, 3.7236328125, 3.96966552734375, 4.2156982421875, 4.46173095703125, 4.707763671875, 4.95379638671875, 5.1998291015625, 5.44586181640625, 5.69189453125, 5.93792724609375, 6.1839599609375, 6.42999267578125, 6.676025390625, 6.92205810546875, 7.1680908203125, 7.41412353515625, 7.66015625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 17.0, 65.0, 141.0, 239.0, 271.0, 158.0, 75.0, 29.0, 11.0, 6.0, 1.0, 2.0], "bins": [-44.41216278076172, -43.619407653808594, -42.82665252685547, -42.03389358520508, -41.24113845825195, -40.44838333129883, -39.6556282043457, -38.86286926269531, -38.07011413574219, -37.27735900878906, -36.48460388183594, -35.69184494018555, -34.89908981323242, -34.1063346862793, -33.31357955932617, -32.52082061767578, -31.72806739807129, -30.935312271118164, -30.142555236816406, -29.34980010986328, -28.557043075561523, -27.7642879486084, -26.97153091430664, -26.178775787353516, -25.38602066040039, -24.593265533447266, -23.800508499145508, -23.007753372192383, -22.214996337890625, -21.4222412109375, -20.629486083984375, -19.836729049682617, -19.04397201538086, -18.251216888427734, -17.458459854125977, -16.66570472717285, -15.872947692871094, -15.080192565917969, -14.287436485290527, -13.494680404663086, -12.701925277709961, -11.90916919708252, -11.116413116455078, -10.323657989501953, -9.530900955200195, -8.73814582824707, -7.945389747619629, -7.1526336669921875, -6.359877586364746, -5.567121505737305, -4.774365425109863, -3.98160982131958, -3.1888537406921387, -2.3960976600646973, -1.603342056274414, -0.8105859756469727, -0.01782989501953125, 0.7749260663986206, 1.5676820278167725, 2.3604378700256348, 3.153193950653076, 3.9459500312805176, 4.738705635070801, 5.531461715698242, 6.324217796325684]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 11.0, 9.0, 9.0, 14.0, 11.0, 16.0, 18.0, 28.0, 17.0, 25.0, 32.0, 27.0, 29.0, 34.0, 34.0, 39.0, 38.0, 29.0, 31.0, 42.0, 45.0, 30.0, 29.0, 38.0, 47.0, 31.0, 38.0, 27.0, 27.0, 22.0, 23.0, 26.0, 23.0, 14.0, 12.0, 10.0, 10.0, 6.0, 12.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.043004512786865, -5.864861488342285, -5.686717987060547, -5.508574962615967, -5.330431938171387, -5.152288913726807, -4.974145889282227, -4.796002388000488, -4.617859363555908, -4.439716339111328, -4.26157283782959, -4.08342981338501, -3.9052867889404297, -3.7271437644958496, -3.5490005016326904, -3.3708572387695312, -3.192714214324951, -3.014571189880371, -2.836427927017212, -2.6582846641540527, -2.4801416397094727, -2.3019986152648926, -2.1238553524017334, -1.9457122087478638, -1.7675690650939941, -1.5894259214401245, -1.4112827777862549, -1.2331396341323853, -1.0549964904785156, -0.876853346824646, -0.6987102031707764, -0.5205670595169067, -0.3424234390258789, -0.16428029537200928, 0.013862848281860352, 0.19200599193572998, 0.3701491355895996, 0.5482922792434692, 0.7264354228973389, 0.9045785665512085, 1.0827217102050781, 1.2608648538589478, 1.4390079975128174, 1.617151141166687, 1.7952942848205566, 1.9734374284744263, 2.151580572128296, 2.329723834991455, 2.507866859436035, 2.6860098838806152, 2.8641531467437744, 3.0422964096069336, 3.2204394340515137, 3.3985824584960938, 3.576725721359253, 3.754868984222412, 3.933012008666992, 4.111155033111572, 4.289298057556152, 4.467441558837891, 4.645584583282471, 4.823727607727051, 5.001871109008789, 5.180014133453369, 5.358157157897949]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 8.0, 8.0, 14.0, 14.0, 15.0, 23.0, 25.0, 21.0, 25.0, 24.0, 31.0, 42.0, 35.0, 32.0, 55.0, 42.0, 59.0, 38.0, 51.0, 54.0, 41.0, 37.0, 37.0, 33.0, 35.0, 31.0, 27.0, 34.0, 24.0, 14.0, 10.0, 13.0, 9.0, 8.0, 7.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1630859375, -1.129150390625, -1.09521484375, -1.061279296875, -1.02734375, -0.993408203125, -0.95947265625, -0.925537109375, -0.8916015625, -0.857666015625, -0.82373046875, -0.789794921875, -0.755859375, -0.721923828125, -0.68798828125, -0.654052734375, -0.6201171875, -0.586181640625, -0.55224609375, -0.518310546875, -0.484375, -0.450439453125, -0.41650390625, -0.382568359375, -0.3486328125, -0.314697265625, -0.28076171875, -0.246826171875, -0.212890625, -0.178955078125, -0.14501953125, -0.111083984375, -0.0771484375, -0.043212890625, -0.00927734375, 0.024658203125, 0.05859375, 0.092529296875, 0.12646484375, 0.160400390625, 0.1943359375, 0.228271484375, 0.26220703125, 0.296142578125, 0.330078125, 0.364013671875, 0.39794921875, 0.431884765625, 0.4658203125, 0.499755859375, 0.53369140625, 0.567626953125, 0.6015625, 0.635498046875, 0.66943359375, 0.703369140625, 0.7373046875, 0.771240234375, 0.80517578125, 0.839111328125, 0.873046875, 0.906982421875, 0.94091796875, 0.974853515625, 1.0087890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 12.0, 19.0, 30.0, 43.0, 57.0, 93.0, 150.0, 237.0, 371.0, 593.0, 970.0, 1545.0, 2687.0, 4504.0, 7970.0, 14400.0, 27321.0, 52805.0, 106882.0, 206834.0, 271227.0, 170934.0, 85639.0, 42737.0, 22324.0, 12164.0, 6648.0, 3764.0, 2120.0, 1318.0, 793.0, 450.0, 301.0, 196.0, 147.0, 75.0, 59.0, 47.0, 25.0, 26.0, 16.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16570663452148438, -0.15941619873046875, -0.15312576293945312, -0.1468353271484375, -0.14054489135742188, -0.13425445556640625, -0.12796401977539062, -0.121673583984375, -0.11538314819335938, -0.10909271240234375, -0.10280227661132812, -0.0965118408203125, -0.09022140502929688, -0.08393096923828125, -0.07764053344726562, -0.07135009765625, -0.06505966186523438, -0.05876922607421875, -0.052478790283203125, -0.0461883544921875, -0.039897918701171875, -0.03360748291015625, -0.027317047119140625, -0.021026611328125, -0.014736175537109375, -0.00844573974609375, -0.002155303955078125, 0.0041351318359375, 0.010425567626953125, 0.01671600341796875, 0.023006439208984375, 0.029296875, 0.035587310791015625, 0.04187774658203125, 0.048168182373046875, 0.0544586181640625, 0.060749053955078125, 0.06703948974609375, 0.07332992553710938, 0.079620361328125, 0.08591079711914062, 0.09220123291015625, 0.09849166870117188, 0.1047821044921875, 0.11107254028320312, 0.11736297607421875, 0.12365341186523438, 0.12994384765625, 0.13623428344726562, 0.14252471923828125, 0.14881515502929688, 0.1551055908203125, 0.16139602661132812, 0.16768646240234375, 0.17397689819335938, 0.180267333984375, 0.18655776977539062, 0.19284820556640625, 0.19913864135742188, 0.2054290771484375, 0.21171951293945312, 0.21800994873046875, 0.22430038452148438, 0.2305908203125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 8.0, 10.0, 13.0, 11.0, 11.0, 21.0, 19.0, 19.0, 13.0, 26.0, 29.0, 34.0, 42.0, 42.0, 45.0, 41.0, 49.0, 46.0, 1066.0, 41.0, 53.0, 33.0, 45.0, 43.0, 32.0, 34.0, 28.0, 25.0, 21.0, 19.0, 23.0, 18.0, 10.0, 16.0, 9.0, 5.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.80517578125, -0.78204345703125, -0.7589111328125, -0.73577880859375, -0.712646484375, -0.68951416015625, -0.6663818359375, -0.64324951171875, -0.6201171875, -0.59698486328125, -0.5738525390625, -0.55072021484375, -0.527587890625, -0.50445556640625, -0.4813232421875, -0.45819091796875, -0.43505859375, -0.41192626953125, -0.3887939453125, -0.36566162109375, -0.342529296875, -0.31939697265625, -0.2962646484375, -0.27313232421875, -0.25, -0.22686767578125, -0.2037353515625, -0.18060302734375, -0.157470703125, -0.13433837890625, -0.1112060546875, -0.08807373046875, -0.06494140625, -0.04180908203125, -0.0186767578125, 0.00445556640625, 0.027587890625, 0.05072021484375, 0.0738525390625, 0.09698486328125, 0.1201171875, 0.14324951171875, 0.1663818359375, 0.18951416015625, 0.212646484375, 0.23577880859375, 0.2589111328125, 0.28204345703125, 0.30517578125, 0.32830810546875, 0.3514404296875, 0.37457275390625, 0.397705078125, 0.42083740234375, 0.4439697265625, 0.46710205078125, 0.490234375, 0.51336669921875, 0.5364990234375, 0.55963134765625, 0.582763671875, 0.60589599609375, 0.6290283203125, 0.65216064453125, 0.67529296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 9.0, 12.0, 22.0, 19.0, 37.0, 41.0, 51.0, 85.0, 121.0, 187.0, 245.0, 374.0, 584.0, 949.0, 1624.0, 2838.0, 5034.0, 9800.0, 20734.0, 49628.0, 138658.0, 886289.0, 759568.0, 131395.0, 47222.0, 20245.0, 9420.0, 4858.0, 2712.0, 1522.0, 939.0, 616.0, 417.0, 252.0, 180.0, 119.0, 94.0, 57.0, 35.0, 36.0, 23.0, 16.0, 12.0, 15.0, 8.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.185791015625, -0.18032264709472656, -0.17485427856445312, -0.1693859100341797, -0.16391754150390625, -0.1584491729736328, -0.15298080444335938, -0.14751243591308594, -0.1420440673828125, -0.13657569885253906, -0.13110733032226562, -0.1256389617919922, -0.12017059326171875, -0.11470222473144531, -0.10923385620117188, -0.10376548767089844, -0.098297119140625, -0.09282875061035156, -0.08736038208007812, -0.08189201354980469, -0.07642364501953125, -0.07095527648925781, -0.06548690795898438, -0.06001853942871094, -0.0545501708984375, -0.04908180236816406, -0.043613433837890625, -0.03814506530761719, -0.03267669677734375, -0.027208328247070312, -0.021739959716796875, -0.016271591186523438, -0.01080322265625, -0.0053348541259765625, 0.000133514404296875, 0.0056018829345703125, 0.01107025146484375, 0.016538619995117188, 0.022006988525390625, 0.027475357055664062, 0.0329437255859375, 0.03841209411621094, 0.043880462646484375, 0.04934883117675781, 0.05481719970703125, 0.06028556823730469, 0.06575393676757812, 0.07122230529785156, 0.076690673828125, 0.08215904235839844, 0.08762741088867188, 0.09309577941894531, 0.09856414794921875, 0.10403251647949219, 0.10950088500976562, 0.11496925354003906, 0.1204376220703125, 0.12590599060058594, 0.13137435913085938, 0.1368427276611328, 0.14231109619140625, 0.1477794647216797, 0.15324783325195312, 0.15871620178222656, 0.1641845703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 13.0, 13.0, 28.0, 24.0, 50.0, 72.0, 100.0, 145.0, 140.0, 111.0, 104.0, 52.0, 43.0, 31.0, 25.0, 14.0, 8.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040802001953125, -0.0394902229309082, -0.038178443908691406, -0.03686666488647461, -0.03555488586425781, -0.034243106842041016, -0.03293132781982422, -0.03161954879760742, -0.030307769775390625, -0.028995990753173828, -0.02768421173095703, -0.026372432708740234, -0.025060653686523438, -0.02374887466430664, -0.022437095642089844, -0.021125316619873047, -0.01981353759765625, -0.018501758575439453, -0.017189979553222656, -0.01587820053100586, -0.014566421508789062, -0.013254642486572266, -0.011942863464355469, -0.010631084442138672, -0.009319305419921875, -0.008007526397705078, -0.006695747375488281, -0.005383968353271484, -0.0040721893310546875, -0.0027604103088378906, -0.0014486312866210938, -0.00013685226440429688, 0.0011749267578125, 0.002486705780029297, 0.0037984848022460938, 0.005110263824462891, 0.0064220428466796875, 0.007733821868896484, 0.009045600891113281, 0.010357379913330078, 0.011669158935546875, 0.012980937957763672, 0.014292716979980469, 0.015604496002197266, 0.016916275024414062, 0.01822805404663086, 0.019539833068847656, 0.020851612091064453, 0.02216339111328125, 0.023475170135498047, 0.024786949157714844, 0.02609872817993164, 0.027410507202148438, 0.028722286224365234, 0.03003406524658203, 0.03134584426879883, 0.032657623291015625, 0.03396940231323242, 0.03528118133544922, 0.036592960357666016, 0.03790473937988281, 0.03921651840209961, 0.040528297424316406, 0.0418400764465332, 0.04315185546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 6.0, 9.0, 12.0, 24.0, 28.0, 49.0, 83.0, 207.0, 830.0, 42743.0, 1001988.0, 2040.0, 284.0, 86.0, 52.0, 29.0, 25.0, 17.0, 8.0, 5.0, 9.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9111328125, -0.8828201293945312, -0.8545074462890625, -0.8261947631835938, -0.797882080078125, -0.7695693969726562, -0.7412567138671875, -0.7129440307617188, -0.68463134765625, -0.6563186645507812, -0.6280059814453125, -0.5996932983398438, -0.571380615234375, -0.5430679321289062, -0.5147552490234375, -0.48644256591796875, -0.4581298828125, -0.42981719970703125, -0.4015045166015625, -0.37319183349609375, -0.344879150390625, -0.31656646728515625, -0.2882537841796875, -0.25994110107421875, -0.23162841796875, -0.20331573486328125, -0.1750030517578125, -0.14669036865234375, -0.118377685546875, -0.09006500244140625, -0.0617523193359375, -0.03343963623046875, -0.005126953125, 0.02318572998046875, 0.0514984130859375, 0.07981109619140625, 0.108123779296875, 0.13643646240234375, 0.1647491455078125, 0.19306182861328125, 0.22137451171875, 0.24968719482421875, 0.2779998779296875, 0.30631256103515625, 0.334625244140625, 0.36293792724609375, 0.3912506103515625, 0.41956329345703125, 0.4478759765625, 0.47618865966796875, 0.5045013427734375, 0.5328140258789062, 0.561126708984375, 0.5894393920898438, 0.6177520751953125, 0.6460647583007812, 0.67437744140625, 0.7026901245117188, 0.7310028076171875, 0.7593154907226562, 0.787628173828125, 0.8159408569335938, 0.8442535400390625, 0.8725662231445312, 0.90087890625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 9.0, 11.0, 6.0, 13.0, 22.0, 30.0, 33.0, 58.0, 70.0, 92.0, 99.0, 126.0, 112.0, 103.0, 81.0, 51.0, 25.0, 21.0, 11.0, 12.0, 13.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03421332314610481, -0.03276054188609123, -0.03130776062607765, -0.029854977503418922, -0.028402196243405342, -0.026949413120746613, -0.025496631860733032, -0.024043850600719452, -0.02259106934070587, -0.02113828808069229, -0.01968550495803356, -0.01823272369801998, -0.0167799424380064, -0.015327160246670246, -0.013874378055334091, -0.01242159679532051, -0.010968813672661781, -0.009516031481325626, -0.008063250221312046, -0.006610468029975891, -0.0051576863043010235, -0.003704904578626156, -0.002252122387290001, -0.0007993411272764206, 0.0006534410640597343, 0.002106222789734602, 0.0035590047482401133, 0.0050117867067456245, 0.006464568432420492, 0.00791735015809536, 0.009370132349431515, 0.010822913609445095, 0.01227569580078125, 0.013728477992117405, 0.015181259252130985, 0.01663404144346714, 0.01808682270348072, 0.01953960582613945, 0.02099238708615303, 0.02244516834616661, 0.02389794960618019, 0.02535073086619377, 0.0268035139888525, 0.02825629524886608, 0.02970907650887966, 0.03116185963153839, 0.03261464089155197, 0.03406742215156555, 0.03552020341157913, 0.03697298467159271, 0.03842576593160629, 0.03987854719161987, 0.04133133217692375, 0.04278411343693733, 0.04423689469695091, 0.04568967595696449, 0.04714246094226837, 0.04859524220228195, 0.05004802346229553, 0.05150080472230911, 0.05295358970761299, 0.05440637096762657, 0.05585915222764015, 0.05731193348765373, 0.05876471474766731]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 3.0, 6.0, 8.0, 8.0, 13.0, 15.0, 20.0, 8.0, 28.0, 27.0, 27.0, 14.0, 30.0, 26.0, 31.0, 28.0, 32.0, 31.0, 35.0, 45.0, 40.0, 35.0, 45.0, 39.0, 38.0, 31.0, 32.0, 26.0, 35.0, 25.0, 37.0, 17.0, 22.0, 18.0, 21.0, 23.0, 14.0, 13.0, 10.0, 5.0, 10.0, 9.0, 5.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.028901875019073486, -0.027948113158345222, -0.02699435129761696, -0.026040589436888695, -0.02508682757616043, -0.024133065715432167, -0.023179303854703903, -0.02222554199397564, -0.021271780133247375, -0.02031801827251911, -0.019364256411790848, -0.018410494551062584, -0.01745673269033432, -0.016502970829606056, -0.015549208968877792, -0.014595447108149529, -0.013641685247421265, -0.012687923386693, -0.011734161525964737, -0.010780399665236473, -0.00982663780450821, -0.008872875943779945, -0.007919114083051682, -0.006965352222323418, -0.006011590361595154, -0.00505782850086689, -0.004104066640138626, -0.0031503047794103622, -0.0021965429186820984, -0.0012427810579538345, -0.0002890191972255707, 0.0006647426635026932, 0.001618504524230957, 0.002572266384959221, 0.0035260282456874847, 0.004479790106415749, 0.0054335519671440125, 0.006387313827872276, 0.00734107568860054, 0.008294837549328804, 0.009248599410057068, 0.010202361270785332, 0.011156123131513596, 0.01210988499224186, 0.013063646852970123, 0.014017408713698387, 0.014971170574426651, 0.015924932435154915, 0.01687869429588318, 0.017832456156611443, 0.018786218017339706, 0.01973997987806797, 0.020693741738796234, 0.021647503599524498, 0.022601265460252762, 0.023555027320981026, 0.02450878918170929, 0.025462551042437553, 0.026416312903165817, 0.02737007476389408, 0.028323836624622345, 0.02927759848535061, 0.030231360346078873, 0.031185122206807137, 0.0321388840675354]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 8.0, 8.0, 14.0, 13.0, 15.0, 25.0, 23.0, 22.0, 26.0, 23.0, 31.0, 40.0, 39.0, 30.0, 55.0, 43.0, 57.0, 40.0, 52.0, 53.0, 41.0, 36.0, 38.0, 31.0, 36.0, 33.0, 26.0, 34.0, 23.0, 12.0, 12.0, 14.0, 8.0, 8.0, 7.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1640625, -1.130096435546875, -1.09613037109375, -1.062164306640625, -1.0281982421875, -0.994232177734375, -0.96026611328125, -0.926300048828125, -0.892333984375, -0.858367919921875, -0.82440185546875, -0.790435791015625, -0.7564697265625, -0.722503662109375, -0.68853759765625, -0.654571533203125, -0.62060546875, -0.586639404296875, -0.55267333984375, -0.518707275390625, -0.4847412109375, -0.450775146484375, -0.41680908203125, -0.382843017578125, -0.348876953125, -0.314910888671875, -0.28094482421875, -0.246978759765625, -0.2130126953125, -0.179046630859375, -0.14508056640625, -0.111114501953125, -0.0771484375, -0.043182373046875, -0.00921630859375, 0.024749755859375, 0.0587158203125, 0.092681884765625, 0.12664794921875, 0.160614013671875, 0.194580078125, 0.228546142578125, 0.26251220703125, 0.296478271484375, 0.3304443359375, 0.364410400390625, 0.39837646484375, 0.432342529296875, 0.46630859375, 0.500274658203125, 0.53424072265625, 0.568206787109375, 0.6021728515625, 0.636138916015625, 0.67010498046875, 0.704071044921875, 0.738037109375, 0.772003173828125, 0.80596923828125, 0.839935302734375, 0.8739013671875, 0.907867431640625, 0.94183349609375, 0.975799560546875, 1.009765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 12.0, 20.0, 22.0, 51.0, 71.0, 139.0, 176.0, 259.0, 448.0, 836.0, 1613.0, 3105.0, 6410.0, 13584.0, 30650.0, 79536.0, 254819.0, 414909.0, 149640.0, 51478.0, 21291.0, 9691.0, 4535.0, 2384.0, 1229.0, 650.0, 349.0, 210.0, 150.0, 92.0, 55.0, 38.0, 27.0, 17.0, 11.0, 8.0, 11.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5703125, -1.52166748046875, -1.4730224609375, -1.42437744140625, -1.375732421875, -1.32708740234375, -1.2784423828125, -1.22979736328125, -1.18115234375, -1.13250732421875, -1.0838623046875, -1.03521728515625, -0.986572265625, -0.93792724609375, -0.8892822265625, -0.84063720703125, -0.7919921875, -0.74334716796875, -0.6947021484375, -0.64605712890625, -0.597412109375, -0.54876708984375, -0.5001220703125, -0.45147705078125, -0.40283203125, -0.35418701171875, -0.3055419921875, -0.25689697265625, -0.208251953125, -0.15960693359375, -0.1109619140625, -0.06231689453125, -0.013671875, 0.03497314453125, 0.0836181640625, 0.13226318359375, 0.180908203125, 0.22955322265625, 0.2781982421875, 0.32684326171875, 0.37548828125, 0.42413330078125, 0.4727783203125, 0.52142333984375, 0.570068359375, 0.61871337890625, 0.6673583984375, 0.71600341796875, 0.7646484375, 0.81329345703125, 0.8619384765625, 0.91058349609375, 0.959228515625, 1.00787353515625, 1.0565185546875, 1.10516357421875, 1.15380859375, 1.20245361328125, 1.2510986328125, 1.29974365234375, 1.348388671875, 1.39703369140625, 1.4456787109375, 1.49432373046875, 1.54296875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 8.0, 7.0, 8.0, 10.0, 14.0, 22.0, 17.0, 18.0, 36.0, 32.0, 38.0, 34.0, 42.0, 50.0, 80.0, 76.0, 179.0, 361.0, 1374.0, 181.0, 88.0, 59.0, 49.0, 32.0, 41.0, 26.0, 31.0, 15.0, 15.0, 18.0, 26.0, 12.0, 10.0, 10.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150390625, -3.048828125, -2.947265625, -2.845703125, -2.744140625, -2.642578125, -2.541015625, -2.439453125, -2.337890625, -2.236328125, -2.134765625, -2.033203125, -1.931640625, -1.830078125, -1.728515625, -1.626953125, -1.525390625, -1.423828125, -1.322265625, -1.220703125, -1.119140625, -1.017578125, -0.916015625, -0.814453125, -0.712890625, -0.611328125, -0.509765625, -0.408203125, -0.306640625, -0.205078125, -0.103515625, -0.001953125, 0.099609375, 0.201171875, 0.302734375, 0.404296875, 0.505859375, 0.607421875, 0.708984375, 0.810546875, 0.912109375, 1.013671875, 1.115234375, 1.216796875, 1.318359375, 1.419921875, 1.521484375, 1.623046875, 1.724609375, 1.826171875, 1.927734375, 2.029296875, 2.130859375, 2.232421875, 2.333984375, 2.435546875, 2.537109375, 2.638671875, 2.740234375, 2.841796875, 2.943359375, 3.044921875, 3.146484375, 3.248046875, 3.349609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 10.0, 7.0, 8.0, 6.0, 11.0, 19.0, 18.0, 26.0, 17.0, 37.0, 42.0, 72.0, 105.0, 133.0, 273.0, 562.0, 3013.0, 68656.0, 2891920.0, 173946.0, 5133.0, 782.0, 312.0, 170.0, 102.0, 73.0, 47.0, 43.0, 35.0, 23.0, 23.0, 12.0, 17.0, 15.0, 7.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4453125, -7.2237548828125, -7.002197265625, -6.7806396484375, -6.55908203125, -6.3375244140625, -6.115966796875, -5.8944091796875, -5.6728515625, -5.4512939453125, -5.229736328125, -5.0081787109375, -4.78662109375, -4.5650634765625, -4.343505859375, -4.1219482421875, -3.900390625, -3.6788330078125, -3.457275390625, -3.2357177734375, -3.01416015625, -2.7926025390625, -2.571044921875, -2.3494873046875, -2.1279296875, -1.9063720703125, -1.684814453125, -1.4632568359375, -1.24169921875, -1.0201416015625, -0.798583984375, -0.5770263671875, -0.35546875, -0.1339111328125, 0.087646484375, 0.3092041015625, 0.53076171875, 0.7523193359375, 0.973876953125, 1.1954345703125, 1.4169921875, 1.6385498046875, 1.860107421875, 2.0816650390625, 2.30322265625, 2.5247802734375, 2.746337890625, 2.9678955078125, 3.189453125, 3.4110107421875, 3.632568359375, 3.8541259765625, 4.07568359375, 4.2972412109375, 4.518798828125, 4.7403564453125, 4.9619140625, 5.1834716796875, 5.405029296875, 5.6265869140625, 5.84814453125, 6.0697021484375, 6.291259765625, 6.5128173828125, 6.734375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [5.0, 42.0, 267.0, 508.0, 180.0, 16.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.573046922683716, -1.811286449432373, -1.0495260953903198, -0.2877657413482666, 0.47399473190307617, 1.235755205154419, 1.9975154399871826, 2.7592761516571045, 3.521036386489868, 4.282796859741211, 5.044557094573975, 5.806317329406738, 6.56807804107666, 7.329838752746582, 8.091598510742188, 8.85335922241211, 9.615119934082031, 10.376880645751953, 11.138640403747559, 11.90040111541748, 12.662161827087402, 13.423921585083008, 14.18568229675293, 14.947443008422852, 15.709202766418457, 16.470962524414062, 17.232723236083984, 17.994483947753906, 18.756244659423828, 19.51800537109375, 20.279766082763672, 21.041526794433594, 21.803285598754883, 22.565046310424805, 23.326807022094727, 24.088565826416016, 24.850326538085938, 25.61208724975586, 26.37384796142578, 27.135608673095703, 27.897369384765625, 28.659130096435547, 29.42089080810547, 30.18265151977539, 30.94441032409668, 31.7061710357666, 32.467933654785156, 33.22969055175781, 33.991451263427734, 34.753211975097656, 35.51497268676758, 36.2767333984375, 37.03849411010742, 37.800254821777344, 38.56201171875, 39.32377624511719, 40.08553695678711, 40.84729766845703, 41.60905838012695, 42.370819091796875, 43.1325798034668, 43.89434051513672, 44.656097412109375, 45.41786193847656, 46.17961883544922]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 3.0, 10.0, 8.0, 13.0, 11.0, 13.0, 25.0, 25.0, 33.0, 28.0, 24.0, 36.0, 31.0, 31.0, 37.0, 37.0, 44.0, 50.0, 41.0, 41.0, 37.0, 44.0, 37.0, 30.0, 26.0, 27.0, 26.0, 31.0, 18.0, 28.0, 26.0, 21.0, 17.0, 15.0, 15.0, 12.0, 6.0, 8.0, 0.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.520465850830078, -8.25983715057373, -7.999208450317383, -7.738579750061035, -7.4779510498046875, -7.21732234954834, -6.95669412612915, -6.696065425872803, -6.435436725616455, -6.174808025360107, -5.91417932510376, -5.653550624847412, -5.392922401428223, -5.132293701171875, -4.871665000915527, -4.61103630065918, -4.350407600402832, -4.089778900146484, -3.8291501998901367, -3.568521738052368, -3.3078930377960205, -3.047264337539673, -2.7866358757019043, -2.5260071754455566, -2.265378475189209, -2.0047497749328613, -1.7441211938858032, -1.4834926128387451, -1.2228639125823975, -0.9622352123260498, -0.7016066312789917, -0.4409780502319336, -0.18034839630126953, 0.08028024435043335, 0.34090888500213623, 0.6015375256538391, 0.862166166305542, 1.1227948665618896, 1.3834234476089478, 1.6440520286560059, 1.9046807289123535, 2.165309429168701, 2.425938129425049, 2.6865665912628174, 2.947195291519165, 3.2078239917755127, 3.4684524536132812, 3.729081153869629, 3.9897098541259766, 4.250338554382324, 4.510967254638672, 4.7715959548950195, 5.032224655151367, 5.292853355407715, 5.553481578826904, 5.814110279083252, 6.0747389793396, 6.335367679595947, 6.595996379852295, 6.856625080108643, 7.117253303527832, 7.37788200378418, 7.638510704040527, 7.899139404296875, 8.159768104553223]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 15.0, 9.0, 13.0, 10.0, 14.0, 15.0, 20.0, 41.0, 26.0, 42.0, 36.0, 33.0, 37.0, 47.0, 43.0, 47.0, 47.0, 60.0, 46.0, 54.0, 38.0, 41.0, 39.0, 34.0, 36.0, 28.0, 31.0, 20.0, 16.0, 11.0, 8.0, 11.0, 10.0, 5.0, 6.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.380859375, -1.342071533203125, -1.30328369140625, -1.264495849609375, -1.2257080078125, -1.186920166015625, -1.14813232421875, -1.109344482421875, -1.070556640625, -1.031768798828125, -0.99298095703125, -0.954193115234375, -0.9154052734375, -0.876617431640625, -0.83782958984375, -0.799041748046875, -0.76025390625, -0.721466064453125, -0.68267822265625, -0.643890380859375, -0.6051025390625, -0.566314697265625, -0.52752685546875, -0.488739013671875, -0.449951171875, -0.411163330078125, -0.37237548828125, -0.333587646484375, -0.2947998046875, -0.256011962890625, -0.21722412109375, -0.178436279296875, -0.1396484375, -0.100860595703125, -0.06207275390625, -0.023284912109375, 0.0155029296875, 0.054290771484375, 0.09307861328125, 0.131866455078125, 0.170654296875, 0.209442138671875, 0.24822998046875, 0.287017822265625, 0.3258056640625, 0.364593505859375, 0.40338134765625, 0.442169189453125, 0.48095703125, 0.519744873046875, 0.55853271484375, 0.597320556640625, 0.6361083984375, 0.674896240234375, 0.71368408203125, 0.752471923828125, 0.791259765625, 0.830047607421875, 0.86883544921875, 0.907623291015625, 0.9464111328125, 0.985198974609375, 1.02398681640625, 1.062774658203125, 1.1015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 19.0, 22.0, 37.0, 69.0, 107.0, 199.0, 351.0, 636.0, 1299.0, 2800.0, 6868.0, 19580.0, 73725.0, 423301.0, 2295339.0, 1147471.0, 166604.0, 36252.0, 11417.0, 4265.0, 1888.0, 937.0, 442.0, 243.0, 134.0, 91.0, 55.0, 48.0, 19.0, 15.0, 14.0, 7.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -1.99603271484375, -1.9119873046875, -1.82794189453125, -1.743896484375, -1.65985107421875, -1.5758056640625, -1.49176025390625, -1.40771484375, -1.32366943359375, -1.2396240234375, -1.15557861328125, -1.071533203125, -0.98748779296875, -0.9034423828125, -0.81939697265625, -0.7353515625, -0.65130615234375, -0.5672607421875, -0.48321533203125, -0.399169921875, -0.31512451171875, -0.2310791015625, -0.14703369140625, -0.06298828125, 0.02105712890625, 0.1051025390625, 0.18914794921875, 0.273193359375, 0.35723876953125, 0.4412841796875, 0.52532958984375, 0.609375, 0.69342041015625, 0.7774658203125, 0.86151123046875, 0.945556640625, 1.02960205078125, 1.1136474609375, 1.19769287109375, 1.28173828125, 1.36578369140625, 1.4498291015625, 1.53387451171875, 1.617919921875, 1.70196533203125, 1.7860107421875, 1.87005615234375, 1.9541015625, 2.03814697265625, 2.1221923828125, 2.20623779296875, 2.290283203125, 2.37432861328125, 2.4583740234375, 2.54241943359375, 2.62646484375, 2.71051025390625, 2.7945556640625, 2.87860107421875, 2.962646484375, 3.04669189453125, 3.1307373046875, 3.21478271484375, 3.298828125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 12.0, 16.0, 18.0, 9.0, 25.0, 25.0, 23.0, 51.0, 62.0, 75.0, 99.0, 131.0, 170.0, 191.0, 269.0, 327.0, 400.0, 441.0, 405.0, 298.0, 238.0, 157.0, 133.0, 97.0, 74.0, 65.0, 41.0, 53.0, 31.0, 21.0, 19.0, 23.0, 17.0, 11.0, 10.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8212890625, -1.7663421630859375, -1.711395263671875, -1.6564483642578125, -1.60150146484375, -1.5465545654296875, -1.491607666015625, -1.4366607666015625, -1.3817138671875, -1.3267669677734375, -1.271820068359375, -1.2168731689453125, -1.16192626953125, -1.1069793701171875, -1.052032470703125, -0.9970855712890625, -0.942138671875, -0.8871917724609375, -0.832244873046875, -0.7772979736328125, -0.72235107421875, -0.6674041748046875, -0.612457275390625, -0.5575103759765625, -0.5025634765625, -0.4476165771484375, -0.392669677734375, -0.3377227783203125, -0.28277587890625, -0.2278289794921875, -0.172882080078125, -0.1179351806640625, -0.06298828125, -0.0080413818359375, 0.046905517578125, 0.1018524169921875, 0.15679931640625, 0.2117462158203125, 0.266693115234375, 0.3216400146484375, 0.3765869140625, 0.4315338134765625, 0.486480712890625, 0.5414276123046875, 0.59637451171875, 0.6513214111328125, 0.706268310546875, 0.7612152099609375, 0.816162109375, 0.8711090087890625, 0.926055908203125, 0.9810028076171875, 1.03594970703125, 1.0908966064453125, 1.145843505859375, 1.2007904052734375, 1.2557373046875, 1.3106842041015625, 1.365631103515625, 1.4205780029296875, 1.47552490234375, 1.5304718017578125, 1.585418701171875, 1.6403656005859375, 1.6953125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 9.0, 13.0, 10.0, 18.0, 17.0, 32.0, 40.0, 41.0, 54.0, 84.0, 94.0, 182.0, 280.0, 609.0, 1774.0, 6068.0, 34073.0, 465988.0, 3388017.0, 265075.0, 24190.0, 4803.0, 1388.0, 574.0, 288.0, 167.0, 103.0, 68.0, 56.0, 36.0, 25.0, 27.0, 15.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.29296875, -6.1046142578125, -5.916259765625, -5.7279052734375, -5.53955078125, -5.3511962890625, -5.162841796875, -4.9744873046875, -4.7861328125, -4.5977783203125, -4.409423828125, -4.2210693359375, -4.03271484375, -3.8443603515625, -3.656005859375, -3.4676513671875, -3.279296875, -3.0909423828125, -2.902587890625, -2.7142333984375, -2.52587890625, -2.3375244140625, -2.149169921875, -1.9608154296875, -1.7724609375, -1.5841064453125, -1.395751953125, -1.2073974609375, -1.01904296875, -0.8306884765625, -0.642333984375, -0.4539794921875, -0.265625, -0.0772705078125, 0.111083984375, 0.2994384765625, 0.48779296875, 0.6761474609375, 0.864501953125, 1.0528564453125, 1.2412109375, 1.4295654296875, 1.617919921875, 1.8062744140625, 1.99462890625, 2.1829833984375, 2.371337890625, 2.5596923828125, 2.748046875, 2.9364013671875, 3.124755859375, 3.3131103515625, 3.50146484375, 3.6898193359375, 3.878173828125, 4.0665283203125, 4.2548828125, 4.4432373046875, 4.631591796875, 4.8199462890625, 5.00830078125, 5.1966552734375, 5.385009765625, 5.5733642578125, 5.76171875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 18.0, 30.0, 51.0, 75.0, 97.0, 135.0, 144.0, 128.0, 108.0, 97.0, 56.0, 28.0, 19.0, 14.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.383947372436523, -18.938648223876953, -18.49334716796875, -18.04804801940918, -17.60274887084961, -17.15744972229004, -16.71215057373047, -16.266849517822266, -15.821550369262695, -15.376251220703125, -14.930951118469238, -14.485651016235352, -14.040351867675781, -13.595052719116211, -13.149752616882324, -12.704452514648438, -12.259153366088867, -11.813854217529297, -11.36855411529541, -10.923254013061523, -10.477954864501953, -10.032655715942383, -9.587355613708496, -9.14205551147461, -8.696756362915039, -8.251457214355469, -7.806157112121582, -7.3608574867248535, -6.915557861328125, -6.4702582359313965, -6.024958610534668, -5.5796589851379395, -5.134359359741211, -4.689059734344482, -4.243760108947754, -3.7984604835510254, -3.353160858154297, -2.9078612327575684, -2.46256160736084, -2.0172619819641113, -1.5719623565673828, -1.1266627311706543, -0.6813631057739258, -0.23606348037719727, 0.20923614501953125, 0.6545357704162598, 1.0998353958129883, 1.5451350212097168, 1.9904346466064453, 2.435734272003174, 2.8810338973999023, 3.326333522796631, 3.7716331481933594, 4.216932773590088, 4.662232398986816, 5.107532024383545, 5.552831649780273, 5.998131275177002, 6.4434309005737305, 6.888730525970459, 7.3340301513671875, 7.779329776763916, 8.224629402160645, 8.669929504394531, 9.115228652954102]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 2.0, 8.0, 7.0, 4.0, 7.0, 13.0, 18.0, 16.0, 18.0, 19.0, 21.0, 28.0, 33.0, 37.0, 32.0, 35.0, 32.0, 32.0, 35.0, 47.0, 39.0, 38.0, 42.0, 41.0, 27.0, 38.0, 37.0, 30.0, 26.0, 26.0, 32.0, 26.0, 18.0, 20.0, 18.0, 21.0, 9.0, 18.0, 6.0, 7.0, 8.0, 13.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.155001640319824, -6.949474334716797, -6.7439470291137695, -6.538419723510742, -6.332891941070557, -6.127364635467529, -5.921837329864502, -5.716310024261475, -5.510782241821289, -5.305254936218262, -5.099727630615234, -4.894200325012207, -4.6886725425720215, -4.483145236968994, -4.277617931365967, -4.0720906257629395, -3.866563320159912, -3.6610360145568848, -3.4555084705352783, -3.249981164932251, -3.0444536209106445, -2.838926315307617, -2.63339900970459, -2.4278717041015625, -2.222344160079956, -2.0168168544769287, -1.8112893104553223, -1.605762004852295, -1.400234580039978, -1.1947071552276611, -0.9891798496246338, -0.7836524248123169, -0.578125, -0.3725976049900055, -0.167070209980011, 0.03845715522766113, 0.24398458003997803, 0.4495120048522949, 0.6550393104553223, 0.8605667352676392, 1.066094160079956, 1.271621584892273, 1.4771490097045898, 1.6826763153076172, 1.888203740119934, 2.093731164932251, 2.2992584705352783, 2.5047860145568848, 2.710313320159912, 2.9158406257629395, 3.121368169784546, 3.3268954753875732, 3.5324230194091797, 3.737950325012207, 3.9434776306152344, 4.149004936218262, 4.354532241821289, 4.560059547424316, 4.765586853027344, 4.971114158630371, 5.176641941070557, 5.382169246673584, 5.587696552276611, 5.793223857879639, 5.998751640319824]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 12.0, 10.0, 11.0, 10.0, 18.0, 24.0, 24.0, 27.0, 25.0, 43.0, 37.0, 30.0, 45.0, 50.0, 39.0, 51.0, 48.0, 49.0, 57.0, 40.0, 50.0, 39.0, 36.0, 34.0, 35.0, 29.0, 33.0, 26.0, 17.0, 15.0, 7.0, 6.0, 3.0, 9.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.238372802734375, -1.20037841796875, -1.162384033203125, -1.1243896484375, -1.086395263671875, -1.04840087890625, -1.010406494140625, -0.972412109375, -0.934417724609375, -0.89642333984375, -0.858428955078125, -0.8204345703125, -0.782440185546875, -0.74444580078125, -0.706451416015625, -0.66845703125, -0.630462646484375, -0.59246826171875, -0.554473876953125, -0.5164794921875, -0.478485107421875, -0.44049072265625, -0.402496337890625, -0.364501953125, -0.326507568359375, -0.28851318359375, -0.250518798828125, -0.2125244140625, -0.174530029296875, -0.13653564453125, -0.098541259765625, -0.060546875, -0.022552490234375, 0.01544189453125, 0.053436279296875, 0.0914306640625, 0.129425048828125, 0.16741943359375, 0.205413818359375, 0.243408203125, 0.281402587890625, 0.31939697265625, 0.357391357421875, 0.3953857421875, 0.433380126953125, 0.47137451171875, 0.509368896484375, 0.54736328125, 0.585357666015625, 0.62335205078125, 0.661346435546875, 0.6993408203125, 0.737335205078125, 0.77532958984375, 0.813323974609375, 0.851318359375, 0.889312744140625, 0.92730712890625, 0.965301513671875, 1.0032958984375, 1.041290283203125, 1.07928466796875, 1.117279052734375, 1.1552734375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 15.0, 22.0, 46.0, 49.0, 79.0, 96.0, 135.0, 226.0, 331.0, 510.0, 817.0, 1317.0, 2224.0, 4057.0, 7845.0, 16134.0, 35567.0, 86595.0, 207334.0, 330428.0, 202359.0, 84155.0, 34725.0, 15891.0, 7672.0, 4059.0, 2254.0, 1331.0, 794.0, 498.0, 343.0, 218.0, 142.0, 87.0, 66.0, 44.0, 25.0, 17.0, 14.0, 7.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18654441833496094, -0.18021774291992188, -0.1738910675048828, -0.16756439208984375, -0.1612377166748047, -0.15491104125976562, -0.14858436584472656, -0.1422576904296875, -0.13593101501464844, -0.12960433959960938, -0.12327766418457031, -0.11695098876953125, -0.11062431335449219, -0.10429763793945312, -0.09797096252441406, -0.091644287109375, -0.08531761169433594, -0.07899093627929688, -0.07266426086425781, -0.06633758544921875, -0.06001091003417969, -0.053684234619140625, -0.04735755920410156, -0.0410308837890625, -0.03470420837402344, -0.028377532958984375, -0.022050857543945312, -0.01572418212890625, -0.009397506713867188, -0.003070831298828125, 0.0032558441162109375, 0.00958251953125, 0.015909194946289062, 0.022235870361328125, 0.028562545776367188, 0.03488922119140625, 0.04121589660644531, 0.047542572021484375, 0.05386924743652344, 0.0601959228515625, 0.06652259826660156, 0.07284927368164062, 0.07917594909667969, 0.08550262451171875, 0.09182929992675781, 0.09815597534179688, 0.10448265075683594, 0.110809326171875, 0.11713600158691406, 0.12346267700195312, 0.1297893524169922, 0.13611602783203125, 0.1424427032470703, 0.14876937866210938, 0.15509605407714844, 0.1614227294921875, 0.16774940490722656, 0.17407608032226562, 0.1804027557373047, 0.18672943115234375, 0.1930561065673828, 0.19938278198242188, 0.20570945739746094, 0.2120361328125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 3.0, 5.0, 3.0, 8.0, 9.0, 4.0, 9.0, 15.0, 22.0, 12.0, 27.0, 14.0, 21.0, 23.0, 18.0, 29.0, 26.0, 29.0, 38.0, 41.0, 38.0, 36.0, 45.0, 1054.0, 35.0, 28.0, 31.0, 30.0, 40.0, 25.0, 37.0, 30.0, 23.0, 20.0, 16.0, 25.0, 22.0, 29.0, 14.0, 16.0, 8.0, 16.0, 11.0, 7.0, 5.0, 7.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.63720703125, -0.6180877685546875, -0.598968505859375, -0.5798492431640625, -0.56072998046875, -0.5416107177734375, -0.522491455078125, -0.5033721923828125, -0.4842529296875, -0.4651336669921875, -0.446014404296875, -0.4268951416015625, -0.40777587890625, -0.3886566162109375, -0.369537353515625, -0.3504180908203125, -0.331298828125, -0.3121795654296875, -0.293060302734375, -0.2739410400390625, -0.25482177734375, -0.2357025146484375, -0.216583251953125, -0.1974639892578125, -0.1783447265625, -0.1592254638671875, -0.140106201171875, -0.1209869384765625, -0.10186767578125, -0.0827484130859375, -0.063629150390625, -0.0445098876953125, -0.025390625, -0.0062713623046875, 0.012847900390625, 0.0319671630859375, 0.05108642578125, 0.0702056884765625, 0.089324951171875, 0.1084442138671875, 0.1275634765625, 0.1466827392578125, 0.165802001953125, 0.1849212646484375, 0.20404052734375, 0.2231597900390625, 0.242279052734375, 0.2613983154296875, 0.280517578125, 0.2996368408203125, 0.318756103515625, 0.3378753662109375, 0.35699462890625, 0.3761138916015625, 0.395233154296875, 0.4143524169921875, 0.4334716796875, 0.4525909423828125, 0.471710205078125, 0.4908294677734375, 0.50994873046875, 0.5290679931640625, 0.548187255859375, 0.5673065185546875, 0.58642578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 14.0, 20.0, 39.0, 56.0, 77.0, 126.0, 267.0, 416.0, 724.0, 1360.0, 2739.0, 5898.0, 13706.0, 35245.0, 100914.0, 336756.0, 1285361.0, 203071.0, 66919.0, 24559.0, 9847.0, 4371.0, 2177.0, 1050.0, 573.0, 328.0, 208.0, 106.0, 60.0, 50.0, 31.0, 13.0, 13.0, 6.0, 11.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1589508056640625, -0.154449462890625, -0.1499481201171875, -0.14544677734375, -0.1409454345703125, -0.136444091796875, -0.1319427490234375, -0.12744140625, -0.1229400634765625, -0.118438720703125, -0.1139373779296875, -0.10943603515625, -0.1049346923828125, -0.100433349609375, -0.0959320068359375, -0.0914306640625, -0.0869293212890625, -0.082427978515625, -0.0779266357421875, -0.07342529296875, -0.0689239501953125, -0.064422607421875, -0.0599212646484375, -0.055419921875, -0.0509185791015625, -0.046417236328125, -0.0419158935546875, -0.03741455078125, -0.0329132080078125, -0.028411865234375, -0.0239105224609375, -0.0194091796875, -0.0149078369140625, -0.010406494140625, -0.0059051513671875, -0.00140380859375, 0.0030975341796875, 0.007598876953125, 0.0121002197265625, 0.0166015625, 0.0211029052734375, 0.025604248046875, 0.0301055908203125, 0.03460693359375, 0.0391082763671875, 0.043609619140625, 0.0481109619140625, 0.0526123046875, 0.0571136474609375, 0.061614990234375, 0.0661163330078125, 0.07061767578125, 0.0751190185546875, 0.079620361328125, 0.0841217041015625, 0.088623046875, 0.0931243896484375, 0.097625732421875, 0.1021270751953125, 0.10662841796875, 0.1111297607421875, 0.115631103515625, 0.1201324462890625, 0.1246337890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 5.0, 4.0, 10.0, 9.0, 16.0, 32.0, 38.0, 62.0, 79.0, 86.0, 104.0, 102.0, 105.0, 96.0, 49.0, 48.0, 24.0, 20.0, 13.0, 10.0, 6.0, 6.0, 4.0, 6.0, 5.0, 6.0, 0.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0159149169921875, -0.015365839004516602, -0.014816761016845703, -0.014267683029174805, -0.013718605041503906, -0.013169527053833008, -0.01262044906616211, -0.012071371078491211, -0.011522293090820312, -0.010973215103149414, -0.010424137115478516, -0.009875059127807617, -0.009325981140136719, -0.00877690315246582, -0.008227825164794922, -0.0076787471771240234, -0.007129669189453125, -0.0065805912017822266, -0.006031513214111328, -0.00548243522644043, -0.004933357238769531, -0.004384279251098633, -0.0038352012634277344, -0.003286123275756836, -0.0027370452880859375, -0.002187967300415039, -0.0016388893127441406, -0.0010898113250732422, -0.0005407333374023438, 8.344650268554688e-06, 0.0005574226379394531, 0.0011065006256103516, 0.00165557861328125, 0.0022046566009521484, 0.002753734588623047, 0.0033028125762939453, 0.0038518905639648438, 0.004400968551635742, 0.004950046539306641, 0.005499124526977539, 0.0060482025146484375, 0.006597280502319336, 0.007146358489990234, 0.007695436477661133, 0.008244514465332031, 0.00879359245300293, 0.009342670440673828, 0.009891748428344727, 0.010440826416015625, 0.010989904403686523, 0.011538982391357422, 0.01208806037902832, 0.012637138366699219, 0.013186216354370117, 0.013735294342041016, 0.014284372329711914, 0.014833450317382812, 0.015382528305053711, 0.01593160629272461, 0.016480684280395508, 0.017029762268066406, 0.017578840255737305, 0.018127918243408203, 0.0186769962310791, 0.01922607421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 7.0, 5.0, 7.0, 19.0, 18.0, 22.0, 30.0, 35.0, 36.0, 47.0, 95.0, 163.0, 472.0, 4625.0, 782011.0, 256594.0, 3498.0, 383.0, 151.0, 87.0, 51.0, 35.0, 26.0, 30.0, 20.0, 19.0, 15.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.385986328125, -0.3746147155761719, -0.36324310302734375, -0.3518714904785156, -0.3404998779296875, -0.3291282653808594, -0.31775665283203125, -0.3063850402832031, -0.295013427734375, -0.2836418151855469, -0.27227020263671875, -0.2608985900878906, -0.2495269775390625, -0.23815536499023438, -0.22678375244140625, -0.21541213989257812, -0.20404052734375, -0.19266891479492188, -0.18129730224609375, -0.16992568969726562, -0.1585540771484375, -0.14718246459960938, -0.13581085205078125, -0.12443923950195312, -0.113067626953125, -0.10169601440429688, -0.09032440185546875, -0.07895278930664062, -0.0675811767578125, -0.056209564208984375, -0.04483795166015625, -0.033466339111328125, -0.0220947265625, -0.010723114013671875, 0.00064849853515625, 0.012020111083984375, 0.0233917236328125, 0.034763336181640625, 0.04613494873046875, 0.057506561279296875, 0.068878173828125, 0.08024978637695312, 0.09162139892578125, 0.10299301147460938, 0.1143646240234375, 0.12573623657226562, 0.13710784912109375, 0.14847946166992188, 0.15985107421875, 0.17122268676757812, 0.18259429931640625, 0.19396591186523438, 0.2053375244140625, 0.21670913696289062, 0.22808074951171875, 0.23945236206054688, 0.250823974609375, 0.2621955871582031, 0.27356719970703125, 0.2849388122558594, 0.2963104248046875, 0.3076820373535156, 0.31905364990234375, 0.3304252624511719, 0.341796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 10.0, 28.0, 67.0, 144.0, 244.0, 237.0, 145.0, 65.0, 38.0, 15.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04146581515669823, -0.03948677331209183, -0.03750772774219513, -0.03552868589758873, -0.03354964032769203, -0.03157059848308563, -0.029591554775834084, -0.027612511068582535, -0.025633467361330986, -0.023654423654079437, -0.02167537994682789, -0.01969633623957634, -0.01771729439496994, -0.015738248825073242, -0.013759206980466843, -0.011780163273215294, -0.009801119565963745, -0.007822075858712196, -0.005843032617121935, -0.0038639893755316734, -0.0018849456682801247, 9.40980389714241e-05, 0.0020731408149003983, 0.004052184522151947, 0.006031228229403496, 0.008010271936655045, 0.009989315643906593, 0.011968358419835567, 0.013947402127087116, 0.01592644676566124, 0.01790548861026764, 0.019884532317519188, 0.021863572299480438, 0.023842616006731987, 0.025821659713983536, 0.027800701558589935, 0.029779747128486633, 0.03175878897309303, 0.03373783081769943, 0.03571687638759613, 0.03769592195749283, 0.03967496380209923, 0.041654009371995926, 0.043633051216602325, 0.04561209678649902, 0.04759113863110542, 0.04957018047571182, 0.05154922604560852, 0.05352826789021492, 0.05550730973482132, 0.05748635530471802, 0.05946539714932442, 0.061444442719221115, 0.06342348456382751, 0.06540253013372421, 0.06738157570362091, 0.06936061382293701, 0.07133965939283371, 0.07331869751214981, 0.07529774308204651, 0.0772767886519432, 0.0792558342218399, 0.081234872341156, 0.0832139179110527, 0.0851929634809494]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 7.0, 11.0, 8.0, 7.0, 13.0, 21.0, 14.0, 25.0, 24.0, 22.0, 26.0, 31.0, 32.0, 33.0, 33.0, 48.0, 45.0, 33.0, 44.0, 35.0, 33.0, 42.0, 35.0, 44.0, 43.0, 35.0, 32.0, 17.0, 25.0, 22.0, 24.0, 23.0, 16.0, 15.0, 11.0, 10.0, 17.0, 7.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.019136369228363037, -0.018570439890027046, -0.018004510551691055, -0.017438581213355064, -0.016872651875019073, -0.016306722536683083, -0.01574079319834709, -0.0151748638600111, -0.01460893452167511, -0.014043005183339119, -0.013477075845003128, -0.012911146506667137, -0.012345217168331146, -0.011779287829995155, -0.011213358491659164, -0.010647429153323174, -0.010081499814987183, -0.009515570476651192, -0.0089496411383152, -0.00838371179997921, -0.007817782461643219, -0.007251853123307228, -0.006685923784971237, -0.006119994446635246, -0.005554065108299255, -0.0049881357699632645, -0.0044222064316272736, -0.0038562770932912827, -0.0032903477549552917, -0.002724418416619301, -0.00215848907828331, -0.001592559739947319, -0.0010266304016113281, -0.0004607010632753372, 0.00010522827506065369, 0.0006711576133966446, 0.0012370869517326355, 0.0018030162900686264, 0.0023689456284046173, 0.002934874966740608, 0.003500804305076599, 0.00406673364341259, 0.004632662981748581, 0.005198592320084572, 0.005764521658420563, 0.006330450996756554, 0.0068963803350925446, 0.0074623096734285355, 0.008028239011764526, 0.008594168350100517, 0.009160097688436508, 0.009726027026772499, 0.01029195636510849, 0.010857885703444481, 0.011423815041780472, 0.011989744380116463, 0.012555673718452454, 0.013121603056788445, 0.013687532395124435, 0.014253461733460426, 0.014819391071796417, 0.015385320410132408, 0.0159512497484684, 0.01651717908680439, 0.01708310842514038]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 12.0, 10.0, 11.0, 11.0, 16.0, 27.0, 21.0, 28.0, 27.0, 41.0, 37.0, 30.0, 43.0, 52.0, 40.0, 49.0, 50.0, 48.0, 57.0, 45.0, 46.0, 37.0, 37.0, 35.0, 35.0, 29.0, 32.0, 27.0, 16.0, 15.0, 7.0, 6.0, 3.0, 9.0, 0.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.238372802734375, -1.20037841796875, -1.162384033203125, -1.1243896484375, -1.086395263671875, -1.04840087890625, -1.010406494140625, -0.972412109375, -0.934417724609375, -0.89642333984375, -0.858428955078125, -0.8204345703125, -0.782440185546875, -0.74444580078125, -0.706451416015625, -0.66845703125, -0.630462646484375, -0.59246826171875, -0.554473876953125, -0.5164794921875, -0.478485107421875, -0.44049072265625, -0.402496337890625, -0.364501953125, -0.326507568359375, -0.28851318359375, -0.250518798828125, -0.2125244140625, -0.174530029296875, -0.13653564453125, -0.098541259765625, -0.060546875, -0.022552490234375, 0.01544189453125, 0.053436279296875, 0.0914306640625, 0.129425048828125, 0.16741943359375, 0.205413818359375, 0.243408203125, 0.281402587890625, 0.31939697265625, 0.357391357421875, 0.3953857421875, 0.433380126953125, 0.47137451171875, 0.509368896484375, 0.54736328125, 0.585357666015625, 0.62335205078125, 0.661346435546875, 0.6993408203125, 0.737335205078125, 0.77532958984375, 0.813323974609375, 0.851318359375, 0.889312744140625, 0.92730712890625, 0.965301513671875, 1.0032958984375, 1.041290283203125, 1.07928466796875, 1.117279052734375, 1.1552734375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 8.0, 12.0, 17.0, 43.0, 59.0, 91.0, 141.0, 199.0, 286.0, 484.0, 752.0, 1161.0, 1969.0, 3153.0, 5237.0, 8745.0, 14878.0, 24842.0, 43912.0, 82052.0, 156029.0, 240775.0, 206371.0, 115001.0, 60732.0, 33326.0, 19092.0, 11322.0, 6828.0, 4178.0, 2596.0, 1532.0, 997.0, 665.0, 415.0, 233.0, 142.0, 90.0, 58.0, 43.0, 31.0, 23.0, 14.0, 10.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1142578125, -1.0812530517578125, -1.048248291015625, -1.0152435302734375, -0.98223876953125, -0.9492340087890625, -0.916229248046875, -0.8832244873046875, -0.8502197265625, -0.8172149658203125, -0.784210205078125, -0.7512054443359375, -0.71820068359375, -0.6851959228515625, -0.652191162109375, -0.6191864013671875, -0.586181640625, -0.5531768798828125, -0.520172119140625, -0.4871673583984375, -0.45416259765625, -0.4211578369140625, -0.388153076171875, -0.3551483154296875, -0.3221435546875, -0.2891387939453125, -0.256134033203125, -0.2231292724609375, -0.19012451171875, -0.1571197509765625, -0.124114990234375, -0.0911102294921875, -0.05810546875, -0.0251007080078125, 0.007904052734375, 0.0409088134765625, 0.07391357421875, 0.1069183349609375, 0.139923095703125, 0.1729278564453125, 0.2059326171875, 0.2389373779296875, 0.271942138671875, 0.3049468994140625, 0.33795166015625, 0.3709564208984375, 0.403961181640625, 0.4369659423828125, 0.469970703125, 0.5029754638671875, 0.535980224609375, 0.5689849853515625, 0.60198974609375, 0.6349945068359375, 0.667999267578125, 0.7010040283203125, 0.7340087890625, 0.7670135498046875, 0.800018310546875, 0.8330230712890625, 0.86602783203125, 0.8990325927734375, 0.932037353515625, 0.9650421142578125, 0.998046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 7.0, 1.0, 1.0, 6.0, 16.0, 11.0, 8.0, 12.0, 15.0, 17.0, 21.0, 16.0, 32.0, 31.0, 29.0, 28.0, 33.0, 45.0, 60.0, 90.0, 133.0, 240.0, 1345.0, 257.0, 130.0, 83.0, 65.0, 58.0, 38.0, 22.0, 32.0, 23.0, 28.0, 30.0, 11.0, 16.0, 11.0, 8.0, 6.0, 9.0, 7.0, 12.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.31640625, -3.22021484375, -3.1240234375, -3.02783203125, -2.931640625, -2.83544921875, -2.7392578125, -2.64306640625, -2.546875, -2.45068359375, -2.3544921875, -2.25830078125, -2.162109375, -2.06591796875, -1.9697265625, -1.87353515625, -1.77734375, -1.68115234375, -1.5849609375, -1.48876953125, -1.392578125, -1.29638671875, -1.2001953125, -1.10400390625, -1.0078125, -0.91162109375, -0.8154296875, -0.71923828125, -0.623046875, -0.52685546875, -0.4306640625, -0.33447265625, -0.23828125, -0.14208984375, -0.0458984375, 0.05029296875, 0.146484375, 0.24267578125, 0.3388671875, 0.43505859375, 0.53125, 0.62744140625, 0.7236328125, 0.81982421875, 0.916015625, 1.01220703125, 1.1083984375, 1.20458984375, 1.30078125, 1.39697265625, 1.4931640625, 1.58935546875, 1.685546875, 1.78173828125, 1.8779296875, 1.97412109375, 2.0703125, 2.16650390625, 2.2626953125, 2.35888671875, 2.455078125, 2.55126953125, 2.6474609375, 2.74365234375, 2.83984375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 15.0, 7.0, 9.0, 12.0, 12.0, 16.0, 27.0, 31.0, 50.0, 44.0, 70.0, 106.0, 157.0, 279.0, 559.0, 1730.0, 8328.0, 62598.0, 1304742.0, 1676719.0, 77039.0, 9699.0, 1925.0, 630.0, 274.0, 171.0, 103.0, 71.0, 64.0, 48.0, 40.0, 37.0, 15.0, 17.0, 12.0, 13.0, 10.0, 6.0, 1.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.0018310546875, -3.859130859375, -3.7164306640625, -3.57373046875, -3.4310302734375, -3.288330078125, -3.1456298828125, -3.0029296875, -2.8602294921875, -2.717529296875, -2.5748291015625, -2.43212890625, -2.2894287109375, -2.146728515625, -2.0040283203125, -1.861328125, -1.7186279296875, -1.575927734375, -1.4332275390625, -1.29052734375, -1.1478271484375, -1.005126953125, -0.8624267578125, -0.7197265625, -0.5770263671875, -0.434326171875, -0.2916259765625, -0.14892578125, -0.0062255859375, 0.136474609375, 0.2791748046875, 0.421875, 0.5645751953125, 0.707275390625, 0.8499755859375, 0.99267578125, 1.1353759765625, 1.278076171875, 1.4207763671875, 1.5634765625, 1.7061767578125, 1.848876953125, 1.9915771484375, 2.13427734375, 2.2769775390625, 2.419677734375, 2.5623779296875, 2.705078125, 2.8477783203125, 2.990478515625, 3.1331787109375, 3.27587890625, 3.4185791015625, 3.561279296875, 3.7039794921875, 3.8466796875, 3.9893798828125, 4.132080078125, 4.2747802734375, 4.41748046875, 4.5601806640625, 4.702880859375, 4.8455810546875, 4.98828125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 100.0, 319.0, 397.0, 142.0, 39.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.270973205566406, -9.485382080078125, -8.699790954589844, -7.914199352264404, -7.128607749938965, -6.343016624450684, -5.557425498962402, -4.771833896636963, -3.9862427711486816, -3.2006514072418213, -2.415060043334961, -1.6294689178466797, -0.8438775539398193, -0.058286190032958984, 0.7273049354553223, 1.5128965377807617, 2.298487663269043, 3.0840790271759033, 3.8696703910827637, 4.655261516571045, 5.440853118896484, 6.226444244384766, 7.012035369873047, 7.797626972198486, 8.58321762084961, 9.36880874633789, 10.154399871826172, 10.939990997314453, 11.72558307647705, 12.511174201965332, 13.296765327453613, 14.082357406616211, 14.867948532104492, 15.653539657592773, 16.439130783081055, 17.224721908569336, 18.010313034057617, 18.79590606689453, 19.581497192382812, 20.367088317871094, 21.152679443359375, 21.938270568847656, 22.723861694335938, 23.50945281982422, 24.2950439453125, 25.08063507080078, 25.866226196289062, 26.651819229125977, 27.437408447265625, 28.222999572753906, 29.008590698242188, 29.79418182373047, 30.57977294921875, 31.36536407470703, 32.15095520019531, 32.936546325683594, 33.72214126586914, 34.50773239135742, 35.2933235168457, 36.078914642333984, 36.864505767822266, 37.65009689331055, 38.43568801879883, 39.22127914428711, 40.00687026977539]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 4.0, 4.0, 5.0, 12.0, 9.0, 10.0, 14.0, 13.0, 13.0, 14.0, 23.0, 20.0, 31.0, 27.0, 34.0, 29.0, 36.0, 34.0, 45.0, 45.0, 48.0, 48.0, 39.0, 44.0, 48.0, 30.0, 38.0, 39.0, 36.0, 30.0, 29.0, 27.0, 21.0, 21.0, 13.0, 12.0, 13.0, 8.0, 5.0, 8.0, 11.0, 5.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.300514221191406, -9.03976058959961, -8.779006958007812, -8.518253326416016, -8.257498741149902, -7.9967451095581055, -7.735991477966309, -7.475237846374512, -7.214484214782715, -6.953730583190918, -6.692976474761963, -6.432222843170166, -6.171469211578369, -5.910715103149414, -5.649961471557617, -5.38920783996582, -5.128453731536865, -4.867700099945068, -4.606945991516113, -4.346192359924316, -4.0854387283325195, -3.8246848583221436, -3.5639309883117676, -3.3031773567199707, -3.0424234867095947, -2.7816696166992188, -2.520915985107422, -2.260162115097046, -1.9994083642959595, -1.738654613494873, -1.477900743484497, -1.2171469926834106, -0.9563937187194824, -0.695639967918396, -0.4348861575126648, -0.1741323471069336, 0.08662140369415283, 0.34737515449523926, 0.6081290245056152, 0.8688827753067017, 1.129636526107788, 1.3903902769088745, 1.651144027709961, 1.911897897720337, 2.172651767730713, 2.4334053993225098, 2.6941592693328857, 2.9549131393432617, 3.2156667709350586, 3.4764206409454346, 3.7371742725372314, 3.9979281425476074, 4.258681774139404, 4.519435882568359, 4.780189514160156, 5.040943145751953, 5.30169677734375, 5.562450408935547, 5.823204517364502, 6.083958148956299, 6.344711780548096, 6.605465888977051, 6.866219520568848, 7.1269731521606445, 7.3877272605896]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 9.0, 7.0, 5.0, 10.0, 13.0, 17.0, 19.0, 22.0, 22.0, 30.0, 22.0, 51.0, 36.0, 38.0, 40.0, 44.0, 50.0, 39.0, 49.0, 58.0, 55.0, 44.0, 35.0, 34.0, 34.0, 42.0, 34.0, 30.0, 22.0, 17.0, 14.0, 18.0, 11.0, 11.0, 5.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.236328125, -1.1980438232421875, -1.159759521484375, -1.1214752197265625, -1.08319091796875, -1.0449066162109375, -1.006622314453125, -0.9683380126953125, -0.9300537109375, -0.8917694091796875, -0.853485107421875, -0.8152008056640625, -0.77691650390625, -0.7386322021484375, -0.700347900390625, -0.6620635986328125, -0.623779296875, -0.5854949951171875, -0.547210693359375, -0.5089263916015625, -0.47064208984375, -0.4323577880859375, -0.394073486328125, -0.3557891845703125, -0.3175048828125, -0.2792205810546875, -0.240936279296875, -0.2026519775390625, -0.16436767578125, -0.1260833740234375, -0.087799072265625, -0.0495147705078125, -0.01123046875, 0.0270538330078125, 0.065338134765625, 0.1036224365234375, 0.14190673828125, 0.1801910400390625, 0.218475341796875, 0.2567596435546875, 0.2950439453125, 0.3333282470703125, 0.371612548828125, 0.4098968505859375, 0.44818115234375, 0.4864654541015625, 0.524749755859375, 0.5630340576171875, 0.601318359375, 0.6396026611328125, 0.677886962890625, 0.7161712646484375, 0.75445556640625, 0.7927398681640625, 0.831024169921875, 0.8693084716796875, 0.9075927734375, 0.9458770751953125, 0.984161376953125, 1.0224456787109375, 1.06072998046875, 1.0990142822265625, 1.137298583984375, 1.1755828857421875, 1.2138671875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 10.0, 6.0, 22.0, 23.0, 41.0, 60.0, 67.0, 98.0, 126.0, 229.0, 295.0, 430.0, 645.0, 986.0, 1496.0, 2562.0, 4576.0, 8860.0, 19577.0, 48174.0, 155011.0, 743283.0, 2259692.0, 712210.0, 149126.0, 47443.0, 18856.0, 8858.0, 4492.0, 2557.0, 1486.0, 937.0, 636.0, 416.0, 307.0, 201.0, 126.0, 118.0, 70.0, 51.0, 29.0, 24.0, 24.0, 16.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.0390625, -1.97430419921875, -1.9095458984375, -1.84478759765625, -1.780029296875, -1.71527099609375, -1.6505126953125, -1.58575439453125, -1.52099609375, -1.45623779296875, -1.3914794921875, -1.32672119140625, -1.261962890625, -1.19720458984375, -1.1324462890625, -1.06768798828125, -1.0029296875, -0.93817138671875, -0.8734130859375, -0.80865478515625, -0.743896484375, -0.67913818359375, -0.6143798828125, -0.54962158203125, -0.48486328125, -0.42010498046875, -0.3553466796875, -0.29058837890625, -0.225830078125, -0.16107177734375, -0.0963134765625, -0.03155517578125, 0.033203125, 0.09796142578125, 0.1627197265625, 0.22747802734375, 0.292236328125, 0.35699462890625, 0.4217529296875, 0.48651123046875, 0.55126953125, 0.61602783203125, 0.6807861328125, 0.74554443359375, 0.810302734375, 0.87506103515625, 0.9398193359375, 1.00457763671875, 1.0693359375, 1.13409423828125, 1.1988525390625, 1.26361083984375, 1.328369140625, 1.39312744140625, 1.4578857421875, 1.52264404296875, 1.58740234375, 1.65216064453125, 1.7169189453125, 1.78167724609375, 1.846435546875, 1.91119384765625, 1.9759521484375, 2.04071044921875, 2.10546875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 1.0, 6.0, 4.0, 10.0, 16.0, 16.0, 25.0, 35.0, 30.0, 38.0, 63.0, 84.0, 103.0, 154.0, 208.0, 292.0, 443.0, 470.0, 512.0, 409.0, 295.0, 218.0, 155.0, 127.0, 85.0, 63.0, 37.0, 36.0, 31.0, 26.0, 17.0, 16.0, 11.0, 7.0, 11.0, 5.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5168609619140625, -1.458526611328125, -1.4001922607421875, -1.34185791015625, -1.2835235595703125, -1.225189208984375, -1.1668548583984375, -1.1085205078125, -1.0501861572265625, -0.991851806640625, -0.9335174560546875, -0.87518310546875, -0.8168487548828125, -0.758514404296875, -0.7001800537109375, -0.641845703125, -0.5835113525390625, -0.525177001953125, -0.4668426513671875, -0.40850830078125, -0.3501739501953125, -0.291839599609375, -0.2335052490234375, -0.1751708984375, -0.1168365478515625, -0.058502197265625, -0.0001678466796875, 0.05816650390625, 0.1165008544921875, 0.174835205078125, 0.2331695556640625, 0.29150390625, 0.3498382568359375, 0.408172607421875, 0.4665069580078125, 0.52484130859375, 0.5831756591796875, 0.641510009765625, 0.6998443603515625, 0.7581787109375, 0.8165130615234375, 0.874847412109375, 0.9331817626953125, 0.99151611328125, 1.0498504638671875, 1.108184814453125, 1.1665191650390625, 1.224853515625, 1.2831878662109375, 1.341522216796875, 1.3998565673828125, 1.45819091796875, 1.5165252685546875, 1.574859619140625, 1.6331939697265625, 1.6915283203125, 1.7498626708984375, 1.808197021484375, 1.8665313720703125, 1.92486572265625, 1.9832000732421875, 2.041534423828125, 2.0998687744140625, 2.158203125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 0.0, 1.0, 4.0, 7.0, 6.0, 8.0, 13.0, 14.0, 24.0, 32.0, 33.0, 40.0, 75.0, 128.0, 206.0, 495.0, 1273.0, 4290.0, 22936.0, 241816.0, 3451003.0, 430514.0, 32913.0, 5722.0, 1540.0, 542.0, 257.0, 128.0, 87.0, 46.0, 42.0, 25.0, 29.0, 14.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.55859375, -7.36273193359375, -7.1668701171875, -6.97100830078125, -6.775146484375, -6.57928466796875, -6.3834228515625, -6.18756103515625, -5.99169921875, -5.79583740234375, -5.5999755859375, -5.40411376953125, -5.208251953125, -5.01239013671875, -4.8165283203125, -4.62066650390625, -4.4248046875, -4.22894287109375, -4.0330810546875, -3.83721923828125, -3.641357421875, -3.44549560546875, -3.2496337890625, -3.05377197265625, -2.85791015625, -2.66204833984375, -2.4661865234375, -2.27032470703125, -2.074462890625, -1.87860107421875, -1.6827392578125, -1.48687744140625, -1.291015625, -1.09515380859375, -0.8992919921875, -0.70343017578125, -0.507568359375, -0.31170654296875, -0.1158447265625, 0.08001708984375, 0.27587890625, 0.47174072265625, 0.6676025390625, 0.86346435546875, 1.059326171875, 1.25518798828125, 1.4510498046875, 1.64691162109375, 1.8427734375, 2.03863525390625, 2.2344970703125, 2.43035888671875, 2.626220703125, 2.82208251953125, 3.0179443359375, 3.21380615234375, 3.40966796875, 3.60552978515625, 3.8013916015625, 3.99725341796875, 4.193115234375, 4.38897705078125, 4.5848388671875, 4.78070068359375, 4.9765625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 80.0, 336.0, 426.0, 146.0, 21.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.90938377380371, -26.5213680267334, -25.13335418701172, -23.745338439941406, -22.357324600219727, -20.969308853149414, -19.581295013427734, -18.193279266357422, -16.80526351928711, -15.417248725891113, -14.029233932495117, -12.641218185424805, -11.253204345703125, -9.865188598632812, -8.477173805236816, -7.08915901184082, -5.701145172119141, -4.3131303787231445, -2.9251153469085693, -1.5371003150939941, -0.14908552169799805, 1.238929271697998, 2.6269445419311523, 4.014959335327148, 5.4029741287231445, 6.790988922119141, 8.179003715515137, 9.567018508911133, 10.955034255981445, 12.343048095703125, 13.731063842773438, 15.119078636169434, 16.507095336914062, 17.895111083984375, 19.283124923706055, 20.671140670776367, 22.059154510498047, 23.44717025756836, 24.835186004638672, 26.22319984436035, 27.61121368408203, 28.999229431152344, 30.387243270874023, 31.775259017944336, 33.163272857666016, 34.55128860473633, 35.93930435180664, 37.32731628417969, 38.71533203125, 40.10334777832031, 41.491363525390625, 42.87937545776367, 44.267391204833984, 45.6554069519043, 47.04342269897461, 48.431434631347656, 49.819454193115234, 51.20746994018555, 52.59548568725586, 53.983497619628906, 55.37151336669922, 56.75952911376953, 58.147544860839844, 59.535560607910156, 60.9235725402832]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 4.0, 11.0, 14.0, 12.0, 21.0, 16.0, 29.0, 29.0, 29.0, 38.0, 37.0, 29.0, 44.0, 38.0, 37.0, 50.0, 44.0, 50.0, 43.0, 47.0, 35.0, 34.0, 29.0, 26.0, 43.0, 32.0, 25.0, 21.0, 17.0, 21.0, 26.0, 12.0, 10.0, 9.0, 7.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.264359951019287, -7.041323184967041, -6.818285942077637, -6.595249176025391, -6.372211933135986, -6.14917516708374, -5.926137924194336, -5.70310115814209, -5.480064392089844, -5.257027626037598, -5.033990383148193, -4.810953617095947, -4.587916374206543, -4.364879608154297, -4.141842842102051, -3.9188055992126465, -3.6957685947418213, -3.472731590270996, -3.249694585800171, -3.0266575813293457, -2.8036208152770996, -2.5805838108062744, -2.357546806335449, -2.134510040283203, -1.9114729166030884, -1.6884359121322632, -1.4653990268707275, -1.2423620223999023, -1.0193250179290771, -0.7962881326675415, -0.5732511281967163, -0.35021424293518066, -0.12717723846435547, 0.09585972130298615, 0.31889668107032776, 0.5419336557388306, 0.764970600605011, 0.9880075454711914, 1.2110445499420166, 1.4340814352035522, 1.6571184396743774, 1.8801554441452026, 2.1031923294067383, 2.3262293338775635, 2.5492663383483887, 2.7723031044006348, 2.995340347290039, 3.218377113342285, 3.4414141178131104, 3.6644511222839355, 3.8874881267547607, 4.110525131225586, 4.333561897277832, 4.556598663330078, 4.779635906219482, 5.0026726722717285, 5.225709915161133, 5.448746681213379, 5.671783924102783, 5.894820690155029, 6.117857933044434, 6.34089469909668, 6.563931465148926, 6.78696870803833, 7.010005474090576]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 9.0, 10.0, 9.0, 16.0, 8.0, 12.0, 21.0, 21.0, 19.0, 25.0, 31.0, 30.0, 33.0, 36.0, 32.0, 31.0, 26.0, 39.0, 27.0, 46.0, 43.0, 47.0, 37.0, 34.0, 31.0, 33.0, 39.0, 25.0, 39.0, 29.0, 22.0, 19.0, 17.0, 18.0, 21.0, 8.0, 8.0, 13.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0498046875, -1.01873779296875, -0.9876708984375, -0.95660400390625, -0.925537109375, -0.89447021484375, -0.8634033203125, -0.83233642578125, -0.80126953125, -0.77020263671875, -0.7391357421875, -0.70806884765625, -0.677001953125, -0.64593505859375, -0.6148681640625, -0.58380126953125, -0.552734375, -0.52166748046875, -0.4906005859375, -0.45953369140625, -0.428466796875, -0.39739990234375, -0.3663330078125, -0.33526611328125, -0.30419921875, -0.27313232421875, -0.2420654296875, -0.21099853515625, -0.179931640625, -0.14886474609375, -0.1177978515625, -0.08673095703125, -0.0556640625, -0.02459716796875, 0.0064697265625, 0.03753662109375, 0.068603515625, 0.09967041015625, 0.1307373046875, 0.16180419921875, 0.19287109375, 0.22393798828125, 0.2550048828125, 0.28607177734375, 0.317138671875, 0.34820556640625, 0.3792724609375, 0.41033935546875, 0.44140625, 0.47247314453125, 0.5035400390625, 0.53460693359375, 0.565673828125, 0.59674072265625, 0.6278076171875, 0.65887451171875, 0.68994140625, 0.72100830078125, 0.7520751953125, 0.78314208984375, 0.814208984375, 0.84527587890625, 0.8763427734375, 0.90740966796875, 0.9384765625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 5.0, 11.0, 8.0, 13.0, 25.0, 28.0, 54.0, 51.0, 111.0, 178.0, 255.0, 435.0, 767.0, 1385.0, 2430.0, 4803.0, 9479.0, 20680.0, 47659.0, 121504.0, 293549.0, 313504.0, 134930.0, 52433.0, 22643.0, 10233.0, 5298.0, 2554.0, 1519.0, 757.0, 422.0, 287.0, 172.0, 128.0, 75.0, 49.0, 37.0, 29.0, 18.0, 8.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.21044921875, -0.20408248901367188, -0.19771575927734375, -0.19134902954101562, -0.1849822998046875, -0.17861557006835938, -0.17224884033203125, -0.16588211059570312, -0.159515380859375, -0.15314865112304688, -0.14678192138671875, -0.14041519165039062, -0.1340484619140625, -0.12768173217773438, -0.12131500244140625, -0.11494827270507812, -0.10858154296875, -0.10221481323242188, -0.09584808349609375, -0.08948135375976562, -0.0831146240234375, -0.07674789428710938, -0.07038116455078125, -0.06401443481445312, -0.057647705078125, -0.051280975341796875, -0.04491424560546875, -0.038547515869140625, -0.0321807861328125, -0.025814056396484375, -0.01944732666015625, -0.013080596923828125, -0.0067138671875, -0.000347137451171875, 0.00601959228515625, 0.012386322021484375, 0.0187530517578125, 0.025119781494140625, 0.03148651123046875, 0.037853240966796875, 0.044219970703125, 0.050586700439453125, 0.05695343017578125, 0.06332015991210938, 0.0696868896484375, 0.07605361938476562, 0.08242034912109375, 0.08878707885742188, 0.09515380859375, 0.10152053833007812, 0.10788726806640625, 0.11425399780273438, 0.1206207275390625, 0.12698745727539062, 0.13335418701171875, 0.13972091674804688, 0.146087646484375, 0.15245437622070312, 0.15882110595703125, 0.16518783569335938, 0.1715545654296875, 0.17792129516601562, 0.18428802490234375, 0.19065475463867188, 0.197021484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 7.0, 9.0, 9.0, 8.0, 16.0, 10.0, 25.0, 31.0, 26.0, 31.0, 36.0, 38.0, 40.0, 43.0, 32.0, 39.0, 53.0, 1060.0, 49.0, 41.0, 41.0, 47.0, 39.0, 41.0, 34.0, 26.0, 25.0, 24.0, 23.0, 16.0, 17.0, 13.0, 12.0, 14.0, 11.0, 3.0, 8.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7275390625, -0.7052764892578125, -0.683013916015625, -0.6607513427734375, -0.63848876953125, -0.6162261962890625, -0.593963623046875, -0.5717010498046875, -0.5494384765625, -0.5271759033203125, -0.504913330078125, -0.4826507568359375, -0.46038818359375, -0.4381256103515625, -0.415863037109375, -0.3936004638671875, -0.371337890625, -0.3490753173828125, -0.326812744140625, -0.3045501708984375, -0.28228759765625, -0.2600250244140625, -0.237762451171875, -0.2154998779296875, -0.1932373046875, -0.1709747314453125, -0.148712158203125, -0.1264495849609375, -0.10418701171875, -0.0819244384765625, -0.059661865234375, -0.0373992919921875, -0.01513671875, 0.0071258544921875, 0.029388427734375, 0.0516510009765625, 0.07391357421875, 0.0961761474609375, 0.118438720703125, 0.1407012939453125, 0.1629638671875, 0.1852264404296875, 0.207489013671875, 0.2297515869140625, 0.25201416015625, 0.2742767333984375, 0.296539306640625, 0.3188018798828125, 0.341064453125, 0.3633270263671875, 0.385589599609375, 0.4078521728515625, 0.43011474609375, 0.4523773193359375, 0.474639892578125, 0.4969024658203125, 0.5191650390625, 0.5414276123046875, 0.563690185546875, 0.5859527587890625, 0.60821533203125, 0.6304779052734375, 0.652740478515625, 0.6750030517578125, 0.697265625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 6.0, 7.0, 16.0, 18.0, 26.0, 39.0, 39.0, 64.0, 96.0, 144.0, 225.0, 274.0, 418.0, 671.0, 1076.0, 1658.0, 2867.0, 4779.0, 8697.0, 16628.0, 33485.0, 74321.0, 177397.0, 1002537.0, 507606.0, 142422.0, 61076.0, 27885.0, 14045.0, 7627.0, 4215.0, 2444.0, 1427.0, 960.0, 668.0, 419.0, 261.0, 158.0, 128.0, 82.0, 73.0, 38.0, 21.0, 32.0, 21.0, 12.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09765625, -0.09438800811767578, -0.09111976623535156, -0.08785152435302734, -0.08458328247070312, -0.0813150405883789, -0.07804679870605469, -0.07477855682373047, -0.07151031494140625, -0.06824207305908203, -0.06497383117675781, -0.061705589294433594, -0.058437347412109375, -0.055169105529785156, -0.05190086364746094, -0.04863262176513672, -0.0453643798828125, -0.04209613800048828, -0.03882789611816406, -0.035559654235839844, -0.032291412353515625, -0.029023170471191406, -0.025754928588867188, -0.02248668670654297, -0.01921844482421875, -0.01595020294189453, -0.012681961059570312, -0.009413719177246094, -0.006145477294921875, -0.0028772354125976562, 0.0003910064697265625, 0.0036592483520507812, 0.006927490234375, 0.010195732116699219, 0.013463973999023438, 0.016732215881347656, 0.020000457763671875, 0.023268699645996094, 0.026536941528320312, 0.02980518341064453, 0.03307342529296875, 0.03634166717529297, 0.03960990905761719, 0.042878150939941406, 0.046146392822265625, 0.049414634704589844, 0.05268287658691406, 0.05595111846923828, 0.0592193603515625, 0.06248760223388672, 0.06575584411621094, 0.06902408599853516, 0.07229232788085938, 0.0755605697631836, 0.07882881164550781, 0.08209705352783203, 0.08536529541015625, 0.08863353729248047, 0.09190177917480469, 0.0951700210571289, 0.09843826293945312, 0.10170650482177734, 0.10497474670410156, 0.10824298858642578, 0.11151123046875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 14.0, 10.0, 13.0, 12.0, 13.0, 21.0, 22.0, 28.0, 38.0, 70.0, 92.0, 157.0, 140.0, 91.0, 67.0, 50.0, 27.0, 21.0, 21.0, 16.0, 11.0, 7.0, 9.0, 3.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205230712890625, -0.019840717315673828, -0.019158363342285156, -0.018476009368896484, -0.017793655395507812, -0.01711130142211914, -0.01642894744873047, -0.015746593475341797, -0.015064239501953125, -0.014381885528564453, -0.013699531555175781, -0.01301717758178711, -0.012334823608398438, -0.011652469635009766, -0.010970115661621094, -0.010287761688232422, -0.00960540771484375, -0.008923053741455078, -0.008240699768066406, -0.007558345794677734, -0.0068759918212890625, -0.006193637847900391, -0.005511283874511719, -0.004828929901123047, -0.004146575927734375, -0.003464221954345703, -0.0027818679809570312, -0.0020995140075683594, -0.0014171600341796875, -0.0007348060607910156, -5.245208740234375e-05, 0.0006299018859863281, 0.001312255859375, 0.001994609832763672, 0.0026769638061523438, 0.0033593177795410156, 0.0040416717529296875, 0.004724025726318359, 0.005406379699707031, 0.006088733673095703, 0.006771087646484375, 0.007453441619873047, 0.008135795593261719, 0.00881814956665039, 0.009500503540039062, 0.010182857513427734, 0.010865211486816406, 0.011547565460205078, 0.01222991943359375, 0.012912273406982422, 0.013594627380371094, 0.014276981353759766, 0.014959335327148438, 0.01564168930053711, 0.01632404327392578, 0.017006397247314453, 0.017688751220703125, 0.018371105194091797, 0.01905345916748047, 0.01973581314086914, 0.020418167114257812, 0.021100521087646484, 0.021782875061035156, 0.022465229034423828, 0.0231475830078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 8.0, 11.0, 4.0, 12.0, 14.0, 21.0, 14.0, 23.0, 45.0, 44.0, 84.0, 189.0, 651.0, 31723.0, 1009731.0, 5207.0, 339.0, 129.0, 71.0, 52.0, 32.0, 17.0, 29.0, 17.0, 17.0, 11.0, 11.0, 12.0, 10.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464599609375, -0.4502143859863281, -0.43582916259765625, -0.4214439392089844, -0.4070587158203125, -0.3926734924316406, -0.37828826904296875, -0.3639030456542969, -0.349517822265625, -0.3351325988769531, -0.32074737548828125, -0.3063621520996094, -0.2919769287109375, -0.2775917053222656, -0.26320648193359375, -0.24882125854492188, -0.23443603515625, -0.22005081176757812, -0.20566558837890625, -0.19128036499023438, -0.1768951416015625, -0.16250991821289062, -0.14812469482421875, -0.13373947143554688, -0.119354248046875, -0.10496902465820312, -0.09058380126953125, -0.07619857788085938, -0.0618133544921875, -0.047428131103515625, -0.03304290771484375, -0.018657684326171875, -0.0042724609375, 0.010112762451171875, 0.02449798583984375, 0.038883209228515625, 0.0532684326171875, 0.06765365600585938, 0.08203887939453125, 0.09642410278320312, 0.110809326171875, 0.12519454956054688, 0.13957977294921875, 0.15396499633789062, 0.1683502197265625, 0.18273544311523438, 0.19712066650390625, 0.21150588989257812, 0.22589111328125, 0.24027633666992188, 0.25466156005859375, 0.2690467834472656, 0.2834320068359375, 0.2978172302246094, 0.31220245361328125, 0.3265876770019531, 0.340972900390625, 0.3553581237792969, 0.36974334716796875, 0.3841285705566406, 0.3985137939453125, 0.4128990173339844, 0.42728424072265625, 0.4416694641113281, 0.4560546875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 18.0, 80.0, 217.0, 362.0, 227.0, 71.0, 26.0, 6.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06614507734775543, -0.06354967504739761, -0.0609542652964592, -0.05835885927081108, -0.055763453245162964, -0.053168050944805145, -0.05057264491915703, -0.04797723889350891, -0.045381832867860794, -0.04278642684221268, -0.04019102081656456, -0.03759561479091644, -0.035000212490558624, -0.03240480273962021, -0.02980940043926239, -0.027213994413614273, -0.024618588387966156, -0.02202318236231804, -0.019427776336669922, -0.016832372173666954, -0.014236966148018837, -0.01164156012237072, -0.009046155028045177, -0.006450749933719635, -0.003855343908071518, -0.0012599383480846882, 0.0013354672119021416, 0.003930872771888971, 0.006526278331875801, 0.009121684357523918, 0.01171708945184946, 0.014312494546175003, 0.016907908022403717, 0.019503314048051834, 0.02209872007369995, 0.02469412423670292, 0.027289530262351036, 0.029884936287999153, 0.03248034045100212, 0.03507574647665024, 0.037671152502298355, 0.04026655852794647, 0.04286196455359459, 0.045457370579242706, 0.048052772879600525, 0.05064818263053894, 0.05324358493089676, 0.055838990956544876, 0.05843439698219299, 0.06102980300784111, 0.06362520903348923, 0.06622061133384705, 0.06881602108478546, 0.07141142338514328, 0.0740068331360817, 0.07660223543643951, 0.07919764518737793, 0.08179304748773575, 0.08438845723867416, 0.08698385953903198, 0.0895792692899704, 0.09217467159032822, 0.09477008134126663, 0.09736548364162445, 0.09996088594198227]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 10.0, 11.0, 10.0, 18.0, 13.0, 12.0, 21.0, 16.0, 18.0, 29.0, 27.0, 23.0, 34.0, 50.0, 31.0, 37.0, 48.0, 42.0, 41.0, 49.0, 45.0, 38.0, 41.0, 35.0, 36.0, 37.0, 25.0, 23.0, 25.0, 20.0, 14.0, 13.0, 11.0, 16.0, 11.0, 12.0, 8.0, 10.0, 10.0, 3.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015985071659088135, -0.015387794934213161, -0.014790518209338188, -0.014193241484463215, -0.013595964759588242, -0.012998688034713268, -0.012401411309838295, -0.011804134584963322, -0.011206857860088348, -0.010609581135213375, -0.010012304410338402, -0.009415027685463428, -0.008817750960588455, -0.008220474235713482, -0.007623197510838509, -0.007025920785963535, -0.006428644061088562, -0.005831367336213589, -0.005234090611338615, -0.004636813886463642, -0.004039537161588669, -0.0034422604367136955, -0.0028449837118387222, -0.002247706986963749, -0.0016504302620887756, -0.0010531535372138023, -0.00045587681233882904, 0.00014139991253614426, 0.0007386766374111176, 0.0013359533622860909, 0.0019332300871610641, 0.0025305068120360374, 0.0031277835369110107, 0.003725060261785984, 0.004322336986660957, 0.004919613711535931, 0.005516890436410904, 0.006114167161285877, 0.0067114438861608505, 0.007308720611035824, 0.007905997335910797, 0.00850327406078577, 0.009100550785660744, 0.009697827510535717, 0.01029510423541069, 0.010892380960285664, 0.011489657685160637, 0.01208693441003561, 0.012684211134910583, 0.013281487859785557, 0.01387876458466053, 0.014476041309535503, 0.015073318034410477, 0.015670593827962875, 0.016267871484160423, 0.01686514914035797, 0.01746242493391037, 0.01805970072746277, 0.018656978383660316, 0.019254256039857864, 0.019851531833410263, 0.020448807626962662, 0.02104608528316021, 0.021643362939357758, 0.022240638732910156]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 9.0, 9.0, 10.0, 16.0, 8.0, 12.0, 21.0, 20.0, 20.0, 26.0, 30.0, 30.0, 32.0, 37.0, 32.0, 31.0, 25.0, 39.0, 29.0, 45.0, 43.0, 46.0, 39.0, 34.0, 30.0, 31.0, 39.0, 28.0, 38.0, 29.0, 22.0, 19.0, 17.0, 19.0, 20.0, 8.0, 8.0, 13.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.05078125, -1.0196914672851562, -0.9886016845703125, -0.9575119018554688, -0.926422119140625, -0.8953323364257812, -0.8642425537109375, -0.8331527709960938, -0.80206298828125, -0.7709732055664062, -0.7398834228515625, -0.7087936401367188, -0.677703857421875, -0.6466140747070312, -0.6155242919921875, -0.5844345092773438, -0.5533447265625, -0.5222549438476562, -0.4911651611328125, -0.46007537841796875, -0.428985595703125, -0.39789581298828125, -0.3668060302734375, -0.33571624755859375, -0.30462646484375, -0.27353668212890625, -0.2424468994140625, -0.21135711669921875, -0.180267333984375, -0.14917755126953125, -0.1180877685546875, -0.08699798583984375, -0.055908203125, -0.02481842041015625, 0.0062713623046875, 0.03736114501953125, 0.068450927734375, 0.09954071044921875, 0.1306304931640625, 0.16172027587890625, 0.19281005859375, 0.22389984130859375, 0.2549896240234375, 0.28607940673828125, 0.317169189453125, 0.34825897216796875, 0.3793487548828125, 0.41043853759765625, 0.4415283203125, 0.47261810302734375, 0.5037078857421875, 0.5347976684570312, 0.565887451171875, 0.5969772338867188, 0.6280670166015625, 0.6591567993164062, 0.69024658203125, 0.7213363647460938, 0.7524261474609375, 0.7835159301757812, 0.814605712890625, 0.8456954956054688, 0.8767852783203125, 0.9078750610351562, 0.93896484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 14.0, 18.0, 26.0, 16.0, 31.0, 43.0, 85.0, 136.0, 206.0, 346.0, 647.0, 1108.0, 2051.0, 4000.0, 8145.0, 17543.0, 42553.0, 105096.0, 247471.0, 339748.0, 162642.0, 65952.0, 27000.0, 11752.0, 5584.0, 2829.0, 1489.0, 823.0, 464.0, 284.0, 136.0, 95.0, 74.0, 49.0, 25.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.65625, -1.603240966796875, -1.55023193359375, -1.497222900390625, -1.4442138671875, -1.391204833984375, -1.33819580078125, -1.285186767578125, -1.232177734375, -1.179168701171875, -1.12615966796875, -1.073150634765625, -1.0201416015625, -0.967132568359375, -0.91412353515625, -0.861114501953125, -0.80810546875, -0.755096435546875, -0.70208740234375, -0.649078369140625, -0.5960693359375, -0.543060302734375, -0.49005126953125, -0.437042236328125, -0.384033203125, -0.331024169921875, -0.27801513671875, -0.225006103515625, -0.1719970703125, -0.118988037109375, -0.06597900390625, -0.012969970703125, 0.0400390625, 0.093048095703125, 0.14605712890625, 0.199066162109375, 0.2520751953125, 0.305084228515625, 0.35809326171875, 0.411102294921875, 0.464111328125, 0.517120361328125, 0.57012939453125, 0.623138427734375, 0.6761474609375, 0.729156494140625, 0.78216552734375, 0.835174560546875, 0.88818359375, 0.941192626953125, 0.99420166015625, 1.047210693359375, 1.1002197265625, 1.153228759765625, 1.20623779296875, 1.259246826171875, 1.312255859375, 1.365264892578125, 1.41827392578125, 1.471282958984375, 1.5242919921875, 1.577301025390625, 1.63031005859375, 1.683319091796875, 1.736328125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 3.0, 8.0, 11.0, 8.0, 15.0, 16.0, 22.0, 21.0, 19.0, 37.0, 34.0, 37.0, 33.0, 50.0, 67.0, 114.0, 215.0, 1355.0, 318.0, 159.0, 95.0, 56.0, 52.0, 42.0, 43.0, 26.0, 36.0, 26.0, 28.0, 24.0, 15.0, 12.0, 10.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.873046875, -3.761688232421875, -3.65032958984375, -3.538970947265625, -3.4276123046875, -3.316253662109375, -3.20489501953125, -3.093536376953125, -2.982177734375, -2.870819091796875, -2.75946044921875, -2.648101806640625, -2.5367431640625, -2.425384521484375, -2.31402587890625, -2.202667236328125, -2.09130859375, -1.979949951171875, -1.86859130859375, -1.757232666015625, -1.6458740234375, -1.534515380859375, -1.42315673828125, -1.311798095703125, -1.200439453125, -1.089080810546875, -0.97772216796875, -0.866363525390625, -0.7550048828125, -0.643646240234375, -0.53228759765625, -0.420928955078125, -0.3095703125, -0.198211669921875, -0.08685302734375, 0.024505615234375, 0.1358642578125, 0.247222900390625, 0.35858154296875, 0.469940185546875, 0.581298828125, 0.692657470703125, 0.80401611328125, 0.915374755859375, 1.0267333984375, 1.138092041015625, 1.24945068359375, 1.360809326171875, 1.47216796875, 1.583526611328125, 1.69488525390625, 1.806243896484375, 1.9176025390625, 2.028961181640625, 2.14031982421875, 2.251678466796875, 2.363037109375, 2.474395751953125, 2.58575439453125, 2.697113037109375, 2.8084716796875, 2.919830322265625, 3.03118896484375, 3.142547607421875, 3.25390625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 6.0, 15.0, 17.0, 23.0, 29.0, 26.0, 42.0, 56.0, 71.0, 107.0, 187.0, 303.0, 695.0, 2183.0, 11348.0, 160355.0, 2678989.0, 271149.0, 15673.0, 2680.0, 828.0, 300.0, 169.0, 121.0, 74.0, 50.0, 44.0, 41.0, 24.0, 18.0, 15.0, 9.0, 14.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.42724609375, -5.2373046875, -5.04736328125, -4.857421875, -4.66748046875, -4.4775390625, -4.28759765625, -4.09765625, -3.90771484375, -3.7177734375, -3.52783203125, -3.337890625, -3.14794921875, -2.9580078125, -2.76806640625, -2.578125, -2.38818359375, -2.1982421875, -2.00830078125, -1.818359375, -1.62841796875, -1.4384765625, -1.24853515625, -1.05859375, -0.86865234375, -0.6787109375, -0.48876953125, -0.298828125, -0.10888671875, 0.0810546875, 0.27099609375, 0.4609375, 0.65087890625, 0.8408203125, 1.03076171875, 1.220703125, 1.41064453125, 1.6005859375, 1.79052734375, 1.98046875, 2.17041015625, 2.3603515625, 2.55029296875, 2.740234375, 2.93017578125, 3.1201171875, 3.31005859375, 3.5, 3.68994140625, 3.8798828125, 4.06982421875, 4.259765625, 4.44970703125, 4.6396484375, 4.82958984375, 5.01953125, 5.20947265625, 5.3994140625, 5.58935546875, 5.779296875, 5.96923828125, 6.1591796875, 6.34912109375, 6.5390625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 18.0, 249.0, 601.0, 144.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.164565086364746, -6.881267547607422, -5.5979695320129395, -4.314671516418457, -3.031373977661133, -1.7480764389038086, -0.46477842330932617, 0.8185195922851562, 2.1018171310424805, 3.385114908218384, 4.668412685394287, 5.9517107009887695, 7.235008239746094, 8.518305778503418, 9.801603317260742, 11.084901809692383, 12.368199348449707, 13.651496887207031, 14.934795379638672, 16.21809196472168, 17.50139045715332, 18.784687042236328, 20.06798553466797, 21.35128402709961, 22.63458251953125, 23.91788101196289, 25.2011775970459, 26.48447608947754, 27.767772674560547, 29.051071166992188, 30.334369659423828, 31.61766815185547, 32.900962829589844, 34.184261322021484, 35.467559814453125, 36.7508544921875, 38.03415298461914, 39.31745147705078, 40.60074996948242, 41.88404846191406, 43.16734313964844, 44.45064163208008, 45.73394012451172, 47.017234802246094, 48.300533294677734, 49.583831787109375, 50.867130279541016, 52.150428771972656, 53.4337272644043, 54.71702575683594, 56.00032424926758, 57.28361892700195, 58.566917419433594, 59.850215911865234, 61.133514404296875, 62.416812896728516, 63.700111389160156, 64.98340606689453, 66.26670837402344, 67.55000305175781, 68.83330535888672, 70.1166000366211, 71.39989471435547, 72.68319702148438, 73.96649169921875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 9.0, 3.0, 10.0, 5.0, 12.0, 13.0, 11.0, 12.0, 10.0, 5.0, 17.0, 22.0, 24.0, 28.0, 31.0, 20.0, 25.0, 28.0, 40.0, 32.0, 32.0, 35.0, 30.0, 32.0, 34.0, 42.0, 41.0, 49.0, 37.0, 27.0, 32.0, 29.0, 30.0, 29.0, 26.0, 13.0, 24.0, 19.0, 19.0, 12.0, 13.0, 8.0, 8.0, 8.0, 2.0, 6.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.77738094329834, -7.528471946716309, -7.279562473297119, -7.030653476715088, -6.781744003295898, -6.532835006713867, -6.283925533294678, -6.0350165367126465, -5.786107063293457, -5.537198066711426, -5.288288593292236, -5.039379596710205, -4.790470123291016, -4.541561126708984, -4.292651653289795, -4.043742656707764, -3.7948334217071533, -3.545924186706543, -3.2970149517059326, -3.0481057167053223, -2.799196481704712, -2.5502872467041016, -2.3013782501220703, -2.052468776702881, -1.80355966091156, -1.5546504259109497, -1.3057411909103394, -1.0568320751190186, -0.8079227805137634, -0.5590136051177979, -0.3101043701171875, -0.06119513511657715, 0.1877140998840332, 0.43662333488464355, 0.6855325698852539, 0.9344417452812195, 1.1833510398864746, 1.4322601556777954, 1.6811693906784058, 1.9300786256790161, 2.178987979888916, 2.4278972148895264, 2.6768064498901367, 2.925715684890747, 3.1746249198913574, 3.4235339164733887, 3.672443389892578, 3.9213523864746094, 4.170261383056641, 4.419170379638672, 4.668079853057861, 4.916988849639893, 5.165898323059082, 5.414807319641113, 5.663716793060303, 5.912625789642334, 6.161535263061523, 6.410444259643555, 6.659353733062744, 6.908262729644775, 7.157172203063965, 7.406081199645996, 7.6549906730651855, 7.903899669647217, 8.152809143066406]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 7.0, 6.0, 5.0, 5.0, 3.0, 7.0, 12.0, 16.0, 16.0, 12.0, 20.0, 24.0, 27.0, 33.0, 28.0, 28.0, 36.0, 41.0, 38.0, 42.0, 40.0, 38.0, 38.0, 46.0, 34.0, 33.0, 43.0, 37.0, 40.0, 31.0, 29.0, 21.0, 24.0, 23.0, 22.0, 15.0, 15.0, 12.0, 15.0, 7.0, 14.0, 4.0, 8.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.052734375, -1.0191192626953125, -0.985504150390625, -0.9518890380859375, -0.91827392578125, -0.8846588134765625, -0.851043701171875, -0.8174285888671875, -0.7838134765625, -0.7501983642578125, -0.716583251953125, -0.6829681396484375, -0.64935302734375, -0.6157379150390625, -0.582122802734375, -0.5485076904296875, -0.514892578125, -0.4812774658203125, -0.447662353515625, -0.4140472412109375, -0.38043212890625, -0.3468170166015625, -0.313201904296875, -0.2795867919921875, -0.2459716796875, -0.2123565673828125, -0.178741455078125, -0.1451263427734375, -0.11151123046875, -0.0778961181640625, -0.044281005859375, -0.0106658935546875, 0.02294921875, 0.0565643310546875, 0.090179443359375, 0.1237945556640625, 0.15740966796875, 0.1910247802734375, 0.224639892578125, 0.2582550048828125, 0.2918701171875, 0.3254852294921875, 0.359100341796875, 0.3927154541015625, 0.42633056640625, 0.4599456787109375, 0.493560791015625, 0.5271759033203125, 0.560791015625, 0.5944061279296875, 0.628021240234375, 0.6616363525390625, 0.69525146484375, 0.7288665771484375, 0.762481689453125, 0.7960968017578125, 0.8297119140625, 0.8633270263671875, 0.896942138671875, 0.9305572509765625, 0.96417236328125, 0.9977874755859375, 1.031402587890625, 1.0650177001953125, 1.0986328125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 8.0, 15.0, 17.0, 31.0, 32.0, 37.0, 88.0, 112.0, 155.0, 214.0, 310.0, 451.0, 699.0, 1005.0, 1555.0, 2465.0, 4182.0, 7441.0, 14460.0, 32447.0, 88081.0, 320626.0, 1457203.0, 1689774.0, 394416.0, 104632.0, 37762.0, 16279.0, 8183.0, 4437.0, 2499.0, 1603.0, 1031.0, 634.0, 405.0, 295.0, 194.0, 158.0, 109.0, 65.0, 47.0, 30.0, 23.0, 26.0, 9.0, 14.0, 7.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.025390625, -1.964141845703125, -1.90289306640625, -1.841644287109375, -1.7803955078125, -1.719146728515625, -1.65789794921875, -1.596649169921875, -1.535400390625, -1.474151611328125, -1.41290283203125, -1.351654052734375, -1.2904052734375, -1.229156494140625, -1.16790771484375, -1.106658935546875, -1.04541015625, -0.984161376953125, -0.92291259765625, -0.861663818359375, -0.8004150390625, -0.739166259765625, -0.67791748046875, -0.616668701171875, -0.555419921875, -0.494171142578125, -0.43292236328125, -0.371673583984375, -0.3104248046875, -0.249176025390625, -0.18792724609375, -0.126678466796875, -0.0654296875, -0.004180908203125, 0.05706787109375, 0.118316650390625, 0.1795654296875, 0.240814208984375, 0.30206298828125, 0.363311767578125, 0.424560546875, 0.485809326171875, 0.54705810546875, 0.608306884765625, 0.6695556640625, 0.730804443359375, 0.79205322265625, 0.853302001953125, 0.91455078125, 0.975799560546875, 1.03704833984375, 1.098297119140625, 1.1595458984375, 1.220794677734375, 1.28204345703125, 1.343292236328125, 1.404541015625, 1.465789794921875, 1.52703857421875, 1.588287353515625, 1.6495361328125, 1.710784912109375, 1.77203369140625, 1.833282470703125, 1.89453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 17.0, 12.0, 13.0, 20.0, 33.0, 37.0, 43.0, 53.0, 95.0, 126.0, 165.0, 234.0, 331.0, 452.0, 536.0, 523.0, 405.0, 268.0, 194.0, 140.0, 92.0, 76.0, 44.0, 43.0, 26.0, 14.0, 14.0, 15.0, 6.0, 6.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.212890625, -2.1492767333984375, -2.085662841796875, -2.0220489501953125, -1.95843505859375, -1.8948211669921875, -1.831207275390625, -1.7675933837890625, -1.7039794921875, -1.6403656005859375, -1.576751708984375, -1.5131378173828125, -1.44952392578125, -1.3859100341796875, -1.322296142578125, -1.2586822509765625, -1.195068359375, -1.1314544677734375, -1.067840576171875, -1.0042266845703125, -0.94061279296875, -0.8769989013671875, -0.813385009765625, -0.7497711181640625, -0.6861572265625, -0.6225433349609375, -0.558929443359375, -0.4953155517578125, -0.43170166015625, -0.3680877685546875, -0.304473876953125, -0.2408599853515625, -0.17724609375, -0.1136322021484375, -0.050018310546875, 0.0135955810546875, 0.07720947265625, 0.1408233642578125, 0.204437255859375, 0.2680511474609375, 0.3316650390625, 0.3952789306640625, 0.458892822265625, 0.5225067138671875, 0.58612060546875, 0.6497344970703125, 0.713348388671875, 0.7769622802734375, 0.840576171875, 0.9041900634765625, 0.967803955078125, 1.0314178466796875, 1.09503173828125, 1.1586456298828125, 1.222259521484375, 1.2858734130859375, 1.3494873046875, 1.4131011962890625, 1.476715087890625, 1.5403289794921875, 1.60394287109375, 1.6675567626953125, 1.731170654296875, 1.7947845458984375, 1.8583984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 7.0, 9.0, 12.0, 7.0, 16.0, 25.0, 29.0, 46.0, 54.0, 103.0, 193.0, 343.0, 720.0, 1757.0, 5187.0, 17627.0, 86546.0, 997738.0, 2823934.0, 213566.0, 32989.0, 8326.0, 2728.0, 1109.0, 536.0, 257.0, 140.0, 69.0, 69.0, 38.0, 24.0, 22.0, 15.0, 5.0, 10.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.1295166015625, -3.977783203125, -3.8260498046875, -3.67431640625, -3.5225830078125, -3.370849609375, -3.2191162109375, -3.0673828125, -2.9156494140625, -2.763916015625, -2.6121826171875, -2.46044921875, -2.3087158203125, -2.156982421875, -2.0052490234375, -1.853515625, -1.7017822265625, -1.550048828125, -1.3983154296875, -1.24658203125, -1.0948486328125, -0.943115234375, -0.7913818359375, -0.6396484375, -0.4879150390625, -0.336181640625, -0.1844482421875, -0.03271484375, 0.1190185546875, 0.270751953125, 0.4224853515625, 0.57421875, 0.7259521484375, 0.877685546875, 1.0294189453125, 1.18115234375, 1.3328857421875, 1.484619140625, 1.6363525390625, 1.7880859375, 1.9398193359375, 2.091552734375, 2.2432861328125, 2.39501953125, 2.5467529296875, 2.698486328125, 2.8502197265625, 3.001953125, 3.1536865234375, 3.305419921875, 3.4571533203125, 3.60888671875, 3.7606201171875, 3.912353515625, 4.0640869140625, 4.2158203125, 4.3675537109375, 4.519287109375, 4.6710205078125, 4.82275390625, 4.9744873046875, 5.126220703125, 5.2779541015625, 5.4296875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 31.0, 241.0, 579.0, 156.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.012923240661621, -12.126651763916016, -10.24038028717041, -8.354108810424805, -6.467837333679199, -4.581565856933594, -2.6952943801879883, -0.8090229034423828, 1.0772485733032227, 2.963520050048828, 4.849791526794434, 6.736063003540039, 8.622334480285645, 10.50860595703125, 12.394877433776855, 14.281148910522461, 16.16741943359375, 18.053691864013672, 19.93996238708496, 21.82623291015625, 23.712505340576172, 25.598777770996094, 27.485048294067383, 29.371318817138672, 31.257591247558594, 33.143863677978516, 35.03013610839844, 36.916404724121094, 38.802677154541016, 40.68894958496094, 42.575218200683594, 44.461490631103516, 46.34776306152344, 48.23403549194336, 50.12030792236328, 52.00657653808594, 53.89284896850586, 55.77912139892578, 57.66539001464844, 59.55166244506836, 61.43793487548828, 63.3242073059082, 65.21047973632812, 67.09674835205078, 68.98301696777344, 70.86929321289062, 72.75556182861328, 74.64183807373047, 76.52810668945312, 78.41437530517578, 80.30065155029297, 82.18692016601562, 84.07319641113281, 85.95946502685547, 87.84573364257812, 89.73200988769531, 91.61827850341797, 93.50454711914062, 95.39082336425781, 97.27709197998047, 99.16336059570312, 101.04963684082031, 102.93590545654297, 104.82218170166016, 106.70845031738281]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 5.0, 9.0, 13.0, 7.0, 8.0, 16.0, 14.0, 20.0, 16.0, 28.0, 20.0, 23.0, 27.0, 32.0, 22.0, 44.0, 34.0, 43.0, 32.0, 45.0, 38.0, 35.0, 32.0, 30.0, 44.0, 39.0, 33.0, 34.0, 31.0, 19.0, 24.0, 21.0, 13.0, 24.0, 16.0, 22.0, 14.0, 14.0, 10.0, 9.0, 11.0, 3.0, 1.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.533347129821777, -5.341763019561768, -5.150179386138916, -4.958595275878906, -4.767011642456055, -4.575427532196045, -4.383843421936035, -4.192259788513184, -4.000675678253174, -3.809091806411743, -3.6175079345703125, -3.4259238243103027, -3.234339952468872, -3.0427560806274414, -2.8511719703674316, -2.659588098526001, -2.4680042266845703, -2.2764203548431396, -2.084836483001709, -1.8932523727416992, -1.7016685009002686, -1.510084629058838, -1.3185006380081177, -1.1269166469573975, -0.9353327751159668, -0.7437488436698914, -0.5521649122238159, -0.3605809807777405, -0.16899704933166504, 0.0225868821144104, 0.21417081356048584, 0.40575480461120605, 0.5973386764526367, 0.7889226078987122, 0.9805065393447876, 1.1720905303955078, 1.3636744022369385, 1.5552582740783691, 1.7468422651290894, 1.9384262561798096, 2.1300101280212402, 2.321593999862671, 2.5131778717041016, 2.7047619819641113, 2.896345853805542, 3.0879297256469727, 3.2795138359069824, 3.471097707748413, 3.6626815795898438, 3.8542654514312744, 4.045849323272705, 4.237433433532715, 4.429017066955566, 4.620601177215576, 4.812185287475586, 5.0037689208984375, 5.195353031158447, 5.386937141418457, 5.578520774841309, 5.770104885101318, 5.961688995361328, 6.15327262878418, 6.3448567390441895, 6.536440849304199, 6.728024482727051]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 8.0, 10.0, 12.0, 16.0, 19.0, 21.0, 22.0, 23.0, 28.0, 27.0, 40.0, 34.0, 31.0, 44.0, 39.0, 40.0, 39.0, 41.0, 49.0, 41.0, 41.0, 38.0, 38.0, 42.0, 18.0, 25.0, 16.0, 27.0, 24.0, 24.0, 20.0, 17.0, 13.0, 10.0, 14.0, 8.0, 6.0, 6.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.0278167724609375, -0.993133544921875, -0.9584503173828125, -0.92376708984375, -0.8890838623046875, -0.854400634765625, -0.8197174072265625, -0.7850341796875, -0.7503509521484375, -0.715667724609375, -0.6809844970703125, -0.64630126953125, -0.6116180419921875, -0.576934814453125, -0.5422515869140625, -0.507568359375, -0.4728851318359375, -0.438201904296875, -0.4035186767578125, -0.36883544921875, -0.3341522216796875, -0.299468994140625, -0.2647857666015625, -0.2301025390625, -0.1954193115234375, -0.160736083984375, -0.1260528564453125, -0.09136962890625, -0.0566864013671875, -0.022003173828125, 0.0126800537109375, 0.04736328125, 0.0820465087890625, 0.116729736328125, 0.1514129638671875, 0.18609619140625, 0.2207794189453125, 0.255462646484375, 0.2901458740234375, 0.3248291015625, 0.3595123291015625, 0.394195556640625, 0.4288787841796875, 0.46356201171875, 0.4982452392578125, 0.532928466796875, 0.5676116943359375, 0.602294921875, 0.6369781494140625, 0.671661376953125, 0.7063446044921875, 0.74102783203125, 0.7757110595703125, 0.810394287109375, 0.8450775146484375, 0.8797607421875, 0.9144439697265625, 0.949127197265625, 0.9838104248046875, 1.01849365234375, 1.0531768798828125, 1.087860107421875, 1.1225433349609375, 1.1572265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 18.0, 16.0, 25.0, 24.0, 40.0, 70.0, 101.0, 142.0, 199.0, 304.0, 449.0, 682.0, 1074.0, 1734.0, 2904.0, 4738.0, 7918.0, 14229.0, 25542.0, 46663.0, 85966.0, 149733.0, 221796.0, 202411.0, 125118.0, 69188.0, 38079.0, 20425.0, 11824.0, 6600.0, 3943.0, 2289.0, 1479.0, 960.0, 638.0, 392.0, 273.0, 159.0, 116.0, 76.0, 57.0, 53.0, 30.0, 23.0, 21.0, 11.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1187744140625, -0.11515617370605469, -0.11153793334960938, -0.10791969299316406, -0.10430145263671875, -0.10068321228027344, -0.09706497192382812, -0.09344673156738281, -0.0898284912109375, -0.08621025085449219, -0.08259201049804688, -0.07897377014160156, -0.07535552978515625, -0.07173728942871094, -0.06811904907226562, -0.06450080871582031, -0.060882568359375, -0.05726432800292969, -0.053646087646484375, -0.05002784729003906, -0.04640960693359375, -0.04279136657714844, -0.039173126220703125, -0.03555488586425781, -0.0319366455078125, -0.028318405151367188, -0.024700164794921875, -0.021081924438476562, -0.01746368408203125, -0.013845443725585938, -0.010227203369140625, -0.0066089630126953125, -0.00299072265625, 0.0006275177001953125, 0.004245758056640625, 0.007863998413085938, 0.01148223876953125, 0.015100479125976562, 0.018718719482421875, 0.022336959838867188, 0.0259552001953125, 0.029573440551757812, 0.033191680908203125, 0.03680992126464844, 0.04042816162109375, 0.04404640197753906, 0.047664642333984375, 0.05128288269042969, 0.054901123046875, 0.05851936340332031, 0.062137603759765625, 0.06575584411621094, 0.06937408447265625, 0.07299232482910156, 0.07661056518554688, 0.08022880554199219, 0.0838470458984375, 0.08746528625488281, 0.09108352661132812, 0.09470176696777344, 0.09832000732421875, 0.10193824768066406, 0.10555648803710938, 0.10917472839355469, 0.11279296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 6.0, 4.0, 4.0, 11.0, 12.0, 9.0, 15.0, 13.0, 19.0, 20.0, 25.0, 17.0, 16.0, 30.0, 33.0, 26.0, 27.0, 27.0, 42.0, 39.0, 35.0, 40.0, 1066.0, 51.0, 40.0, 38.0, 42.0, 37.0, 43.0, 23.0, 20.0, 26.0, 24.0, 20.0, 25.0, 15.0, 18.0, 14.0, 8.0, 7.0, 10.0, 7.0, 4.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.72412109375, -0.70184326171875, -0.6795654296875, -0.65728759765625, -0.635009765625, -0.61273193359375, -0.5904541015625, -0.56817626953125, -0.5458984375, -0.52362060546875, -0.5013427734375, -0.47906494140625, -0.456787109375, -0.43450927734375, -0.4122314453125, -0.38995361328125, -0.36767578125, -0.34539794921875, -0.3231201171875, -0.30084228515625, -0.278564453125, -0.25628662109375, -0.2340087890625, -0.21173095703125, -0.189453125, -0.16717529296875, -0.1448974609375, -0.12261962890625, -0.100341796875, -0.07806396484375, -0.0557861328125, -0.03350830078125, -0.01123046875, 0.01104736328125, 0.0333251953125, 0.05560302734375, 0.077880859375, 0.10015869140625, 0.1224365234375, 0.14471435546875, 0.1669921875, 0.18927001953125, 0.2115478515625, 0.23382568359375, 0.256103515625, 0.27838134765625, 0.3006591796875, 0.32293701171875, 0.34521484375, 0.36749267578125, 0.3897705078125, 0.41204833984375, 0.434326171875, 0.45660400390625, 0.4788818359375, 0.50115966796875, 0.5234375, 0.54571533203125, 0.5679931640625, 0.59027099609375, 0.612548828125, 0.63482666015625, 0.6571044921875, 0.67938232421875, 0.70166015625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 0.0, 9.0, 6.0, 12.0, 18.0, 36.0, 39.0, 65.0, 109.0, 176.0, 271.0, 485.0, 797.0, 1428.0, 2526.0, 4739.0, 8868.0, 17196.0, 34878.0, 74096.0, 163826.0, 1041261.0, 488381.0, 135030.0, 62027.0, 29565.0, 14587.0, 7467.0, 4028.0, 2150.0, 1236.0, 708.0, 414.0, 254.0, 157.0, 91.0, 74.0, 38.0, 28.0, 20.0, 7.0, 11.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09857177734375, -0.09547996520996094, -0.09238815307617188, -0.08929634094238281, -0.08620452880859375, -0.08311271667480469, -0.08002090454101562, -0.07692909240722656, -0.0738372802734375, -0.07074546813964844, -0.06765365600585938, -0.06456184387207031, -0.06147003173828125, -0.05837821960449219, -0.055286407470703125, -0.05219459533691406, -0.049102783203125, -0.04601097106933594, -0.042919158935546875, -0.03982734680175781, -0.03673553466796875, -0.03364372253417969, -0.030551910400390625, -0.027460098266601562, -0.0243682861328125, -0.021276473999023438, -0.018184661865234375, -0.015092849731445312, -0.01200103759765625, -0.008909225463867188, -0.005817413330078125, -0.0027256011962890625, 0.0003662109375, 0.0034580230712890625, 0.006549835205078125, 0.009641647338867188, 0.01273345947265625, 0.015825271606445312, 0.018917083740234375, 0.022008895874023438, 0.0251007080078125, 0.028192520141601562, 0.031284332275390625, 0.03437614440917969, 0.03746795654296875, 0.04055976867675781, 0.043651580810546875, 0.04674339294433594, 0.049835205078125, 0.05292701721191406, 0.056018829345703125, 0.05911064147949219, 0.06220245361328125, 0.06529426574707031, 0.06838607788085938, 0.07147789001464844, 0.0745697021484375, 0.07766151428222656, 0.08075332641601562, 0.08384513854980469, 0.08693695068359375, 0.09002876281738281, 0.09312057495117188, 0.09621238708496094, 0.09930419921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 10.0, 2.0, 9.0, 16.0, 7.0, 7.0, 9.0, 13.0, 19.0, 13.0, 19.0, 31.0, 26.0, 38.0, 33.0, 56.0, 51.0, 60.0, 72.0, 64.0, 57.0, 62.0, 54.0, 44.0, 28.0, 27.0, 25.0, 22.0, 21.0, 10.0, 14.0, 9.0, 7.0, 16.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00672149658203125, -0.006525516510009766, -0.006329536437988281, -0.006133556365966797, -0.0059375762939453125, -0.005741596221923828, -0.005545616149902344, -0.005349636077880859, -0.005153656005859375, -0.004957675933837891, -0.004761695861816406, -0.004565715789794922, -0.0043697357177734375, -0.004173755645751953, -0.003977775573730469, -0.0037817955017089844, -0.0035858154296875, -0.0033898353576660156, -0.0031938552856445312, -0.002997875213623047, -0.0028018951416015625, -0.002605915069580078, -0.0024099349975585938, -0.0022139549255371094, -0.002017974853515625, -0.0018219947814941406, -0.0016260147094726562, -0.0014300346374511719, -0.0012340545654296875, -0.0010380744934082031, -0.0008420944213867188, -0.0006461143493652344, -0.00045013427734375, -0.0002541542053222656, -5.817413330078125e-05, 0.00013780593872070312, 0.0003337860107421875, 0.0005297660827636719, 0.0007257461547851562, 0.0009217262268066406, 0.001117706298828125, 0.0013136863708496094, 0.0015096664428710938, 0.0017056465148925781, 0.0019016265869140625, 0.002097606658935547, 0.0022935867309570312, 0.0024895668029785156, 0.002685546875, 0.0028815269470214844, 0.0030775070190429688, 0.003273487091064453, 0.0034694671630859375, 0.003665447235107422, 0.0038614273071289062, 0.004057407379150391, 0.004253387451171875, 0.004449367523193359, 0.004645347595214844, 0.004841327667236328, 0.0050373077392578125, 0.005233287811279297, 0.005429267883300781, 0.005625247955322266, 0.00582122802734375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 1.0, 6.0, 6.0, 7.0, 11.0, 8.0, 13.0, 14.0, 12.0, 19.0, 24.0, 36.0, 50.0, 66.0, 91.0, 127.0, 185.0, 514.0, 3626.0, 149785.0, 880046.0, 11945.0, 1005.0, 302.0, 172.0, 120.0, 73.0, 60.0, 40.0, 34.0, 27.0, 16.0, 10.0, 13.0, 9.0, 10.0, 13.0, 10.0, 5.0, 1.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.11566162109375, -0.1118326187133789, -0.10800361633300781, -0.10417461395263672, -0.10034561157226562, -0.09651660919189453, -0.09268760681152344, -0.08885860443115234, -0.08502960205078125, -0.08120059967041016, -0.07737159729003906, -0.07354259490966797, -0.06971359252929688, -0.06588459014892578, -0.06205558776855469, -0.058226585388183594, -0.0543975830078125, -0.050568580627441406, -0.04673957824707031, -0.04291057586669922, -0.039081573486328125, -0.03525257110595703, -0.03142356872558594, -0.027594566345214844, -0.02376556396484375, -0.019936561584472656, -0.016107559204101562, -0.012278556823730469, -0.008449554443359375, -0.004620552062988281, -0.0007915496826171875, 0.0030374526977539062, 0.006866455078125, 0.010695457458496094, 0.014524459838867188, 0.01835346221923828, 0.022182464599609375, 0.02601146697998047, 0.029840469360351562, 0.033669471740722656, 0.03749847412109375, 0.041327476501464844, 0.04515647888183594, 0.04898548126220703, 0.052814483642578125, 0.05664348602294922, 0.06047248840332031, 0.0643014907836914, 0.0681304931640625, 0.0719594955444336, 0.07578849792480469, 0.07961750030517578, 0.08344650268554688, 0.08727550506591797, 0.09110450744628906, 0.09493350982666016, 0.09876251220703125, 0.10259151458740234, 0.10642051696777344, 0.11024951934814453, 0.11407852172851562, 0.11790752410888672, 0.12173652648925781, 0.1255655288696289, 0.12939453125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 10.0, 67.0, 270.0, 443.0, 170.0, 44.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007522056810557842, -0.005726903676986694, -0.003931750543415546, -0.0021365974098443985, -0.0003414442762732506, 0.0014537088572978973, 0.0032488619908690453, 0.005044015124440193, 0.006839168258011341, 0.008634321391582489, 0.010429474525153637, 0.012224627658724785, 0.014019780792295933, 0.01581493392586708, 0.017610087990760803, 0.019405240193009377, 0.02120039239525795, 0.022995546460151672, 0.024790698662400246, 0.02658585086464882, 0.02838100492954254, 0.030176158994436264, 0.03197131305932999, 0.03376646339893341, 0.03556161746382713, 0.037356771528720856, 0.03915192186832428, 0.040947075933218, 0.042742229998111725, 0.04453738406300545, 0.04633253812789917, 0.048127688467502594, 0.049922846257686615, 0.05171800032258034, 0.05351315438747406, 0.055308304727077484, 0.05710345879197121, 0.05889861285686493, 0.06069376319646835, 0.062488917261362076, 0.0642840713262558, 0.06607922166585922, 0.06787437945604324, 0.06966952979564667, 0.07146468758583069, 0.07325983792543411, 0.07505498826503754, 0.07685014605522156, 0.07864529639482498, 0.0804404467344284, 0.08223560452461243, 0.08403075486421585, 0.08582590520381927, 0.0876210629940033, 0.08941621333360672, 0.09121137112379074, 0.09300652146339417, 0.09480167180299759, 0.09659682959318161, 0.09839197993278503, 0.10018713772296906, 0.10198228806257248, 0.1037774384021759, 0.10557259619235992, 0.10736774653196335]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 3.0, 8.0, 5.0, 11.0, 15.0, 14.0, 10.0, 21.0, 27.0, 25.0, 20.0, 34.0, 30.0, 31.0, 35.0, 55.0, 40.0, 35.0, 41.0, 31.0, 39.0, 46.0, 44.0, 34.0, 30.0, 46.0, 42.0, 27.0, 29.0, 18.0, 30.0, 18.0, 14.0, 23.0, 14.0, 11.0, 11.0, 10.0, 9.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.010213494300842285, -0.009885085746645927, -0.00955667719244957, -0.009228268638253212, -0.008899860084056854, -0.008571451529860497, -0.008243042975664139, -0.007914634421467781, -0.007586225867271423, -0.007257817313075066, -0.006929408758878708, -0.00660100020468235, -0.006272591650485992, -0.005944183096289635, -0.005615774542093277, -0.005287365987896919, -0.0049589574337005615, -0.004630548879504204, -0.004302140325307846, -0.003973731771111488, -0.0036453232169151306, -0.003316914662718773, -0.002988506108522415, -0.0026600975543260574, -0.0023316890001296997, -0.002003280445933342, -0.0016748718917369843, -0.0013464633375406265, -0.0010180547833442688, -0.0006896462291479111, -0.00036123767495155334, -3.282912075519562e-05, 0.0002955794334411621, 0.0006239879876375198, 0.0009523965418338776, 0.0012808050960302353, 0.001609213650226593, 0.0019376222044229507, 0.0022660307586193085, 0.002594439312815666, 0.002922847867012024, 0.0032512564212083817, 0.0035796649754047394, 0.003908073529601097, 0.004236482083797455, 0.0045648906379938126, 0.00489329919219017, 0.005221707746386528, 0.005550116300582886, 0.0058785248547792435, 0.006206933408975601, 0.006535341963171959, 0.006863750517368317, 0.007192159071564674, 0.007520567625761032, 0.00784897617995739, 0.008177384734153748, 0.008505793288350105, 0.008834201842546463, 0.00916261039674282, 0.009491018950939178, 0.009819427505135536, 0.010147836059331894, 0.010476244613528252, 0.01080465316772461]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 1.0, 5.0, 1.0, 4.0, 6.0, 4.0, 9.0, 10.0, 11.0, 17.0, 19.0, 20.0, 23.0, 22.0, 28.0, 28.0, 38.0, 36.0, 29.0, 44.0, 41.0, 40.0, 39.0, 41.0, 49.0, 41.0, 41.0, 38.0, 36.0, 43.0, 19.0, 25.0, 16.0, 27.0, 24.0, 24.0, 20.0, 17.0, 13.0, 10.0, 14.0, 8.0, 6.0, 6.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.028778076171875, -0.99407958984375, -0.959381103515625, -0.9246826171875, -0.889984130859375, -0.85528564453125, -0.820587158203125, -0.785888671875, -0.751190185546875, -0.71649169921875, -0.681793212890625, -0.6470947265625, -0.612396240234375, -0.57769775390625, -0.542999267578125, -0.50830078125, -0.473602294921875, -0.43890380859375, -0.404205322265625, -0.3695068359375, -0.334808349609375, -0.30010986328125, -0.265411376953125, -0.230712890625, -0.196014404296875, -0.16131591796875, -0.126617431640625, -0.0919189453125, -0.057220458984375, -0.02252197265625, 0.012176513671875, 0.046875, 0.081573486328125, 0.11627197265625, 0.150970458984375, 0.1856689453125, 0.220367431640625, 0.25506591796875, 0.289764404296875, 0.324462890625, 0.359161376953125, 0.39385986328125, 0.428558349609375, 0.4632568359375, 0.497955322265625, 0.53265380859375, 0.567352294921875, 0.60205078125, 0.636749267578125, 0.67144775390625, 0.706146240234375, 0.7408447265625, 0.775543212890625, 0.81024169921875, 0.844940185546875, 0.879638671875, 0.914337158203125, 0.94903564453125, 0.983734130859375, 1.0184326171875, 1.053131103515625, 1.08782958984375, 1.122528076171875, 1.1572265625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 9.0, 8.0, 6.0, 12.0, 17.0, 28.0, 34.0, 36.0, 56.0, 93.0, 103.0, 156.0, 234.0, 411.0, 739.0, 1311.0, 2574.0, 4928.0, 9838.0, 20116.0, 45173.0, 139869.0, 552221.0, 174788.0, 50743.0, 22450.0, 10824.0, 5500.0, 2787.0, 1445.0, 791.0, 401.0, 273.0, 166.0, 106.0, 81.0, 49.0, 43.0, 38.0, 34.0, 19.0, 11.0, 9.0, 10.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.302734375, -2.224853515625, -2.14697265625, -2.069091796875, -1.9912109375, -1.913330078125, -1.83544921875, -1.757568359375, -1.6796875, -1.601806640625, -1.52392578125, -1.446044921875, -1.3681640625, -1.290283203125, -1.21240234375, -1.134521484375, -1.056640625, -0.978759765625, -0.90087890625, -0.822998046875, -0.7451171875, -0.667236328125, -0.58935546875, -0.511474609375, -0.43359375, -0.355712890625, -0.27783203125, -0.199951171875, -0.1220703125, -0.044189453125, 0.03369140625, 0.111572265625, 0.189453125, 0.267333984375, 0.34521484375, 0.423095703125, 0.5009765625, 0.578857421875, 0.65673828125, 0.734619140625, 0.8125, 0.890380859375, 0.96826171875, 1.046142578125, 1.1240234375, 1.201904296875, 1.27978515625, 1.357666015625, 1.435546875, 1.513427734375, 1.59130859375, 1.669189453125, 1.7470703125, 1.824951171875, 1.90283203125, 1.980712890625, 2.05859375, 2.136474609375, 2.21435546875, 2.292236328125, 2.3701171875, 2.447998046875, 2.52587890625, 2.603759765625, 2.681640625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 12.0, 13.0, 12.0, 15.0, 15.0, 18.0, 30.0, 22.0, 25.0, 26.0, 32.0, 27.0, 35.0, 53.0, 58.0, 78.0, 143.0, 250.0, 1371.0, 233.0, 118.0, 66.0, 53.0, 41.0, 39.0, 40.0, 33.0, 32.0, 20.0, 16.0, 29.0, 15.0, 12.0, 12.0, 7.0, 6.0, 2.0, 4.0, 10.0, 5.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0], "bins": [-3.482421875, -3.384033203125, -3.28564453125, -3.187255859375, -3.0888671875, -2.990478515625, -2.89208984375, -2.793701171875, -2.6953125, -2.596923828125, -2.49853515625, -2.400146484375, -2.3017578125, -2.203369140625, -2.10498046875, -2.006591796875, -1.908203125, -1.809814453125, -1.71142578125, -1.613037109375, -1.5146484375, -1.416259765625, -1.31787109375, -1.219482421875, -1.12109375, -1.022705078125, -0.92431640625, -0.825927734375, -0.7275390625, -0.629150390625, -0.53076171875, -0.432373046875, -0.333984375, -0.235595703125, -0.13720703125, -0.038818359375, 0.0595703125, 0.157958984375, 0.25634765625, 0.354736328125, 0.453125, 0.551513671875, 0.64990234375, 0.748291015625, 0.8466796875, 0.945068359375, 1.04345703125, 1.141845703125, 1.240234375, 1.338623046875, 1.43701171875, 1.535400390625, 1.6337890625, 1.732177734375, 1.83056640625, 1.928955078125, 2.02734375, 2.125732421875, 2.22412109375, 2.322509765625, 2.4208984375, 2.519287109375, 2.61767578125, 2.716064453125, 2.814453125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 7.0, 10.0, 6.0, 11.0, 11.0, 18.0, 23.0, 20.0, 34.0, 47.0, 54.0, 62.0, 109.0, 147.0, 291.0, 594.0, 1522.0, 5640.0, 28574.0, 331828.0, 2651647.0, 104649.0, 14787.0, 3344.0, 1078.0, 414.0, 213.0, 150.0, 92.0, 60.0, 44.0, 43.0, 29.0, 29.0, 26.0, 22.0, 18.0, 14.0, 11.0, 3.0, 6.0, 2.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.4036865234375, -5.205810546875, -5.0079345703125, -4.81005859375, -4.6121826171875, -4.414306640625, -4.2164306640625, -4.0185546875, -3.8206787109375, -3.622802734375, -3.4249267578125, -3.22705078125, -3.0291748046875, -2.831298828125, -2.6334228515625, -2.435546875, -2.2376708984375, -2.039794921875, -1.8419189453125, -1.64404296875, -1.4461669921875, -1.248291015625, -1.0504150390625, -0.8525390625, -0.6546630859375, -0.456787109375, -0.2589111328125, -0.06103515625, 0.1368408203125, 0.334716796875, 0.5325927734375, 0.73046875, 0.9283447265625, 1.126220703125, 1.3240966796875, 1.52197265625, 1.7198486328125, 1.917724609375, 2.1156005859375, 2.3134765625, 2.5113525390625, 2.709228515625, 2.9071044921875, 3.10498046875, 3.3028564453125, 3.500732421875, 3.6986083984375, 3.896484375, 4.0943603515625, 4.292236328125, 4.4901123046875, 4.68798828125, 4.8858642578125, 5.083740234375, 5.2816162109375, 5.4794921875, 5.6773681640625, 5.875244140625, 6.0731201171875, 6.27099609375, 6.4688720703125, 6.666748046875, 6.8646240234375, 7.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 10.0, 34.0, 96.0, 202.0, 294.0, 213.0, 106.0, 34.0, 16.0, 7.0, 1.0], "bins": [-37.37522888183594, -36.724788665771484, -36.07434844970703, -35.42390823364258, -34.773468017578125, -34.12302780151367, -33.47258758544922, -32.822147369384766, -32.17170715332031, -31.52126693725586, -30.870826721191406, -30.220386505126953, -29.5699462890625, -28.919506072998047, -28.269065856933594, -27.61862564086914, -26.968183517456055, -26.3177433013916, -25.66730308532715, -25.016862869262695, -24.366422653198242, -23.71598243713379, -23.065542221069336, -22.41510009765625, -21.764659881591797, -21.114219665527344, -20.46377944946289, -19.813339233398438, -19.162899017333984, -18.51245880126953, -17.862018585205078, -17.211578369140625, -16.561138153076172, -15.910697937011719, -15.260257720947266, -14.609817504882812, -13.95937728881836, -13.308937072753906, -12.658495903015137, -12.008055686950684, -11.357616424560547, -10.707176208496094, -10.05673599243164, -9.406295776367188, -8.755855560302734, -8.105415344238281, -7.454974174499512, -6.804533958435059, -6.154093265533447, -5.503653049468994, -4.853212356567383, -4.20277214050293, -3.5523319244384766, -2.9018917083740234, -2.251451253890991, -1.601010799407959, -0.9505705833435059, -0.3001302480697632, 0.3503100872039795, 1.0007504224777222, 1.6511907577514648, 2.301630973815918, 2.95207142829895, 3.6025118827819824, 4.2529520988464355]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 6.0, 11.0, 6.0, 5.0, 8.0, 12.0, 14.0, 13.0, 18.0, 23.0, 20.0, 28.0, 25.0, 22.0, 33.0, 27.0, 34.0, 38.0, 38.0, 33.0, 48.0, 48.0, 32.0, 41.0, 38.0, 42.0, 39.0, 34.0, 29.0, 31.0, 28.0, 27.0, 18.0, 20.0, 18.0, 20.0, 17.0, 9.0, 9.0, 7.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.84592056274414, -8.57669448852539, -8.307469367980957, -8.038243293762207, -7.769018173217773, -7.499792098999023, -7.230566501617432, -6.96134090423584, -6.692115306854248, -6.422889709472656, -6.1536641120910645, -5.884438514709473, -5.615212440490723, -5.345987319946289, -5.076761245727539, -4.807535648345947, -4.5383100509643555, -4.269084453582764, -3.999858856201172, -3.730633020401001, -3.461407423019409, -3.1921818256378174, -2.9229559898376465, -2.6537303924560547, -2.384504795074463, -2.115279197692871, -1.8460534811019897, -1.5768277645111084, -1.3076021671295166, -1.0383765697479248, -0.7691508531570435, -0.4999251365661621, -0.23070049285888672, 0.038525164127349854, 0.3077508211135864, 0.576976478099823, 0.8462021350860596, 1.1154277324676514, 1.3846534490585327, 1.653879165649414, 1.9231047630310059, 2.1923303604125977, 2.4615559577941895, 2.7307817935943604, 3.000007390975952, 3.269232988357544, 3.538458824157715, 3.8076844215393066, 4.076910018920898, 4.34613561630249, 4.615361213684082, 4.884586811065674, 5.153812408447266, 5.423038482666016, 5.692264080047607, 5.961489677429199, 6.230715274810791, 6.499940872192383, 6.769166469573975, 7.038392066955566, 7.307618141174316, 7.57684326171875, 7.8460693359375, 8.11529541015625, 8.384520530700684]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 8.0, 7.0, 6.0, 17.0, 8.0, 11.0, 20.0, 28.0, 23.0, 19.0, 38.0, 33.0, 32.0, 29.0, 38.0, 37.0, 43.0, 40.0, 41.0, 47.0, 51.0, 33.0, 38.0, 37.0, 35.0, 34.0, 31.0, 28.0, 31.0, 19.0, 15.0, 14.0, 18.0, 17.0, 18.0, 16.0, 11.0, 6.0, 4.0, 14.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.1154937744140625, -1.077667236328125, -1.0398406982421875, -1.00201416015625, -0.9641876220703125, -0.926361083984375, -0.8885345458984375, -0.8507080078125, -0.8128814697265625, -0.775054931640625, -0.7372283935546875, -0.69940185546875, -0.6615753173828125, -0.623748779296875, -0.5859222412109375, -0.548095703125, -0.5102691650390625, -0.472442626953125, -0.4346160888671875, -0.39678955078125, -0.3589630126953125, -0.321136474609375, -0.2833099365234375, -0.2454833984375, -0.2076568603515625, -0.169830322265625, -0.1320037841796875, -0.09417724609375, -0.0563507080078125, -0.018524169921875, 0.0193023681640625, 0.05712890625, 0.0949554443359375, 0.132781982421875, 0.1706085205078125, 0.20843505859375, 0.2462615966796875, 0.284088134765625, 0.3219146728515625, 0.3597412109375, 0.3975677490234375, 0.435394287109375, 0.4732208251953125, 0.51104736328125, 0.5488739013671875, 0.586700439453125, 0.6245269775390625, 0.662353515625, 0.7001800537109375, 0.738006591796875, 0.7758331298828125, 0.81365966796875, 0.8514862060546875, 0.889312744140625, 0.9271392822265625, 0.9649658203125, 1.0027923583984375, 1.040618896484375, 1.0784454345703125, 1.11627197265625, 1.1540985107421875, 1.191925048828125, 1.2297515869140625, 1.267578125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 5.0, 14.0, 13.0, 25.0, 29.0, 51.0, 75.0, 92.0, 174.0, 198.0, 275.0, 418.0, 625.0, 872.0, 1259.0, 2111.0, 3428.0, 5686.0, 9899.0, 19826.0, 45426.0, 140967.0, 652653.0, 2137175.0, 885417.0, 181980.0, 55544.0, 22593.0, 11381.0, 6131.0, 3574.0, 2156.0, 1356.0, 866.0, 595.0, 427.0, 292.0, 182.0, 133.0, 100.0, 76.0, 52.0, 34.0, 31.0, 21.0, 13.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.1171875, -2.0501708984375, -1.983154296875, -1.9161376953125, -1.84912109375, -1.7821044921875, -1.715087890625, -1.6480712890625, -1.5810546875, -1.5140380859375, -1.447021484375, -1.3800048828125, -1.31298828125, -1.2459716796875, -1.178955078125, -1.1119384765625, -1.044921875, -0.9779052734375, -0.910888671875, -0.8438720703125, -0.77685546875, -0.7098388671875, -0.642822265625, -0.5758056640625, -0.5087890625, -0.4417724609375, -0.374755859375, -0.3077392578125, -0.24072265625, -0.1737060546875, -0.106689453125, -0.0396728515625, 0.02734375, 0.0943603515625, 0.161376953125, 0.2283935546875, 0.29541015625, 0.3624267578125, 0.429443359375, 0.4964599609375, 0.5634765625, 0.6304931640625, 0.697509765625, 0.7645263671875, 0.83154296875, 0.8985595703125, 0.965576171875, 1.0325927734375, 1.099609375, 1.1666259765625, 1.233642578125, 1.3006591796875, 1.36767578125, 1.4346923828125, 1.501708984375, 1.5687255859375, 1.6357421875, 1.7027587890625, 1.769775390625, 1.8367919921875, 1.90380859375, 1.9708251953125, 2.037841796875, 2.1048583984375, 2.171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 8.0, 14.0, 11.0, 18.0, 28.0, 20.0, 34.0, 54.0, 45.0, 79.0, 111.0, 144.0, 236.0, 321.0, 434.0, 510.0, 555.0, 379.0, 256.0, 239.0, 154.0, 97.0, 92.0, 46.0, 47.0, 31.0, 23.0, 26.0, 15.0, 6.0, 9.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.337432861328125, -2.26861572265625, -2.199798583984375, -2.1309814453125, -2.062164306640625, -1.99334716796875, -1.924530029296875, -1.855712890625, -1.786895751953125, -1.71807861328125, -1.649261474609375, -1.5804443359375, -1.511627197265625, -1.44281005859375, -1.373992919921875, -1.30517578125, -1.236358642578125, -1.16754150390625, -1.098724365234375, -1.0299072265625, -0.961090087890625, -0.89227294921875, -0.823455810546875, -0.754638671875, -0.685821533203125, -0.61700439453125, -0.548187255859375, -0.4793701171875, -0.410552978515625, -0.34173583984375, -0.272918701171875, -0.2041015625, -0.135284423828125, -0.06646728515625, 0.002349853515625, 0.0711669921875, 0.139984130859375, 0.20880126953125, 0.277618408203125, 0.346435546875, 0.415252685546875, 0.48406982421875, 0.552886962890625, 0.6217041015625, 0.690521240234375, 0.75933837890625, 0.828155517578125, 0.89697265625, 0.965789794921875, 1.03460693359375, 1.103424072265625, 1.1722412109375, 1.241058349609375, 1.30987548828125, 1.378692626953125, 1.447509765625, 1.516326904296875, 1.58514404296875, 1.653961181640625, 1.7227783203125, 1.791595458984375, 1.86041259765625, 1.929229736328125, 1.998046875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 13.0, 7.0, 9.0, 17.0, 34.0, 39.0, 53.0, 100.0, 117.0, 235.0, 460.0, 1283.0, 3878.0, 15642.0, 95362.0, 1973545.0, 1985275.0, 96520.0, 15449.0, 3842.0, 1227.0, 506.0, 269.0, 128.0, 105.0, 43.0, 29.0, 23.0, 18.0, 12.0, 10.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.62890625, -6.43951416015625, -6.2501220703125, -6.06072998046875, -5.871337890625, -5.68194580078125, -5.4925537109375, -5.30316162109375, -5.11376953125, -4.92437744140625, -4.7349853515625, -4.54559326171875, -4.356201171875, -4.16680908203125, -3.9774169921875, -3.78802490234375, -3.5986328125, -3.40924072265625, -3.2198486328125, -3.03045654296875, -2.841064453125, -2.65167236328125, -2.4622802734375, -2.27288818359375, -2.08349609375, -1.89410400390625, -1.7047119140625, -1.51531982421875, -1.325927734375, -1.13653564453125, -0.9471435546875, -0.75775146484375, -0.568359375, -0.37896728515625, -0.1895751953125, -0.00018310546875, 0.189208984375, 0.37860107421875, 0.5679931640625, 0.75738525390625, 0.94677734375, 1.13616943359375, 1.3255615234375, 1.51495361328125, 1.704345703125, 1.89373779296875, 2.0831298828125, 2.27252197265625, 2.4619140625, 2.65130615234375, 2.8406982421875, 3.03009033203125, 3.219482421875, 3.40887451171875, 3.5982666015625, 3.78765869140625, 3.97705078125, 4.16644287109375, 4.3558349609375, 4.54522705078125, 4.734619140625, 4.92401123046875, 5.1134033203125, 5.30279541015625, 5.4921875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 32.0, 296.0, 567.0, 111.0, 10.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.48743438720703, -62.606571197509766, -60.725711822509766, -58.8448486328125, -56.9639892578125, -55.083126068115234, -53.20226287841797, -51.32140350341797, -49.44054412841797, -47.5596809387207, -45.6788215637207, -43.79795837402344, -41.91709899902344, -40.03623580932617, -38.155372619628906, -36.274513244628906, -34.39365005493164, -32.512786865234375, -30.631927490234375, -28.75106430053711, -26.87020492553711, -24.989341735839844, -23.10848045349121, -21.227619171142578, -19.346757888793945, -17.465896606445312, -15.58503532409668, -13.70417308807373, -11.823311805725098, -9.942450523376465, -8.061588287353516, -6.180727005004883, -4.29986572265625, -2.419004201889038, -0.5381426811218262, 1.3427190780639648, 3.2235803604125977, 5.1044416427612305, 6.98530387878418, 8.866165161132812, 10.747026443481445, 12.627887725830078, 14.508749008178711, 16.389610290527344, 18.27047348022461, 20.15133285522461, 22.032196044921875, 23.913057327270508, 25.79391860961914, 27.674779891967773, 29.555641174316406, 31.436504364013672, 33.31736373901367, 35.19822692871094, 37.07908630371094, 38.9599494934082, 40.84081268310547, 42.721675872802734, 44.602535247802734, 46.4833984375, 48.3642578125, 50.245121002197266, 52.12598419189453, 54.00684356689453, 55.88770294189453]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 6.0, 9.0, 13.0, 6.0, 12.0, 10.0, 20.0, 16.0, 17.0, 18.0, 30.0, 33.0, 25.0, 27.0, 35.0, 35.0, 37.0, 44.0, 31.0, 36.0, 29.0, 40.0, 49.0, 25.0, 36.0, 42.0, 34.0, 32.0, 24.0, 16.0, 28.0, 30.0, 19.0, 27.0, 17.0, 23.0, 14.0, 13.0, 9.0, 11.0, 5.0, 6.0, 10.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.118191719055176, -5.902606964111328, -5.6870222091674805, -5.471437454223633, -5.255852699279785, -5.0402679443359375, -4.824683666229248, -4.6090989112854, -4.393514156341553, -4.177929401397705, -3.9623446464538574, -3.746760129928589, -3.531175374984741, -3.3155906200408936, -3.100006103515625, -2.8844213485717773, -2.6688365936279297, -2.453251838684082, -2.2376670837402344, -2.022082567214966, -1.8064978122711182, -1.5909130573272705, -1.3753284215927124, -1.1597437858581543, -0.9441590309143066, -0.7285743355751038, -0.5129896402359009, -0.297404944896698, -0.08182024955749512, 0.13376450538635254, 0.34934914112091064, 0.5649337768554688, 0.7805180549621582, 0.9961027503013611, 1.211687445640564, 1.427272081375122, 1.6428568363189697, 1.8584415912628174, 2.074026107788086, 2.2896108627319336, 2.5051956176757812, 2.720780372619629, 2.9363651275634766, 3.151949644088745, 3.3675343990325928, 3.5831191539764404, 3.798703670501709, 4.014288425445557, 4.229873180389404, 4.445457935333252, 4.6610426902771, 4.876627445220947, 5.092211723327637, 5.307796478271484, 5.523381233215332, 5.73896598815918, 5.954550743103027, 6.170135498046875, 6.385720252990723, 6.60130500793457, 6.816889762878418, 7.032474517822266, 7.248058795928955, 7.463643550872803, 7.67922830581665]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 11.0, 11.0, 13.0, 16.0, 17.0, 23.0, 26.0, 19.0, 29.0, 25.0, 44.0, 38.0, 36.0, 33.0, 45.0, 40.0, 52.0, 38.0, 43.0, 37.0, 38.0, 29.0, 35.0, 26.0, 32.0, 31.0, 26.0, 21.0, 24.0, 21.0, 18.0, 8.0, 12.0, 16.0, 14.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1484375, -1.1114349365234375, -1.074432373046875, -1.0374298095703125, -1.00042724609375, -0.9634246826171875, -0.926422119140625, -0.8894195556640625, -0.8524169921875, -0.8154144287109375, -0.778411865234375, -0.7414093017578125, -0.70440673828125, -0.6674041748046875, -0.630401611328125, -0.5933990478515625, -0.556396484375, -0.5193939208984375, -0.482391357421875, -0.4453887939453125, -0.40838623046875, -0.3713836669921875, -0.334381103515625, -0.2973785400390625, -0.2603759765625, -0.2233734130859375, -0.186370849609375, -0.1493682861328125, -0.11236572265625, -0.0753631591796875, -0.038360595703125, -0.0013580322265625, 0.03564453125, 0.0726470947265625, 0.109649658203125, 0.1466522216796875, 0.18365478515625, 0.2206573486328125, 0.257659912109375, 0.2946624755859375, 0.3316650390625, 0.3686676025390625, 0.405670166015625, 0.4426727294921875, 0.47967529296875, 0.5166778564453125, 0.553680419921875, 0.5906829833984375, 0.627685546875, 0.6646881103515625, 0.701690673828125, 0.7386932373046875, 0.77569580078125, 0.8126983642578125, 0.849700927734375, 0.8867034912109375, 0.9237060546875, 0.9607086181640625, 0.997711181640625, 1.0347137451171875, 1.07171630859375, 1.1087188720703125, 1.145721435546875, 1.1827239990234375, 1.2197265625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 7.0, 10.0, 26.0, 29.0, 57.0, 98.0, 153.0, 301.0, 502.0, 865.0, 1458.0, 2668.0, 4758.0, 9056.0, 17624.0, 34891.0, 71525.0, 145884.0, 255951.0, 241609.0, 131279.0, 64323.0, 31340.0, 15701.0, 8220.0, 4408.0, 2484.0, 1401.0, 805.0, 465.0, 264.0, 165.0, 108.0, 51.0, 36.0, 12.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1724853515625, -0.1679372787475586, -0.1633892059326172, -0.15884113311767578, -0.15429306030273438, -0.14974498748779297, -0.14519691467285156, -0.14064884185791016, -0.13610076904296875, -0.13155269622802734, -0.12700462341308594, -0.12245655059814453, -0.11790847778320312, -0.11336040496826172, -0.10881233215332031, -0.1042642593383789, -0.0997161865234375, -0.0951681137084961, -0.09062004089355469, -0.08607196807861328, -0.08152389526367188, -0.07697582244873047, -0.07242774963378906, -0.06787967681884766, -0.06333160400390625, -0.058783531188964844, -0.05423545837402344, -0.04968738555908203, -0.045139312744140625, -0.04059123992919922, -0.03604316711425781, -0.031495094299316406, -0.026947021484375, -0.022398948669433594, -0.017850875854492188, -0.013302803039550781, -0.008754730224609375, -0.004206657409667969, 0.0003414154052734375, 0.004889488220214844, 0.00943756103515625, 0.013985633850097656, 0.018533706665039062, 0.02308177947998047, 0.027629852294921875, 0.03217792510986328, 0.03672599792480469, 0.041274070739746094, 0.0458221435546875, 0.050370216369628906, 0.05491828918457031, 0.05946636199951172, 0.06401443481445312, 0.06856250762939453, 0.07311058044433594, 0.07765865325927734, 0.08220672607421875, 0.08675479888916016, 0.09130287170410156, 0.09585094451904297, 0.10039901733398438, 0.10494709014892578, 0.10949516296386719, 0.1140432357788086, 0.11859130859375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 7.0, 4.0, 11.0, 6.0, 15.0, 11.0, 14.0, 25.0, 20.0, 28.0, 27.0, 32.0, 34.0, 43.0, 52.0, 35.0, 42.0, 43.0, 1068.0, 49.0, 49.0, 47.0, 42.0, 34.0, 41.0, 37.0, 26.0, 23.0, 28.0, 16.0, 25.0, 14.0, 14.0, 11.0, 10.0, 6.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7507095336914062, -0.7226104736328125, -0.6945114135742188, -0.666412353515625, -0.6383132934570312, -0.6102142333984375, -0.5821151733398438, -0.55401611328125, -0.5259170532226562, -0.4978179931640625, -0.46971893310546875, -0.441619873046875, -0.41352081298828125, -0.3854217529296875, -0.35732269287109375, -0.3292236328125, -0.30112457275390625, -0.2730255126953125, -0.24492645263671875, -0.216827392578125, -0.18872833251953125, -0.1606292724609375, -0.13253021240234375, -0.10443115234375, -0.07633209228515625, -0.0482330322265625, -0.02013397216796875, 0.007965087890625, 0.03606414794921875, 0.0641632080078125, 0.09226226806640625, 0.120361328125, 0.14846038818359375, 0.1765594482421875, 0.20465850830078125, 0.232757568359375, 0.26085662841796875, 0.2889556884765625, 0.31705474853515625, 0.34515380859375, 0.37325286865234375, 0.4013519287109375, 0.42945098876953125, 0.457550048828125, 0.48564910888671875, 0.5137481689453125, 0.5418472290039062, 0.5699462890625, 0.5980453491210938, 0.6261444091796875, 0.6542434692382812, 0.682342529296875, 0.7104415893554688, 0.7385406494140625, 0.7666397094726562, 0.79473876953125, 0.8228378295898438, 0.8509368896484375, 0.8790359497070312, 0.907135009765625, 0.9352340698242188, 0.9633331298828125, 0.9914321899414062, 1.01953125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 11.0, 23.0, 34.0, 42.0, 80.0, 121.0, 168.0, 269.0, 410.0, 692.0, 1123.0, 1823.0, 2939.0, 4894.0, 8518.0, 15201.0, 27609.0, 52831.0, 104704.0, 237645.0, 1214864.0, 214115.0, 97943.0, 50111.0, 26001.0, 14416.0, 8370.0, 4849.0, 2786.0, 1697.0, 1053.0, 666.0, 412.0, 241.0, 157.0, 116.0, 60.0, 41.0, 24.0, 19.0, 15.0, 13.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.087890625, -0.08500480651855469, -0.08211898803710938, -0.07923316955566406, -0.07634735107421875, -0.07346153259277344, -0.07057571411132812, -0.06768989562988281, -0.0648040771484375, -0.06191825866699219, -0.059032440185546875, -0.05614662170410156, -0.05326080322265625, -0.05037498474121094, -0.047489166259765625, -0.04460334777832031, -0.041717529296875, -0.03883171081542969, -0.035945892333984375, -0.03306007385253906, -0.03017425537109375, -0.027288436889648438, -0.024402618408203125, -0.021516799926757812, -0.0186309814453125, -0.015745162963867188, -0.012859344482421875, -0.009973526000976562, -0.00708770751953125, -0.0042018890380859375, -0.001316070556640625, 0.0015697479248046875, 0.00445556640625, 0.0073413848876953125, 0.010227203369140625, 0.013113021850585938, 0.01599884033203125, 0.018884658813476562, 0.021770477294921875, 0.024656295776367188, 0.0275421142578125, 0.030427932739257812, 0.033313751220703125, 0.03619956970214844, 0.03908538818359375, 0.04197120666503906, 0.044857025146484375, 0.04774284362792969, 0.050628662109375, 0.05351448059082031, 0.056400299072265625, 0.05928611755371094, 0.06217193603515625, 0.06505775451660156, 0.06794357299804688, 0.07082939147949219, 0.0737152099609375, 0.07660102844238281, 0.07948684692382812, 0.08237266540527344, 0.08525848388671875, 0.08814430236816406, 0.09103012084960938, 0.09391593933105469, 0.0968017578125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 0.0, 5.0, 6.0, 1.0, 3.0, 11.0, 8.0, 9.0, 14.0, 13.0, 17.0, 13.0, 22.0, 24.0, 19.0, 23.0, 48.0, 49.0, 56.0, 46.0, 61.0, 78.0, 64.0, 59.0, 57.0, 52.0, 38.0, 32.0, 25.0, 25.0, 21.0, 18.0, 11.0, 13.0, 16.0, 11.0, 2.0, 7.0, 8.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00656890869140625, -0.006353020668029785, -0.00613713264465332, -0.0059212446212768555, -0.005705356597900391, -0.005489468574523926, -0.005273580551147461, -0.005057692527770996, -0.004841804504394531, -0.004625916481018066, -0.0044100284576416016, -0.004194140434265137, -0.003978252410888672, -0.003762364387512207, -0.003546476364135742, -0.0033305883407592773, -0.0031147003173828125, -0.0028988122940063477, -0.002682924270629883, -0.002467036247253418, -0.002251148223876953, -0.0020352602005004883, -0.0018193721771240234, -0.0016034841537475586, -0.0013875961303710938, -0.001171708106994629, -0.0009558200836181641, -0.0007399320602416992, -0.0005240440368652344, -0.00030815601348876953, -9.226799011230469e-05, 0.00012362003326416016, 0.000339508056640625, 0.0005553960800170898, 0.0007712841033935547, 0.0009871721267700195, 0.0012030601501464844, 0.0014189481735229492, 0.001634836196899414, 0.001850724220275879, 0.0020666122436523438, 0.0022825002670288086, 0.0024983882904052734, 0.0027142763137817383, 0.002930164337158203, 0.003146052360534668, 0.003361940383911133, 0.0035778284072875977, 0.0037937164306640625, 0.004009604454040527, 0.004225492477416992, 0.004441380500793457, 0.004657268524169922, 0.004873156547546387, 0.0050890445709228516, 0.005304932594299316, 0.005520820617675781, 0.005736708641052246, 0.005952596664428711, 0.006168484687805176, 0.006384372711181641, 0.0066002607345581055, 0.00681614875793457, 0.007032036781311035, 0.0072479248046875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 7.0, 8.0, 7.0, 10.0, 17.0, 17.0, 22.0, 28.0, 45.0, 73.0, 110.0, 163.0, 285.0, 690.0, 23232.0, 1018942.0, 3676.0, 487.0, 232.0, 166.0, 91.0, 54.0, 36.0, 25.0, 19.0, 18.0, 18.0, 12.0, 8.0, 10.0, 6.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.181884765625, -0.17643165588378906, -0.17097854614257812, -0.1655254364013672, -0.16007232666015625, -0.1546192169189453, -0.14916610717773438, -0.14371299743652344, -0.1382598876953125, -0.13280677795410156, -0.12735366821289062, -0.12190055847167969, -0.11644744873046875, -0.11099433898925781, -0.10554122924804688, -0.10008811950683594, -0.094635009765625, -0.08918190002441406, -0.08372879028320312, -0.07827568054199219, -0.07282257080078125, -0.06736946105957031, -0.061916351318359375, -0.05646324157714844, -0.0510101318359375, -0.04555702209472656, -0.040103912353515625, -0.03465080261230469, -0.02919769287109375, -0.023744583129882812, -0.018291473388671875, -0.012838363647460938, -0.00738525390625, -0.0019321441650390625, 0.003520965576171875, 0.008974075317382812, 0.01442718505859375, 0.019880294799804688, 0.025333404541015625, 0.030786514282226562, 0.0362396240234375, 0.04169273376464844, 0.047145843505859375, 0.05259895324707031, 0.05805206298828125, 0.06350517272949219, 0.06895828247070312, 0.07441139221191406, 0.079864501953125, 0.08531761169433594, 0.09077072143554688, 0.09622383117675781, 0.10167694091796875, 0.10713005065917969, 0.11258316040039062, 0.11803627014160156, 0.1234893798828125, 0.12894248962402344, 0.13439559936523438, 0.1398487091064453, 0.14530181884765625, 0.1507549285888672, 0.15620803833007812, 0.16166114807128906, 0.1671142578125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 19.0, 66.0, 310.0, 431.0, 122.0, 47.0, 13.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0063706873916089535, -0.004826504737138748, -0.003282322082668543, -0.0017381394281983376, -0.00019395677372813225, 0.001350225880742073, 0.0028944085352122784, 0.004438590724021196, 0.005982773844152689, 0.007526956498622894, 0.009071139618754387, 0.010615321807563305, 0.012159503996372223, 0.013703687116503716, 0.015247870236635208, 0.01679205149412155, 0.018336234614253044, 0.019880417734384537, 0.02142459899187088, 0.022968782112002373, 0.024512965232133865, 0.026057148352265358, 0.02760133147239685, 0.029145512729883194, 0.030689695850014687, 0.03223387897014618, 0.03377806022763252, 0.035322245210409164, 0.03686642646789551, 0.03841060772538185, 0.03995479270815849, 0.041498973965644836, 0.04304315894842148, 0.04458734020590782, 0.046131525188684464, 0.04767570644617081, 0.04921989142894745, 0.05076407268643379, 0.052308253943920135, 0.05385243892669678, 0.05539662018418312, 0.056940801441669464, 0.058484986424446106, 0.06002916768193245, 0.06157334893941879, 0.06311753392219543, 0.06466171890497208, 0.06620589643716812, 0.06775008141994476, 0.0692942664027214, 0.07083844393491745, 0.07238262891769409, 0.07392681390047073, 0.07547099143266678, 0.07701517641544342, 0.07855936139822006, 0.0801035463809967, 0.08164773136377335, 0.08319190889596939, 0.08473609387874603, 0.08628027886152267, 0.08782445639371872, 0.08936864137649536, 0.090912826359272, 0.09245700389146805]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 11.0, 7.0, 11.0, 13.0, 16.0, 10.0, 15.0, 21.0, 18.0, 23.0, 29.0, 24.0, 30.0, 27.0, 30.0, 34.0, 33.0, 38.0, 44.0, 39.0, 38.0, 38.0, 36.0, 47.0, 25.0, 29.0, 38.0, 38.0, 29.0, 31.0, 26.0, 13.0, 14.0, 15.0, 20.0, 16.0, 10.0, 13.0, 5.0, 10.0, 11.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.006985187530517578, -0.006765741854906082, -0.006546296179294586, -0.00632685050368309, -0.006107404828071594, -0.005887959152460098, -0.005668513476848602, -0.005449067801237106, -0.00522962212562561, -0.005010176450014114, -0.004790730774402618, -0.0045712850987911224, -0.0043518394231796265, -0.0041323937475681305, -0.0039129480719566345, -0.0036935023963451385, -0.0034740567207336426, -0.0032546110451221466, -0.0030351653695106506, -0.0028157196938991547, -0.0025962740182876587, -0.0023768283426761627, -0.0021573826670646667, -0.0019379369914531708, -0.0017184913158416748, -0.0014990456402301788, -0.0012795999646186829, -0.0010601542890071869, -0.0008407086133956909, -0.000621262937784195, -0.000401817262172699, -0.000182371586561203, 3.707408905029297e-05, 0.00025651976466178894, 0.0004759654402732849, 0.0006954111158847809, 0.0009148567914962769, 0.0011343024671077728, 0.0013537481427192688, 0.0015731938183307648, 0.0017926394939422607, 0.0020120851695537567, 0.0022315308451652527, 0.0024509765207767487, 0.0026704221963882446, 0.0028898678719997406, 0.0031093135476112366, 0.0033287592232227325, 0.0035482048988342285, 0.0037676505744457245, 0.0039870962500572205, 0.004206541925668716, 0.004425987601280212, 0.004645433276891708, 0.004864878952503204, 0.0050843246281147, 0.005303770303726196, 0.005523215979337692, 0.005742661654949188, 0.005962107330560684, 0.00618155300617218, 0.006400998681783676, 0.006620444357395172, 0.006839890033006668, 0.007059335708618164]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 11.0, 11.0, 14.0, 15.0, 16.0, 23.0, 27.0, 20.0, 28.0, 25.0, 43.0, 39.0, 36.0, 33.0, 46.0, 39.0, 52.0, 38.0, 44.0, 36.0, 38.0, 29.0, 35.0, 25.0, 33.0, 28.0, 29.0, 21.0, 24.0, 21.0, 18.0, 8.0, 12.0, 16.0, 13.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.1104888916015625, -1.073516845703125, -1.0365447998046875, -0.99957275390625, -0.9626007080078125, -0.925628662109375, -0.8886566162109375, -0.8516845703125, -0.8147125244140625, -0.777740478515625, -0.7407684326171875, -0.70379638671875, -0.6668243408203125, -0.629852294921875, -0.5928802490234375, -0.555908203125, -0.5189361572265625, -0.481964111328125, -0.4449920654296875, -0.40802001953125, -0.3710479736328125, -0.334075927734375, -0.2971038818359375, -0.2601318359375, -0.2231597900390625, -0.186187744140625, -0.1492156982421875, -0.11224365234375, -0.0752716064453125, -0.038299560546875, -0.0013275146484375, 0.03564453125, 0.0726165771484375, 0.109588623046875, 0.1465606689453125, 0.18353271484375, 0.2205047607421875, 0.257476806640625, 0.2944488525390625, 0.3314208984375, 0.3683929443359375, 0.405364990234375, 0.4423370361328125, 0.47930908203125, 0.5162811279296875, 0.553253173828125, 0.5902252197265625, 0.627197265625, 0.6641693115234375, 0.701141357421875, 0.7381134033203125, 0.77508544921875, 0.8120574951171875, 0.849029541015625, 0.8860015869140625, 0.9229736328125, 0.9599456787109375, 0.996917724609375, 1.0338897705078125, 1.07086181640625, 1.1078338623046875, 1.144805908203125, 1.1817779541015625, 1.21875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 15.0, 24.0, 29.0, 40.0, 66.0, 102.0, 141.0, 183.0, 281.0, 387.0, 629.0, 891.0, 1284.0, 1890.0, 2741.0, 4051.0, 6291.0, 10142.0, 16819.0, 28764.0, 50314.0, 92121.0, 170454.0, 251625.0, 179849.0, 97630.0, 53610.0, 29771.0, 17532.0, 10652.0, 6762.0, 4397.0, 2916.0, 1972.0, 1379.0, 837.0, 578.0, 409.0, 292.0, 202.0, 156.0, 96.0, 67.0, 42.0, 36.0, 21.0, 13.0, 17.0, 3.0, 9.0, 4.0, 1.0], "bins": [-1.4921875, -1.4502105712890625, -1.408233642578125, -1.3662567138671875, -1.32427978515625, -1.2823028564453125, -1.240325927734375, -1.1983489990234375, -1.1563720703125, -1.1143951416015625, -1.072418212890625, -1.0304412841796875, -0.98846435546875, -0.9464874267578125, -0.904510498046875, -0.8625335693359375, -0.820556640625, -0.7785797119140625, -0.736602783203125, -0.6946258544921875, -0.65264892578125, -0.6106719970703125, -0.568695068359375, -0.5267181396484375, -0.4847412109375, -0.4427642822265625, -0.400787353515625, -0.3588104248046875, -0.31683349609375, -0.2748565673828125, -0.232879638671875, -0.1909027099609375, -0.14892578125, -0.1069488525390625, -0.064971923828125, -0.0229949951171875, 0.01898193359375, 0.0609588623046875, 0.102935791015625, 0.1449127197265625, 0.1868896484375, 0.2288665771484375, 0.270843505859375, 0.3128204345703125, 0.35479736328125, 0.3967742919921875, 0.438751220703125, 0.4807281494140625, 0.522705078125, 0.5646820068359375, 0.606658935546875, 0.6486358642578125, 0.69061279296875, 0.7325897216796875, 0.774566650390625, 0.8165435791015625, 0.8585205078125, 0.9004974365234375, 0.942474365234375, 0.9844512939453125, 1.02642822265625, 1.0684051513671875, 1.110382080078125, 1.1523590087890625, 1.1943359375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 10.0, 7.0, 10.0, 18.0, 13.0, 15.0, 16.0, 21.0, 26.0, 31.0, 27.0, 43.0, 38.0, 57.0, 50.0, 85.0, 124.0, 250.0, 1352.0, 226.0, 147.0, 91.0, 59.0, 53.0, 37.0, 29.0, 34.0, 27.0, 19.0, 16.0, 20.0, 16.0, 16.0, 8.0, 10.0, 11.0, 9.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.226318359375, -3.12060546875, -3.014892578125, -2.9091796875, -2.803466796875, -2.69775390625, -2.592041015625, -2.486328125, -2.380615234375, -2.27490234375, -2.169189453125, -2.0634765625, -1.957763671875, -1.85205078125, -1.746337890625, -1.640625, -1.534912109375, -1.42919921875, -1.323486328125, -1.2177734375, -1.112060546875, -1.00634765625, -0.900634765625, -0.794921875, -0.689208984375, -0.58349609375, -0.477783203125, -0.3720703125, -0.266357421875, -0.16064453125, -0.054931640625, 0.05078125, 0.156494140625, 0.26220703125, 0.367919921875, 0.4736328125, 0.579345703125, 0.68505859375, 0.790771484375, 0.896484375, 1.002197265625, 1.10791015625, 1.213623046875, 1.3193359375, 1.425048828125, 1.53076171875, 1.636474609375, 1.7421875, 1.847900390625, 1.95361328125, 2.059326171875, 2.1650390625, 2.270751953125, 2.37646484375, 2.482177734375, 2.587890625, 2.693603515625, 2.79931640625, 2.905029296875, 3.0107421875, 3.116455078125, 3.22216796875, 3.327880859375, 3.43359375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 7.0, 9.0, 13.0, 18.0, 25.0, 23.0, 25.0, 47.0, 54.0, 65.0, 121.0, 181.0, 301.0, 600.0, 1234.0, 2983.0, 8276.0, 25383.0, 112119.0, 1337428.0, 1495058.0, 120448.0, 26664.0, 8618.0, 3136.0, 1295.0, 582.0, 325.0, 195.0, 126.0, 92.0, 54.0, 48.0, 28.0, 26.0, 16.0, 16.0, 12.0, 9.0, 6.0, 6.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.7421875, -3.621551513671875, -3.50091552734375, -3.380279541015625, -3.2596435546875, -3.139007568359375, -3.01837158203125, -2.897735595703125, -2.777099609375, -2.656463623046875, -2.53582763671875, -2.415191650390625, -2.2945556640625, -2.173919677734375, -2.05328369140625, -1.932647705078125, -1.81201171875, -1.691375732421875, -1.57073974609375, -1.450103759765625, -1.3294677734375, -1.208831787109375, -1.08819580078125, -0.967559814453125, -0.846923828125, -0.726287841796875, -0.60565185546875, -0.485015869140625, -0.3643798828125, -0.243743896484375, -0.12310791015625, -0.002471923828125, 0.1181640625, 0.238800048828125, 0.35943603515625, 0.480072021484375, 0.6007080078125, 0.721343994140625, 0.84197998046875, 0.962615966796875, 1.083251953125, 1.203887939453125, 1.32452392578125, 1.445159912109375, 1.5657958984375, 1.686431884765625, 1.80706787109375, 1.927703857421875, 2.04833984375, 2.168975830078125, 2.28961181640625, 2.410247802734375, 2.5308837890625, 2.651519775390625, 2.77215576171875, 2.892791748046875, 3.013427734375, 3.134063720703125, 3.25469970703125, 3.375335693359375, 3.4959716796875, 3.616607666015625, 3.73724365234375, 3.857879638671875, 3.978515625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 36.0, 190.0, 453.0, 274.0, 55.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.474459648132324, -12.481573104858398, -11.488686561584473, -10.495800018310547, -9.502912521362305, -8.510026931762695, -7.517139434814453, -6.524252891540527, -5.531366348266602, -4.538479804992676, -3.545593023300171, -2.552706241607666, -1.5598196983337402, -0.5669331550598145, 0.42595386505126953, 1.4188404083251953, 2.411726951599121, 3.404613494873047, 4.397500038146973, 5.390387058258057, 6.383273601531982, 7.376160144805908, 8.369047164916992, 9.361933708190918, 10.354820251464844, 11.34770679473877, 12.340593338012695, 13.333480834960938, 14.326366424560547, 15.319253921508789, 16.31214141845703, 17.30502700805664, 18.29791259765625, 19.290800094604492, 20.2836856842041, 21.276573181152344, 22.269458770751953, 23.262346267700195, 24.255233764648438, 25.248119354248047, 26.241004943847656, 27.2338924407959, 28.226778030395508, 29.21966552734375, 30.21255111694336, 31.2054386138916, 32.198326110839844, 33.19121170043945, 34.18409729003906, 35.17698287963867, 36.16987228393555, 37.162757873535156, 38.155643463134766, 39.148529052734375, 40.14141845703125, 41.13430404663086, 42.127193450927734, 43.120079040527344, 44.11296844482422, 45.10585403442383, 46.09873962402344, 47.09162521362305, 48.08451461791992, 49.07740020751953, 50.07028579711914]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 7.0, 11.0, 13.0, 24.0, 15.0, 12.0, 22.0, 30.0, 14.0, 29.0, 33.0, 40.0, 48.0, 43.0, 47.0, 46.0, 45.0, 47.0, 57.0, 56.0, 41.0, 42.0, 42.0, 36.0, 28.0, 30.0, 29.0, 24.0, 18.0, 19.0, 10.0, 14.0, 13.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.521005630493164, -10.230130195617676, -9.939253807067871, -9.648378372192383, -9.357501983642578, -9.06662654876709, -8.775750160217285, -8.484874725341797, -8.193998336791992, -7.903122425079346, -7.612246513366699, -7.321370601654053, -7.030494689941406, -6.73961877822876, -6.448742866516113, -6.157867431640625, -5.8669915199279785, -5.576115608215332, -5.2852396965026855, -4.994363784790039, -4.703487873077393, -4.412611961364746, -4.121736526489258, -3.8308603763580322, -3.5399844646453857, -3.2491085529327393, -2.9582326412200928, -2.6673569679260254, -2.376481056213379, -2.0856051445007324, -1.794729232788086, -1.5038533210754395, -1.212977409362793, -0.9221014976501465, -0.6312256455421448, -0.34034979343414307, -0.04947388172149658, 0.2414020299911499, 0.5322778224945068, 0.8231537342071533, 1.1140296459197998, 1.4049055576324463, 1.6957814693450928, 1.9866572618484497, 2.2775330543518066, 2.568408966064453, 2.8592848777770996, 3.150160789489746, 3.4410367012023926, 3.731912612915039, 4.0227885246276855, 4.313664436340332, 4.6045403480529785, 4.895416259765625, 5.186291694641113, 5.477168083190918, 5.768043518066406, 6.058919429779053, 6.349795341491699, 6.640671253204346, 6.931547164916992, 7.222423076629639, 7.513298988342285, 7.804174423217773, 8.095050811767578]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 10.0, 2.0, 3.0, 8.0, 9.0, 13.0, 17.0, 13.0, 15.0, 12.0, 21.0, 29.0, 28.0, 25.0, 31.0, 37.0, 29.0, 31.0, 35.0, 33.0, 41.0, 49.0, 42.0, 32.0, 36.0, 39.0, 38.0, 35.0, 34.0, 21.0, 22.0, 17.0, 23.0, 25.0, 26.0, 19.0, 13.0, 19.0, 9.0, 9.0, 13.0, 5.0, 7.0, 4.0, 10.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0500946044921875, -1.015228271484375, -0.9803619384765625, -0.94549560546875, -0.9106292724609375, -0.875762939453125, -0.8408966064453125, -0.8060302734375, -0.7711639404296875, -0.736297607421875, -0.7014312744140625, -0.66656494140625, -0.6316986083984375, -0.596832275390625, -0.5619659423828125, -0.527099609375, -0.4922332763671875, -0.457366943359375, -0.4225006103515625, -0.38763427734375, -0.3527679443359375, -0.317901611328125, -0.2830352783203125, -0.2481689453125, -0.2133026123046875, -0.178436279296875, -0.1435699462890625, -0.10870361328125, -0.0738372802734375, -0.038970947265625, -0.0041046142578125, 0.03076171875, 0.0656280517578125, 0.100494384765625, 0.1353607177734375, 0.17022705078125, 0.2050933837890625, 0.239959716796875, 0.2748260498046875, 0.3096923828125, 0.3445587158203125, 0.379425048828125, 0.4142913818359375, 0.44915771484375, 0.4840240478515625, 0.518890380859375, 0.5537567138671875, 0.588623046875, 0.6234893798828125, 0.658355712890625, 0.6932220458984375, 0.72808837890625, 0.7629547119140625, 0.797821044921875, 0.8326873779296875, 0.8675537109375, 0.9024200439453125, 0.937286376953125, 0.9721527099609375, 1.00701904296875, 1.0418853759765625, 1.076751708984375, 1.1116180419921875, 1.146484375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 8.0, 18.0, 36.0, 57.0, 74.0, 88.0, 161.0, 204.0, 283.0, 427.0, 561.0, 812.0, 1197.0, 1738.0, 2542.0, 4288.0, 7032.0, 12629.0, 25268.0, 60187.0, 189629.0, 796525.0, 2002511.0, 783359.0, 187763.0, 60343.0, 25249.0, 12379.0, 6940.0, 4091.0, 2547.0, 1686.0, 1120.0, 744.0, 542.0, 373.0, 256.0, 189.0, 132.0, 101.0, 67.0, 50.0, 21.0, 20.0, 12.0, 8.0, 1.0, 8.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.759674072265625, -1.70001220703125, -1.640350341796875, -1.5806884765625, -1.521026611328125, -1.46136474609375, -1.401702880859375, -1.342041015625, -1.282379150390625, -1.22271728515625, -1.163055419921875, -1.1033935546875, -1.043731689453125, -0.98406982421875, -0.924407958984375, -0.86474609375, -0.805084228515625, -0.74542236328125, -0.685760498046875, -0.6260986328125, -0.566436767578125, -0.50677490234375, -0.447113037109375, -0.387451171875, -0.327789306640625, -0.26812744140625, -0.208465576171875, -0.1488037109375, -0.089141845703125, -0.02947998046875, 0.030181884765625, 0.08984375, 0.149505615234375, 0.20916748046875, 0.268829345703125, 0.3284912109375, 0.388153076171875, 0.44781494140625, 0.507476806640625, 0.567138671875, 0.626800537109375, 0.68646240234375, 0.746124267578125, 0.8057861328125, 0.865447998046875, 0.92510986328125, 0.984771728515625, 1.04443359375, 1.104095458984375, 1.16375732421875, 1.223419189453125, 1.2830810546875, 1.342742919921875, 1.40240478515625, 1.462066650390625, 1.521728515625, 1.581390380859375, 1.64105224609375, 1.700714111328125, 1.7603759765625, 1.820037841796875, 1.87969970703125, 1.939361572265625, 1.9990234375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 1.0, 5.0, 10.0, 3.0, 15.0, 9.0, 12.0, 17.0, 17.0, 22.0, 38.0, 34.0, 63.0, 71.0, 87.0, 128.0, 196.0, 199.0, 299.0, 425.0, 459.0, 472.0, 374.0, 290.0, 198.0, 137.0, 106.0, 88.0, 53.0, 50.0, 42.0, 26.0, 17.0, 17.0, 19.0, 15.0, 5.0, 8.0, 10.0, 6.0, 6.0, 8.0, 3.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0], "bins": [-1.943359375, -1.889190673828125, -1.83502197265625, -1.780853271484375, -1.7266845703125, -1.672515869140625, -1.61834716796875, -1.564178466796875, -1.510009765625, -1.455841064453125, -1.40167236328125, -1.347503662109375, -1.2933349609375, -1.239166259765625, -1.18499755859375, -1.130828857421875, -1.07666015625, -1.022491455078125, -0.96832275390625, -0.914154052734375, -0.8599853515625, -0.805816650390625, -0.75164794921875, -0.697479248046875, -0.643310546875, -0.589141845703125, -0.53497314453125, -0.480804443359375, -0.4266357421875, -0.372467041015625, -0.31829833984375, -0.264129638671875, -0.2099609375, -0.155792236328125, -0.10162353515625, -0.047454833984375, 0.0067138671875, 0.060882568359375, 0.11505126953125, 0.169219970703125, 0.223388671875, 0.277557373046875, 0.33172607421875, 0.385894775390625, 0.4400634765625, 0.494232177734375, 0.54840087890625, 0.602569580078125, 0.65673828125, 0.710906982421875, 0.76507568359375, 0.819244384765625, 0.8734130859375, 0.927581787109375, 0.98175048828125, 1.035919189453125, 1.090087890625, 1.144256591796875, 1.19842529296875, 1.252593994140625, 1.3067626953125, 1.360931396484375, 1.41510009765625, 1.469268798828125, 1.5234375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 5.0, 12.0, 13.0, 24.0, 28.0, 42.0, 56.0, 96.0, 171.0, 291.0, 483.0, 975.0, 1934.0, 4268.0, 10461.0, 29304.0, 102755.0, 589215.0, 2759122.0, 550922.0, 97740.0, 28236.0, 9994.0, 4136.0, 1831.0, 925.0, 467.0, 285.0, 169.0, 115.0, 61.0, 44.0, 15.0, 11.0, 14.0, 11.0, 9.0, 5.0, 9.0, 4.0, 5.0, 4.0, 4.0, 6.0, 2.0, 1.0], "bins": [-3.869140625, -3.763092041015625, -3.65704345703125, -3.550994873046875, -3.4449462890625, -3.338897705078125, -3.23284912109375, -3.126800537109375, -3.020751953125, -2.914703369140625, -2.80865478515625, -2.702606201171875, -2.5965576171875, -2.490509033203125, -2.38446044921875, -2.278411865234375, -2.17236328125, -2.066314697265625, -1.96026611328125, -1.854217529296875, -1.7481689453125, -1.642120361328125, -1.53607177734375, -1.430023193359375, -1.323974609375, -1.217926025390625, -1.11187744140625, -1.005828857421875, -0.8997802734375, -0.793731689453125, -0.68768310546875, -0.581634521484375, -0.4755859375, -0.369537353515625, -0.26348876953125, -0.157440185546875, -0.0513916015625, 0.054656982421875, 0.16070556640625, 0.266754150390625, 0.372802734375, 0.478851318359375, 0.58489990234375, 0.690948486328125, 0.7969970703125, 0.903045654296875, 1.00909423828125, 1.115142822265625, 1.22119140625, 1.327239990234375, 1.43328857421875, 1.539337158203125, 1.6453857421875, 1.751434326171875, 1.85748291015625, 1.963531494140625, 2.069580078125, 2.175628662109375, 2.28167724609375, 2.387725830078125, 2.4937744140625, 2.599822998046875, 2.70587158203125, 2.811920166015625, 2.91796875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 27.0, 66.0, 139.0, 178.0, 240.0, 168.0, 106.0, 51.0, 18.0, 11.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.947937488555908, -6.34044075012207, -5.732944011688232, -5.1254472732543945, -4.517951011657715, -3.910454034805298, -3.302957534790039, -2.695460796356201, -2.0879640579223633, -1.4804673194885254, -0.872970700263977, -0.2654740810394287, 0.3420226573944092, 0.9495193958282471, 1.5570158958435059, 2.1645126342773438, 2.7720093727111816, 3.3795061111450195, 3.9870028495788574, 4.594499588012695, 5.201995849609375, 5.809493064880371, 6.416989326477051, 7.024486064910889, 7.631982803344727, 8.239479064941406, 8.846976280212402, 9.454472541809082, 10.061969757080078, 10.669466018676758, 11.276962280273438, 11.884459495544434, 12.49195671081543, 13.09945297241211, 13.706950187683105, 14.314446449279785, 14.921943664550781, 15.529439926147461, 16.13693618774414, 16.744434356689453, 17.351930618286133, 17.959426879882812, 18.566923141479492, 19.174421310424805, 19.781917572021484, 20.389413833618164, 20.996910095214844, 21.604408264160156, 22.211902618408203, 22.819398880004883, 23.426895141601562, 24.034393310546875, 24.641889572143555, 25.249385833740234, 25.856882095336914, 26.464378356933594, 27.071876525878906, 27.679372787475586, 28.286869049072266, 28.894367218017578, 29.501863479614258, 30.109359741210938, 30.716856002807617, 31.324352264404297, 31.93185043334961]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 4.0, 7.0, 9.0, 13.0, 14.0, 18.0, 15.0, 31.0, 29.0, 27.0, 28.0, 25.0, 48.0, 36.0, 42.0, 50.0, 38.0, 35.0, 37.0, 41.0, 45.0, 36.0, 38.0, 37.0, 32.0, 39.0, 43.0, 26.0, 27.0, 19.0, 20.0, 16.0, 12.0, 10.0, 13.0, 11.0, 5.0, 9.0, 2.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.741573333740234, -6.520761013031006, -6.299948692321777, -6.079135894775391, -5.858323574066162, -5.637511253356934, -5.416698455810547, -5.195886135101318, -4.97507381439209, -4.754261493682861, -4.533449172973633, -4.312636375427246, -4.091824054718018, -3.871011734008789, -3.6501991748809814, -3.429386615753174, -3.2085742950439453, -2.987761974334717, -2.766949415206909, -2.5461368560791016, -2.325324535369873, -2.1045122146606445, -1.883699655532837, -1.6628872156143188, -1.4420747756958008, -1.2212623357772827, -1.0004498958587646, -0.7796374559402466, -0.5588250160217285, -0.33801257610321045, -0.11720013618469238, 0.10361230373382568, 0.32442522048950195, 0.54523766040802, 0.7660501003265381, 0.9868625402450562, 1.2076749801635742, 1.4284874200820923, 1.6492998600006104, 1.8701122999191284, 2.0909247398376465, 2.311737060546875, 2.5325496196746826, 2.7533621788024902, 2.9741744995117188, 3.1949868202209473, 3.415799379348755, 3.6366119384765625, 3.857424259185791, 4.0782365798950195, 4.299049377441406, 4.519861698150635, 4.740674018859863, 4.961486339569092, 5.18229866027832, 5.403111457824707, 5.6239237785339355, 5.844736099243164, 6.065548896789551, 6.286361217498779, 6.507173538208008, 6.727985858917236, 6.948798179626465, 7.169610977172852, 7.39042329788208]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 7.0, 2.0, 5.0, 7.0, 5.0, 11.0, 8.0, 6.0, 9.0, 11.0, 12.0, 23.0, 19.0, 20.0, 21.0, 21.0, 23.0, 22.0, 27.0, 26.0, 28.0, 30.0, 35.0, 34.0, 31.0, 29.0, 26.0, 40.0, 35.0, 42.0, 43.0, 26.0, 27.0, 31.0, 37.0, 24.0, 17.0, 22.0, 24.0, 21.0, 19.0, 20.0, 9.0, 15.0, 14.0, 10.0, 3.0, 5.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.97119140625, -0.9383316040039062, -0.9054718017578125, -0.8726119995117188, -0.839752197265625, -0.8068923950195312, -0.7740325927734375, -0.7411727905273438, -0.70831298828125, -0.6754531860351562, -0.6425933837890625, -0.6097335815429688, -0.576873779296875, -0.5440139770507812, -0.5111541748046875, -0.47829437255859375, -0.4454345703125, -0.41257476806640625, -0.3797149658203125, -0.34685516357421875, -0.313995361328125, -0.28113555908203125, -0.2482757568359375, -0.21541595458984375, -0.18255615234375, -0.14969635009765625, -0.1168365478515625, -0.08397674560546875, -0.051116943359375, -0.01825714111328125, 0.0146026611328125, 0.04746246337890625, 0.080322265625, 0.11318206787109375, 0.1460418701171875, 0.17890167236328125, 0.211761474609375, 0.24462127685546875, 0.2774810791015625, 0.31034088134765625, 0.34320068359375, 0.37606048583984375, 0.4089202880859375, 0.44178009033203125, 0.474639892578125, 0.5074996948242188, 0.5403594970703125, 0.5732192993164062, 0.6060791015625, 0.6389389038085938, 0.6717987060546875, 0.7046585083007812, 0.737518310546875, 0.7703781127929688, 0.8032379150390625, 0.8360977172851562, 0.86895751953125, 0.9018173217773438, 0.9346771240234375, 0.9675369262695312, 1.000396728515625, 1.0332565307617188, 1.0661163330078125, 1.0989761352539062, 1.1318359375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 14.0, 19.0, 26.0, 36.0, 58.0, 69.0, 98.0, 172.0, 279.0, 481.0, 847.0, 1511.0, 2705.0, 5141.0, 9976.0, 19771.0, 41343.0, 90078.0, 191034.0, 292739.0, 205419.0, 97384.0, 44720.0, 21626.0, 10441.0, 5704.0, 2998.0, 1640.0, 830.0, 497.0, 326.0, 189.0, 137.0, 86.0, 44.0, 37.0, 22.0, 17.0, 8.0, 6.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1585693359375, -0.1533794403076172, -0.14818954467773438, -0.14299964904785156, -0.13780975341796875, -0.13261985778808594, -0.12742996215820312, -0.12224006652832031, -0.1170501708984375, -0.11186027526855469, -0.10667037963867188, -0.10148048400878906, -0.09629058837890625, -0.09110069274902344, -0.08591079711914062, -0.08072090148925781, -0.075531005859375, -0.07034111022949219, -0.06515121459960938, -0.05996131896972656, -0.05477142333984375, -0.04958152770996094, -0.044391632080078125, -0.03920173645019531, -0.0340118408203125, -0.028821945190429688, -0.023632049560546875, -0.018442153930664062, -0.01325225830078125, -0.008062362670898438, -0.002872467041015625, 0.0023174285888671875, 0.00750732421875, 0.012697219848632812, 0.017887115478515625, 0.023077011108398438, 0.02826690673828125, 0.03345680236816406, 0.038646697998046875, 0.04383659362792969, 0.0490264892578125, 0.05421638488769531, 0.059406280517578125, 0.06459617614746094, 0.06978607177734375, 0.07497596740722656, 0.08016586303710938, 0.08535575866699219, 0.090545654296875, 0.09573554992675781, 0.10092544555664062, 0.10611534118652344, 0.11130523681640625, 0.11649513244628906, 0.12168502807617188, 0.1268749237060547, 0.1320648193359375, 0.1372547149658203, 0.14244461059570312, 0.14763450622558594, 0.15282440185546875, 0.15801429748535156, 0.16320419311523438, 0.1683940887451172, 0.173583984375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 11.0, 14.0, 15.0, 12.0, 24.0, 22.0, 20.0, 24.0, 19.0, 29.0, 38.0, 44.0, 46.0, 37.0, 34.0, 46.0, 1069.0, 37.0, 52.0, 44.0, 37.0, 41.0, 31.0, 36.0, 24.0, 27.0, 22.0, 18.0, 26.0, 19.0, 10.0, 22.0, 11.0, 9.0, 8.0, 8.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78955078125, -0.7633819580078125, -0.737213134765625, -0.7110443115234375, -0.68487548828125, -0.6587066650390625, -0.632537841796875, -0.6063690185546875, -0.5802001953125, -0.5540313720703125, -0.527862548828125, -0.5016937255859375, -0.47552490234375, -0.4493560791015625, -0.423187255859375, -0.3970184326171875, -0.370849609375, -0.3446807861328125, -0.318511962890625, -0.2923431396484375, -0.26617431640625, -0.2400054931640625, -0.213836669921875, -0.1876678466796875, -0.1614990234375, -0.1353302001953125, -0.109161376953125, -0.0829925537109375, -0.05682373046875, -0.0306549072265625, -0.004486083984375, 0.0216827392578125, 0.0478515625, 0.0740203857421875, 0.100189208984375, 0.1263580322265625, 0.15252685546875, 0.1786956787109375, 0.204864501953125, 0.2310333251953125, 0.2572021484375, 0.2833709716796875, 0.309539794921875, 0.3357086181640625, 0.36187744140625, 0.3880462646484375, 0.414215087890625, 0.4403839111328125, 0.466552734375, 0.4927215576171875, 0.518890380859375, 0.5450592041015625, 0.57122802734375, 0.5973968505859375, 0.623565673828125, 0.6497344970703125, 0.6759033203125, 0.7020721435546875, 0.728240966796875, 0.7544097900390625, 0.78057861328125, 0.8067474365234375, 0.832916259765625, 0.8590850830078125, 0.88525390625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 7.0, 7.0, 10.0, 10.0, 7.0, 9.0, 20.0, 21.0, 29.0, 45.0, 67.0, 53.0, 122.0, 150.0, 215.0, 400.0, 625.0, 1095.0, 2141.0, 4439.0, 9509.0, 23673.0, 63625.0, 188747.0, 1366745.0, 288090.0, 89890.0, 32007.0, 12914.0, 5887.0, 2764.0, 1431.0, 875.0, 482.0, 310.0, 226.0, 146.0, 107.0, 63.0, 50.0, 37.0, 25.0, 21.0, 7.0, 8.0, 7.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156494140625, -0.15184593200683594, -0.14719772338867188, -0.1425495147705078, -0.13790130615234375, -0.1332530975341797, -0.12860488891601562, -0.12395668029785156, -0.1193084716796875, -0.11466026306152344, -0.11001205444335938, -0.10536384582519531, -0.10071563720703125, -0.09606742858886719, -0.09141921997070312, -0.08677101135253906, -0.082122802734375, -0.07747459411621094, -0.07282638549804688, -0.06817817687988281, -0.06352996826171875, -0.05888175964355469, -0.054233551025390625, -0.04958534240722656, -0.0449371337890625, -0.04028892517089844, -0.035640716552734375, -0.030992507934570312, -0.02634429931640625, -0.021696090698242188, -0.017047882080078125, -0.012399673461914062, -0.00775146484375, -0.0031032562255859375, 0.001544952392578125, 0.0061931610107421875, 0.01084136962890625, 0.015489578247070312, 0.020137786865234375, 0.024785995483398438, 0.0294342041015625, 0.03408241271972656, 0.038730621337890625, 0.04337882995605469, 0.04802703857421875, 0.05267524719238281, 0.057323455810546875, 0.06197166442871094, 0.066619873046875, 0.07126808166503906, 0.07591629028320312, 0.08056449890136719, 0.08521270751953125, 0.08986091613769531, 0.09450912475585938, 0.09915733337402344, 0.1038055419921875, 0.10845375061035156, 0.11310195922851562, 0.11775016784667969, 0.12239837646484375, 0.1270465850830078, 0.13169479370117188, 0.13634300231933594, 0.1409912109375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 19.0, 27.0, 50.0, 95.0, 269.0, 252.0, 121.0, 70.0, 35.0, 21.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031585693359375, -0.03073287010192871, -0.029880046844482422, -0.029027223587036133, -0.028174400329589844, -0.027321577072143555, -0.026468753814697266, -0.025615930557250977, -0.024763107299804688, -0.0239102840423584, -0.02305746078491211, -0.02220463752746582, -0.02135181427001953, -0.020498991012573242, -0.019646167755126953, -0.018793344497680664, -0.017940521240234375, -0.017087697982788086, -0.016234874725341797, -0.015382051467895508, -0.014529228210449219, -0.01367640495300293, -0.01282358169555664, -0.011970758438110352, -0.011117935180664062, -0.010265111923217773, -0.009412288665771484, -0.008559465408325195, -0.007706642150878906, -0.006853818893432617, -0.006000995635986328, -0.005148172378540039, -0.00429534912109375, -0.003442525863647461, -0.002589702606201172, -0.0017368793487548828, -0.0008840560913085938, -3.123283386230469e-05, 0.0008215904235839844, 0.0016744136810302734, 0.0025272369384765625, 0.0033800601959228516, 0.004232883453369141, 0.00508570671081543, 0.005938529968261719, 0.006791353225708008, 0.007644176483154297, 0.008496999740600586, 0.009349822998046875, 0.010202646255493164, 0.011055469512939453, 0.011908292770385742, 0.012761116027832031, 0.01361393928527832, 0.01446676254272461, 0.015319585800170898, 0.016172409057617188, 0.017025232315063477, 0.017878055572509766, 0.018730878829956055, 0.019583702087402344, 0.020436525344848633, 0.021289348602294922, 0.02214217185974121, 0.0229949951171875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 1.0, 7.0, 11.0, 19.0, 38.0, 65.0, 128.0, 536.0, 34301.0, 1012089.0, 1023.0, 159.0, 65.0, 35.0, 14.0, 16.0, 15.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.44771575927734375, -0.4305877685546875, -0.41345977783203125, -0.396331787109375, -0.37920379638671875, -0.3620758056640625, -0.34494781494140625, -0.32781982421875, -0.31069183349609375, -0.2935638427734375, -0.27643585205078125, -0.259307861328125, -0.24217987060546875, -0.2250518798828125, -0.20792388916015625, -0.1907958984375, -0.17366790771484375, -0.1565399169921875, -0.13941192626953125, -0.122283935546875, -0.10515594482421875, -0.0880279541015625, -0.07089996337890625, -0.05377197265625, -0.03664398193359375, -0.0195159912109375, -0.00238800048828125, 0.014739990234375, 0.03186798095703125, 0.0489959716796875, 0.06612396240234375, 0.083251953125, 0.10037994384765625, 0.1175079345703125, 0.13463592529296875, 0.151763916015625, 0.16889190673828125, 0.1860198974609375, 0.20314788818359375, 0.22027587890625, 0.23740386962890625, 0.2545318603515625, 0.27165985107421875, 0.288787841796875, 0.30591583251953125, 0.3230438232421875, 0.34017181396484375, 0.3572998046875, 0.37442779541015625, 0.3915557861328125, 0.40868377685546875, 0.425811767578125, 0.44293975830078125, 0.4600677490234375, 0.47719573974609375, 0.49432373046875, 0.5114517211914062, 0.5285797119140625, 0.5457077026367188, 0.562835693359375, 0.5799636840820312, 0.5970916748046875, 0.6142196655273438, 0.63134765625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 37.0, 180.0, 507.0, 232.0, 48.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11935458332300186, -0.11712586879730225, -0.11489715427160263, -0.11266843974590302, -0.1104397252202034, -0.10821101069450378, -0.10598229616880417, -0.10375358164310455, -0.10152486711740494, -0.09929615259170532, -0.0970674380660057, -0.09483872354030609, -0.09261000901460648, -0.09038129448890686, -0.08815257996320724, -0.08592386543750763, -0.08369515091180801, -0.0814664363861084, -0.07923772186040878, -0.07700900733470917, -0.07478029280900955, -0.07255157828330994, -0.07032286375761032, -0.0680941492319107, -0.06586543470621109, -0.06363672018051147, -0.06140800565481186, -0.059179291129112244, -0.05695057660341263, -0.05472186207771301, -0.0524931475520134, -0.05026443302631378, -0.048035722225904465, -0.04580700770020485, -0.043578293174505234, -0.04134957864880562, -0.039120864123106, -0.03689214959740639, -0.03466343507170677, -0.032434720546007156, -0.03020600602030754, -0.027977291494607925, -0.02574857696890831, -0.023519862443208694, -0.02129114791750908, -0.019062433391809464, -0.016833718866109848, -0.014605004340410233, -0.012376289814710617, -0.010147575289011002, -0.007918860763311386, -0.005690146237611771, -0.003461431711912155, -0.0012327171862125397, 0.0009959973394870758, 0.0032247118651866913, 0.005453426390886307, 0.007682140916585922, 0.009910855442285538, 0.012139569967985153, 0.014368284493684769, 0.016596999019384384, 0.018825713545084, 0.021054428070783615, 0.02328314259648323]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 13.0, 10.0, 14.0, 14.0, 9.0, 17.0, 23.0, 14.0, 29.0, 36.0, 36.0, 41.0, 36.0, 30.0, 43.0, 31.0, 40.0, 39.0, 47.0, 39.0, 42.0, 34.0, 42.0, 29.0, 35.0, 23.0, 25.0, 22.0, 27.0, 24.0, 18.0, 7.0, 13.0, 27.0, 11.0, 5.0, 8.0, 4.0, 2.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.009152233600616455, -0.008870133198797703, -0.00858803279697895, -0.008305932395160198, -0.008023831993341446, -0.007741731591522694, -0.007459631189703941, -0.007177530787885189, -0.006895430386066437, -0.0066133299842476845, -0.006331229582428932, -0.00604912918061018, -0.005767028778791428, -0.005484928376972675, -0.005202827975153923, -0.004920727573335171, -0.0046386271715164185, -0.004356526769697666, -0.004074426367878914, -0.0037923259660601616, -0.0035102255642414093, -0.003228125162422657, -0.0029460247606039047, -0.0026639243587851524, -0.0023818239569664, -0.002099723555147648, -0.0018176231533288956, -0.0015355227515101433, -0.001253422349691391, -0.0009713219478726387, -0.0006892215460538864, -0.0004071211442351341, -0.00012502074241638184, 0.00015707965940237045, 0.00043918006122112274, 0.000721280463039875, 0.0010033808648586273, 0.0012854812666773796, 0.001567581668496132, 0.0018496820703148842, 0.0021317824721336365, 0.0024138828739523888, 0.002695983275771141, 0.0029780836775898933, 0.0032601840794086456, 0.003542284481227398, 0.00382438488304615, 0.0041064852848649025, 0.004388585686683655, 0.004670686088502407, 0.004952786490321159, 0.005234886892139912, 0.005516987293958664, 0.005799087695777416, 0.0060811880975961685, 0.006363288499414921, 0.006645388901233673, 0.006927489303052425, 0.007209589704871178, 0.00749169010668993, 0.007773790508508682, 0.008055890910327435, 0.008337991312146187, 0.008620091713964939, 0.008902192115783691]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 7.0, 2.0, 5.0, 6.0, 6.0, 11.0, 8.0, 5.0, 10.0, 11.0, 10.0, 25.0, 19.0, 19.0, 22.0, 21.0, 24.0, 21.0, 27.0, 26.0, 28.0, 30.0, 34.0, 34.0, 32.0, 29.0, 26.0, 42.0, 33.0, 40.0, 44.0, 27.0, 27.0, 31.0, 35.0, 26.0, 16.0, 23.0, 24.0, 21.0, 18.0, 21.0, 9.0, 15.0, 14.0, 10.0, 3.0, 5.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9716796875, -0.938812255859375, -0.90594482421875, -0.873077392578125, -0.8402099609375, -0.807342529296875, -0.77447509765625, -0.741607666015625, -0.708740234375, -0.675872802734375, -0.64300537109375, -0.610137939453125, -0.5772705078125, -0.544403076171875, -0.51153564453125, -0.478668212890625, -0.44580078125, -0.412933349609375, -0.38006591796875, -0.347198486328125, -0.3143310546875, -0.281463623046875, -0.24859619140625, -0.215728759765625, -0.182861328125, -0.149993896484375, -0.11712646484375, -0.084259033203125, -0.0513916015625, -0.018524169921875, 0.01434326171875, 0.047210693359375, 0.080078125, 0.112945556640625, 0.14581298828125, 0.178680419921875, 0.2115478515625, 0.244415283203125, 0.27728271484375, 0.310150146484375, 0.343017578125, 0.375885009765625, 0.40875244140625, 0.441619873046875, 0.4744873046875, 0.507354736328125, 0.54022216796875, 0.573089599609375, 0.60595703125, 0.638824462890625, 0.67169189453125, 0.704559326171875, 0.7374267578125, 0.770294189453125, 0.80316162109375, 0.836029052734375, 0.868896484375, 0.901763916015625, 0.93463134765625, 0.967498779296875, 1.0003662109375, 1.033233642578125, 1.06610107421875, 1.098968505859375, 1.1318359375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 1.0, 7.0, 4.0, 12.0, 14.0, 13.0, 26.0, 26.0, 31.0, 55.0, 95.0, 141.0, 199.0, 305.0, 468.0, 663.0, 979.0, 1492.0, 2363.0, 3703.0, 6074.0, 10434.0, 18774.0, 35659.0, 71828.0, 145995.0, 243884.0, 232777.0, 132464.0, 64778.0, 32625.0, 17285.0, 9718.0, 5612.0, 3491.0, 2234.0, 1485.0, 948.0, 637.0, 396.0, 297.0, 166.0, 111.0, 78.0, 57.0, 47.0, 23.0, 20.0, 19.0, 19.0, 3.0, 12.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.5244140625, -1.475128173828125, -1.42584228515625, -1.376556396484375, -1.3272705078125, -1.277984619140625, -1.22869873046875, -1.179412841796875, -1.130126953125, -1.080841064453125, -1.03155517578125, -0.982269287109375, -0.9329833984375, -0.883697509765625, -0.83441162109375, -0.785125732421875, -0.73583984375, -0.686553955078125, -0.63726806640625, -0.587982177734375, -0.5386962890625, -0.489410400390625, -0.44012451171875, -0.390838623046875, -0.341552734375, -0.292266845703125, -0.24298095703125, -0.193695068359375, -0.1444091796875, -0.095123291015625, -0.04583740234375, 0.003448486328125, 0.052734375, 0.102020263671875, 0.15130615234375, 0.200592041015625, 0.2498779296875, 0.299163818359375, 0.34844970703125, 0.397735595703125, 0.447021484375, 0.496307373046875, 0.54559326171875, 0.594879150390625, 0.6441650390625, 0.693450927734375, 0.74273681640625, 0.792022705078125, 0.84130859375, 0.890594482421875, 0.93988037109375, 0.989166259765625, 1.0384521484375, 1.087738037109375, 1.13702392578125, 1.186309814453125, 1.235595703125, 1.284881591796875, 1.33416748046875, 1.383453369140625, 1.4327392578125, 1.482025146484375, 1.53131103515625, 1.580596923828125, 1.6298828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 10.0, 10.0, 11.0, 8.0, 9.0, 18.0, 19.0, 24.0, 25.0, 27.0, 29.0, 43.0, 50.0, 48.0, 84.0, 97.0, 116.0, 198.0, 1276.0, 177.0, 146.0, 99.0, 83.0, 56.0, 59.0, 45.0, 38.0, 43.0, 40.0, 20.0, 20.0, 19.0, 17.0, 10.0, 15.0, 7.0, 9.0, 7.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.04296875, -2.957733154296875, -2.87249755859375, -2.787261962890625, -2.7020263671875, -2.616790771484375, -2.53155517578125, -2.446319580078125, -2.361083984375, -2.275848388671875, -2.19061279296875, -2.105377197265625, -2.0201416015625, -1.934906005859375, -1.84967041015625, -1.764434814453125, -1.67919921875, -1.593963623046875, -1.50872802734375, -1.423492431640625, -1.3382568359375, -1.253021240234375, -1.16778564453125, -1.082550048828125, -0.997314453125, -0.912078857421875, -0.82684326171875, -0.741607666015625, -0.6563720703125, -0.571136474609375, -0.48590087890625, -0.400665283203125, -0.3154296875, -0.230194091796875, -0.14495849609375, -0.059722900390625, 0.0255126953125, 0.110748291015625, 0.19598388671875, 0.281219482421875, 0.366455078125, 0.451690673828125, 0.53692626953125, 0.622161865234375, 0.7073974609375, 0.792633056640625, 0.87786865234375, 0.963104248046875, 1.04833984375, 1.133575439453125, 1.21881103515625, 1.304046630859375, 1.3892822265625, 1.474517822265625, 1.55975341796875, 1.644989013671875, 1.730224609375, 1.815460205078125, 1.90069580078125, 1.985931396484375, 2.0711669921875, 2.156402587890625, 2.24163818359375, 2.326873779296875, 2.412109375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 3.0, 8.0, 9.0, 10.0, 9.0, 18.0, 20.0, 37.0, 46.0, 65.0, 90.0, 127.0, 201.0, 239.0, 503.0, 1225.0, 3109.0, 10920.0, 58240.0, 801279.0, 2115214.0, 127333.0, 18920.0, 4744.0, 1571.0, 676.0, 364.0, 204.0, 131.0, 109.0, 64.0, 58.0, 50.0, 30.0, 13.0, 12.0, 8.0, 9.0, 10.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.51953125, -4.37908935546875, -4.2386474609375, -4.09820556640625, -3.957763671875, -3.81732177734375, -3.6768798828125, -3.53643798828125, -3.39599609375, -3.25555419921875, -3.1151123046875, -2.97467041015625, -2.834228515625, -2.69378662109375, -2.5533447265625, -2.41290283203125, -2.2724609375, -2.13201904296875, -1.9915771484375, -1.85113525390625, -1.710693359375, -1.57025146484375, -1.4298095703125, -1.28936767578125, -1.14892578125, -1.00848388671875, -0.8680419921875, -0.72760009765625, -0.587158203125, -0.44671630859375, -0.3062744140625, -0.16583251953125, -0.025390625, 0.11505126953125, 0.2554931640625, 0.39593505859375, 0.536376953125, 0.67681884765625, 0.8172607421875, 0.95770263671875, 1.09814453125, 1.23858642578125, 1.3790283203125, 1.51947021484375, 1.659912109375, 1.80035400390625, 1.9407958984375, 2.08123779296875, 2.2216796875, 2.36212158203125, 2.5025634765625, 2.64300537109375, 2.783447265625, 2.92388916015625, 3.0643310546875, 3.20477294921875, 3.34521484375, 3.48565673828125, 3.6260986328125, 3.76654052734375, 3.906982421875, 4.04742431640625, 4.1878662109375, 4.32830810546875, 4.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 353.0, 657.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.70758056640625, -149.8297882080078, -146.9519805908203, -144.07418823242188, -141.19638061523438, -138.31858825683594, -135.4407958984375, -132.56298828125, -129.68519592285156, -126.8073959350586, -123.92959594726562, -121.05180358886719, -118.17400360107422, -115.29620361328125, -112.41840362548828, -109.54060363769531, -106.66279602050781, -103.78499603271484, -100.90719604492188, -98.02940368652344, -95.15160369873047, -92.2738037109375, -89.39600372314453, -86.51820373535156, -83.64041137695312, -80.76261138916016, -77.88481140136719, -75.00701904296875, -72.12921905517578, -69.25141906738281, -66.37361907958984, -63.495819091796875, -60.618019104003906, -57.74021911621094, -54.862422943115234, -51.984622955322266, -49.1068229675293, -46.229026794433594, -43.351226806640625, -40.473426818847656, -37.59562683105469, -34.71782684326172, -31.840028762817383, -28.962230682373047, -26.084430694580078, -23.206632614135742, -20.328834533691406, -17.451034545898438, -14.573238372802734, -11.695439338684082, -8.81764030456543, -5.939842224121094, -3.0620431900024414, -0.18424415588378906, 2.693553924560547, 5.571353912353516, 8.449151992797852, 11.326951026916504, 14.204750061035156, 17.082548141479492, 19.960346221923828, 22.838146209716797, 25.715944290161133, 28.5937442779541, 31.471542358398438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 1.0, 8.0, 4.0, 6.0, 9.0, 13.0, 21.0, 18.0, 19.0, 16.0, 29.0, 29.0, 35.0, 25.0, 44.0, 23.0, 44.0, 40.0, 43.0, 43.0, 56.0, 45.0, 35.0, 36.0, 40.0, 37.0, 31.0, 38.0, 33.0, 39.0, 27.0, 14.0, 17.0, 15.0, 14.0, 12.0, 7.0, 7.0, 7.0, 6.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.8365583419799805, -7.591069221496582, -7.345579624176025, -7.100090026855469, -6.85460090637207, -6.609111785888672, -6.363622188568115, -6.118132591247559, -5.87264347076416, -5.627154350280762, -5.381664752960205, -5.136175155639648, -4.89068603515625, -4.645196914672852, -4.399707317352295, -4.154217720031738, -3.90872859954834, -3.6632392406463623, -3.4177498817443848, -3.1722605228424072, -2.9267711639404297, -2.681281805038452, -2.4357924461364746, -2.190303087234497, -1.9448137283325195, -1.699324369430542, -1.4538350105285645, -1.208345651626587, -0.9628562927246094, -0.7173669338226318, -0.4718775749206543, -0.22638821601867676, 0.019100666046142578, 0.2645900249481201, 0.5100793838500977, 0.7555687427520752, 1.0010581016540527, 1.2465474605560303, 1.4920368194580078, 1.7375261783599854, 1.983015537261963, 2.2285048961639404, 2.473994255065918, 2.7194836139678955, 2.964972972869873, 3.2104623317718506, 3.455951690673828, 3.7014410495758057, 3.946930408477783, 4.19242000579834, 4.437909126281738, 4.683398246765137, 4.928887844085693, 5.17437744140625, 5.419866561889648, 5.665355682373047, 5.9108452796936035, 6.15633487701416, 6.401823997497559, 6.647313117980957, 6.892802715301514, 7.13829231262207, 7.383781433105469, 7.629270553588867, 7.874760150909424]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 3.0, 6.0, 5.0, 10.0, 15.0, 10.0, 9.0, 10.0, 17.0, 17.0, 20.0, 25.0, 21.0, 29.0, 35.0, 28.0, 32.0, 37.0, 35.0, 45.0, 37.0, 32.0, 31.0, 37.0, 40.0, 49.0, 37.0, 42.0, 32.0, 20.0, 29.0, 31.0, 31.0, 23.0, 15.0, 23.0, 16.0, 10.0, 14.0, 8.0, 9.0, 4.0, 8.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.1237945556640625, -1.085479736328125, -1.0471649169921875, -1.00885009765625, -0.9705352783203125, -0.932220458984375, -0.8939056396484375, -0.8555908203125, -0.8172760009765625, -0.778961181640625, -0.7406463623046875, -0.70233154296875, -0.6640167236328125, -0.625701904296875, -0.5873870849609375, -0.549072265625, -0.5107574462890625, -0.472442626953125, -0.4341278076171875, -0.39581298828125, -0.3574981689453125, -0.319183349609375, -0.2808685302734375, -0.2425537109375, -0.2042388916015625, -0.165924072265625, -0.1276092529296875, -0.08929443359375, -0.0509796142578125, -0.012664794921875, 0.0256500244140625, 0.06396484375, 0.1022796630859375, 0.140594482421875, 0.1789093017578125, 0.21722412109375, 0.2555389404296875, 0.293853759765625, 0.3321685791015625, 0.3704833984375, 0.4087982177734375, 0.447113037109375, 0.4854278564453125, 0.52374267578125, 0.5620574951171875, 0.600372314453125, 0.6386871337890625, 0.677001953125, 0.7153167724609375, 0.753631591796875, 0.7919464111328125, 0.83026123046875, 0.8685760498046875, 0.906890869140625, 0.9452056884765625, 0.9835205078125, 1.0218353271484375, 1.060150146484375, 1.0984649658203125, 1.13677978515625, 1.1750946044921875, 1.213409423828125, 1.2517242431640625, 1.2900390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 5.0, 10.0, 1.0, 14.0, 15.0, 14.0, 15.0, 16.0, 28.0, 35.0, 54.0, 63.0, 64.0, 109.0, 161.0, 269.0, 559.0, 2142.0, 31497.0, 3990648.0, 162391.0, 4403.0, 772.0, 314.0, 176.0, 120.0, 101.0, 63.0, 50.0, 38.0, 26.0, 29.0, 20.0, 13.0, 12.0, 11.0, 3.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.625, -9.26416015625, -8.9033203125, -8.54248046875, -8.181640625, -7.82080078125, -7.4599609375, -7.09912109375, -6.73828125, -6.37744140625, -6.0166015625, -5.65576171875, -5.294921875, -4.93408203125, -4.5732421875, -4.21240234375, -3.8515625, -3.49072265625, -3.1298828125, -2.76904296875, -2.408203125, -2.04736328125, -1.6865234375, -1.32568359375, -0.96484375, -0.60400390625, -0.2431640625, 0.11767578125, 0.478515625, 0.83935546875, 1.2001953125, 1.56103515625, 1.921875, 2.28271484375, 2.6435546875, 3.00439453125, 3.365234375, 3.72607421875, 4.0869140625, 4.44775390625, 4.80859375, 5.16943359375, 5.5302734375, 5.89111328125, 6.251953125, 6.61279296875, 6.9736328125, 7.33447265625, 7.6953125, 8.05615234375, 8.4169921875, 8.77783203125, 9.138671875, 9.49951171875, 9.8603515625, 10.22119140625, 10.58203125, 10.94287109375, 11.3037109375, 11.66455078125, 12.025390625, 12.38623046875, 12.7470703125, 13.10791015625, 13.46875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 9.0, 10.0, 19.0, 16.0, 23.0, 29.0, 42.0, 40.0, 56.0, 70.0, 66.0, 106.0, 150.0, 204.0, 293.0, 412.0, 554.0, 553.0, 405.0, 263.0, 177.0, 131.0, 92.0, 65.0, 64.0, 41.0, 27.0, 31.0, 19.0, 17.0, 16.0, 14.0, 9.0, 4.0, 7.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-1.873046875, -1.81597900390625, -1.7589111328125, -1.70184326171875, -1.644775390625, -1.58770751953125, -1.5306396484375, -1.47357177734375, -1.41650390625, -1.35943603515625, -1.3023681640625, -1.24530029296875, -1.188232421875, -1.13116455078125, -1.0740966796875, -1.01702880859375, -0.9599609375, -0.90289306640625, -0.8458251953125, -0.78875732421875, -0.731689453125, -0.67462158203125, -0.6175537109375, -0.56048583984375, -0.50341796875, -0.44635009765625, -0.3892822265625, -0.33221435546875, -0.275146484375, -0.21807861328125, -0.1610107421875, -0.10394287109375, -0.046875, 0.01019287109375, 0.0672607421875, 0.12432861328125, 0.181396484375, 0.23846435546875, 0.2955322265625, 0.35260009765625, 0.40966796875, 0.46673583984375, 0.5238037109375, 0.58087158203125, 0.637939453125, 0.69500732421875, 0.7520751953125, 0.80914306640625, 0.8662109375, 0.92327880859375, 0.9803466796875, 1.03741455078125, 1.094482421875, 1.15155029296875, 1.2086181640625, 1.26568603515625, 1.32275390625, 1.37982177734375, 1.4368896484375, 1.49395751953125, 1.551025390625, 1.60809326171875, 1.6651611328125, 1.72222900390625, 1.779296875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 17.0, 28.0, 30.0, 33.0, 63.0, 98.0, 135.0, 326.0, 682.0, 1894.0, 6594.0, 33680.0, 320925.0, 3493903.0, 294372.0, 32028.0, 6196.0, 1795.0, 688.0, 313.0, 146.0, 95.0, 63.0, 48.0, 29.0, 23.0, 13.0, 11.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.18359375, -6.00933837890625, -5.8350830078125, -5.66082763671875, -5.486572265625, -5.31231689453125, -5.1380615234375, -4.96380615234375, -4.78955078125, -4.61529541015625, -4.4410400390625, -4.26678466796875, -4.092529296875, -3.91827392578125, -3.7440185546875, -3.56976318359375, -3.3955078125, -3.22125244140625, -3.0469970703125, -2.87274169921875, -2.698486328125, -2.52423095703125, -2.3499755859375, -2.17572021484375, -2.00146484375, -1.82720947265625, -1.6529541015625, -1.47869873046875, -1.304443359375, -1.13018798828125, -0.9559326171875, -0.78167724609375, -0.607421875, -0.43316650390625, -0.2589111328125, -0.08465576171875, 0.089599609375, 0.26385498046875, 0.4381103515625, 0.61236572265625, 0.78662109375, 0.96087646484375, 1.1351318359375, 1.30938720703125, 1.483642578125, 1.65789794921875, 1.8321533203125, 2.00640869140625, 2.1806640625, 2.35491943359375, 2.5291748046875, 2.70343017578125, 2.877685546875, 3.05194091796875, 3.2261962890625, 3.40045166015625, 3.57470703125, 3.74896240234375, 3.9232177734375, 4.09747314453125, 4.271728515625, 4.44598388671875, 4.6202392578125, 4.79449462890625, 4.96875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 33.0, 198.0, 441.0, 274.0, 59.0, 10.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.707467555999756, -5.524057388305664, -4.3406476974487305, -3.1572375297546387, -1.9738273620605469, -0.7904171943664551, 0.3929924964904785, 1.5764031410217285, 2.759812831878662, 3.943222999572754, 5.1266326904296875, 6.310042858123779, 7.493453025817871, 8.676862716674805, 9.860273361206055, 11.043684005737305, 12.227092742919922, 13.410502433776855, 14.593913078308105, 15.777322769165039, 16.96073341369629, 18.144142150878906, 19.327552795410156, 20.510963439941406, 21.694374084472656, 22.877784729003906, 24.061193466186523, 25.244604110717773, 26.428014755249023, 27.61142349243164, 28.79483413696289, 29.97824478149414, 31.16165542602539, 32.34506607055664, 33.52847671508789, 34.711883544921875, 35.895294189453125, 37.078704833984375, 38.262115478515625, 39.445526123046875, 40.628936767578125, 41.812347412109375, 42.995758056640625, 44.179168701171875, 45.36257553100586, 46.54598617553711, 47.72939682006836, 48.91280746459961, 50.096214294433594, 51.279624938964844, 52.463035583496094, 53.646446228027344, 54.82985305786133, 56.01326370239258, 57.19667434692383, 58.38008499145508, 59.56349563598633, 60.74690628051758, 61.93031692504883, 63.11372375488281, 64.29713439941406, 65.48054504394531, 66.66395568847656, 67.84736633300781, 69.03077697753906]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 1.0, 7.0, 6.0, 12.0, 8.0, 8.0, 8.0, 16.0, 15.0, 19.0, 21.0, 17.0, 27.0, 35.0, 26.0, 34.0, 32.0, 32.0, 38.0, 35.0, 41.0, 47.0, 40.0, 42.0, 51.0, 42.0, 35.0, 27.0, 35.0, 37.0, 37.0, 23.0, 25.0, 23.0, 15.0, 11.0, 7.0, 14.0, 5.0, 11.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.843233108520508, -5.649523735046387, -5.455814361572266, -5.2621049880981445, -5.068395614624023, -4.874686241149902, -4.680976867675781, -4.48726749420166, -4.293558120727539, -4.099848747253418, -3.906139373779297, -3.712430000305176, -3.5187206268310547, -3.3250112533569336, -3.1313018798828125, -2.9375925064086914, -2.7438831329345703, -2.550173759460449, -2.356464385986328, -2.162755012512207, -1.969045639038086, -1.7753362655639648, -1.5816268920898438, -1.3879175186157227, -1.1942081451416016, -1.0004987716674805, -0.8067893981933594, -0.6130800247192383, -0.4193706512451172, -0.2256612777709961, -0.031951904296875, 0.1617574691772461, 0.3554668426513672, 0.5491762161254883, 0.7428855895996094, 0.9365949630737305, 1.1303043365478516, 1.3240137100219727, 1.5177230834960938, 1.7114324569702148, 1.905141830444336, 2.098851203918457, 2.292560577392578, 2.486269950866699, 2.6799793243408203, 2.8736886978149414, 3.0673980712890625, 3.2611074447631836, 3.4548168182373047, 3.648526191711426, 3.842235565185547, 4.035944938659668, 4.229654312133789, 4.42336368560791, 4.617073059082031, 4.810782432556152, 5.004491806030273, 5.1982011795043945, 5.391910552978516, 5.585619926452637, 5.779329299926758, 5.973038673400879, 6.166748046875, 6.360457420349121, 6.554166793823242]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 6.0, 16.0, 7.0, 15.0, 13.0, 11.0, 25.0, 24.0, 20.0, 24.0, 14.0, 33.0, 36.0, 31.0, 39.0, 28.0, 40.0, 37.0, 43.0, 40.0, 43.0, 46.0, 35.0, 35.0, 29.0, 32.0, 34.0, 29.0, 23.0, 23.0, 26.0, 18.0, 19.0, 16.0, 12.0, 6.0, 11.0, 8.0, 10.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.2412109375, -1.203765869140625, -1.16632080078125, -1.128875732421875, -1.0914306640625, -1.053985595703125, -1.01654052734375, -0.979095458984375, -0.941650390625, -0.904205322265625, -0.86676025390625, -0.829315185546875, -0.7918701171875, -0.754425048828125, -0.71697998046875, -0.679534912109375, -0.64208984375, -0.604644775390625, -0.56719970703125, -0.529754638671875, -0.4923095703125, -0.454864501953125, -0.41741943359375, -0.379974365234375, -0.342529296875, -0.305084228515625, -0.26763916015625, -0.230194091796875, -0.1927490234375, -0.155303955078125, -0.11785888671875, -0.080413818359375, -0.04296875, -0.005523681640625, 0.03192138671875, 0.069366455078125, 0.1068115234375, 0.144256591796875, 0.18170166015625, 0.219146728515625, 0.256591796875, 0.294036865234375, 0.33148193359375, 0.368927001953125, 0.4063720703125, 0.443817138671875, 0.48126220703125, 0.518707275390625, 0.55615234375, 0.593597412109375, 0.63104248046875, 0.668487548828125, 0.7059326171875, 0.743377685546875, 0.78082275390625, 0.818267822265625, 0.855712890625, 0.893157958984375, 0.93060302734375, 0.968048095703125, 1.0054931640625, 1.042938232421875, 1.08038330078125, 1.117828369140625, 1.1552734375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 11.0, 20.0, 21.0, 30.0, 21.0, 39.0, 44.0, 53.0, 79.0, 74.0, 130.0, 154.0, 229.0, 278.0, 417.0, 607.0, 1018.0, 1800.0, 3045.0, 5513.0, 10729.0, 21880.0, 48060.0, 110931.0, 250005.0, 309884.0, 156020.0, 66634.0, 29646.0, 14285.0, 7117.0, 3825.0, 2046.0, 1267.0, 754.0, 486.0, 353.0, 250.0, 172.0, 146.0, 111.0, 85.0, 68.0, 50.0, 44.0, 30.0, 20.0, 16.0, 16.0, 14.0, 6.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.237548828125, -0.2299346923828125, -0.222320556640625, -0.2147064208984375, -0.20709228515625, -0.1994781494140625, -0.191864013671875, -0.1842498779296875, -0.1766357421875, -0.1690216064453125, -0.161407470703125, -0.1537933349609375, -0.14617919921875, -0.1385650634765625, -0.130950927734375, -0.1233367919921875, -0.11572265625, -0.1081085205078125, -0.100494384765625, -0.0928802490234375, -0.08526611328125, -0.0776519775390625, -0.070037841796875, -0.0624237060546875, -0.0548095703125, -0.0471954345703125, -0.039581298828125, -0.0319671630859375, -0.02435302734375, -0.0167388916015625, -0.009124755859375, -0.0015106201171875, 0.006103515625, 0.0137176513671875, 0.021331787109375, 0.0289459228515625, 0.03656005859375, 0.0441741943359375, 0.051788330078125, 0.0594024658203125, 0.0670166015625, 0.0746307373046875, 0.082244873046875, 0.0898590087890625, 0.09747314453125, 0.1050872802734375, 0.112701416015625, 0.1203155517578125, 0.1279296875, 0.1355438232421875, 0.143157958984375, 0.1507720947265625, 0.15838623046875, 0.1660003662109375, 0.173614501953125, 0.1812286376953125, 0.1888427734375, 0.1964569091796875, 0.204071044921875, 0.2116851806640625, 0.21929931640625, 0.2269134521484375, 0.234527587890625, 0.2421417236328125, 0.249755859375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 8.0, 4.0, 9.0, 10.0, 13.0, 16.0, 21.0, 18.0, 25.0, 16.0, 27.0, 33.0, 25.0, 29.0, 26.0, 42.0, 44.0, 32.0, 44.0, 1071.0, 41.0, 44.0, 38.0, 39.0, 41.0, 26.0, 37.0, 35.0, 28.0, 19.0, 32.0, 23.0, 23.0, 19.0, 12.0, 11.0, 13.0, 5.0, 5.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.8361358642578125, -0.808013916015625, -0.7798919677734375, -0.75177001953125, -0.7236480712890625, -0.695526123046875, -0.6674041748046875, -0.6392822265625, -0.6111602783203125, -0.583038330078125, -0.5549163818359375, -0.52679443359375, -0.4986724853515625, -0.470550537109375, -0.4424285888671875, -0.414306640625, -0.3861846923828125, -0.358062744140625, -0.3299407958984375, -0.30181884765625, -0.2736968994140625, -0.245574951171875, -0.2174530029296875, -0.1893310546875, -0.1612091064453125, -0.133087158203125, -0.1049652099609375, -0.07684326171875, -0.0487213134765625, -0.020599365234375, 0.0075225830078125, 0.03564453125, 0.0637664794921875, 0.091888427734375, 0.1200103759765625, 0.14813232421875, 0.1762542724609375, 0.204376220703125, 0.2324981689453125, 0.2606201171875, 0.2887420654296875, 0.316864013671875, 0.3449859619140625, 0.37310791015625, 0.4012298583984375, 0.429351806640625, 0.4574737548828125, 0.485595703125, 0.5137176513671875, 0.541839599609375, 0.5699615478515625, 0.59808349609375, 0.6262054443359375, 0.654327392578125, 0.6824493408203125, 0.7105712890625, 0.7386932373046875, 0.766815185546875, 0.7949371337890625, 0.82305908203125, 0.8511810302734375, 0.879302978515625, 0.9074249267578125, 0.935546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 13.0, 20.0, 29.0, 37.0, 65.0, 105.0, 176.0, 268.0, 429.0, 721.0, 1144.0, 1914.0, 3312.0, 5790.0, 10469.0, 19697.0, 38464.0, 77361.0, 165261.0, 906550.0, 576076.0, 144803.0, 69381.0, 34555.0, 17736.0, 9699.0, 5399.0, 3069.0, 1876.0, 1039.0, 678.0, 365.0, 202.0, 142.0, 102.0, 54.0, 40.0, 21.0, 21.0, 15.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.1375732421875, -0.13384723663330078, -0.13012123107910156, -0.12639522552490234, -0.12266921997070312, -0.1189432144165039, -0.11521720886230469, -0.11149120330810547, -0.10776519775390625, -0.10403919219970703, -0.10031318664550781, -0.0965871810913086, -0.09286117553710938, -0.08913516998291016, -0.08540916442871094, -0.08168315887451172, -0.0779571533203125, -0.07423114776611328, -0.07050514221191406, -0.06677913665771484, -0.06305313110351562, -0.059327125549316406, -0.05560111999511719, -0.05187511444091797, -0.04814910888671875, -0.04442310333251953, -0.04069709777832031, -0.036971092224121094, -0.033245086669921875, -0.029519081115722656, -0.025793075561523438, -0.02206707000732422, -0.018341064453125, -0.014615058898925781, -0.010889053344726562, -0.007163047790527344, -0.003437042236328125, 0.00028896331787109375, 0.0040149688720703125, 0.007740974426269531, 0.01146697998046875, 0.015192985534667969, 0.018918991088867188, 0.022644996643066406, 0.026371002197265625, 0.030097007751464844, 0.03382301330566406, 0.03754901885986328, 0.0412750244140625, 0.04500102996826172, 0.04872703552246094, 0.052453041076660156, 0.056179046630859375, 0.059905052185058594, 0.06363105773925781, 0.06735706329345703, 0.07108306884765625, 0.07480907440185547, 0.07853507995605469, 0.0822610855102539, 0.08598709106445312, 0.08971309661865234, 0.09343910217285156, 0.09716510772705078, 0.10089111328125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 5.0, 12.0, 17.0, 14.0, 39.0, 47.0, 69.0, 128.0, 147.0, 141.0, 94.0, 67.0, 43.0, 28.0, 10.0, 12.0, 11.0, 12.0, 10.0, 4.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0209808349609375, -0.020343542098999023, -0.019706249237060547, -0.01906895637512207, -0.018431663513183594, -0.017794370651245117, -0.01715707778930664, -0.016519784927368164, -0.015882492065429688, -0.015245199203491211, -0.014607906341552734, -0.013970613479614258, -0.013333320617675781, -0.012696027755737305, -0.012058734893798828, -0.011421442031860352, -0.010784149169921875, -0.010146856307983398, -0.009509563446044922, -0.008872270584106445, -0.008234977722167969, -0.007597684860229492, -0.006960391998291016, -0.006323099136352539, -0.0056858062744140625, -0.005048513412475586, -0.004411220550537109, -0.003773927688598633, -0.0031366348266601562, -0.0024993419647216797, -0.0018620491027832031, -0.0012247562408447266, -0.00058746337890625, 4.982948303222656e-05, 0.0006871223449707031, 0.0013244152069091797, 0.0019617080688476562, 0.002599000930786133, 0.0032362937927246094, 0.003873586654663086, 0.0045108795166015625, 0.005148172378540039, 0.005785465240478516, 0.006422758102416992, 0.007060050964355469, 0.007697343826293945, 0.008334636688232422, 0.008971929550170898, 0.009609222412109375, 0.010246515274047852, 0.010883808135986328, 0.011521100997924805, 0.012158393859863281, 0.012795686721801758, 0.013432979583740234, 0.014070272445678711, 0.014707565307617188, 0.015344858169555664, 0.01598215103149414, 0.016619443893432617, 0.017256736755371094, 0.01789402961730957, 0.018531322479248047, 0.019168615341186523, 0.019805908203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 5.0, 9.0, 7.0, 14.0, 13.0, 14.0, 6.0, 16.0, 21.0, 28.0, 37.0, 46.0, 101.0, 186.0, 556.0, 2241.0, 21445.0, 1005162.0, 15733.0, 1864.0, 480.0, 184.0, 113.0, 57.0, 39.0, 31.0, 18.0, 14.0, 11.0, 19.0, 10.0, 13.0, 3.0, 6.0, 0.0, 6.0, 4.0, 1.0, 7.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-0.376220703125, -0.3642578125, -0.352294921875, -0.34033203125, -0.328369140625, -0.31640625, -0.304443359375, -0.29248046875, -0.280517578125, -0.2685546875, -0.256591796875, -0.24462890625, -0.232666015625, -0.220703125, -0.208740234375, -0.19677734375, -0.184814453125, -0.1728515625, -0.160888671875, -0.14892578125, -0.136962890625, -0.125, -0.113037109375, -0.10107421875, -0.089111328125, -0.0771484375, -0.065185546875, -0.05322265625, -0.041259765625, -0.029296875, -0.017333984375, -0.00537109375, 0.006591796875, 0.0185546875, 0.030517578125, 0.04248046875, 0.054443359375, 0.06640625, 0.078369140625, 0.09033203125, 0.102294921875, 0.1142578125, 0.126220703125, 0.13818359375, 0.150146484375, 0.162109375, 0.174072265625, 0.18603515625, 0.197998046875, 0.2099609375, 0.221923828125, 0.23388671875, 0.245849609375, 0.2578125, 0.269775390625, 0.28173828125, 0.293701171875, 0.3056640625, 0.317626953125, 0.32958984375, 0.341552734375, 0.353515625, 0.365478515625, 0.37744140625, 0.389404296875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 15.0, 35.0, 32.0, 49.0, 77.0, 105.0, 125.0, 153.0, 129.0, 66.0, 69.0, 43.0, 26.0, 21.0, 13.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03974579647183418, -0.03867802023887634, -0.0376102440059185, -0.03654246777296066, -0.03547469154000282, -0.03440691530704498, -0.03333913907408714, -0.0322713628411293, -0.031203586608171463, -0.030135810375213623, -0.029068034142255783, -0.028000257909297943, -0.026932481676340103, -0.025864705443382263, -0.024796929210424423, -0.023729152977466583, -0.022661376744508743, -0.021593600511550903, -0.020525824278593063, -0.019458048045635223, -0.018390271812677383, -0.017322495579719543, -0.016254719346761703, -0.015186943113803864, -0.014119166880846024, -0.013051390647888184, -0.011983614414930344, -0.010915838181972504, -0.009848061949014664, -0.008780285716056824, -0.007712509483098984, -0.006644733250141144, -0.005576957017183304, -0.004509180784225464, -0.003441404551267624, -0.002373628318309784, -0.001305852085351944, -0.000238075852394104, 0.000829700380563736, 0.001897476613521576, 0.002965252846479416, 0.004033029079437256, 0.005100805312395096, 0.006168581545352936, 0.007236357778310776, 0.008304134011268616, 0.009371910244226456, 0.010439686477184296, 0.011507462710142136, 0.012575238943099976, 0.013643015176057816, 0.014710791409015656, 0.015778567641973495, 0.016846343874931335, 0.017914120107889175, 0.018981896340847015, 0.020049672573804855, 0.021117448806762695, 0.022185225039720535, 0.023253001272678375, 0.024320777505636215, 0.025388553738594055, 0.026456329971551895, 0.027524106204509735, 0.028591882437467575]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 8.0, 7.0, 11.0, 7.0, 19.0, 12.0, 16.0, 16.0, 26.0, 31.0, 32.0, 34.0, 37.0, 36.0, 35.0, 37.0, 45.0, 48.0, 52.0, 45.0, 49.0, 42.0, 41.0, 42.0, 38.0, 34.0, 25.0, 34.0, 19.0, 25.0, 20.0, 13.0, 6.0, 7.0, 6.0, 3.0, 8.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.02067023515701294, -0.02008119970560074, -0.019492164254188538, -0.018903128802776337, -0.018314093351364136, -0.017725057899951935, -0.017136022448539734, -0.016546986997127533, -0.015957951545715332, -0.015368916094303131, -0.01477988064289093, -0.01419084519147873, -0.013601809740066528, -0.013012774288654327, -0.012423738837242126, -0.011834703385829926, -0.011245667934417725, -0.010656632483005524, -0.010067597031593323, -0.009478561580181122, -0.008889526128768921, -0.00830049067735672, -0.007711455225944519, -0.007122419774532318, -0.006533384323120117, -0.005944348871707916, -0.005355313420295715, -0.004766277968883514, -0.0041772425174713135, -0.0035882070660591125, -0.0029991716146469116, -0.0024101361632347107, -0.0018211007118225098, -0.0012320652604103088, -0.0006430298089981079, -5.399435758590698e-05, 0.0005350410938262939, 0.0011240765452384949, 0.0017131119966506958, 0.0023021474480628967, 0.0028911828994750977, 0.0034802183508872986, 0.0040692538022994995, 0.0046582892537117004, 0.005247324705123901, 0.005836360156536102, 0.006425395607948303, 0.007014431059360504, 0.007603466510772705, 0.008192501962184906, 0.008781537413597107, 0.009370572865009308, 0.009959608316421509, 0.01054864376783371, 0.01113767921924591, 0.011726714670658112, 0.012315750122070312, 0.012904785573482513, 0.013493821024894714, 0.014082856476306915, 0.014671891927719116, 0.015260927379131317, 0.015849962830543518, 0.01643899828195572, 0.01702803373336792]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 6.0, 16.0, 7.0, 15.0, 13.0, 11.0, 25.0, 24.0, 19.0, 25.0, 14.0, 33.0, 36.0, 30.0, 40.0, 29.0, 39.0, 37.0, 41.0, 42.0, 40.0, 49.0, 34.0, 33.0, 30.0, 32.0, 35.0, 30.0, 23.0, 23.0, 26.0, 15.0, 22.0, 15.0, 13.0, 6.0, 11.0, 8.0, 10.0, 3.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.2412109375, -1.20379638671875, -1.1663818359375, -1.12896728515625, -1.091552734375, -1.05413818359375, -1.0167236328125, -0.97930908203125, -0.94189453125, -0.90447998046875, -0.8670654296875, -0.82965087890625, -0.792236328125, -0.75482177734375, -0.7174072265625, -0.67999267578125, -0.642578125, -0.60516357421875, -0.5677490234375, -0.53033447265625, -0.492919921875, -0.45550537109375, -0.4180908203125, -0.38067626953125, -0.34326171875, -0.30584716796875, -0.2684326171875, -0.23101806640625, -0.193603515625, -0.15618896484375, -0.1187744140625, -0.08135986328125, -0.0439453125, -0.00653076171875, 0.0308837890625, 0.06829833984375, 0.105712890625, 0.14312744140625, 0.1805419921875, 0.21795654296875, 0.25537109375, 0.29278564453125, 0.3302001953125, 0.36761474609375, 0.405029296875, 0.44244384765625, 0.4798583984375, 0.51727294921875, 0.5546875, 0.59210205078125, 0.6295166015625, 0.66693115234375, 0.704345703125, 0.74176025390625, 0.7791748046875, 0.81658935546875, 0.85400390625, 0.89141845703125, 0.9288330078125, 0.96624755859375, 1.003662109375, 1.04107666015625, 1.0784912109375, 1.11590576171875, 1.1533203125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 8.0, 14.0, 22.0, 34.0, 38.0, 67.0, 103.0, 146.0, 198.0, 328.0, 486.0, 822.0, 1312.0, 2148.0, 3839.0, 7200.0, 14231.0, 29810.0, 67748.0, 163987.0, 345416.0, 234488.0, 94986.0, 40915.0, 18892.0, 9557.0, 4823.0, 2698.0, 1573.0, 941.0, 571.0, 383.0, 266.0, 145.0, 120.0, 85.0, 58.0, 30.0, 28.0, 17.0, 11.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09375, -2.025543212890625, -1.95733642578125, -1.889129638671875, -1.8209228515625, -1.752716064453125, -1.68450927734375, -1.616302490234375, -1.548095703125, -1.479888916015625, -1.41168212890625, -1.343475341796875, -1.2752685546875, -1.207061767578125, -1.13885498046875, -1.070648193359375, -1.00244140625, -0.934234619140625, -0.86602783203125, -0.797821044921875, -0.7296142578125, -0.661407470703125, -0.59320068359375, -0.524993896484375, -0.456787109375, -0.388580322265625, -0.32037353515625, -0.252166748046875, -0.1839599609375, -0.115753173828125, -0.04754638671875, 0.020660400390625, 0.0888671875, 0.157073974609375, 0.22528076171875, 0.293487548828125, 0.3616943359375, 0.429901123046875, 0.49810791015625, 0.566314697265625, 0.634521484375, 0.702728271484375, 0.77093505859375, 0.839141845703125, 0.9073486328125, 0.975555419921875, 1.04376220703125, 1.111968994140625, 1.18017578125, 1.248382568359375, 1.31658935546875, 1.384796142578125, 1.4530029296875, 1.521209716796875, 1.58941650390625, 1.657623291015625, 1.725830078125, 1.794036865234375, 1.86224365234375, 1.930450439453125, 1.9986572265625, 2.066864013671875, 2.13507080078125, 2.203277587890625, 2.271484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 10.0, 10.0, 14.0, 27.0, 24.0, 26.0, 25.0, 36.0, 41.0, 51.0, 63.0, 77.0, 148.0, 268.0, 1414.0, 229.0, 120.0, 67.0, 60.0, 44.0, 44.0, 40.0, 42.0, 28.0, 24.0, 18.0, 13.0, 11.0, 9.0, 10.0, 11.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.590789794921875, -3.48626708984375, -3.381744384765625, -3.2772216796875, -3.172698974609375, -3.06817626953125, -2.963653564453125, -2.859130859375, -2.754608154296875, -2.65008544921875, -2.545562744140625, -2.4410400390625, -2.336517333984375, -2.23199462890625, -2.127471923828125, -2.02294921875, -1.918426513671875, -1.81390380859375, -1.709381103515625, -1.6048583984375, -1.500335693359375, -1.39581298828125, -1.291290283203125, -1.186767578125, -1.082244873046875, -0.97772216796875, -0.873199462890625, -0.7686767578125, -0.664154052734375, -0.55963134765625, -0.455108642578125, -0.3505859375, -0.246063232421875, -0.14154052734375, -0.037017822265625, 0.0675048828125, 0.172027587890625, 0.27655029296875, 0.381072998046875, 0.485595703125, 0.590118408203125, 0.69464111328125, 0.799163818359375, 0.9036865234375, 1.008209228515625, 1.11273193359375, 1.217254638671875, 1.32177734375, 1.426300048828125, 1.53082275390625, 1.635345458984375, 1.7398681640625, 1.844390869140625, 1.94891357421875, 2.053436279296875, 2.157958984375, 2.262481689453125, 2.36700439453125, 2.471527099609375, 2.5760498046875, 2.680572509765625, 2.78509521484375, 2.889617919921875, 2.994140625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 5.0, 5.0, 13.0, 17.0, 18.0, 18.0, 20.0, 35.0, 55.0, 66.0, 95.0, 115.0, 180.0, 264.0, 419.0, 769.0, 2604.0, 84564.0, 3032704.0, 20330.0, 1584.0, 618.0, 373.0, 234.0, 162.0, 115.0, 73.0, 57.0, 61.0, 39.0, 26.0, 10.0, 12.0, 12.0, 7.0, 8.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2354736328125, -8.885009765625, -8.5345458984375, -8.18408203125, -7.8336181640625, -7.483154296875, -7.1326904296875, -6.7822265625, -6.4317626953125, -6.081298828125, -5.7308349609375, -5.38037109375, -5.0299072265625, -4.679443359375, -4.3289794921875, -3.978515625, -3.6280517578125, -3.277587890625, -2.9271240234375, -2.57666015625, -2.2261962890625, -1.875732421875, -1.5252685546875, -1.1748046875, -0.8243408203125, -0.473876953125, -0.1234130859375, 0.22705078125, 0.5775146484375, 0.927978515625, 1.2784423828125, 1.62890625, 1.9793701171875, 2.329833984375, 2.6802978515625, 3.03076171875, 3.3812255859375, 3.731689453125, 4.0821533203125, 4.4326171875, 4.7830810546875, 5.133544921875, 5.4840087890625, 5.83447265625, 6.1849365234375, 6.535400390625, 6.8858642578125, 7.236328125, 7.5867919921875, 7.937255859375, 8.2877197265625, 8.63818359375, 8.9886474609375, 9.339111328125, 9.6895751953125, 10.0400390625, 10.3905029296875, 10.740966796875, 11.0914306640625, 11.44189453125, 11.7923583984375, 12.142822265625, 12.4932861328125, 12.84375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 10.0, 10.0, 28.0, 74.0, 143.0, 215.0, 222.0, 172.0, 82.0, 31.0, 18.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.501022338867188, -21.96599769592285, -21.430971145629883, -20.895946502685547, -20.360919952392578, -19.825895309448242, -19.290870666503906, -18.755844116210938, -18.2208194732666, -17.685794830322266, -17.150768280029297, -16.61574363708496, -16.080718994140625, -15.545692443847656, -15.01066780090332, -14.475642204284668, -13.940616607666016, -13.405591011047363, -12.870565414428711, -12.335540771484375, -11.800515174865723, -11.26548957824707, -10.730464935302734, -10.195439338684082, -9.66041374206543, -9.125388145446777, -8.590362548828125, -8.055337905883789, -7.520312309265137, -6.985286712646484, -6.45026159286499, -5.915236473083496, -5.38021183013916, -4.845186233520508, -4.310161113739014, -3.7751357555389404, -3.240110397338867, -2.705085039138794, -2.1700596809387207, -1.6350343227386475, -1.1000089645385742, -0.564983606338501, -0.029958248138427734, 0.5050671100616455, 1.0400924682617188, 1.575117826461792, 2.1101431846618652, 2.6451685428619385, 3.1801939010620117, 3.715219259262085, 4.250244617462158, 4.785269737243652, 5.320295333862305, 5.855320930480957, 6.390346050262451, 6.925371170043945, 7.460396766662598, 7.99542236328125, 8.530447006225586, 9.065472602844238, 9.60049819946289, 10.135523796081543, 10.670549392700195, 11.205574035644531, 11.740599632263184]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 14.0, 10.0, 10.0, 12.0, 13.0, 20.0, 15.0, 22.0, 32.0, 39.0, 29.0, 30.0, 36.0, 43.0, 39.0, 36.0, 47.0, 36.0, 43.0, 43.0, 29.0, 28.0, 53.0, 49.0, 30.0, 34.0, 31.0, 21.0, 18.0, 20.0, 23.0, 12.0, 16.0, 20.0, 4.0, 8.0, 9.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.69442081451416, -8.430889129638672, -8.1673583984375, -7.903826713562012, -7.640295028686523, -7.376763820648193, -7.113232612609863, -6.849700927734375, -6.586169719696045, -6.322638511657715, -6.059106826782227, -5.7955756187438965, -5.532044410705566, -5.268512725830078, -5.004981517791748, -4.741450309753418, -4.47791862487793, -4.2143874168396, -3.9508557319641113, -3.6873245239257812, -3.423793077468872, -3.160261631011963, -2.896730422973633, -2.6331989765167236, -2.3696675300598145, -2.1061360836029053, -1.8426047563552856, -1.579073429107666, -1.3155419826507568, -1.0520105361938477, -0.788479208946228, -0.5249478816986084, -0.2614173889160156, 0.0021139979362487793, 0.2656453847885132, 0.5291767716407776, 0.792708158493042, 1.0562396049499512, 1.3197709321975708, 1.5833022594451904, 1.8468337059020996, 2.110365152359009, 2.373896598815918, 2.637427806854248, 2.9009592533111572, 3.1644906997680664, 3.4280219078063965, 3.6915533542633057, 3.955084800720215, 4.218616008758545, 4.482147693634033, 4.745678901672363, 5.009210586547852, 5.272741794586182, 5.536273002624512, 5.7998046875, 6.06333589553833, 6.32686710357666, 6.590398788452148, 6.8539299964904785, 7.117461204528809, 7.380992889404297, 7.644524097442627, 7.908055305480957, 8.171586990356445]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 3.0, 5.0, 12.0, 7.0, 9.0, 10.0, 19.0, 17.0, 17.0, 15.0, 19.0, 19.0, 21.0, 20.0, 31.0, 31.0, 24.0, 32.0, 34.0, 33.0, 42.0, 40.0, 39.0, 41.0, 43.0, 32.0, 42.0, 32.0, 32.0, 20.0, 25.0, 33.0, 24.0, 28.0, 18.0, 14.0, 17.0, 13.0, 12.0, 15.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.1318359375, -1.096832275390625, -1.06182861328125, -1.026824951171875, -0.9918212890625, -0.956817626953125, -0.92181396484375, -0.886810302734375, -0.851806640625, -0.816802978515625, -0.78179931640625, -0.746795654296875, -0.7117919921875, -0.676788330078125, -0.64178466796875, -0.606781005859375, -0.57177734375, -0.536773681640625, -0.50177001953125, -0.466766357421875, -0.4317626953125, -0.396759033203125, -0.36175537109375, -0.326751708984375, -0.291748046875, -0.256744384765625, -0.22174072265625, -0.186737060546875, -0.1517333984375, -0.116729736328125, -0.08172607421875, -0.046722412109375, -0.01171875, 0.023284912109375, 0.05828857421875, 0.093292236328125, 0.1282958984375, 0.163299560546875, 0.19830322265625, 0.233306884765625, 0.268310546875, 0.303314208984375, 0.33831787109375, 0.373321533203125, 0.4083251953125, 0.443328857421875, 0.47833251953125, 0.513336181640625, 0.54833984375, 0.583343505859375, 0.61834716796875, 0.653350830078125, 0.6883544921875, 0.723358154296875, 0.75836181640625, 0.793365478515625, 0.828369140625, 0.863372802734375, 0.89837646484375, 0.933380126953125, 0.9683837890625, 1.003387451171875, 1.03839111328125, 1.073394775390625, 1.1083984375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 17.0, 33.0, 54.0, 129.0, 187.0, 385.0, 780.0, 1707.0, 4968.0, 20201.0, 221359.0, 3163085.0, 729576.0, 39982.0, 7395.0, 2374.0, 1030.0, 478.0, 241.0, 141.0, 72.0, 39.0, 16.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.859375, -4.715087890625, -4.57080078125, -4.426513671875, -4.2822265625, -4.137939453125, -3.99365234375, -3.849365234375, -3.705078125, -3.560791015625, -3.41650390625, -3.272216796875, -3.1279296875, -2.983642578125, -2.83935546875, -2.695068359375, -2.55078125, -2.406494140625, -2.26220703125, -2.117919921875, -1.9736328125, -1.829345703125, -1.68505859375, -1.540771484375, -1.396484375, -1.252197265625, -1.10791015625, -0.963623046875, -0.8193359375, -0.675048828125, -0.53076171875, -0.386474609375, -0.2421875, -0.097900390625, 0.04638671875, 0.190673828125, 0.3349609375, 0.479248046875, 0.62353515625, 0.767822265625, 0.912109375, 1.056396484375, 1.20068359375, 1.344970703125, 1.4892578125, 1.633544921875, 1.77783203125, 1.922119140625, 2.06640625, 2.210693359375, 2.35498046875, 2.499267578125, 2.6435546875, 2.787841796875, 2.93212890625, 3.076416015625, 3.220703125, 3.364990234375, 3.50927734375, 3.653564453125, 3.7978515625, 3.942138671875, 4.08642578125, 4.230712890625, 4.375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 20.0, 15.0, 34.0, 44.0, 44.0, 85.0, 100.0, 98.0, 157.0, 218.0, 329.0, 506.0, 655.0, 534.0, 354.0, 249.0, 168.0, 105.0, 95.0, 66.0, 58.0, 35.0, 24.0, 28.0, 9.0, 4.0, 7.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.552734375, -2.476776123046875, -2.40081787109375, -2.324859619140625, -2.2489013671875, -2.172943115234375, -2.09698486328125, -2.021026611328125, -1.945068359375, -1.869110107421875, -1.79315185546875, -1.717193603515625, -1.6412353515625, -1.565277099609375, -1.48931884765625, -1.413360595703125, -1.33740234375, -1.261444091796875, -1.18548583984375, -1.109527587890625, -1.0335693359375, -0.957611083984375, -0.88165283203125, -0.805694580078125, -0.729736328125, -0.653778076171875, -0.57781982421875, -0.501861572265625, -0.4259033203125, -0.349945068359375, -0.27398681640625, -0.198028564453125, -0.1220703125, -0.046112060546875, 0.02984619140625, 0.105804443359375, 0.1817626953125, 0.257720947265625, 0.33367919921875, 0.409637451171875, 0.485595703125, 0.561553955078125, 0.63751220703125, 0.713470458984375, 0.7894287109375, 0.865386962890625, 0.94134521484375, 1.017303466796875, 1.09326171875, 1.169219970703125, 1.24517822265625, 1.321136474609375, 1.3970947265625, 1.473052978515625, 1.54901123046875, 1.624969482421875, 1.700927734375, 1.776885986328125, 1.85284423828125, 1.928802490234375, 2.0047607421875, 2.080718994140625, 2.15667724609375, 2.232635498046875, 2.30859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 7.0, 14.0, 14.0, 28.0, 45.0, 86.0, 143.0, 227.0, 499.0, 1502.0, 7006.0, 64962.0, 1970980.0, 2071613.0, 67352.0, 7189.0, 1525.0, 496.0, 253.0, 141.0, 63.0, 47.0, 42.0, 15.0, 15.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.25360107421875, -6.0697021484375, -5.88580322265625, -5.701904296875, -5.51800537109375, -5.3341064453125, -5.15020751953125, -4.96630859375, -4.78240966796875, -4.5985107421875, -4.41461181640625, -4.230712890625, -4.04681396484375, -3.8629150390625, -3.67901611328125, -3.4951171875, -3.31121826171875, -3.1273193359375, -2.94342041015625, -2.759521484375, -2.57562255859375, -2.3917236328125, -2.20782470703125, -2.02392578125, -1.84002685546875, -1.6561279296875, -1.47222900390625, -1.288330078125, -1.10443115234375, -0.9205322265625, -0.73663330078125, -0.552734375, -0.36883544921875, -0.1849365234375, -0.00103759765625, 0.182861328125, 0.36676025390625, 0.5506591796875, 0.73455810546875, 0.91845703125, 1.10235595703125, 1.2862548828125, 1.47015380859375, 1.654052734375, 1.83795166015625, 2.0218505859375, 2.20574951171875, 2.3896484375, 2.57354736328125, 2.7574462890625, 2.94134521484375, 3.125244140625, 3.30914306640625, 3.4930419921875, 3.67694091796875, 3.86083984375, 4.04473876953125, 4.2286376953125, 4.41253662109375, 4.596435546875, 4.78033447265625, 4.9642333984375, 5.14813232421875, 5.33203125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 20.0, 155.0, 624.0, 201.0, 13.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53470230102539, -54.68478775024414, -52.834877014160156, -50.984962463378906, -49.135047912597656, -47.285133361816406, -45.435218811035156, -43.58530807495117, -41.73539352416992, -39.88547897338867, -38.03556823730469, -36.18565368652344, -34.33573913574219, -32.48582458496094, -30.63591194152832, -28.785999298095703, -26.936084747314453, -25.086170196533203, -23.236257553100586, -21.38634490966797, -19.53643035888672, -17.68651580810547, -15.836603164672852, -13.986689567565918, -12.136775970458984, -10.28686237335205, -8.436948776245117, -6.587035179138184, -4.73712158203125, -2.8872079849243164, -1.0372943878173828, 0.8126192092895508, 2.6625289916992188, 4.512442588806152, 6.362356185913086, 8.21226978302002, 10.062183380126953, 11.912096977233887, 13.76201057434082, 15.611924171447754, 17.461837768554688, 19.311752319335938, 21.161664962768555, 23.011577606201172, 24.861492156982422, 26.711406707763672, 28.56131935119629, 30.411231994628906, 32.261146545410156, 34.111061096191406, 35.960975646972656, 37.81088638305664, 39.66080093383789, 41.51071548461914, 43.360626220703125, 45.210540771484375, 47.060455322265625, 48.910369873046875, 50.760284423828125, 52.61019515991211, 54.46010971069336, 56.31002426147461, 58.159934997558594, 60.009849548339844, 61.859764099121094]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 8.0, 19.0, 11.0, 24.0, 19.0, 24.0, 26.0, 26.0, 34.0, 22.0, 42.0, 30.0, 50.0, 39.0, 42.0, 38.0, 37.0, 33.0, 30.0, 39.0, 34.0, 37.0, 38.0, 39.0, 28.0, 36.0, 17.0, 12.0, 22.0, 21.0, 26.0, 12.0, 15.0, 9.0, 12.0, 7.0, 6.0, 7.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.762332916259766, -6.537089824676514, -6.3118462562561035, -6.086603164672852, -5.8613600730896, -5.6361165046691895, -5.4108734130859375, -5.185629844665527, -4.960386753082275, -4.735143661499023, -4.509900093078613, -4.284657001495361, -4.059413909912109, -3.834170341491699, -3.6089272499084473, -3.383683919906616, -3.1584408283233643, -2.933197498321533, -2.7079544067382812, -2.48271107673645, -2.257467746734619, -2.032224655151367, -1.8069813251495361, -1.581737995147705, -1.3564947843551636, -1.131251573562622, -0.906008243560791, -0.6807650327682495, -0.45552176237106323, -0.23027849197387695, -0.005035281181335449, 0.2202080488204956, 0.4454512596130371, 0.6706945300102234, 0.8959378004074097, 1.1211810111999512, 1.3464243412017822, 1.5716675519943237, 1.7969107627868652, 2.0221540927886963, 2.2473974227905273, 2.4726407527923584, 2.6978838443756104, 2.9231271743774414, 3.1483705043792725, 3.3736138343811035, 3.5988569259643555, 3.8241002559661865, 4.049343109130859, 4.274586200714111, 4.4998297691345215, 4.725072860717773, 4.950315952301025, 5.1755595207214355, 5.4008026123046875, 5.626046180725098, 5.85128927230835, 6.076532363891602, 6.301775932312012, 6.527019023895264, 6.752262115478516, 6.977505683898926, 7.202748775482178, 7.42799186706543, 7.65323543548584]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 4.0, 11.0, 10.0, 16.0, 17.0, 24.0, 30.0, 27.0, 32.0, 30.0, 42.0, 32.0, 47.0, 35.0, 47.0, 33.0, 39.0, 27.0, 54.0, 48.0, 31.0, 39.0, 33.0, 33.0, 33.0, 30.0, 23.0, 18.0, 22.0, 19.0, 17.0, 14.0, 10.0, 10.0, 5.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9073028564453125, -0.872222900390625, -0.8371429443359375, -0.80206298828125, -0.7669830322265625, -0.731903076171875, -0.6968231201171875, -0.6617431640625, -0.6266632080078125, -0.591583251953125, -0.5565032958984375, -0.52142333984375, -0.4863433837890625, -0.451263427734375, -0.4161834716796875, -0.381103515625, -0.3460235595703125, -0.310943603515625, -0.2758636474609375, -0.24078369140625, -0.2057037353515625, -0.170623779296875, -0.1355438232421875, -0.1004638671875, -0.0653839111328125, -0.030303955078125, 0.0047760009765625, 0.03985595703125, 0.0749359130859375, 0.110015869140625, 0.1450958251953125, 0.18017578125, 0.2152557373046875, 0.250335693359375, 0.2854156494140625, 0.32049560546875, 0.3555755615234375, 0.390655517578125, 0.4257354736328125, 0.4608154296875, 0.4958953857421875, 0.530975341796875, 0.5660552978515625, 0.60113525390625, 0.6362152099609375, 0.671295166015625, 0.7063751220703125, 0.741455078125, 0.7765350341796875, 0.811614990234375, 0.8466949462890625, 0.88177490234375, 0.9168548583984375, 0.951934814453125, 0.9870147705078125, 1.0220947265625, 1.0571746826171875, 1.092254638671875, 1.1273345947265625, 1.16241455078125, 1.1974945068359375, 1.232574462890625, 1.2676544189453125, 1.302734375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 8.0, 8.0, 10.0, 17.0, 38.0, 41.0, 64.0, 116.0, 168.0, 274.0, 418.0, 879.0, 1804.0, 4107.0, 12653.0, 47216.0, 210319.0, 518216.0, 189857.0, 43001.0, 11759.0, 4021.0, 1604.0, 812.0, 466.0, 247.0, 164.0, 90.0, 66.0, 39.0, 27.0, 16.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279052734375, -0.2685089111328125, -0.257965087890625, -0.2474212646484375, -0.23687744140625, -0.2263336181640625, -0.215789794921875, -0.2052459716796875, -0.1947021484375, -0.1841583251953125, -0.173614501953125, -0.1630706787109375, -0.15252685546875, -0.1419830322265625, -0.131439208984375, -0.1208953857421875, -0.1103515625, -0.0998077392578125, -0.089263916015625, -0.0787200927734375, -0.06817626953125, -0.0576324462890625, -0.047088623046875, -0.0365447998046875, -0.0260009765625, -0.0154571533203125, -0.004913330078125, 0.0056304931640625, 0.01617431640625, 0.0267181396484375, 0.037261962890625, 0.0478057861328125, 0.058349609375, 0.0688934326171875, 0.079437255859375, 0.0899810791015625, 0.10052490234375, 0.1110687255859375, 0.121612548828125, 0.1321563720703125, 0.1427001953125, 0.1532440185546875, 0.163787841796875, 0.1743316650390625, 0.18487548828125, 0.1954193115234375, 0.205963134765625, 0.2165069580078125, 0.22705078125, 0.2375946044921875, 0.248138427734375, 0.2586822509765625, 0.26922607421875, 0.2797698974609375, 0.290313720703125, 0.3008575439453125, 0.3114013671875, 0.3219451904296875, 0.332489013671875, 0.3430328369140625, 0.35357666015625, 0.3641204833984375, 0.374664306640625, 0.3852081298828125, 0.395751953125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 5.0, 8.0, 6.0, 7.0, 4.0, 11.0, 8.0, 14.0, 9.0, 25.0, 21.0, 23.0, 35.0, 22.0, 22.0, 24.0, 30.0, 35.0, 35.0, 40.0, 39.0, 37.0, 1069.0, 45.0, 44.0, 44.0, 43.0, 28.0, 34.0, 22.0, 29.0, 28.0, 20.0, 23.0, 15.0, 20.0, 14.0, 14.0, 13.0, 13.0, 6.0, 8.0, 7.0, 10.0, 6.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.74853515625, -0.7261505126953125, -0.703765869140625, -0.6813812255859375, -0.65899658203125, -0.6366119384765625, -0.614227294921875, -0.5918426513671875, -0.5694580078125, -0.5470733642578125, -0.524688720703125, -0.5023040771484375, -0.47991943359375, -0.4575347900390625, -0.435150146484375, -0.4127655029296875, -0.390380859375, -0.3679962158203125, -0.345611572265625, -0.3232269287109375, -0.30084228515625, -0.2784576416015625, -0.256072998046875, -0.2336883544921875, -0.2113037109375, -0.1889190673828125, -0.166534423828125, -0.1441497802734375, -0.12176513671875, -0.0993804931640625, -0.076995849609375, -0.0546112060546875, -0.0322265625, -0.0098419189453125, 0.012542724609375, 0.0349273681640625, 0.05731201171875, 0.0796966552734375, 0.102081298828125, 0.1244659423828125, 0.1468505859375, 0.1692352294921875, 0.191619873046875, 0.2140045166015625, 0.23638916015625, 0.2587738037109375, 0.281158447265625, 0.3035430908203125, 0.325927734375, 0.3483123779296875, 0.370697021484375, 0.3930816650390625, 0.41546630859375, 0.4378509521484375, 0.460235595703125, 0.4826202392578125, 0.5050048828125, 0.5273895263671875, 0.549774169921875, 0.5721588134765625, 0.59454345703125, 0.6169281005859375, 0.639312744140625, 0.6616973876953125, 0.68408203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 10.0, 7.0, 5.0, 20.0, 28.0, 27.0, 31.0, 52.0, 60.0, 80.0, 109.0, 103.0, 183.0, 245.0, 302.0, 412.0, 627.0, 923.0, 1439.0, 2368.0, 4370.0, 8352.0, 17386.0, 39052.0, 98474.0, 311036.0, 1319566.0, 172391.0, 64949.0, 27134.0, 12374.0, 6185.0, 3200.0, 1889.0, 1150.0, 701.0, 486.0, 360.0, 258.0, 184.0, 149.0, 100.0, 77.0, 62.0, 61.0, 41.0, 37.0, 22.0, 20.0, 13.0, 11.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.1170654296875, -0.11319923400878906, -0.10933303833007812, -0.10546684265136719, -0.10160064697265625, -0.09773445129394531, -0.09386825561523438, -0.09000205993652344, -0.0861358642578125, -0.08226966857910156, -0.07840347290039062, -0.07453727722167969, -0.07067108154296875, -0.06680488586425781, -0.06293869018554688, -0.05907249450683594, -0.055206298828125, -0.05134010314941406, -0.047473907470703125, -0.04360771179199219, -0.03974151611328125, -0.03587532043457031, -0.032009124755859375, -0.028142929077148438, -0.0242767333984375, -0.020410537719726562, -0.016544342041015625, -0.012678146362304688, -0.00881195068359375, -0.0049457550048828125, -0.001079559326171875, 0.0027866363525390625, 0.00665283203125, 0.010519027709960938, 0.014385223388671875, 0.018251419067382812, 0.02211761474609375, 0.025983810424804688, 0.029850006103515625, 0.03371620178222656, 0.0375823974609375, 0.04144859313964844, 0.045314788818359375, 0.04918098449707031, 0.05304718017578125, 0.05691337585449219, 0.060779571533203125, 0.06464576721191406, 0.068511962890625, 0.07237815856933594, 0.07624435424804688, 0.08011054992675781, 0.08397674560546875, 0.08784294128417969, 0.09170913696289062, 0.09557533264160156, 0.0994415283203125, 0.10330772399902344, 0.10717391967773438, 0.11104011535644531, 0.11490631103515625, 0.11877250671386719, 0.12263870239257812, 0.12650489807128906, 0.13037109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 19.0, 20.0, 31.0, 53.0, 67.0, 90.0, 84.0, 113.0, 90.0, 89.0, 71.0, 56.0, 48.0, 30.0, 25.0, 15.0, 8.0, 2.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.009063720703125, -0.008787989616394043, -0.008512258529663086, -0.008236527442932129, -0.007960796356201172, -0.007685065269470215, -0.007409334182739258, -0.007133603096008301, -0.006857872009277344, -0.006582140922546387, -0.00630640983581543, -0.006030678749084473, -0.005754947662353516, -0.005479216575622559, -0.0052034854888916016, -0.0049277544021606445, -0.0046520233154296875, -0.0043762922286987305, -0.0041005611419677734, -0.0038248300552368164, -0.0035490989685058594, -0.0032733678817749023, -0.0029976367950439453, -0.0027219057083129883, -0.0024461746215820312, -0.0021704435348510742, -0.0018947124481201172, -0.0016189813613891602, -0.0013432502746582031, -0.001067519187927246, -0.0007917881011962891, -0.000516057014465332, -0.000240325927734375, 3.540515899658203e-05, 0.00031113624572753906, 0.0005868673324584961, 0.0008625984191894531, 0.0011383295059204102, 0.0014140605926513672, 0.0016897916793823242, 0.0019655227661132812, 0.0022412538528442383, 0.0025169849395751953, 0.0027927160263061523, 0.0030684471130371094, 0.0033441781997680664, 0.0036199092864990234, 0.0038956403732299805, 0.0041713714599609375, 0.0044471025466918945, 0.0047228336334228516, 0.004998564720153809, 0.005274295806884766, 0.005550026893615723, 0.00582575798034668, 0.006101489067077637, 0.006377220153808594, 0.006652951240539551, 0.006928682327270508, 0.007204413414001465, 0.007480144500732422, 0.007755875587463379, 0.008031606674194336, 0.008307337760925293, 0.00858306884765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 4.0, 4.0, 4.0, 13.0, 7.0, 9.0, 8.0, 20.0, 35.0, 55.0, 82.0, 163.0, 259.0, 690.0, 13078.0, 1024244.0, 8625.0, 574.0, 278.0, 133.0, 73.0, 52.0, 34.0, 28.0, 10.0, 12.0, 10.0, 11.0, 1.0, 2.0, 8.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1968994140625, -0.19101333618164062, -0.18512725830078125, -0.17924118041992188, -0.1733551025390625, -0.16746902465820312, -0.16158294677734375, -0.15569686889648438, -0.149810791015625, -0.14392471313476562, -0.13803863525390625, -0.13215255737304688, -0.1262664794921875, -0.12038040161132812, -0.11449432373046875, -0.10860824584960938, -0.10272216796875, -0.09683609008789062, -0.09095001220703125, -0.08506393432617188, -0.0791778564453125, -0.07329177856445312, -0.06740570068359375, -0.061519622802734375, -0.055633544921875, -0.049747467041015625, -0.04386138916015625, -0.037975311279296875, -0.0320892333984375, -0.026203155517578125, -0.02031707763671875, -0.014430999755859375, -0.008544921875, -0.002658843994140625, 0.00322723388671875, 0.009113311767578125, 0.0149993896484375, 0.020885467529296875, 0.02677154541015625, 0.032657623291015625, 0.038543701171875, 0.044429779052734375, 0.05031585693359375, 0.056201934814453125, 0.0620880126953125, 0.06797409057617188, 0.07386016845703125, 0.07974624633789062, 0.08563232421875, 0.09151840209960938, 0.09740447998046875, 0.10329055786132812, 0.1091766357421875, 0.11506271362304688, 0.12094879150390625, 0.12683486938476562, 0.132720947265625, 0.13860702514648438, 0.14449310302734375, 0.15037918090820312, 0.1562652587890625, 0.16215133666992188, 0.16803741455078125, 0.17392349243164062, 0.1798095703125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 25.0, 54.0, 106.0, 180.0, 241.0, 201.0, 99.0, 63.0, 25.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026927482336759567, -0.02624380774796009, -0.025560135021805763, -0.024876460433006287, -0.02419278770685196, -0.023509113118052483, -0.022825438529253006, -0.02214176580309868, -0.02145809307694435, -0.020774418488144875, -0.020090745761990547, -0.01940707117319107, -0.018723398447036743, -0.018039723858237267, -0.01735604926943779, -0.016672376543283463, -0.015988701954483986, -0.015305028297007084, -0.014621354639530182, -0.013937680050730705, -0.013254007324576378, -0.012570332735776901, -0.0118866590783, -0.011202985420823097, -0.010519311763346195, -0.009835638105869293, -0.009151964448392391, -0.00846829079091549, -0.0077846166677773, -0.007100943010300398, -0.0064172688871622086, -0.0057335952296853065, -0.0050499215722084045, -0.0043662479147315025, -0.003682574024423957, -0.002998900134116411, -0.002315226476639509, -0.0016315528191626072, -0.0009478786960244179, -0.00026420503854751587, 0.00041946861892938614, 0.00110314239282161, 0.0017868161667138338, 0.0024704900570213795, 0.0031541637144982815, 0.0038378373719751835, 0.004521511495113373, 0.005205185152590275, 0.005888858810067177, 0.006572532467544079, 0.007256206125020981, 0.007939880713820457, 0.008623553439974785, 0.009307228028774261, 0.009990901686251163, 0.010674575343728065, 0.011358249001204967, 0.01204192265868187, 0.012725596316158772, 0.013409269973635674, 0.01409294456243515, 0.014776617288589478, 0.015460291877388954, 0.01614396646618843, 0.016827639192342758]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 6.0, 11.0, 9.0, 17.0, 18.0, 11.0, 24.0, 21.0, 26.0, 28.0, 32.0, 45.0, 32.0, 39.0, 30.0, 45.0, 50.0, 45.0, 42.0, 38.0, 41.0, 51.0, 48.0, 38.0, 23.0, 28.0, 34.0, 19.0, 23.0, 17.0, 20.0, 13.0, 8.0, 11.0, 13.0, 9.0, 4.0, 3.0, 6.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.007984161376953125, -0.007743661291897297, -0.007503161206841469, -0.007262661121785641, -0.007022161036729813, -0.0067816609516739845, -0.006541160866618156, -0.006300660781562328, -0.0060601606965065, -0.005819660611450672, -0.005579160526394844, -0.005338660441339016, -0.005098160356283188, -0.00485766027122736, -0.004617160186171532, -0.004376660101115704, -0.0041361600160598755, -0.0038956599310040474, -0.0036551598459482193, -0.003414659760892391, -0.003174159675836563, -0.002933659590780735, -0.002693159505724907, -0.002452659420669079, -0.0022121593356132507, -0.0019716592505574226, -0.0017311591655015945, -0.0014906590804457664, -0.0012501589953899384, -0.0010096589103341103, -0.0007691588252782822, -0.0005286587402224541, -0.000288158655166626, -4.765857011079788e-05, 0.0001928415149450302, 0.0004333416000008583, 0.0006738416850566864, 0.0009143417701125145, 0.0011548418551683426, 0.0013953419402241707, 0.0016358420252799988, 0.0018763421103358269, 0.002116842195391655, 0.002357342280447483, 0.002597842365503311, 0.0028383424505591393, 0.0030788425356149673, 0.0033193426206707954, 0.0035598427057266235, 0.0038003427907824516, 0.00404084287583828, 0.004281342960894108, 0.004521843045949936, 0.004762343131005764, 0.005002843216061592, 0.00524334330111742, 0.005483843386173248, 0.005724343471229076, 0.0059648435562849045, 0.006205343641340733, 0.006445843726396561, 0.006686343811452389, 0.006926843896508217, 0.007167343981564045, 0.007407844066619873]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 4.0, 11.0, 10.0, 16.0, 17.0, 24.0, 29.0, 28.0, 32.0, 30.0, 41.0, 34.0, 46.0, 35.0, 48.0, 32.0, 39.0, 28.0, 53.0, 47.0, 32.0, 38.0, 34.0, 33.0, 33.0, 30.0, 23.0, 18.0, 22.0, 19.0, 17.0, 14.0, 10.0, 10.0, 5.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9077835083007812, -0.8726959228515625, -0.8376083374023438, -0.802520751953125, -0.7674331665039062, -0.7323455810546875, -0.6972579956054688, -0.66217041015625, -0.6270828247070312, -0.5919952392578125, -0.5569076538085938, -0.521820068359375, -0.48673248291015625, -0.4516448974609375, -0.41655731201171875, -0.3814697265625, -0.34638214111328125, -0.3112945556640625, -0.27620697021484375, -0.241119384765625, -0.20603179931640625, -0.1709442138671875, -0.13585662841796875, -0.10076904296875, -0.06568145751953125, -0.0305938720703125, 0.00449371337890625, 0.039581298828125, 0.07466888427734375, 0.1097564697265625, 0.14484405517578125, 0.179931640625, 0.21501922607421875, 0.2501068115234375, 0.28519439697265625, 0.320281982421875, 0.35536956787109375, 0.3904571533203125, 0.42554473876953125, 0.46063232421875, 0.49571990966796875, 0.5308074951171875, 0.5658950805664062, 0.600982666015625, 0.6360702514648438, 0.6711578369140625, 0.7062454223632812, 0.7413330078125, 0.7764205932617188, 0.8115081787109375, 0.8465957641601562, 0.881683349609375, 0.9167709350585938, 0.9518585205078125, 0.9869461059570312, 1.02203369140625, 1.0571212768554688, 1.0922088623046875, 1.1272964477539062, 1.162384033203125, 1.1974716186523438, 1.2325592041015625, 1.2676467895507812, 1.302734375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 3.0, 13.0, 19.0, 16.0, 23.0, 44.0, 49.0, 57.0, 84.0, 129.0, 201.0, 248.0, 396.0, 606.0, 1046.0, 1822.0, 3359.0, 7254.0, 15815.0, 37992.0, 102585.0, 340880.0, 357877.0, 106453.0, 39493.0, 16272.0, 7308.0, 3602.0, 1856.0, 1062.0, 636.0, 414.0, 258.0, 191.0, 132.0, 100.0, 74.0, 55.0, 30.0, 31.0, 22.0, 17.0, 11.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.1080322265625, -2.044189453125, -1.9803466796875, -1.91650390625, -1.8526611328125, -1.788818359375, -1.7249755859375, -1.6611328125, -1.5972900390625, -1.533447265625, -1.4696044921875, -1.40576171875, -1.3419189453125, -1.278076171875, -1.2142333984375, -1.150390625, -1.0865478515625, -1.022705078125, -0.9588623046875, -0.89501953125, -0.8311767578125, -0.767333984375, -0.7034912109375, -0.6396484375, -0.5758056640625, -0.511962890625, -0.4481201171875, -0.38427734375, -0.3204345703125, -0.256591796875, -0.1927490234375, -0.12890625, -0.0650634765625, -0.001220703125, 0.0626220703125, 0.12646484375, 0.1903076171875, 0.254150390625, 0.3179931640625, 0.3818359375, 0.4456787109375, 0.509521484375, 0.5733642578125, 0.63720703125, 0.7010498046875, 0.764892578125, 0.8287353515625, 0.892578125, 0.9564208984375, 1.020263671875, 1.0841064453125, 1.14794921875, 1.2117919921875, 1.275634765625, 1.3394775390625, 1.4033203125, 1.4671630859375, 1.531005859375, 1.5948486328125, 1.65869140625, 1.7225341796875, 1.786376953125, 1.8502197265625, 1.9140625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 15.0, 16.0, 15.0, 19.0, 36.0, 32.0, 33.0, 49.0, 48.0, 78.0, 96.0, 161.0, 262.0, 1411.0, 213.0, 161.0, 81.0, 47.0, 57.0, 36.0, 25.0, 28.0, 20.0, 24.0, 21.0, 19.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.907257080078125, -2.79693603515625, -2.686614990234375, -2.5762939453125, -2.465972900390625, -2.35565185546875, -2.245330810546875, -2.135009765625, -2.024688720703125, -1.91436767578125, -1.804046630859375, -1.6937255859375, -1.583404541015625, -1.47308349609375, -1.362762451171875, -1.25244140625, -1.142120361328125, -1.03179931640625, -0.921478271484375, -0.8111572265625, -0.700836181640625, -0.59051513671875, -0.480194091796875, -0.369873046875, -0.259552001953125, -0.14923095703125, -0.038909912109375, 0.0714111328125, 0.181732177734375, 0.29205322265625, 0.402374267578125, 0.5126953125, 0.623016357421875, 0.73333740234375, 0.843658447265625, 0.9539794921875, 1.064300537109375, 1.17462158203125, 1.284942626953125, 1.395263671875, 1.505584716796875, 1.61590576171875, 1.726226806640625, 1.8365478515625, 1.946868896484375, 2.05718994140625, 2.167510986328125, 2.27783203125, 2.388153076171875, 2.49847412109375, 2.608795166015625, 2.7191162109375, 2.829437255859375, 2.93975830078125, 3.050079345703125, 3.160400390625, 3.270721435546875, 3.38104248046875, 3.491363525390625, 3.6016845703125, 3.712005615234375, 3.82232666015625, 3.932647705078125, 4.04296875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 7.0, 8.0, 12.0, 18.0, 32.0, 48.0, 92.0, 118.0, 227.0, 416.0, 835.0, 2423.0, 29822.0, 3094248.0, 13823.0, 1902.0, 782.0, 371.0, 191.0, 113.0, 77.0, 39.0, 35.0, 15.0, 18.0, 8.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.8359375, -14.40478515625, -13.9736328125, -13.54248046875, -13.111328125, -12.68017578125, -12.2490234375, -11.81787109375, -11.38671875, -10.95556640625, -10.5244140625, -10.09326171875, -9.662109375, -9.23095703125, -8.7998046875, -8.36865234375, -7.9375, -7.50634765625, -7.0751953125, -6.64404296875, -6.212890625, -5.78173828125, -5.3505859375, -4.91943359375, -4.48828125, -4.05712890625, -3.6259765625, -3.19482421875, -2.763671875, -2.33251953125, -1.9013671875, -1.47021484375, -1.0390625, -0.60791015625, -0.1767578125, 0.25439453125, 0.685546875, 1.11669921875, 1.5478515625, 1.97900390625, 2.41015625, 2.84130859375, 3.2724609375, 3.70361328125, 4.134765625, 4.56591796875, 4.9970703125, 5.42822265625, 5.859375, 6.29052734375, 6.7216796875, 7.15283203125, 7.583984375, 8.01513671875, 8.4462890625, 8.87744140625, 9.30859375, 9.73974609375, 10.1708984375, 10.60205078125, 11.033203125, 11.46435546875, 11.8955078125, 12.32666015625, 12.7578125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 6.0, 0.0, 10.0, 32.0, 47.0, 79.0, 103.0, 178.0, 154.0, 141.0, 109.0, 70.0, 34.0, 18.0, 19.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.101462364196777, -5.560796737670898, -5.0201311111450195, -4.479465007781982, -3.9387993812561035, -3.3981337547302246, -2.8574678897857666, -2.3168020248413086, -1.7761363983154297, -1.2354706525802612, -0.6948049068450928, -0.15413916110992432, 0.38652658462524414, 0.927192211151123, 1.467858076095581, 2.008523941040039, 2.549189567565918, 3.089855194091797, 3.630521059036255, 4.171186923980713, 4.711852550506592, 5.252518177032471, 5.793184280395508, 6.333849906921387, 6.874515533447266, 7.4151811599731445, 7.955846786499023, 8.496512413024902, 9.037178039550781, 9.577844619750977, 10.118510246276855, 10.659175872802734, 11.199840545654297, 11.740506172180176, 12.281171798706055, 12.821837425231934, 13.362503051757812, 13.903169631958008, 14.443835258483887, 14.984500885009766, 15.525166511535645, 16.065832138061523, 16.60649871826172, 17.14716339111328, 17.687829971313477, 18.22849464416504, 18.769161224365234, 19.309825897216797, 19.850492477416992, 20.391159057617188, 20.93182373046875, 21.472490310668945, 22.013154983520508, 22.553821563720703, 23.094486236572266, 23.63515281677246, 24.175819396972656, 24.71648597717285, 25.257150650024414, 25.79781723022461, 26.338481903076172, 26.879148483276367, 27.41981315612793, 27.960479736328125, 28.501144409179688]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 2.0, 7.0, 6.0, 13.0, 12.0, 10.0, 20.0, 13.0, 15.0, 28.0, 22.0, 21.0, 21.0, 23.0, 33.0, 45.0, 29.0, 38.0, 51.0, 38.0, 54.0, 39.0, 44.0, 45.0, 39.0, 43.0, 38.0, 30.0, 44.0, 31.0, 26.0, 22.0, 18.0, 16.0, 14.0, 10.0, 9.0, 8.0, 5.0, 9.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.275643348693848, -8.975184440612793, -8.674725532531738, -8.374267578125, -8.073808670043945, -7.773349761962891, -7.472890853881836, -7.172431945800781, -6.871973514556885, -6.57151460647583, -6.271056175231934, -5.970597267150879, -5.670138359069824, -5.369679927825928, -5.069221019744873, -4.768762588500977, -4.468303680419922, -4.167844772338867, -3.8673863410949707, -3.566927433013916, -3.2664687633514404, -2.966010093688965, -2.66555118560791, -2.3650925159454346, -2.064633846282959, -1.7641751766204834, -1.4637163877487183, -1.1632575988769531, -0.8627989292144775, -0.562340259552002, -0.2618814706802368, 0.03857731819152832, 0.3390350341796875, 0.6394937634468079, 0.9399524927139282, 1.2404112815856934, 1.540869951248169, 1.8413286209106445, 2.141787528991699, 2.442246198654175, 2.7427048683166504, 3.043163537979126, 3.3436222076416016, 3.6440811157226562, 3.944539785385132, 4.244998455047607, 4.545457363128662, 4.845915794372559, 5.146374702453613, 5.446833610534668, 5.7472920417785645, 6.047750949859619, 6.348209381103516, 6.64866828918457, 6.949127197265625, 7.24958610534668, 7.550044536590576, 7.850503444671631, 8.150961875915527, 8.451420783996582, 8.751879692077637, 9.052337646484375, 9.35279655456543, 9.653255462646484, 9.953714370727539]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 5.0, 7.0, 10.0, 8.0, 8.0, 12.0, 24.0, 15.0, 21.0, 25.0, 36.0, 25.0, 30.0, 40.0, 41.0, 43.0, 54.0, 53.0, 42.0, 46.0, 49.0, 42.0, 37.0, 45.0, 39.0, 40.0, 33.0, 30.0, 23.0, 17.0, 19.0, 16.0, 15.0, 13.0, 8.0, 8.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.2054443359375, -1.163818359375, -1.1221923828125, -1.08056640625, -1.0389404296875, -0.997314453125, -0.9556884765625, -0.9140625, -0.8724365234375, -0.830810546875, -0.7891845703125, -0.74755859375, -0.7059326171875, -0.664306640625, -0.6226806640625, -0.5810546875, -0.5394287109375, -0.497802734375, -0.4561767578125, -0.41455078125, -0.3729248046875, -0.331298828125, -0.2896728515625, -0.248046875, -0.2064208984375, -0.164794921875, -0.1231689453125, -0.08154296875, -0.0399169921875, 0.001708984375, 0.0433349609375, 0.0849609375, 0.1265869140625, 0.168212890625, 0.2098388671875, 0.25146484375, 0.2930908203125, 0.334716796875, 0.3763427734375, 0.41796875, 0.4595947265625, 0.501220703125, 0.5428466796875, 0.58447265625, 0.6260986328125, 0.667724609375, 0.7093505859375, 0.7509765625, 0.7926025390625, 0.834228515625, 0.8758544921875, 0.91748046875, 0.9591064453125, 1.000732421875, 1.0423583984375, 1.083984375, 1.1256103515625, 1.167236328125, 1.2088623046875, 1.25048828125, 1.2921142578125, 1.333740234375, 1.3753662109375, 1.4169921875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 8.0, 10.0, 8.0, 22.0, 20.0, 34.0, 30.0, 43.0, 71.0, 109.0, 150.0, 233.0, 408.0, 688.0, 1325.0, 2517.0, 5620.0, 18802.0, 175578.0, 2851325.0, 1066991.0, 51583.0, 10498.0, 3826.0, 1777.0, 985.0, 586.0, 333.0, 214.0, 143.0, 89.0, 64.0, 41.0, 34.0, 23.0, 18.0, 9.0, 10.0, 13.0, 9.0, 7.0, 5.0, 3.0, 0.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.938568115234375, -3.81463623046875, -3.690704345703125, -3.5667724609375, -3.442840576171875, -3.31890869140625, -3.194976806640625, -3.071044921875, -2.947113037109375, -2.82318115234375, -2.699249267578125, -2.5753173828125, -2.451385498046875, -2.32745361328125, -2.203521728515625, -2.07958984375, -1.955657958984375, -1.83172607421875, -1.707794189453125, -1.5838623046875, -1.459930419921875, -1.33599853515625, -1.212066650390625, -1.088134765625, -0.964202880859375, -0.84027099609375, -0.716339111328125, -0.5924072265625, -0.468475341796875, -0.34454345703125, -0.220611572265625, -0.0966796875, 0.027252197265625, 0.15118408203125, 0.275115966796875, 0.3990478515625, 0.522979736328125, 0.64691162109375, 0.770843505859375, 0.894775390625, 1.018707275390625, 1.14263916015625, 1.266571044921875, 1.3905029296875, 1.514434814453125, 1.63836669921875, 1.762298583984375, 1.88623046875, 2.010162353515625, 2.13409423828125, 2.258026123046875, 2.3819580078125, 2.505889892578125, 2.62982177734375, 2.753753662109375, 2.877685546875, 3.001617431640625, 3.12554931640625, 3.249481201171875, 3.3734130859375, 3.497344970703125, 3.62127685546875, 3.745208740234375, 3.869140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 11.0, 11.0, 18.0, 17.0, 21.0, 29.0, 51.0, 59.0, 77.0, 119.0, 154.0, 174.0, 248.0, 344.0, 436.0, 525.0, 465.0, 356.0, 248.0, 180.0, 139.0, 102.0, 71.0, 55.0, 51.0, 27.0, 20.0, 18.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4529571533203125, -1.391265869140625, -1.3295745849609375, -1.26788330078125, -1.2061920166015625, -1.144500732421875, -1.0828094482421875, -1.0211181640625, -0.9594268798828125, -0.897735595703125, -0.8360443115234375, -0.77435302734375, -0.7126617431640625, -0.650970458984375, -0.5892791748046875, -0.527587890625, -0.4658966064453125, -0.404205322265625, -0.3425140380859375, -0.28082275390625, -0.2191314697265625, -0.157440185546875, -0.0957489013671875, -0.0340576171875, 0.0276336669921875, 0.089324951171875, 0.1510162353515625, 0.21270751953125, 0.2743988037109375, 0.336090087890625, 0.3977813720703125, 0.45947265625, 0.5211639404296875, 0.582855224609375, 0.6445465087890625, 0.70623779296875, 0.7679290771484375, 0.829620361328125, 0.8913116455078125, 0.9530029296875, 1.0146942138671875, 1.076385498046875, 1.1380767822265625, 1.19976806640625, 1.2614593505859375, 1.323150634765625, 1.3848419189453125, 1.446533203125, 1.5082244873046875, 1.569915771484375, 1.6316070556640625, 1.69329833984375, 1.7549896240234375, 1.816680908203125, 1.8783721923828125, 1.9400634765625, 2.0017547607421875, 2.063446044921875, 2.1251373291015625, 2.18682861328125, 2.2485198974609375, 2.310211181640625, 2.3719024658203125, 2.43359375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 11.0, 4.0, 12.0, 9.0, 19.0, 32.0, 39.0, 67.0, 76.0, 141.0, 243.0, 375.0, 687.0, 1338.0, 3015.0, 9260.0, 39918.0, 330744.0, 2942447.0, 769399.0, 74358.0, 14059.0, 4275.0, 1690.0, 822.0, 443.0, 258.0, 164.0, 110.0, 94.0, 37.0, 28.0, 36.0, 16.0, 15.0, 11.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.494140625, -3.393341064453125, -3.29254150390625, -3.191741943359375, -3.0909423828125, -2.990142822265625, -2.88934326171875, -2.788543701171875, -2.687744140625, -2.586944580078125, -2.48614501953125, -2.385345458984375, -2.2845458984375, -2.183746337890625, -2.08294677734375, -1.982147216796875, -1.88134765625, -1.780548095703125, -1.67974853515625, -1.578948974609375, -1.4781494140625, -1.377349853515625, -1.27655029296875, -1.175750732421875, -1.074951171875, -0.974151611328125, -0.87335205078125, -0.772552490234375, -0.6717529296875, -0.570953369140625, -0.47015380859375, -0.369354248046875, -0.2685546875, -0.167755126953125, -0.06695556640625, 0.033843994140625, 0.1346435546875, 0.235443115234375, 0.33624267578125, 0.437042236328125, 0.537841796875, 0.638641357421875, 0.73944091796875, 0.840240478515625, 0.9410400390625, 1.041839599609375, 1.14263916015625, 1.243438720703125, 1.34423828125, 1.445037841796875, 1.54583740234375, 1.646636962890625, 1.7474365234375, 1.848236083984375, 1.94903564453125, 2.049835205078125, 2.150634765625, 2.251434326171875, 2.35223388671875, 2.453033447265625, 2.5538330078125, 2.654632568359375, 2.75543212890625, 2.856231689453125, 2.95703125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 68.0, 442.0, 435.0, 60.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.513240814208984, -16.822830200195312, -15.132420539855957, -13.442010879516602, -11.75160026550293, -10.061189651489258, -8.370779991149902, -6.680370330810547, -4.989959716796875, -3.2995495796203613, -1.6091394424438477, 0.08127069473266602, 1.7716808319091797, 3.4620914459228516, 5.152501106262207, 6.8429107666015625, 8.533321380615234, 10.223731994628906, 11.914141654968262, 13.604551315307617, 15.294961929321289, 16.98537254333496, 18.67578125, 20.366191864013672, 22.056602478027344, 23.747013092041016, 25.437423706054688, 27.127832412719727, 28.8182430267334, 30.50865364074707, 32.19906234741211, 33.88947296142578, 35.57988739013672, 37.27029800415039, 38.96070861816406, 40.651119232177734, 42.341529846191406, 44.03193664550781, 45.722347259521484, 47.412757873535156, 49.10316848754883, 50.7935791015625, 52.48398971557617, 54.174400329589844, 55.86480712890625, 57.55522155761719, 59.245628356933594, 60.936038970947266, 62.62644958496094, 64.31685638427734, 66.00727081298828, 67.69767761230469, 69.38809204101562, 71.07849884033203, 72.76891326904297, 74.45932006835938, 76.14973449707031, 77.84014129638672, 79.53055572509766, 81.22096252441406, 82.911376953125, 84.6017837524414, 86.29219818115234, 87.98260498046875, 89.67301177978516]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 10.0, 7.0, 8.0, 11.0, 17.0, 15.0, 21.0, 30.0, 32.0, 37.0, 42.0, 31.0, 42.0, 40.0, 61.0, 42.0, 54.0, 60.0, 54.0, 52.0, 54.0, 50.0, 32.0, 38.0, 30.0, 25.0, 22.0, 23.0, 17.0, 16.0, 9.0, 12.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.028031349182129, -9.739277839660645, -9.45052433013916, -9.161770820617676, -8.873017311096191, -8.584263801574707, -8.295510292053223, -8.006755828857422, -7.718002796173096, -7.429249286651611, -7.140495777130127, -6.851742267608643, -6.56298828125, -6.274234771728516, -5.985481262207031, -5.696727752685547, -5.4079742431640625, -5.119220733642578, -4.830467224121094, -4.541713714599609, -4.252960205078125, -3.9642064571380615, -3.675452709197998, -3.3866991996765137, -3.0979456901550293, -2.809192180633545, -2.5204386711120605, -2.231684923171997, -1.9429314136505127, -1.6541779041290283, -1.3654242753982544, -1.0766706466674805, -0.7879180908203125, -0.49916452169418335, -0.2104109525680542, 0.07834261655807495, 0.3670961856842041, 0.6558496952056885, 0.9446033239364624, 1.2333569526672363, 1.5221104621887207, 1.810863971710205, 2.0996174812316895, 2.388371229171753, 2.6771247386932373, 2.9658782482147217, 3.254631996154785, 3.5433855056762695, 3.832139015197754, 4.120892524719238, 4.409646034240723, 4.698399543762207, 4.987153053283691, 5.275906562805176, 5.564660549163818, 5.853414058685303, 6.142167568206787, 6.4309210777282715, 6.719674587249756, 7.00842809677124, 7.297182083129883, 7.585935592651367, 7.874689102172852, 8.163442611694336, 8.45219612121582]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 4.0, 8.0, 7.0, 10.0, 14.0, 23.0, 14.0, 24.0, 24.0, 24.0, 26.0, 29.0, 41.0, 37.0, 46.0, 53.0, 41.0, 42.0, 59.0, 44.0, 53.0, 39.0, 41.0, 21.0, 31.0, 27.0, 30.0, 29.0, 23.0, 25.0, 17.0, 12.0, 19.0, 10.0, 7.0, 13.0, 9.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1484375, -1.1151046752929688, -1.0817718505859375, -1.0484390258789062, -1.015106201171875, -0.9817733764648438, -0.9484405517578125, -0.9151077270507812, -0.88177490234375, -0.8484420776367188, -0.8151092529296875, -0.7817764282226562, -0.748443603515625, -0.7151107788085938, -0.6817779541015625, -0.6484451293945312, -0.6151123046875, -0.5817794799804688, -0.5484466552734375, -0.5151138305664062, -0.481781005859375, -0.44844818115234375, -0.4151153564453125, -0.38178253173828125, -0.34844970703125, -0.31511688232421875, -0.2817840576171875, -0.24845123291015625, -0.215118408203125, -0.18178558349609375, -0.1484527587890625, -0.11511993408203125, -0.081787109375, -0.04845428466796875, -0.0151214599609375, 0.01821136474609375, 0.051544189453125, 0.08487701416015625, 0.1182098388671875, 0.15154266357421875, 0.18487548828125, 0.21820831298828125, 0.2515411376953125, 0.28487396240234375, 0.318206787109375, 0.35153961181640625, 0.3848724365234375, 0.41820526123046875, 0.4515380859375, 0.48487091064453125, 0.5182037353515625, 0.5515365600585938, 0.584869384765625, 0.6182022094726562, 0.6515350341796875, 0.6848678588867188, 0.71820068359375, 0.7515335083007812, 0.7848663330078125, 0.8181991577148438, 0.851531982421875, 0.8848648071289062, 0.9181976318359375, 0.9515304565429688, 0.98486328125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 9.0, 22.0, 24.0, 30.0, 35.0, 53.0, 112.0, 129.0, 194.0, 335.0, 431.0, 601.0, 1075.0, 1673.0, 2598.0, 4263.0, 6971.0, 12242.0, 23453.0, 49675.0, 126397.0, 335506.0, 288119.0, 103335.0, 42821.0, 20683.0, 10930.0, 6358.0, 3827.0, 2375.0, 1427.0, 913.0, 598.0, 424.0, 255.0, 222.0, 139.0, 101.0, 68.0, 35.0, 29.0, 15.0, 12.0, 3.0, 11.0, 4.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.202392578125, -0.1962413787841797, -0.19009017944335938, -0.18393898010253906, -0.17778778076171875, -0.17163658142089844, -0.16548538208007812, -0.1593341827392578, -0.1531829833984375, -0.1470317840576172, -0.14088058471679688, -0.13472938537597656, -0.12857818603515625, -0.12242698669433594, -0.11627578735351562, -0.11012458801269531, -0.103973388671875, -0.09782218933105469, -0.09167098999023438, -0.08551979064941406, -0.07936859130859375, -0.07321739196777344, -0.06706619262695312, -0.06091499328613281, -0.0547637939453125, -0.04861259460449219, -0.042461395263671875, -0.03631019592285156, -0.03015899658203125, -0.024007797241210938, -0.017856597900390625, -0.011705398559570312, -0.00555419921875, 0.0005970001220703125, 0.006748199462890625, 0.012899398803710938, 0.01905059814453125, 0.025201797485351562, 0.031352996826171875, 0.03750419616699219, 0.0436553955078125, 0.04980659484863281, 0.055957794189453125, 0.06210899353027344, 0.06826019287109375, 0.07441139221191406, 0.08056259155273438, 0.08671379089355469, 0.092864990234375, 0.09901618957519531, 0.10516738891601562, 0.11131858825683594, 0.11746978759765625, 0.12362098693847656, 0.12977218627929688, 0.1359233856201172, 0.1420745849609375, 0.1482257843017578, 0.15437698364257812, 0.16052818298339844, 0.16667938232421875, 0.17283058166503906, 0.17898178100585938, 0.1851329803466797, 0.1912841796875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 8.0, 8.0, 9.0, 11.0, 10.0, 22.0, 18.0, 25.0, 27.0, 32.0, 23.0, 28.0, 31.0, 30.0, 34.0, 45.0, 46.0, 39.0, 41.0, 1059.0, 45.0, 35.0, 39.0, 29.0, 33.0, 26.0, 29.0, 26.0, 24.0, 24.0, 24.0, 18.0, 12.0, 23.0, 15.0, 12.0, 10.0, 3.0, 11.0, 14.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.72119140625, -0.7006988525390625, -0.680206298828125, -0.6597137451171875, -0.63922119140625, -0.6187286376953125, -0.598236083984375, -0.5777435302734375, -0.5572509765625, -0.5367584228515625, -0.516265869140625, -0.4957733154296875, -0.47528076171875, -0.4547882080078125, -0.434295654296875, -0.4138031005859375, -0.393310546875, -0.3728179931640625, -0.352325439453125, -0.3318328857421875, -0.31134033203125, -0.2908477783203125, -0.270355224609375, -0.2498626708984375, -0.2293701171875, -0.2088775634765625, -0.188385009765625, -0.1678924560546875, -0.14739990234375, -0.1269073486328125, -0.106414794921875, -0.0859222412109375, -0.0654296875, -0.0449371337890625, -0.024444580078125, -0.0039520263671875, 0.01654052734375, 0.0370330810546875, 0.057525634765625, 0.0780181884765625, 0.0985107421875, 0.1190032958984375, 0.139495849609375, 0.1599884033203125, 0.18048095703125, 0.2009735107421875, 0.221466064453125, 0.2419586181640625, 0.262451171875, 0.2829437255859375, 0.303436279296875, 0.3239288330078125, 0.34442138671875, 0.3649139404296875, 0.385406494140625, 0.4058990478515625, 0.4263916015625, 0.4468841552734375, 0.467376708984375, 0.4878692626953125, 0.50836181640625, 0.5288543701171875, 0.549346923828125, 0.5698394775390625, 0.59033203125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 20.0, 17.0, 34.0, 41.0, 58.0, 84.0, 88.0, 154.0, 197.0, 303.0, 420.0, 651.0, 956.0, 1481.0, 2398.0, 4205.0, 8413.0, 20141.0, 61517.0, 265380.0, 1451595.0, 195075.0, 49623.0, 16869.0, 7240.0, 3912.0, 2072.0, 1364.0, 881.0, 585.0, 407.0, 293.0, 196.0, 123.0, 102.0, 64.0, 49.0, 27.0, 30.0, 19.0, 14.0, 7.0, 6.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15644073486328125, -0.1502838134765625, -0.14412689208984375, -0.137969970703125, -0.13181304931640625, -0.1256561279296875, -0.11949920654296875, -0.11334228515625, -0.10718536376953125, -0.1010284423828125, -0.09487152099609375, -0.088714599609375, -0.08255767822265625, -0.0764007568359375, -0.07024383544921875, -0.0640869140625, -0.05792999267578125, -0.0517730712890625, -0.04561614990234375, -0.039459228515625, -0.03330230712890625, -0.0271453857421875, -0.02098846435546875, -0.01483154296875, -0.00867462158203125, -0.0025177001953125, 0.00363922119140625, 0.009796142578125, 0.01595306396484375, 0.0221099853515625, 0.02826690673828125, 0.034423828125, 0.04058074951171875, 0.0467376708984375, 0.05289459228515625, 0.059051513671875, 0.06520843505859375, 0.0713653564453125, 0.07752227783203125, 0.08367919921875, 0.08983612060546875, 0.0959930419921875, 0.10214996337890625, 0.108306884765625, 0.11446380615234375, 0.1206207275390625, 0.12677764892578125, 0.1329345703125, 0.13909149169921875, 0.1452484130859375, 0.15140533447265625, 0.157562255859375, 0.16371917724609375, 0.1698760986328125, 0.17603302001953125, 0.18218994140625, 0.18834686279296875, 0.1945037841796875, 0.20066070556640625, 0.206817626953125, 0.21297454833984375, 0.2191314697265625, 0.22528839111328125, 0.2314453125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 5.0, 9.0, 9.0, 14.0, 26.0, 31.0, 41.0, 51.0, 128.0, 211.0, 158.0, 91.0, 48.0, 31.0, 21.0, 17.0, 9.0, 8.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 3.0, 6.0, 0.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0214691162109375, -0.020790815353393555, -0.02011251449584961, -0.019434213638305664, -0.01875591278076172, -0.018077611923217773, -0.017399311065673828, -0.016721010208129883, -0.016042709350585938, -0.015364408493041992, -0.014686107635498047, -0.014007806777954102, -0.013329505920410156, -0.012651205062866211, -0.011972904205322266, -0.01129460334777832, -0.010616302490234375, -0.00993800163269043, -0.009259700775146484, -0.008581399917602539, -0.007903099060058594, -0.0072247982025146484, -0.006546497344970703, -0.005868196487426758, -0.0051898956298828125, -0.004511594772338867, -0.003833293914794922, -0.0031549930572509766, -0.0024766921997070312, -0.001798391342163086, -0.0011200904846191406, -0.0004417896270751953, 0.00023651123046875, 0.0009148120880126953, 0.0015931129455566406, 0.002271413803100586, 0.0029497146606445312, 0.0036280155181884766, 0.004306316375732422, 0.004984617233276367, 0.0056629180908203125, 0.006341218948364258, 0.007019519805908203, 0.0076978206634521484, 0.008376121520996094, 0.009054422378540039, 0.009732723236083984, 0.01041102409362793, 0.011089324951171875, 0.01176762580871582, 0.012445926666259766, 0.013124227523803711, 0.013802528381347656, 0.014480829238891602, 0.015159130096435547, 0.015837430953979492, 0.016515731811523438, 0.017194032669067383, 0.017872333526611328, 0.018550634384155273, 0.01922893524169922, 0.019907236099243164, 0.02058553695678711, 0.021263837814331055, 0.021942138671875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 8.0, 3.0, 3.0, 10.0, 10.0, 7.0, 7.0, 10.0, 7.0, 8.0, 2.0, 12.0, 13.0, 16.0, 20.0, 35.0, 43.0, 76.0, 89.0, 113.0, 207.0, 535.0, 6237.0, 961739.0, 76131.0, 2198.0, 382.0, 174.0, 114.0, 92.0, 51.0, 37.0, 26.0, 24.0, 19.0, 10.0, 9.0, 5.0, 8.0, 6.0, 8.0, 6.0, 10.0, 6.0, 6.0, 9.0, 3.0, 3.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.34375, -0.3322296142578125, -0.320709228515625, -0.3091888427734375, -0.29766845703125, -0.2861480712890625, -0.274627685546875, -0.2631072998046875, -0.2515869140625, -0.2400665283203125, -0.228546142578125, -0.2170257568359375, -0.20550537109375, -0.1939849853515625, -0.182464599609375, -0.1709442138671875, -0.159423828125, -0.1479034423828125, -0.136383056640625, -0.1248626708984375, -0.11334228515625, -0.1018218994140625, -0.090301513671875, -0.0787811279296875, -0.0672607421875, -0.0557403564453125, -0.044219970703125, -0.0326995849609375, -0.02117919921875, -0.0096588134765625, 0.001861572265625, 0.0133819580078125, 0.02490234375, 0.0364227294921875, 0.047943115234375, 0.0594635009765625, 0.07098388671875, 0.0825042724609375, 0.094024658203125, 0.1055450439453125, 0.1170654296875, 0.1285858154296875, 0.140106201171875, 0.1516265869140625, 0.16314697265625, 0.1746673583984375, 0.186187744140625, 0.1977081298828125, 0.209228515625, 0.2207489013671875, 0.232269287109375, 0.2437896728515625, 0.25531005859375, 0.2668304443359375, 0.278350830078125, 0.2898712158203125, 0.3013916015625, 0.3129119873046875, 0.324432373046875, 0.3359527587890625, 0.34747314453125, 0.3589935302734375, 0.370513916015625, 0.3820343017578125, 0.3935546875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 17.0, 81.0, 410.0, 383.0, 95.0, 18.0, 9.0], "bins": [-0.24258236587047577, -0.23853299021720886, -0.23448359966278076, -0.23043422400951385, -0.22638484835624695, -0.22233547270298004, -0.21828608214855194, -0.21423670649528503, -0.21018733084201813, -0.20613795518875122, -0.20208856463432312, -0.1980391889810562, -0.1939898133277893, -0.1899404376745224, -0.1858910471200943, -0.1818416714668274, -0.1777922809123993, -0.17374290525913239, -0.16969351470470428, -0.16564413905143738, -0.16159476339817047, -0.15754538774490356, -0.15349599719047546, -0.14944662153720856, -0.14539724588394165, -0.14134787023067474, -0.13729847967624664, -0.13324910402297974, -0.12919972836971283, -0.12515035271644592, -0.12110096216201782, -0.11705158650875092, -0.1130022183060646, -0.1089528352022171, -0.1049034595489502, -0.10085407644510269, -0.09680470079183578, -0.09275531768798828, -0.08870594203472137, -0.08465655893087387, -0.08060717582702637, -0.07655779272317886, -0.07250841706991196, -0.06845903396606445, -0.06440965831279755, -0.06036027520895004, -0.05631089583039284, -0.05226151645183563, -0.048212140798568726, -0.04416276142001152, -0.040113382041454315, -0.03606399893760681, -0.032014623284339905, -0.02796524204313755, -0.023915860801935196, -0.01986648142337799, -0.015817102044820786, -0.01176772266626358, -0.0077183423563838005, -0.0036689620465040207, 0.0003804173320531845, 0.00442979671061039, 0.008479177951812744, 0.01252855733036995, 0.016577936708927155]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 12.0, 8.0, 7.0, 16.0, 7.0, 13.0, 19.0, 24.0, 25.0, 24.0, 43.0, 35.0, 44.0, 37.0, 34.0, 41.0, 49.0, 46.0, 43.0, 57.0, 52.0, 42.0, 39.0, 39.0, 28.0, 29.0, 34.0, 24.0, 25.0, 23.0, 13.0, 17.0, 10.0, 11.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.03174370527267456, -0.030864480882883072, -0.029985256493091583, -0.029106032103300095, -0.028226807713508606, -0.027347583323717117, -0.02646835893392563, -0.02558913454413414, -0.02470991015434265, -0.023830685764551163, -0.022951461374759674, -0.022072236984968185, -0.021193012595176697, -0.020313788205385208, -0.01943456381559372, -0.01855533942580223, -0.017676115036010742, -0.016796890646219254, -0.015917666256427765, -0.015038441866636276, -0.014159217476844788, -0.013279993087053299, -0.01240076869726181, -0.011521544307470322, -0.010642319917678833, -0.009763095527887344, -0.008883871138095856, -0.008004646748304367, -0.007125422358512878, -0.00624619796872139, -0.005366973578929901, -0.0044877491891384125, -0.003608524799346924, -0.002729300409555435, -0.0018500760197639465, -0.0009708516299724579, -9.162724018096924e-05, 0.0007875971496105194, 0.001666821539402008, 0.0025460459291934967, 0.0034252703189849854, 0.004304494708776474, 0.005183719098567963, 0.006062943488359451, 0.00694216787815094, 0.007821392267942429, 0.008700616657733917, 0.009579841047525406, 0.010459065437316895, 0.011338289827108383, 0.012217514216899872, 0.01309673860669136, 0.013975962996482849, 0.014855187386274338, 0.015734411776065826, 0.016613636165857315, 0.017492860555648804, 0.018372084945440292, 0.01925130933523178, 0.02013053372502327, 0.02100975811481476, 0.021888982504606247, 0.022768206894397736, 0.023647431284189224, 0.024526655673980713]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 4.0, 8.0, 7.0, 10.0, 15.0, 21.0, 15.0, 24.0, 25.0, 23.0, 24.0, 28.0, 43.0, 38.0, 47.0, 50.0, 42.0, 42.0, 60.0, 42.0, 53.0, 41.0, 41.0, 21.0, 30.0, 27.0, 29.0, 30.0, 22.0, 26.0, 18.0, 12.0, 19.0, 9.0, 8.0, 12.0, 10.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.146484375, -1.11322021484375, -1.0799560546875, -1.04669189453125, -1.013427734375, -0.98016357421875, -0.9468994140625, -0.91363525390625, -0.88037109375, -0.84710693359375, -0.8138427734375, -0.78057861328125, -0.747314453125, -0.71405029296875, -0.6807861328125, -0.64752197265625, -0.6142578125, -0.58099365234375, -0.5477294921875, -0.51446533203125, -0.481201171875, -0.44793701171875, -0.4146728515625, -0.38140869140625, -0.34814453125, -0.31488037109375, -0.2816162109375, -0.24835205078125, -0.215087890625, -0.18182373046875, -0.1485595703125, -0.11529541015625, -0.08203125, -0.04876708984375, -0.0155029296875, 0.01776123046875, 0.051025390625, 0.08428955078125, 0.1175537109375, 0.15081787109375, 0.18408203125, 0.21734619140625, 0.2506103515625, 0.28387451171875, 0.317138671875, 0.35040283203125, 0.3836669921875, 0.41693115234375, 0.4501953125, 0.48345947265625, 0.5167236328125, 0.54998779296875, 0.583251953125, 0.61651611328125, 0.6497802734375, 0.68304443359375, 0.71630859375, 0.74957275390625, 0.7828369140625, 0.81610107421875, 0.849365234375, 0.88262939453125, 0.9158935546875, 0.94915771484375, 0.982421875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 9.0, 8.0, 19.0, 22.0, 24.0, 32.0, 49.0, 64.0, 88.0, 120.0, 154.0, 188.0, 290.0, 391.0, 613.0, 926.0, 1568.0, 2652.0, 5229.0, 11140.0, 27791.0, 81656.0, 277349.0, 421909.0, 139622.0, 43941.0, 16480.0, 7126.0, 3471.0, 1991.0, 1163.0, 722.0, 470.0, 309.0, 256.0, 179.0, 140.0, 76.0, 68.0, 61.0, 43.0, 39.0, 20.0, 22.0, 7.0, 12.0, 9.0, 9.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.2744140625, -1.236053466796875, -1.19769287109375, -1.159332275390625, -1.1209716796875, -1.082611083984375, -1.04425048828125, -1.005889892578125, -0.967529296875, -0.929168701171875, -0.89080810546875, -0.852447509765625, -0.8140869140625, -0.775726318359375, -0.73736572265625, -0.699005126953125, -0.66064453125, -0.622283935546875, -0.58392333984375, -0.545562744140625, -0.5072021484375, -0.468841552734375, -0.43048095703125, -0.392120361328125, -0.353759765625, -0.315399169921875, -0.27703857421875, -0.238677978515625, -0.2003173828125, -0.161956787109375, -0.12359619140625, -0.085235595703125, -0.046875, -0.008514404296875, 0.02984619140625, 0.068206787109375, 0.1065673828125, 0.144927978515625, 0.18328857421875, 0.221649169921875, 0.260009765625, 0.298370361328125, 0.33673095703125, 0.375091552734375, 0.4134521484375, 0.451812744140625, 0.49017333984375, 0.528533935546875, 0.56689453125, 0.605255126953125, 0.64361572265625, 0.681976318359375, 0.7203369140625, 0.758697509765625, 0.79705810546875, 0.835418701171875, 0.873779296875, 0.912139892578125, 0.95050048828125, 0.988861083984375, 1.0272216796875, 1.065582275390625, 1.10394287109375, 1.142303466796875, 1.1806640625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 13.0, 9.0, 11.0, 20.0, 11.0, 13.0, 22.0, 29.0, 39.0, 34.0, 43.0, 39.0, 81.0, 113.0, 192.0, 1364.0, 334.0, 195.0, 84.0, 57.0, 54.0, 44.0, 32.0, 29.0, 38.0, 18.0, 23.0, 13.0, 15.0, 16.0, 10.0, 7.0, 8.0, 4.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.220703125, -3.133392333984375, -3.04608154296875, -2.958770751953125, -2.8714599609375, -2.784149169921875, -2.69683837890625, -2.609527587890625, -2.522216796875, -2.434906005859375, -2.34759521484375, -2.260284423828125, -2.1729736328125, -2.085662841796875, -1.99835205078125, -1.911041259765625, -1.82373046875, -1.736419677734375, -1.64910888671875, -1.561798095703125, -1.4744873046875, -1.387176513671875, -1.29986572265625, -1.212554931640625, -1.125244140625, -1.037933349609375, -0.95062255859375, -0.863311767578125, -0.7760009765625, -0.688690185546875, -0.60137939453125, -0.514068603515625, -0.4267578125, -0.339447021484375, -0.25213623046875, -0.164825439453125, -0.0775146484375, 0.009796142578125, 0.09710693359375, 0.184417724609375, 0.271728515625, 0.359039306640625, 0.44635009765625, 0.533660888671875, 0.6209716796875, 0.708282470703125, 0.79559326171875, 0.882904052734375, 0.97021484375, 1.057525634765625, 1.14483642578125, 1.232147216796875, 1.3194580078125, 1.406768798828125, 1.49407958984375, 1.581390380859375, 1.668701171875, 1.756011962890625, 1.84332275390625, 1.930633544921875, 2.0179443359375, 2.105255126953125, 2.19256591796875, 2.279876708984375, 2.3671875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 5.0, 8.0, 8.0, 9.0, 18.0, 23.0, 23.0, 32.0, 37.0, 65.0, 89.0, 101.0, 150.0, 201.0, 386.0, 894.0, 2804.0, 23753.0, 2944760.0, 164095.0, 5631.0, 1314.0, 493.0, 230.0, 142.0, 91.0, 72.0, 70.0, 32.0, 36.0, 32.0, 19.0, 12.0, 11.0, 11.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.7734375, -4.61798095703125, -4.4625244140625, -4.30706787109375, -4.151611328125, -3.99615478515625, -3.8406982421875, -3.68524169921875, -3.52978515625, -3.37432861328125, -3.2188720703125, -3.06341552734375, -2.907958984375, -2.75250244140625, -2.5970458984375, -2.44158935546875, -2.2861328125, -2.13067626953125, -1.9752197265625, -1.81976318359375, -1.664306640625, -1.50885009765625, -1.3533935546875, -1.19793701171875, -1.04248046875, -0.88702392578125, -0.7315673828125, -0.57611083984375, -0.420654296875, -0.26519775390625, -0.1097412109375, 0.04571533203125, 0.201171875, 0.35662841796875, 0.5120849609375, 0.66754150390625, 0.822998046875, 0.97845458984375, 1.1339111328125, 1.28936767578125, 1.44482421875, 1.60028076171875, 1.7557373046875, 1.91119384765625, 2.066650390625, 2.22210693359375, 2.3775634765625, 2.53302001953125, 2.6884765625, 2.84393310546875, 2.9993896484375, 3.15484619140625, 3.310302734375, 3.46575927734375, 3.6212158203125, 3.77667236328125, 3.93212890625, 4.08758544921875, 4.2430419921875, 4.39849853515625, 4.553955078125, 4.70941162109375, 4.8648681640625, 5.02032470703125, 5.17578125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 34.0, 523.0, 432.0, 21.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.516396522521973, -8.985089302062988, -7.453781604766846, -5.922473907470703, -4.391166687011719, -2.8598594665527344, -1.3285512924194336, 0.20275592803955078, 1.7340631484985352, 3.2653706073760986, 4.796678066253662, 6.327985763549805, 7.859292984008789, 9.390600204467773, 10.921908378601074, 12.453215599060059, 13.984522819519043, 15.515830039978027, 17.047138214111328, 18.578445434570312, 20.109752655029297, 21.64105987548828, 23.172367095947266, 24.70367431640625, 26.234981536865234, 27.76628875732422, 29.297595977783203, 30.828903198242188, 32.36021041870117, 33.891517639160156, 35.422828674316406, 36.954132080078125, 38.485443115234375, 40.01675033569336, 41.548057556152344, 43.07936477661133, 44.61067199707031, 46.1419792175293, 47.67328643798828, 49.20459747314453, 50.73590087890625, 52.267208099365234, 53.79851531982422, 55.3298225402832, 56.86112976074219, 58.39243698120117, 59.923744201660156, 61.455055236816406, 62.98636245727539, 64.51766967773438, 66.04898071289062, 67.58028411865234, 69.1115951538086, 70.64289855957031, 72.17420959472656, 73.70551300048828, 75.23682403564453, 76.76813507080078, 78.2994384765625, 79.83074951171875, 81.36205291748047, 82.89336395263672, 84.42466735839844, 85.95597839355469, 87.4872817993164]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 10.0, 6.0, 13.0, 16.0, 18.0, 22.0, 22.0, 29.0, 26.0, 32.0, 35.0, 34.0, 47.0, 38.0, 48.0, 46.0, 31.0, 49.0, 41.0, 46.0, 51.0, 42.0, 33.0, 45.0, 34.0, 31.0, 17.0, 21.0, 18.0, 20.0, 9.0, 15.0, 8.0, 11.0, 6.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.179915428161621, -4.969279766082764, -4.758644104003906, -4.548008441925049, -4.337372779846191, -4.126737117767334, -3.9161014556884766, -3.705465793609619, -3.4948301315307617, -3.2841944694519043, -3.073558807373047, -2.8629231452941895, -2.652287483215332, -2.4416518211364746, -2.231016159057617, -2.0203804969787598, -1.8097450733184814, -1.599109411239624, -1.3884737491607666, -1.1778380870819092, -0.9672024846076965, -0.7565668821334839, -0.5459312200546265, -0.33529555797576904, -0.12465989589691162, 0.0859757512807846, 0.29661139845848083, 0.5072470307350159, 0.7178826928138733, 0.9285182952880859, 1.1391539573669434, 1.3497896194458008, 1.5604252815246582, 1.7710609436035156, 1.981696605682373, 2.1923322677612305, 2.402967929840088, 2.6136035919189453, 2.8242392539978027, 3.03487491607666, 3.2455105781555176, 3.456146240234375, 3.6667819023132324, 3.87741756439209, 4.088053226470947, 4.298688888549805, 4.509324550628662, 4.7199602127075195, 4.930595397949219, 5.141231060028076, 5.351866722106934, 5.562502384185791, 5.773138046264648, 5.983773708343506, 6.194409370422363, 6.405045032501221, 6.615680694580078, 6.8263163566589355, 7.036952018737793, 7.24758768081665, 7.458223342895508, 7.668859004974365, 7.879494667053223, 8.090129852294922, 8.300765991210938]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 8.0, 8.0, 9.0, 16.0, 15.0, 18.0, 18.0, 16.0, 27.0, 23.0, 32.0, 31.0, 27.0, 32.0, 35.0, 38.0, 49.0, 57.0, 38.0, 38.0, 40.0, 34.0, 43.0, 34.0, 30.0, 32.0, 29.0, 30.0, 25.0, 26.0, 17.0, 18.0, 15.0, 13.0, 13.0, 10.0, 9.0, 4.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.146484375, -1.1115875244140625, -1.076690673828125, -1.0417938232421875, -1.00689697265625, -0.9720001220703125, -0.937103271484375, -0.9022064208984375, -0.8673095703125, -0.8324127197265625, -0.797515869140625, -0.7626190185546875, -0.72772216796875, -0.6928253173828125, -0.657928466796875, -0.6230316162109375, -0.588134765625, -0.5532379150390625, -0.518341064453125, -0.4834442138671875, -0.44854736328125, -0.4136505126953125, -0.378753662109375, -0.3438568115234375, -0.3089599609375, -0.2740631103515625, -0.239166259765625, -0.2042694091796875, -0.16937255859375, -0.1344757080078125, -0.099578857421875, -0.0646820068359375, -0.02978515625, 0.0051116943359375, 0.040008544921875, 0.0749053955078125, 0.10980224609375, 0.1446990966796875, 0.179595947265625, 0.2144927978515625, 0.2493896484375, 0.2842864990234375, 0.319183349609375, 0.3540802001953125, 0.38897705078125, 0.4238739013671875, 0.458770751953125, 0.4936676025390625, 0.528564453125, 0.5634613037109375, 0.598358154296875, 0.6332550048828125, 0.66815185546875, 0.7030487060546875, 0.737945556640625, 0.7728424072265625, 0.8077392578125, 0.8426361083984375, 0.877532958984375, 0.9124298095703125, 0.94732666015625, 0.9822235107421875, 1.017120361328125, 1.0520172119140625, 1.0869140625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 7.0, 12.0, 6.0, 15.0, 16.0, 23.0, 19.0, 46.0, 56.0, 79.0, 114.0, 166.0, 257.0, 450.0, 784.0, 1556.0, 3188.0, 8128.0, 28528.0, 193338.0, 2527140.0, 1312832.0, 87913.0, 17907.0, 5923.0, 2554.0, 1308.0, 731.0, 425.0, 254.0, 151.0, 103.0, 67.0, 41.0, 32.0, 31.0, 15.0, 16.0, 18.0, 7.0, 6.0, 4.0, 6.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.99609375, -4.84393310546875, -4.6917724609375, -4.53961181640625, -4.387451171875, -4.23529052734375, -4.0831298828125, -3.93096923828125, -3.77880859375, -3.62664794921875, -3.4744873046875, -3.32232666015625, -3.170166015625, -3.01800537109375, -2.8658447265625, -2.71368408203125, -2.5615234375, -2.40936279296875, -2.2572021484375, -2.10504150390625, -1.952880859375, -1.80072021484375, -1.6485595703125, -1.49639892578125, -1.34423828125, -1.19207763671875, -1.0399169921875, -0.88775634765625, -0.735595703125, -0.58343505859375, -0.4312744140625, -0.27911376953125, -0.126953125, 0.02520751953125, 0.1773681640625, 0.32952880859375, 0.481689453125, 0.63385009765625, 0.7860107421875, 0.93817138671875, 1.09033203125, 1.24249267578125, 1.3946533203125, 1.54681396484375, 1.698974609375, 1.85113525390625, 2.0032958984375, 2.15545654296875, 2.3076171875, 2.45977783203125, 2.6119384765625, 2.76409912109375, 2.916259765625, 3.06842041015625, 3.2205810546875, 3.37274169921875, 3.52490234375, 3.67706298828125, 3.8292236328125, 3.98138427734375, 4.133544921875, 4.28570556640625, 4.4378662109375, 4.59002685546875, 4.7421875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 10.0, 13.0, 18.0, 25.0, 37.0, 42.0, 65.0, 100.0, 119.0, 201.0, 256.0, 325.0, 431.0, 542.0, 519.0, 385.0, 281.0, 201.0, 157.0, 111.0, 69.0, 46.0, 29.0, 22.0, 20.0, 12.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.488250732421875, -2.39837646484375, -2.308502197265625, -2.2186279296875, -2.128753662109375, -2.03887939453125, -1.949005126953125, -1.859130859375, -1.769256591796875, -1.67938232421875, -1.589508056640625, -1.4996337890625, -1.409759521484375, -1.31988525390625, -1.230010986328125, -1.14013671875, -1.050262451171875, -0.96038818359375, -0.870513916015625, -0.7806396484375, -0.690765380859375, -0.60089111328125, -0.511016845703125, -0.421142578125, -0.331268310546875, -0.24139404296875, -0.151519775390625, -0.0616455078125, 0.028228759765625, 0.11810302734375, 0.207977294921875, 0.2978515625, 0.387725830078125, 0.47760009765625, 0.567474365234375, 0.6573486328125, 0.747222900390625, 0.83709716796875, 0.926971435546875, 1.016845703125, 1.106719970703125, 1.19659423828125, 1.286468505859375, 1.3763427734375, 1.466217041015625, 1.55609130859375, 1.645965576171875, 1.73583984375, 1.825714111328125, 1.91558837890625, 2.005462646484375, 2.0953369140625, 2.185211181640625, 2.27508544921875, 2.364959716796875, 2.454833984375, 2.544708251953125, 2.63458251953125, 2.724456787109375, 2.8143310546875, 2.904205322265625, 2.99407958984375, 3.083953857421875, 3.173828125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 15.0, 20.0, 28.0, 34.0, 52.0, 102.0, 157.0, 250.0, 441.0, 776.0, 1480.0, 2880.0, 5889.0, 13611.0, 35614.0, 109751.0, 424600.0, 1753013.0, 1394143.0, 315727.0, 85031.0, 28999.0, 11100.0, 5094.0, 2537.0, 1192.0, 720.0, 370.0, 241.0, 135.0, 79.0, 59.0, 24.0, 27.0, 24.0, 12.0, 11.0, 6.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.15130615234375, -2.0838623046875, -2.01641845703125, -1.948974609375, -1.88153076171875, -1.8140869140625, -1.74664306640625, -1.67919921875, -1.61175537109375, -1.5443115234375, -1.47686767578125, -1.409423828125, -1.34197998046875, -1.2745361328125, -1.20709228515625, -1.1396484375, -1.07220458984375, -1.0047607421875, -0.93731689453125, -0.869873046875, -0.80242919921875, -0.7349853515625, -0.66754150390625, -0.60009765625, -0.53265380859375, -0.4652099609375, -0.39776611328125, -0.330322265625, -0.26287841796875, -0.1954345703125, -0.12799072265625, -0.060546875, 0.00689697265625, 0.0743408203125, 0.14178466796875, 0.209228515625, 0.27667236328125, 0.3441162109375, 0.41156005859375, 0.47900390625, 0.54644775390625, 0.6138916015625, 0.68133544921875, 0.748779296875, 0.81622314453125, 0.8836669921875, 0.95111083984375, 1.0185546875, 1.08599853515625, 1.1534423828125, 1.22088623046875, 1.288330078125, 1.35577392578125, 1.4232177734375, 1.49066162109375, 1.55810546875, 1.62554931640625, 1.6929931640625, 1.76043701171875, 1.827880859375, 1.89532470703125, 1.9627685546875, 2.03021240234375, 2.09765625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 9.0, 13.0, 13.0, 23.0, 31.0, 30.0, 21.0, 38.0, 48.0, 55.0, 75.0, 68.0, 60.0, 81.0, 61.0, 67.0, 49.0, 58.0, 34.0, 28.0, 33.0, 26.0, 10.0, 11.0, 11.0, 6.0, 5.0, 6.0, 1.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.206491470336914, -17.735309600830078, -17.26412582397461, -16.792943954467773, -16.321760177612305, -15.850578308105469, -15.379395484924316, -14.908212661743164, -14.437030792236328, -13.965847969055176, -13.494665145874023, -13.023483276367188, -12.552300453186035, -12.081117630004883, -11.60993480682373, -11.138751983642578, -10.667569160461426, -10.196386337280273, -9.725203514099121, -9.254020690917969, -8.782838821411133, -8.31165599822998, -7.840473175048828, -7.369290351867676, -6.898108005523682, -6.426925182342529, -5.955742835998535, -5.484560012817383, -5.0133771896362305, -4.542194843292236, -4.071012020111084, -3.5998294353485107, -3.1286468505859375, -2.6574642658233643, -2.186281681060791, -1.7150988578796387, -1.2439162731170654, -0.7727336883544922, -0.30155086517333984, 0.1696317195892334, 0.6408143043518066, 1.1119968891143799, 1.5831795930862427, 2.0543622970581055, 2.5255448818206787, 2.996727466583252, 3.4679102897644043, 3.9390928745269775, 4.410275459289551, 4.881458282470703, 5.352640628814697, 5.82382345199585, 6.295005798339844, 6.766188621520996, 7.237371444702148, 7.708554267883301, 8.179737091064453, 8.650919914245605, 9.122102737426758, 9.593284606933594, 10.064467430114746, 10.535650253295898, 11.00683307647705, 11.478015899658203, 11.949197769165039]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 7.0, 4.0, 9.0, 11.0, 10.0, 17.0, 11.0, 15.0, 22.0, 18.0, 24.0, 25.0, 26.0, 23.0, 38.0, 43.0, 42.0, 41.0, 39.0, 42.0, 31.0, 45.0, 38.0, 55.0, 35.0, 46.0, 39.0, 38.0, 27.0, 25.0, 24.0, 23.0, 18.0, 13.0, 12.0, 12.0, 12.0, 16.0, 10.0, 7.0, 3.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.612322807312012, -10.259001731872559, -9.905680656433105, -9.552360534667969, -9.199039459228516, -8.845718383789062, -8.49239730834961, -8.139076232910156, -7.785755157470703, -7.43243408203125, -7.079113483428955, -6.725792407989502, -6.372471332550049, -6.019150733947754, -5.665829658508301, -5.312508583068848, -4.959187984466553, -4.6058669090271, -4.252546310424805, -3.8992252349853516, -3.5459041595458984, -3.1925833225250244, -2.8392624855041504, -2.4859414100646973, -2.1326205730438232, -1.7792996168136597, -1.425978660583496, -1.072657823562622, -0.7193368673324585, -0.3660159111022949, -0.012695074081420898, 0.3406260013580322, 0.6939468383789062, 1.0472677946090698, 1.4005887508392334, 1.7539095878601074, 2.1072306632995605, 2.4605515003204346, 2.8138723373413086, 3.1671934127807617, 3.5205142498016357, 3.8738350868225098, 4.227156162261963, 4.580476760864258, 4.933797836303711, 5.287118911743164, 5.640439987182617, 5.99376106262207, 6.347081661224365, 6.700402736663818, 7.053723335266113, 7.407044410705566, 7.7603654861450195, 8.113686561584473, 8.46700668334961, 8.820327758789062, 9.173648834228516, 9.526969909667969, 9.880290985107422, 10.233612060546875, 10.586932182312012, 10.940253257751465, 11.293574333190918, 11.646895408630371, 12.000216484069824]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 9.0, 8.0, 9.0, 20.0, 15.0, 13.0, 22.0, 14.0, 20.0, 14.0, 44.0, 28.0, 31.0, 32.0, 53.0, 52.0, 42.0, 37.0, 39.0, 45.0, 47.0, 45.0, 39.0, 42.0, 39.0, 33.0, 25.0, 33.0, 24.0, 16.0, 15.0, 11.0, 16.0, 12.0, 12.0, 10.0, 4.0, 6.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.234375, -19.549072265625, -18.86376953125, -18.178466796875, -17.4931640625, -16.807861328125, -16.12255859375, -15.437255859375, -14.751953125, -14.066650390625, -13.38134765625, -12.696044921875, -12.0107421875, -11.325439453125, -10.64013671875, -9.954833984375, -9.26953125, -8.584228515625, -7.89892578125, -7.213623046875, -6.5283203125, -5.843017578125, -5.15771484375, -4.472412109375, -3.787109375, -3.101806640625, -2.41650390625, -1.731201171875, -1.0458984375, -0.360595703125, 0.32470703125, 1.010009765625, 1.6953125, 2.380615234375, 3.06591796875, 3.751220703125, 4.4365234375, 5.121826171875, 5.80712890625, 6.492431640625, 7.177734375, 7.863037109375, 8.54833984375, 9.233642578125, 9.9189453125, 10.604248046875, 11.28955078125, 11.974853515625, 12.66015625, 13.345458984375, 14.03076171875, 14.716064453125, 15.4013671875, 16.086669921875, 16.77197265625, 17.457275390625, 18.142578125, 18.827880859375, 19.51318359375, 20.198486328125, 20.8837890625, 21.569091796875, 22.25439453125, 22.939697265625, 23.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 12.0, 27.0, 53.0, 67.0, 103.0, 128.0, 200.0, 282.0, 398.0, 617.0, 813.0, 1236.0, 1927.0, 2918.0, 4492.0, 6786.0, 10815.0, 16967.0, 27432.0, 44778.0, 75612.0, 129236.0, 206409.0, 202641.0, 125162.0, 73406.0, 43279.0, 26304.0, 16432.0, 10301.0, 6758.0, 4447.0, 2797.0, 1903.0, 1272.0, 851.0, 583.0, 362.0, 246.0, 147.0, 109.0, 68.0, 40.0, 34.0, 28.0, 17.0, 22.0, 7.0, 10.0, 4.0, 4.0, 6.0, 3.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9124298095703125, -0.882965087890625, -0.8535003662109375, -0.82403564453125, -0.7945709228515625, -0.765106201171875, -0.7356414794921875, -0.7061767578125, -0.6767120361328125, -0.647247314453125, -0.6177825927734375, -0.58831787109375, -0.5588531494140625, -0.529388427734375, -0.4999237060546875, -0.470458984375, -0.4409942626953125, -0.411529541015625, -0.3820648193359375, -0.35260009765625, -0.3231353759765625, -0.293670654296875, -0.2642059326171875, -0.2347412109375, -0.2052764892578125, -0.175811767578125, -0.1463470458984375, -0.11688232421875, -0.0874176025390625, -0.057952880859375, -0.0284881591796875, 0.0009765625, 0.0304412841796875, 0.059906005859375, 0.0893707275390625, 0.11883544921875, 0.1483001708984375, 0.177764892578125, 0.2072296142578125, 0.2366943359375, 0.2661590576171875, 0.295623779296875, 0.3250885009765625, 0.35455322265625, 0.3840179443359375, 0.413482666015625, 0.4429473876953125, 0.472412109375, 0.5018768310546875, 0.531341552734375, 0.5608062744140625, 0.59027099609375, 0.6197357177734375, 0.649200439453125, 0.6786651611328125, 0.7081298828125, 0.7375946044921875, 0.767059326171875, 0.7965240478515625, 0.82598876953125, 0.8554534912109375, 0.884918212890625, 0.9143829345703125, 0.94384765625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 5.0, 3.0, 15.0, 10.0, 9.0, 12.0, 15.0, 14.0, 22.0, 33.0, 38.0, 26.0, 42.0, 36.0, 39.0, 38.0, 38.0, 41.0, 1070.0, 47.0, 50.0, 47.0, 41.0, 36.0, 42.0, 32.0, 43.0, 31.0, 18.0, 28.0, 19.0, 21.0, 11.0, 7.0, 9.0, 4.0, 7.0, 4.0, 7.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-15.0, -14.5780029296875, -14.156005859375, -13.7340087890625, -13.31201171875, -12.8900146484375, -12.468017578125, -12.0460205078125, -11.6240234375, -11.2020263671875, -10.780029296875, -10.3580322265625, -9.93603515625, -9.5140380859375, -9.092041015625, -8.6700439453125, -8.248046875, -7.8260498046875, -7.404052734375, -6.9820556640625, -6.56005859375, -6.1380615234375, -5.716064453125, -5.2940673828125, -4.8720703125, -4.4500732421875, -4.028076171875, -3.6060791015625, -3.18408203125, -2.7620849609375, -2.340087890625, -1.9180908203125, -1.49609375, -1.0740966796875, -0.652099609375, -0.2301025390625, 0.19189453125, 0.6138916015625, 1.035888671875, 1.4578857421875, 1.8798828125, 2.3018798828125, 2.723876953125, 3.1458740234375, 3.56787109375, 3.9898681640625, 4.411865234375, 4.8338623046875, 5.255859375, 5.6778564453125, 6.099853515625, 6.5218505859375, 6.94384765625, 7.3658447265625, 7.787841796875, 8.2098388671875, 8.6318359375, 9.0538330078125, 9.475830078125, 9.8978271484375, 10.31982421875, 10.7418212890625, 11.163818359375, 11.5858154296875, 12.0078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 10.0, 23.0, 30.0, 37.0, 59.0, 83.0, 134.0, 197.0, 313.0, 504.0, 736.0, 1124.0, 1677.0, 2704.0, 3992.0, 6182.0, 9345.0, 14396.0, 23125.0, 37566.0, 64987.0, 112650.0, 246332.0, 1200085.0, 153467.0, 85741.0, 49592.0, 29819.0, 18373.0, 11862.0, 7406.0, 4891.0, 3397.0, 2135.0, 1403.0, 908.0, 683.0, 385.0, 258.0, 181.0, 93.0, 90.0, 53.0, 35.0, 10.0, 18.0, 11.0, 8.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.90234375, -0.875213623046875, -0.84808349609375, -0.820953369140625, -0.7938232421875, -0.766693115234375, -0.73956298828125, -0.712432861328125, -0.685302734375, -0.658172607421875, -0.63104248046875, -0.603912353515625, -0.5767822265625, -0.549652099609375, -0.52252197265625, -0.495391845703125, -0.46826171875, -0.441131591796875, -0.41400146484375, -0.386871337890625, -0.3597412109375, -0.332611083984375, -0.30548095703125, -0.278350830078125, -0.251220703125, -0.224090576171875, -0.19696044921875, -0.169830322265625, -0.1427001953125, -0.115570068359375, -0.08843994140625, -0.061309814453125, -0.0341796875, -0.007049560546875, 0.02008056640625, 0.047210693359375, 0.0743408203125, 0.101470947265625, 0.12860107421875, 0.155731201171875, 0.182861328125, 0.209991455078125, 0.23712158203125, 0.264251708984375, 0.2913818359375, 0.318511962890625, 0.34564208984375, 0.372772216796875, 0.39990234375, 0.427032470703125, 0.45416259765625, 0.481292724609375, 0.5084228515625, 0.535552978515625, 0.56268310546875, 0.589813232421875, 0.616943359375, 0.644073486328125, 0.67120361328125, 0.698333740234375, 0.7254638671875, 0.752593994140625, 0.77972412109375, 0.806854248046875, 0.833984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 8.0, 9.0, 17.0, 26.0, 33.0, 37.0, 45.0, 61.0, 60.0, 72.0, 85.0, 81.0, 87.0, 56.0, 46.0, 54.0, 38.0, 42.0, 24.0, 23.0, 21.0, 6.0, 9.0, 9.0, 2.0, 3.0, 5.0, 11.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03564453125, -0.034639596939086914, -0.03363466262817383, -0.03262972831726074, -0.031624794006347656, -0.03061985969543457, -0.029614925384521484, -0.0286099910736084, -0.027605056762695312, -0.026600122451782227, -0.02559518814086914, -0.024590253829956055, -0.02358531951904297, -0.022580385208129883, -0.021575450897216797, -0.02057051658630371, -0.019565582275390625, -0.01856064796447754, -0.017555713653564453, -0.016550779342651367, -0.015545845031738281, -0.014540910720825195, -0.01353597640991211, -0.012531042098999023, -0.011526107788085938, -0.010521173477172852, -0.009516239166259766, -0.00851130485534668, -0.007506370544433594, -0.006501436233520508, -0.005496501922607422, -0.004491567611694336, -0.00348663330078125, -0.002481698989868164, -0.0014767646789550781, -0.0004718303680419922, 0.0005331039428710938, 0.0015380382537841797, 0.0025429725646972656, 0.0035479068756103516, 0.0045528411865234375, 0.0055577754974365234, 0.006562709808349609, 0.007567644119262695, 0.008572578430175781, 0.009577512741088867, 0.010582447052001953, 0.011587381362915039, 0.012592315673828125, 0.013597249984741211, 0.014602184295654297, 0.015607118606567383, 0.01661205291748047, 0.017616987228393555, 0.01862192153930664, 0.019626855850219727, 0.020631790161132812, 0.0216367244720459, 0.022641658782958984, 0.02364659309387207, 0.024651527404785156, 0.025656461715698242, 0.026661396026611328, 0.027666330337524414, 0.0286712646484375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 18.0, 12.0, 27.0, 31.0, 36.0, 55.0, 69.0, 75.0, 144.0, 249.0, 448.0, 808.0, 1679.0, 3467.0, 7738.0, 19040.0, 50212.0, 141199.0, 358898.0, 293405.0, 105765.0, 38097.0, 14855.0, 6306.0, 2796.0, 1317.0, 758.0, 393.0, 201.0, 143.0, 78.0, 62.0, 56.0, 27.0, 26.0, 17.0, 9.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.115966796875, -0.11220932006835938, -0.10845184326171875, -0.10469436645507812, -0.1009368896484375, -0.09717941284179688, -0.09342193603515625, -0.08966445922851562, -0.085906982421875, -0.08214950561523438, -0.07839202880859375, -0.07463455200195312, -0.0708770751953125, -0.06711959838867188, -0.06336212158203125, -0.059604644775390625, -0.05584716796875, -0.052089691162109375, -0.04833221435546875, -0.044574737548828125, -0.0408172607421875, -0.037059783935546875, -0.03330230712890625, -0.029544830322265625, -0.025787353515625, -0.022029876708984375, -0.01827239990234375, -0.014514923095703125, -0.0107574462890625, -0.006999969482421875, -0.00324249267578125, 0.000514984130859375, 0.0042724609375, 0.008029937744140625, 0.01178741455078125, 0.015544891357421875, 0.0193023681640625, 0.023059844970703125, 0.02681732177734375, 0.030574798583984375, 0.034332275390625, 0.038089752197265625, 0.04184722900390625, 0.045604705810546875, 0.0493621826171875, 0.053119659423828125, 0.05687713623046875, 0.060634613037109375, 0.06439208984375, 0.06814956665039062, 0.07190704345703125, 0.07566452026367188, 0.0794219970703125, 0.08317947387695312, 0.08693695068359375, 0.09069442749023438, 0.094451904296875, 0.09820938110351562, 0.10196685791015625, 0.10572433471679688, 0.1094818115234375, 0.11323928833007812, 0.11699676513671875, 0.12075424194335938, 0.12451171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 5.0, 8.0, 13.0, 10.0, 17.0, 19.0, 26.0, 44.0, 58.0, 57.0, 76.0, 92.0, 109.0, 98.0, 91.0, 70.0, 64.0, 45.0, 28.0, 22.0, 12.0, 9.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07604219764471054, -0.07435810565948486, -0.07267400622367859, -0.07098991423845291, -0.06930582225322723, -0.06762173026800156, -0.06593763083219528, -0.0642535388469696, -0.06256944686174393, -0.06088535115122795, -0.059201259166002274, -0.0575171634554863, -0.05583307147026062, -0.054148975759744644, -0.05246488004922867, -0.05078078806400299, -0.049096692353487015, -0.04741259664297104, -0.04572850465774536, -0.044044408947229385, -0.04236031696200371, -0.04067622125148773, -0.038992129266262054, -0.03730803355574608, -0.0356239378452301, -0.03393984213471413, -0.03225575014948845, -0.030571654438972473, -0.028887562453746796, -0.02720346674323082, -0.025519372895359993, -0.023835279047489166, -0.02215118706226349, -0.020467093214392662, -0.018782999366521835, -0.01709890365600586, -0.015414810739457607, -0.01373071689158678, -0.01204662211239338, -0.010362528264522552, -0.008678434416651726, -0.006994340568780899, -0.005310246255248785, -0.003626151941716671, -0.0019420580938458443, -0.00025796424597501755, 0.0014261305332183838, 0.0031102243810892105, 0.004794318228960037, 0.006478412076830864, 0.00816250592470169, 0.009846600703895092, 0.011530694551765919, 0.013214788399636745, 0.014898883178830147, 0.016582977026700974, 0.0182670708745718, 0.019951164722442627, 0.021635258570313454, 0.02331935241818428, 0.025003448128700256, 0.026687540113925934, 0.02837163582444191, 0.030055729672312737, 0.03173982352018356]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 12.0, 9.0, 15.0, 17.0, 20.0, 14.0, 20.0, 27.0, 32.0, 24.0, 32.0, 37.0, 35.0, 29.0, 37.0, 40.0, 32.0, 38.0, 29.0, 52.0, 35.0, 26.0, 41.0, 32.0, 20.0, 37.0, 31.0, 25.0, 22.0, 20.0, 18.0, 17.0, 11.0, 11.0, 12.0, 13.0, 10.0, 8.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.03223389387130737, -0.03132842481136322, -0.03042295202612877, -0.029517481103539467, -0.028612010180950165, -0.027706539258360863, -0.02680106833577156, -0.02589559741318226, -0.024990126490592957, -0.024084655568003654, -0.023179184645414352, -0.02227371372282505, -0.02136824280023575, -0.020462771877646446, -0.019557300955057144, -0.018651830032467842, -0.01774635910987854, -0.016840888187289238, -0.015935417264699936, -0.015029946342110634, -0.014124475419521332, -0.01321900449693203, -0.012313533574342728, -0.011408062651753426, -0.010502591729164124, -0.009597120806574821, -0.00869164988398552, -0.007786178961396217, -0.006880708038806915, -0.005975237116217613, -0.005069766193628311, -0.004164295271039009, -0.003258824348449707, -0.002353353425860405, -0.001447882503271103, -0.0005424115806818008, 0.0003630593419075012, 0.0012685302644968033, 0.0021740011870861053, 0.0030794721096754074, 0.0039849430322647095, 0.0048904139548540115, 0.005795884877443314, 0.006701355800032616, 0.007606826722621918, 0.00851229764521122, 0.009417768567800522, 0.010323239490389824, 0.011228710412979126, 0.012134181335568428, 0.01303965225815773, 0.013945123180747032, 0.014850594103336334, 0.015756065025925636, 0.01666153594851494, 0.01756700687110424, 0.018472477793693542, 0.019377948716282845, 0.020283419638872147, 0.02118889056146145, 0.02209436148405075, 0.022999832406640053, 0.023905303329229355, 0.024810774251818657, 0.02571624517440796]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 9.0, 20.0, 15.0, 13.0, 22.0, 15.0, 17.0, 16.0, 44.0, 30.0, 27.0, 37.0, 51.0, 51.0, 40.0, 38.0, 40.0, 42.0, 49.0, 47.0, 42.0, 40.0, 38.0, 31.0, 26.0, 34.0, 23.0, 17.0, 14.0, 11.0, 16.0, 12.0, 10.0, 11.0, 5.0, 6.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.203125, -19.51904296875, -18.8349609375, -18.15087890625, -17.466796875, -16.78271484375, -16.0986328125, -15.41455078125, -14.73046875, -14.04638671875, -13.3623046875, -12.67822265625, -11.994140625, -11.31005859375, -10.6259765625, -9.94189453125, -9.2578125, -8.57373046875, -7.8896484375, -7.20556640625, -6.521484375, -5.83740234375, -5.1533203125, -4.46923828125, -3.78515625, -3.10107421875, -2.4169921875, -1.73291015625, -1.048828125, -0.36474609375, 0.3193359375, 1.00341796875, 1.6875, 2.37158203125, 3.0556640625, 3.73974609375, 4.423828125, 5.10791015625, 5.7919921875, 6.47607421875, 7.16015625, 7.84423828125, 8.5283203125, 9.21240234375, 9.896484375, 10.58056640625, 11.2646484375, 11.94873046875, 12.6328125, 13.31689453125, 14.0009765625, 14.68505859375, 15.369140625, 16.05322265625, 16.7373046875, 17.42138671875, 18.10546875, 18.78955078125, 19.4736328125, 20.15771484375, 20.841796875, 21.52587890625, 22.2099609375, 22.89404296875, 23.578125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 1.0, 4.0, 4.0, 7.0, 8.0, 7.0, 12.0, 20.0, 25.0, 23.0, 35.0, 37.0, 43.0, 71.0, 153.0, 218.0, 336.0, 569.0, 1183.0, 3798.0, 17829.0, 146528.0, 695392.0, 156446.0, 19190.0, 3804.0, 1238.0, 594.0, 329.0, 211.0, 138.0, 87.0, 63.0, 25.0, 30.0, 16.0, 17.0, 17.0, 10.0, 10.0, 8.0, 4.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.18902587890625, -4.0421142578125, -3.89520263671875, -3.748291015625, -3.60137939453125, -3.4544677734375, -3.30755615234375, -3.16064453125, -3.01373291015625, -2.8668212890625, -2.71990966796875, -2.572998046875, -2.42608642578125, -2.2791748046875, -2.13226318359375, -1.9853515625, -1.83843994140625, -1.6915283203125, -1.54461669921875, -1.397705078125, -1.25079345703125, -1.1038818359375, -0.95697021484375, -0.81005859375, -0.66314697265625, -0.5162353515625, -0.36932373046875, -0.222412109375, -0.07550048828125, 0.0714111328125, 0.21832275390625, 0.365234375, 0.51214599609375, 0.6590576171875, 0.80596923828125, 0.952880859375, 1.09979248046875, 1.2467041015625, 1.39361572265625, 1.54052734375, 1.68743896484375, 1.8343505859375, 1.98126220703125, 2.128173828125, 2.27508544921875, 2.4219970703125, 2.56890869140625, 2.7158203125, 2.86273193359375, 3.0096435546875, 3.15655517578125, 3.303466796875, 3.45037841796875, 3.5972900390625, 3.74420166015625, 3.89111328125, 4.03802490234375, 4.1849365234375, 4.33184814453125, 4.478759765625, 4.62567138671875, 4.7725830078125, 4.91949462890625, 5.06640625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 13.0, 13.0, 14.0, 23.0, 25.0, 35.0, 40.0, 47.0, 46.0, 52.0, 46.0, 56.0, 336.0, 1853.0, 46.0, 45.0, 56.0, 47.0, 41.0, 45.0, 34.0, 22.0, 29.0, 18.0, 7.0, 12.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.59375, -41.47412109375, -40.3544921875, -39.23486328125, -38.115234375, -36.99560546875, -35.8759765625, -34.75634765625, -33.63671875, -32.51708984375, -31.3974609375, -30.27783203125, -29.158203125, -28.03857421875, -26.9189453125, -25.79931640625, -24.6796875, -23.56005859375, -22.4404296875, -21.32080078125, -20.201171875, -19.08154296875, -17.9619140625, -16.84228515625, -15.72265625, -14.60302734375, -13.4833984375, -12.36376953125, -11.244140625, -10.12451171875, -9.0048828125, -7.88525390625, -6.765625, -5.64599609375, -4.5263671875, -3.40673828125, -2.287109375, -1.16748046875, -0.0478515625, 1.07177734375, 2.19140625, 3.31103515625, 4.4306640625, 5.55029296875, 6.669921875, 7.78955078125, 8.9091796875, 10.02880859375, 11.1484375, 12.26806640625, 13.3876953125, 14.50732421875, 15.626953125, 16.74658203125, 17.8662109375, 18.98583984375, 20.10546875, 21.22509765625, 22.3447265625, 23.46435546875, 24.583984375, 25.70361328125, 26.8232421875, 27.94287109375, 29.0625]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 5.0, 9.0, 5.0, 17.0, 29.0, 26.0, 32.0, 61.0, 100.0, 167.0, 349.0, 786.0, 2347.0, 10358.0, 110014.0, 2879362.0, 126466.0, 11429.0, 2484.0, 794.0, 361.0, 182.0, 112.0, 51.0, 42.0, 39.0, 21.0, 12.0, 11.0, 6.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.7138671875, -3.568359375, -3.4228515625, -3.27734375, -3.1318359375, -2.986328125, -2.8408203125, -2.6953125, -2.5498046875, -2.404296875, -2.2587890625, -2.11328125, -1.9677734375, -1.822265625, -1.6767578125, -1.53125, -1.3857421875, -1.240234375, -1.0947265625, -0.94921875, -0.8037109375, -0.658203125, -0.5126953125, -0.3671875, -0.2216796875, -0.076171875, 0.0693359375, 0.21484375, 0.3603515625, 0.505859375, 0.6513671875, 0.796875, 0.9423828125, 1.087890625, 1.2333984375, 1.37890625, 1.5244140625, 1.669921875, 1.8154296875, 1.9609375, 2.1064453125, 2.251953125, 2.3974609375, 2.54296875, 2.6884765625, 2.833984375, 2.9794921875, 3.125, 3.2705078125, 3.416015625, 3.5615234375, 3.70703125, 3.8525390625, 3.998046875, 4.1435546875, 4.2890625, 4.4345703125, 4.580078125, 4.7255859375, 4.87109375, 5.0166015625, 5.162109375, 5.3076171875, 5.453125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 12.0, 44.0, 65.0, 139.0, 240.0, 204.0, 119.0, 71.0, 32.0, 19.0, 19.0, 5.0, 5.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.50821304321289, -36.230491638183594, -33.9527702331543, -31.675048828125, -29.397327423095703, -27.119606018066406, -24.841886520385742, -22.564165115356445, -20.28644371032715, -18.00872230529785, -15.731000900268555, -13.453280448913574, -11.175559043884277, -8.89783763885498, -6.6201171875, -4.342395782470703, -2.0646743774414062, 0.21304678916931152, 2.4907679557800293, 4.768488883972168, 7.046210289001465, 9.323931694030762, 11.601652145385742, 13.879373550415039, 16.157094955444336, 18.434816360473633, 20.71253776550293, 22.990257263183594, 25.26797866821289, 27.545700073242188, 29.823421478271484, 32.10114288330078, 34.378868103027344, 36.65658950805664, 38.93431091308594, 41.212032318115234, 43.48975372314453, 45.76747512817383, 48.045196533203125, 50.322914123535156, 52.60063934326172, 54.878360748291016, 57.15608215332031, 59.43380355834961, 61.711524963378906, 63.9892463684082, 66.2669677734375, 68.54468536376953, 70.82240295410156, 73.1001205444336, 75.37784576416016, 77.65556335449219, 79.93328857421875, 82.21100616455078, 84.48873138427734, 86.76644897460938, 89.04417419433594, 91.32189178466797, 93.59961700439453, 95.87733459472656, 98.15505981445312, 100.43277740478516, 102.71050262451172, 104.98822021484375, 107.26594543457031]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 3.0, 1.0, 6.0, 7.0, 8.0, 14.0, 14.0, 15.0, 19.0, 16.0, 23.0, 25.0, 30.0, 35.0, 36.0, 33.0, 45.0, 36.0, 24.0, 43.0, 35.0, 36.0, 41.0, 37.0, 36.0, 45.0, 29.0, 38.0, 37.0, 25.0, 18.0, 20.0, 21.0, 20.0, 17.0, 18.0, 13.0, 14.0, 13.0, 10.0, 14.0, 8.0, 6.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.845970153808594, -33.69481658935547, -32.543663024902344, -31.392505645751953, -30.241352081298828, -29.090198516845703, -27.939043045043945, -26.787887573242188, -25.636734008789062, -24.485580444335938, -23.33442497253418, -22.183269500732422, -21.032115936279297, -19.880962371826172, -18.729806900024414, -17.578651428222656, -16.42749786376953, -15.27634334564209, -14.125188827514648, -12.974034309387207, -11.822879791259766, -10.671725273132324, -9.520570755004883, -8.369416236877441, -7.21826171875, -6.067107200622559, -4.915952682495117, -3.764798164367676, -2.6136436462402344, -1.462489128112793, -0.31133460998535156, 0.8398199081420898, 1.9909782409667969, 3.1421327590942383, 4.29328727722168, 5.444441795349121, 6.5955963134765625, 7.746750831604004, 8.897905349731445, 10.049059867858887, 11.200214385986328, 12.35136890411377, 13.502523422241211, 14.653677940368652, 15.804832458496094, 16.95598602294922, 18.107141494750977, 19.258296966552734, 20.40945053100586, 21.560604095458984, 22.711759567260742, 23.8629150390625, 25.014068603515625, 26.16522216796875, 27.316377639770508, 28.467533111572266, 29.61868667602539, 30.769840240478516, 31.920995712280273, 33.07215118408203, 34.223304748535156, 35.37445831298828, 36.525611877441406, 37.6767692565918, 38.82792282104492]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 13.0, 10.0, 15.0, 25.0, 31.0, 35.0, 55.0, 73.0, 100.0, 127.0, 171.0, 359.0, 663.0, 1627.0, 4053.0, 10969.0, 1021848.0, 4688.0, 1823.0, 734.0, 365.0, 226.0, 139.0, 103.0, 82.0, 57.0, 45.0, 28.0, 21.0, 19.0, 15.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.13714599609375, -10.6744384765625, -10.21173095703125, -9.749022483825684, -9.286314964294434, -8.823607444763184, -8.360898971557617, -7.898191452026367, -7.435483932495117, -6.972776412963867, -6.510068416595459, -6.047360420227051, -5.584652900695801, -5.121945381164551, -4.659237384796143, -4.196529388427734, -3.7338218688964844, -3.2711141109466553, -2.808406352996826, -2.345698595046997, -1.882990837097168, -1.4202830791473389, -0.9575753211975098, -0.49486756324768066, -0.03215980529785156, 0.43054795265197754, 0.8932557106018066, 1.3559634685516357, 1.8186712265014648, 2.281378984451294, 2.744086742401123, 3.206794500350952, 3.6695022583007812, 4.132209777832031, 4.5949177742004395, 5.057625770568848, 5.520333290100098, 5.983040809631348, 6.445748805999756, 6.908456802368164, 7.371164321899414, 7.833871841430664, 8.296579360961914, 8.75928783416748, 9.22199535369873, 9.68470287322998, 10.147411346435547, 10.610118865966797, 11.072826385498047, 11.535533905029297, 11.998241424560547, 12.460949897766113, 12.923657417297363, 13.386364936828613, 13.84907341003418, 14.31178092956543, 14.77448844909668, 15.23719596862793, 15.69990348815918, 16.16261100769043, 16.625320434570312, 17.088027954101562, 17.550735473632812, 18.013442993164062, 18.476150512695312]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 13.0, 15.0, 75.0, 1076.0, 51457952.0, 3714.0, 234.0, 32.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-390.0, -377.7001953125, -365.400390625, -353.1005859375, -340.8007507324219, -328.5009460449219, -316.2011413574219, -303.9013366699219, -291.60150146484375, -279.30169677734375, -267.00189208984375, -254.7020721435547, -242.40225219726562, -230.10244750976562, -217.80264282226562, -205.50283813476562, -193.20303344726562, -180.90322875976562, -168.60340881347656, -156.30360412597656, -144.0037841796875, -131.7039794921875, -119.4041748046875, -107.10436248779297, -94.80455017089844, -82.5047378540039, -70.20492553710938, -57.905120849609375, -45.605308532714844, -33.30549621582031, -21.005691528320312, -8.705879211425781, 3.59393310546875, 15.893743515014648, 28.193553924560547, 40.49336242675781, 52.793174743652344, 65.09298706054688, 77.39279174804688, 89.6926040649414, 101.99241638183594, 114.29222869873047, 126.592041015625, 138.891845703125, 151.191650390625, 163.49147033691406, 175.79127502441406, 188.09109497070312, 200.39089965820312, 212.69070434570312, 224.9905242919922, 237.2903289794922, 249.59014892578125, 261.88995361328125, 274.18975830078125, 286.48956298828125, 298.78936767578125, 311.08917236328125, 323.38897705078125, 335.68878173828125, 347.9886169433594, 360.2884216308594, 372.5882263183594, 384.8880310058594, 397.1878662109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 10.0, 4.0, 19.0, 23.0, 34.0, 55.0, 84.0, 116.0, 182.0, 308.0, 466.0, 721.0, 1112.0, 1880.0, 2981.0, 5156.0, 8807.0, 15064.0, 26892.0, 48875.0, 92445.0, 182910.0, 384089.0, 1117099.0, 2875204.0, 857101.0, 327935.0, 159065.0, 81652.0, 43596.0, 23954.0, 13577.0, 7828.0, 4656.0, 2809.0, 1678.0, 1061.0, 677.0, 444.0, 295.0, 169.0, 109.0, 86.0, 52.0, 42.0, 34.0, 20.0, 15.0, 14.0, 11.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-2.123046875, -2.057525634765625, -1.99200439453125, -1.926483154296875, -1.8609619140625, -1.795440673828125, -1.72991943359375, -1.664398193359375, -1.598876953125, -1.533355712890625, -1.46783447265625, -1.402313232421875, -1.3367919921875, -1.271270751953125, -1.20574951171875, -1.140228271484375, -1.07470703125, -1.009185791015625, -0.94366455078125, -0.878143310546875, -0.8126220703125, -0.747100830078125, -0.68157958984375, -0.616058349609375, -0.550537109375, -0.485015869140625, -0.41949462890625, -0.353973388671875, -0.2884521484375, -0.222930908203125, -0.15740966796875, -0.091888427734375, -0.0263671875, 0.039154052734375, 0.10467529296875, 0.170196533203125, 0.2357177734375, 0.301239013671875, 0.36676025390625, 0.432281494140625, 0.497802734375, 0.563323974609375, 0.62884521484375, 0.694366455078125, 0.7598876953125, 0.825408935546875, 0.89093017578125, 0.956451416015625, 1.02197265625, 1.087493896484375, 1.15301513671875, 1.218536376953125, 1.2840576171875, 1.349578857421875, 1.41510009765625, 1.480621337890625, 1.546142578125, 1.611663818359375, 1.67718505859375, 1.742706298828125, 1.8082275390625, 1.873748779296875, 1.93927001953125, 2.004791259765625, 2.0703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 4.0, 3.0, 4.0, 10.0, 8.0, 7.0, 15.0, 23.0, 21.0, 21.0, 16.0, 30.0, 28.0, 25.0, 29.0, 32.0, 37.0, 37.0, 58.0, 64.0, 280.0, 512.0, 261.0, 106.0, 42.0, 43.0, 29.0, 36.0, 28.0, 32.0, 25.0, 35.0, 29.0, 18.0, 20.0, 19.0, 13.0, 9.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.65557861328125, -6.4674072265625, -6.27923583984375, -6.091064453125, -5.90289306640625, -5.7147216796875, -5.52655029296875, -5.33837890625, -5.15020751953125, -4.9620361328125, -4.77386474609375, -4.585693359375, -4.39752197265625, -4.2093505859375, -4.02117919921875, -3.8330078125, -3.64483642578125, -3.4566650390625, -3.26849365234375, -3.080322265625, -2.89215087890625, -2.7039794921875, -2.51580810546875, -2.32763671875, -2.13946533203125, -1.9512939453125, -1.76312255859375, -1.574951171875, -1.38677978515625, -1.1986083984375, -1.01043701171875, -0.822265625, -0.63409423828125, -0.4459228515625, -0.25775146484375, -0.069580078125, 0.11859130859375, 0.3067626953125, 0.49493408203125, 0.68310546875, 0.87127685546875, 1.0594482421875, 1.24761962890625, 1.435791015625, 1.62396240234375, 1.8121337890625, 2.00030517578125, 2.1884765625, 2.37664794921875, 2.5648193359375, 2.75299072265625, 2.941162109375, 3.12933349609375, 3.3175048828125, 3.50567626953125, 3.69384765625, 3.88201904296875, 4.0701904296875, 4.25836181640625, 4.446533203125, 4.63470458984375, 4.8228759765625, 5.01104736328125, 5.19921875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 5.0, 7.0, 15.0, 30.0, 37.0, 69.0, 112.0, 146.0, 215.0, 356.0, 536.0, 786.0, 1347.0, 2068.0, 3220.0, 5088.0, 7596.0, 12065.0, 18540.0, 27977.0, 42564.0, 64338.0, 94231.0, 136698.0, 193540.0, 266740.0, 429184.0, 1414863.0, 2026510.0, 561114.0, 299138.0, 212462.0, 152140.0, 105993.0, 72061.0, 47946.0, 31735.0, 21040.0, 13715.0, 8953.0, 5793.0, 3722.0, 2455.0, 1546.0, 957.0, 630.0, 388.0, 281.0, 191.0, 103.0, 71.0, 41.0, 37.0, 17.0, 12.0, 12.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.880859375, -0.8534622192382812, -0.8260650634765625, -0.7986679077148438, -0.771270751953125, -0.7438735961914062, -0.7164764404296875, -0.6890792846679688, -0.66168212890625, -0.6342849731445312, -0.6068878173828125, -0.5794906616210938, -0.552093505859375, -0.5246963500976562, -0.4972991943359375, -0.46990203857421875, -0.4425048828125, -0.41510772705078125, -0.3877105712890625, -0.36031341552734375, -0.332916259765625, -0.30551910400390625, -0.2781219482421875, -0.25072479248046875, -0.22332763671875, -0.19593048095703125, -0.1685333251953125, -0.14113616943359375, -0.113739013671875, -0.08634185791015625, -0.0589447021484375, -0.03154754638671875, -0.004150390625, 0.02324676513671875, 0.0506439208984375, 0.07804107666015625, 0.105438232421875, 0.13283538818359375, 0.1602325439453125, 0.18762969970703125, 0.21502685546875, 0.24242401123046875, 0.2698211669921875, 0.29721832275390625, 0.324615478515625, 0.35201263427734375, 0.3794097900390625, 0.40680694580078125, 0.4342041015625, 0.46160125732421875, 0.4889984130859375, 0.5163955688476562, 0.543792724609375, 0.5711898803710938, 0.5985870361328125, 0.6259841918945312, 0.65338134765625, 0.6807785034179688, 0.7081756591796875, 0.7355728149414062, 0.762969970703125, 0.7903671264648438, 0.8177642822265625, 0.8451614379882812, 0.87255859375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 7.0, 8.0, 8.0, 7.0, 19.0, 25.0, 26.0, 21.0, 23.0, 31.0, 34.0, 24.0, 40.0, 36.0, 36.0, 52.0, 76.0, 303.0, 518.0, 217.0, 92.0, 47.0, 37.0, 38.0, 46.0, 30.0, 19.0, 23.0, 26.0, 22.0, 21.0, 12.0, 12.0, 11.0, 8.0, 14.0, 7.0, 11.0, 3.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.09375, -7.85797119140625, -7.6221923828125, -7.38641357421875, -7.150634765625, -6.91485595703125, -6.6790771484375, -6.44329833984375, -6.20751953125, -5.97174072265625, -5.7359619140625, -5.50018310546875, -5.264404296875, -5.02862548828125, -4.7928466796875, -4.55706787109375, -4.3212890625, -4.08551025390625, -3.8497314453125, -3.61395263671875, -3.378173828125, -3.14239501953125, -2.9066162109375, -2.67083740234375, -2.43505859375, -2.19927978515625, -1.9635009765625, -1.72772216796875, -1.491943359375, -1.25616455078125, -1.0203857421875, -0.78460693359375, -0.548828125, -0.31304931640625, -0.0772705078125, 0.15850830078125, 0.394287109375, 0.63006591796875, 0.8658447265625, 1.10162353515625, 1.33740234375, 1.57318115234375, 1.8089599609375, 2.04473876953125, 2.280517578125, 2.51629638671875, 2.7520751953125, 2.98785400390625, 3.2236328125, 3.45941162109375, 3.6951904296875, 3.93096923828125, 4.166748046875, 4.40252685546875, 4.6383056640625, 4.87408447265625, 5.10986328125, 5.34564208984375, 5.5814208984375, 5.81719970703125, 6.052978515625, 6.28875732421875, 6.5245361328125, 6.76031494140625, 6.99609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 4.0, 13.0, 12.0, 11.0, 25.0, 27.0, 69.0, 72.0, 89.0, 105.0, 173.0, 218.0, 318.0, 526.0, 988.0, 1590.0, 2558.0, 4945.0, 11017.0, 34198.0, 122837.0, 5837984.0, 194404.0, 50385.0, 15028.0, 6099.0, 3059.0, 1724.0, 1023.0, 613.0, 404.0, 263.0, 170.0, 138.0, 107.0, 60.0, 45.0, 37.0, 17.0, 34.0, 26.0, 6.0, 7.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-11.0390625, -10.7294921875, -10.419921875, -10.1103515625, -9.80078125, -9.4912109375, -9.181640625, -8.8720703125, -8.5625, -8.2529296875, -7.943359375, -7.6337890625, -7.32421875, -7.0146484375, -6.705078125, -6.3955078125, -6.0859375, -5.7763671875, -5.466796875, -5.1572265625, -4.84765625, -4.5380859375, -4.228515625, -3.9189453125, -3.609375, -3.2998046875, -2.990234375, -2.6806640625, -2.37109375, -2.0615234375, -1.751953125, -1.4423828125, -1.1328125, -0.8232421875, -0.513671875, -0.2041015625, 0.10546875, 0.4150390625, 0.724609375, 1.0341796875, 1.34375, 1.6533203125, 1.962890625, 2.2724609375, 2.58203125, 2.8916015625, 3.201171875, 3.5107421875, 3.8203125, 4.1298828125, 4.439453125, 4.7490234375, 5.05859375, 5.3681640625, 5.677734375, 5.9873046875, 6.296875, 6.6064453125, 6.916015625, 7.2255859375, 7.53515625, 7.8447265625, 8.154296875, 8.4638671875, 8.7734375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 12.0, 19.0, 11.0, 18.0, 26.0, 25.0, 23.0, 28.0, 18.0, 27.0, 28.0, 33.0, 40.0, 29.0, 41.0, 55.0, 472.0, 591.0, 74.0, 43.0, 32.0, 36.0, 26.0, 40.0, 40.0, 32.0, 21.0, 24.0, 17.0, 20.0, 23.0, 15.0, 6.0, 12.0, 12.0, 11.0, 4.0, 3.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.3671875, -14.90234375, -14.4375, -13.97265625, -13.5078125, -13.04296875, -12.578125, -12.11328125, -11.6484375, -11.18359375, -10.71875, -10.25390625, -9.7890625, -9.32421875, -8.859375, -8.39453125, -7.9296875, -7.46484375, -7.0, -6.53515625, -6.0703125, -5.60546875, -5.140625, -4.67578125, -4.2109375, -3.74609375, -3.28125, -2.81640625, -2.3515625, -1.88671875, -1.421875, -0.95703125, -0.4921875, -0.02734375, 0.4375, 0.90234375, 1.3671875, 1.83203125, 2.296875, 2.76171875, 3.2265625, 3.69140625, 4.15625, 4.62109375, 5.0859375, 5.55078125, 6.015625, 6.48046875, 6.9453125, 7.41015625, 7.875, 8.33984375, 8.8046875, 9.26953125, 9.734375, 10.19921875, 10.6640625, 11.12890625, 11.59375, 12.05859375, 12.5234375, 12.98828125, 13.453125, 13.91796875, 14.3828125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 16.0, 53.0, 568.0, 286.0, 31.0, 13.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.99908447265625, -96.27044677734375, -92.54180145263672, -88.81315612792969, -85.08451843261719, -81.35588073730469, -77.62723541259766, -73.89859008789062, -70.16995239257812, -66.44131469726562, -62.712669372558594, -58.98402786254883, -55.25538635253906, -51.5267448425293, -47.79810333251953, -44.069461822509766, -40.3408203125, -36.612178802490234, -32.88353729248047, -29.154895782470703, -25.426254272460938, -21.697612762451172, -17.968971252441406, -14.24032974243164, -10.511688232421875, -6.783046722412109, -3.0544052124023438, 0.6742362976074219, 4.4028778076171875, 8.131519317626953, 11.860160827636719, 15.588802337646484, 19.31744384765625, 23.046085357666016, 26.77472686767578, 30.503368377685547, 34.23200988769531, 37.96065139770508, 41.689292907714844, 45.41793441772461, 49.146575927734375, 52.87521743774414, 56.603858947753906, 60.33250045776367, 64.06114196777344, 67.78977966308594, 71.51842498779297, 75.2470703125, 78.9757080078125, 82.704345703125, 86.43299102783203, 90.16163635253906, 93.89027404785156, 97.61891174316406, 101.3475570678711, 105.07620239257812, 108.80484008789062, 112.53347778320312, 116.26212310791016, 119.99076843261719, 123.71940612792969, 127.44804382324219, 131.17669677734375, 134.90533447265625, 138.63397216796875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 5.0, 5.0, 8.0, 9.0, 17.0, 19.0, 22.0, 62.0, 237.0, 309.0, 140.0, 39.0, 24.0, 12.0, 12.0, 10.0, 11.0, 14.0, 5.0, 3.0, 10.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-119.98593139648438, -117.08096313476562, -114.17599487304688, -111.27102661132812, -108.36605834960938, -105.46109008789062, -102.55612182617188, -99.6511459350586, -96.74617767333984, -93.8412094116211, -90.93624114990234, -88.0312728881836, -85.12630462646484, -82.22132873535156, -79.31636047363281, -76.41139221191406, -73.50642395019531, -70.60145568847656, -67.69648742675781, -64.79151916503906, -61.88654708862305, -58.9815788269043, -56.07661056518555, -53.17163848876953, -50.26667785644531, -47.36170959472656, -44.45674133300781, -41.55177307128906, -38.64680099487305, -35.7418327331543, -32.83686447143555, -29.931894302368164, -27.02692413330078, -24.12195587158203, -21.21698570251465, -18.3120174407959, -15.407048225402832, -12.502079010009766, -9.597110748291016, -6.692140579223633, -3.787172317504883, -0.8822033405303955, 2.022765636444092, 4.927734375, 7.832703590393066, 10.737672805786133, 13.642641067504883, 16.547611236572266, 19.452579498291016, 22.357547760009766, 25.26251792907715, 28.1674861907959, 31.07245635986328, 33.97742462158203, 36.88239288330078, 39.78736114501953, 42.69232940673828, 45.59729766845703, 48.50226593017578, 51.40723419189453, 54.31220626831055, 57.2171745300293, 60.12214279174805, 63.02711486816406, 65.93208312988281]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 8.0, 16.0, 12.0, 21.0, 23.0, 36.0, 50.0, 71.0, 114.0, 171.0, 315.0, 423.0, 776.0, 1386.0, 2622.0, 5457.0, 14605.0, 87814.0, 4010926.0, 45924.0, 11828.0, 5116.0, 2603.0, 1435.0, 812.0, 540.0, 357.0, 262.0, 174.0, 132.0, 78.0, 45.0, 34.0, 26.0, 16.0, 17.0, 13.0, 6.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.417724609375, -0.4044151306152344, -0.39110565185546875, -0.3777961730957031, -0.3644866943359375, -0.3511772155761719, -0.33786773681640625, -0.3245582580566406, -0.311248779296875, -0.2979393005371094, -0.28462982177734375, -0.2713203430175781, -0.2580108642578125, -0.24470138549804688, -0.23139190673828125, -0.21808242797851562, -0.20477294921875, -0.19146347045898438, -0.17815399169921875, -0.16484451293945312, -0.1515350341796875, -0.13822555541992188, -0.12491607666015625, -0.11160659790039062, -0.098297119140625, -0.08498764038085938, -0.07167816162109375, -0.058368682861328125, -0.0450592041015625, -0.031749725341796875, -0.01844024658203125, -0.005130767822265625, 0.0081787109375, 0.021488189697265625, 0.03479766845703125, 0.048107147216796875, 0.0614166259765625, 0.07472610473632812, 0.08803558349609375, 0.10134506225585938, 0.114654541015625, 0.12796401977539062, 0.14127349853515625, 0.15458297729492188, 0.1678924560546875, 0.18120193481445312, 0.19451141357421875, 0.20782089233398438, 0.22113037109375, 0.23443984985351562, 0.24774932861328125, 0.2610588073730469, 0.2743682861328125, 0.2876777648925781, 0.30098724365234375, 0.3142967224121094, 0.327606201171875, 0.3409156799316406, 0.35422515869140625, 0.3675346374511719, 0.3808441162109375, 0.3941535949707031, 0.40746307373046875, 0.4207725524902344, 0.43408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 12.0, 6.0, 7.0, 8.0, 15.0, 61.0, 722.0, 14.0, 15.0, 11.0, 8.0, 2.0, 9.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 11.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.179931640625, -0.17404937744140625, -0.1681671142578125, -0.16228485107421875, -0.156402587890625, -0.15052032470703125, -0.1446380615234375, -0.13875579833984375, -0.13287353515625, -0.12699127197265625, -0.1211090087890625, -0.11522674560546875, -0.109344482421875, -0.10346221923828125, -0.0975799560546875, -0.09169769287109375, -0.0858154296875, -0.07993316650390625, -0.0740509033203125, -0.06816864013671875, -0.062286376953125, -0.05640411376953125, -0.0505218505859375, -0.04463958740234375, -0.03875732421875, -0.03287506103515625, -0.0269927978515625, -0.02111053466796875, -0.015228271484375, -0.00934600830078125, -0.0034637451171875, 0.00241851806640625, 0.00830078125, 0.01418304443359375, 0.0200653076171875, 0.02594757080078125, 0.031829833984375, 0.03771209716796875, 0.0435943603515625, 0.04947662353515625, 0.05535888671875, 0.06124114990234375, 0.0671234130859375, 0.07300567626953125, 0.078887939453125, 0.08477020263671875, 0.0906524658203125, 0.09653472900390625, 0.1024169921875, 0.10829925537109375, 0.1141815185546875, 0.12006378173828125, 0.125946044921875, 0.13182830810546875, 0.1377105712890625, 0.14359283447265625, 0.14947509765625, 0.15535736083984375, 0.1612396240234375, 0.16712188720703125, 0.173004150390625, 0.17888641357421875, 0.1847686767578125, 0.19065093994140625, 0.196533203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 2.0, 3.0, 8.0, 7.0, 9.0, 18.0, 36.0, 35.0, 64.0, 132.0, 214.0, 417.0, 859.0, 2042.0, 5652.0, 19844.0, 107332.0, 3573920.0, 422886.0, 43727.0, 10600.0, 3551.0, 1418.0, 629.0, 353.0, 173.0, 122.0, 85.0, 59.0, 21.0, 23.0, 8.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48095703125, -0.46228790283203125, -0.4436187744140625, -0.42494964599609375, -0.406280517578125, -0.38761138916015625, -0.3689422607421875, -0.35027313232421875, -0.33160400390625, -0.31293487548828125, -0.2942657470703125, -0.27559661865234375, -0.256927490234375, -0.23825836181640625, -0.2195892333984375, -0.20092010498046875, -0.1822509765625, -0.16358184814453125, -0.1449127197265625, -0.12624359130859375, -0.107574462890625, -0.08890533447265625, -0.0702362060546875, -0.05156707763671875, -0.03289794921875, -0.01422882080078125, 0.0044403076171875, 0.02310943603515625, 0.041778564453125, 0.06044769287109375, 0.0791168212890625, 0.09778594970703125, 0.116455078125, 0.13512420654296875, 0.1537933349609375, 0.17246246337890625, 0.191131591796875, 0.20980072021484375, 0.2284698486328125, 0.24713897705078125, 0.26580810546875, 0.28447723388671875, 0.3031463623046875, 0.32181549072265625, 0.340484619140625, 0.35915374755859375, 0.3778228759765625, 0.39649200439453125, 0.4151611328125, 0.43383026123046875, 0.4524993896484375, 0.47116851806640625, 0.489837646484375, 0.5085067749023438, 0.5271759033203125, 0.5458450317382812, 0.56451416015625, 0.5831832885742188, 0.6018524169921875, 0.6205215454101562, 0.639190673828125, 0.6578598022460938, 0.6765289306640625, 0.6951980590820312, 0.7138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 11.0, 18.0, 15.0, 28.0, 33.0, 47.0, 55.0, 99.0, 151.0, 264.0, 812.0, 1568.0, 403.0, 196.0, 92.0, 58.0, 60.0, 27.0, 17.0, 22.0, 20.0, 11.0, 10.0, 8.0, 3.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16162109375, -0.1560955047607422, -0.15056991577148438, -0.14504432678222656, -0.13951873779296875, -0.13399314880371094, -0.12846755981445312, -0.12294197082519531, -0.1174163818359375, -0.11189079284667969, -0.10636520385742188, -0.10083961486816406, -0.09531402587890625, -0.08978843688964844, -0.08426284790039062, -0.07873725891113281, -0.073211669921875, -0.06768608093261719, -0.062160491943359375, -0.05663490295410156, -0.05110931396484375, -0.04558372497558594, -0.040058135986328125, -0.03453254699707031, -0.0290069580078125, -0.023481369018554688, -0.017955780029296875, -0.012430191040039062, -0.00690460205078125, -0.0013790130615234375, 0.004146575927734375, 0.009672164916992188, 0.01519775390625, 0.020723342895507812, 0.026248931884765625, 0.03177452087402344, 0.03730010986328125, 0.04282569885253906, 0.048351287841796875, 0.05387687683105469, 0.0594024658203125, 0.06492805480957031, 0.07045364379882812, 0.07597923278808594, 0.08150482177734375, 0.08703041076660156, 0.09255599975585938, 0.09808158874511719, 0.103607177734375, 0.10913276672363281, 0.11465835571289062, 0.12018394470214844, 0.12570953369140625, 0.13123512268066406, 0.13676071166992188, 0.1422863006591797, 0.1478118896484375, 0.1533374786376953, 0.15886306762695312, 0.16438865661621094, 0.16991424560546875, 0.17543983459472656, 0.18096542358398438, 0.1864910125732422, 0.1920166015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 27.0, 65.0, 117.0, 222.0, 233.0, 181.0, 88.0, 28.0, 15.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.138641595840454, -1.0999451875686646, -1.061248779296875, -1.0225523710250854, -0.9838559627532959, -0.9451595544815063, -0.9064631462097168, -0.8677667379379272, -0.8290703296661377, -0.7903739213943481, -0.7516775131225586, -0.712981104850769, -0.6742846965789795, -0.6355882883071899, -0.5968918800354004, -0.5581954717636108, -0.5194990634918213, -0.48080265522003174, -0.4421062469482422, -0.40340983867645264, -0.3647134304046631, -0.32601702213287354, -0.287320613861084, -0.24862420558929443, -0.20992779731750488, -0.17123138904571533, -0.13253498077392578, -0.09383857250213623, -0.05514216423034668, -0.01644575595855713, 0.022250652313232422, 0.06094706058502197, 0.09964346885681152, 0.13833987712860107, 0.17703628540039062, 0.21573269367218018, 0.2544291019439697, 0.2931255102157593, 0.33182191848754883, 0.3705183267593384, 0.40921473503112793, 0.4479111433029175, 0.48660755157470703, 0.5253039598464966, 0.5640003681182861, 0.6026967763900757, 0.6413931846618652, 0.6800895929336548, 0.7187860012054443, 0.7574824094772339, 0.7961788177490234, 0.834875226020813, 0.8735716342926025, 0.9122680425643921, 0.9509644508361816, 0.9896608591079712, 1.0283572673797607, 1.0670536756515503, 1.1057500839233398, 1.1444464921951294, 1.183142900466919, 1.2218393087387085, 1.260535717010498, 1.2992321252822876, 1.3379285335540771]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 6.0, 7.0, 18.0, 10.0, 13.0, 31.0, 29.0, 36.0, 47.0, 61.0, 59.0, 67.0, 67.0, 86.0, 90.0, 65.0, 61.0, 56.0, 34.0, 50.0, 30.0, 16.0, 16.0, 17.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9934549927711487, -0.967807948589325, -0.9421609044075012, -0.9165139198303223, -0.8908668756484985, -0.8652198314666748, -0.8395727872848511, -0.8139257431030273, -0.7882786989212036, -0.7626316547393799, -0.7369846105575562, -0.7113375663757324, -0.6856905817985535, -0.6600435376167297, -0.634396493434906, -0.6087494492530823, -0.5831024646759033, -0.5574554204940796, -0.5318083763122559, -0.5061613321304321, -0.4805143475532532, -0.45486730337142944, -0.4292202591896057, -0.403573215007782, -0.37792620062828064, -0.3522791564464569, -0.32663214206695557, -0.30098509788513184, -0.2753380537033081, -0.24969103932380676, -0.22404399514198303, -0.1983969658613205, -0.17274999618530273, -0.1471029669046402, -0.12145593017339706, -0.09580889344215393, -0.0701618641614914, -0.04451483488082886, -0.018867790699005127, 0.00677923858165741, 0.032426267862319946, 0.05807330086827278, 0.08372033387422562, 0.10936737060546875, 0.1350143998861313, 0.16066142916679382, 0.18630847334861755, 0.2119555026292801, 0.23760253190994263, 0.26324957609176636, 0.2888965904712677, 0.31454363465309143, 0.3401906490325928, 0.3658376932144165, 0.39148473739624023, 0.41713178157806396, 0.4427787959575653, 0.46842584013938904, 0.4940728545188904, 0.5197198987007141, 0.5453669428825378, 0.5710139274597168, 0.5966609716415405, 0.6223080158233643, 0.647955060005188]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 16.0, 14.0, 26.0, 34.0, 34.0, 51.0, 73.0, 102.0, 142.0, 175.0, 231.0, 318.0, 398.0, 519.0, 800.0, 1172.0, 1475.0, 2138.0, 3047.0, 4226.0, 6093.0, 9057.0, 13545.0, 20675.0, 33053.0, 776359.0, 93637.0, 26701.0, 17188.0, 11469.0, 7551.0, 5304.0, 3724.0, 2578.0, 1782.0, 1303.0, 972.0, 660.0, 525.0, 378.0, 263.0, 182.0, 161.0, 112.0, 100.0, 62.0, 30.0, 31.0, 18.0, 21.0, 12.0, 6.0, 5.0, 6.0, 0.0, 4.0], "bins": [-0.39501953125, -0.3833274841308594, -0.37163543701171875, -0.3599433898925781, -0.3482513427734375, -0.3365592956542969, -0.32486724853515625, -0.3131752014160156, -0.301483154296875, -0.2897911071777344, -0.27809906005859375, -0.2664070129394531, -0.2547149658203125, -0.24302291870117188, -0.23133087158203125, -0.21963882446289062, -0.20794677734375, -0.19625473022460938, -0.18456268310546875, -0.17287063598632812, -0.1611785888671875, -0.14948654174804688, -0.13779449462890625, -0.12610244750976562, -0.114410400390625, -0.10271835327148438, -0.09102630615234375, -0.07933425903320312, -0.0676422119140625, -0.055950164794921875, -0.04425811767578125, -0.032566070556640625, -0.0208740234375, -0.009181976318359375, 0.00251007080078125, 0.014202117919921875, 0.0258941650390625, 0.037586212158203125, 0.04927825927734375, 0.060970306396484375, 0.072662353515625, 0.08435440063476562, 0.09604644775390625, 0.10773849487304688, 0.1194305419921875, 0.13112258911132812, 0.14281463623046875, 0.15450668334960938, 0.16619873046875, 0.17789077758789062, 0.18958282470703125, 0.20127487182617188, 0.2129669189453125, 0.22465896606445312, 0.23635101318359375, 0.24804306030273438, 0.259735107421875, 0.2714271545410156, 0.28311920166015625, 0.2948112487792969, 0.3065032958984375, 0.3181953430175781, 0.32988739013671875, 0.3415794372558594, 0.353271484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 6.0, 7.0, 10.0, 5.0, 10.0, 6.0, 13.0, 66.0, 695.0, 37.0, 16.0, 11.0, 3.0, 7.0, 10.0, 5.0, 7.0, 6.0, 4.0, 5.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.1796875, -0.1738433837890625, -0.167999267578125, -0.1621551513671875, -0.15631103515625, -0.1504669189453125, -0.144622802734375, -0.1387786865234375, -0.1329345703125, -0.1270904541015625, -0.121246337890625, -0.1154022216796875, -0.10955810546875, -0.1037139892578125, -0.097869873046875, -0.0920257568359375, -0.086181640625, -0.0803375244140625, -0.074493408203125, -0.0686492919921875, -0.06280517578125, -0.0569610595703125, -0.051116943359375, -0.0452728271484375, -0.0394287109375, -0.0335845947265625, -0.027740478515625, -0.0218963623046875, -0.01605224609375, -0.0102081298828125, -0.004364013671875, 0.0014801025390625, 0.00732421875, 0.0131683349609375, 0.019012451171875, 0.0248565673828125, 0.03070068359375, 0.0365447998046875, 0.042388916015625, 0.0482330322265625, 0.0540771484375, 0.0599212646484375, 0.065765380859375, 0.0716094970703125, 0.07745361328125, 0.0832977294921875, 0.089141845703125, 0.0949859619140625, 0.100830078125, 0.1066741943359375, 0.112518310546875, 0.1183624267578125, 0.12420654296875, 0.1300506591796875, 0.135894775390625, 0.1417388916015625, 0.1475830078125, 0.1534271240234375, 0.159271240234375, 0.1651153564453125, 0.17095947265625, 0.1768035888671875, 0.182647705078125, 0.1884918212890625, 0.1943359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 14.0, 10.0, 13.0, 16.0, 19.0, 22.0, 32.0, 38.0, 52.0, 73.0, 131.0, 142.0, 231.0, 390.0, 708.0, 1444.0, 3245.0, 8794.0, 28421.0, 111789.0, 432265.0, 343017.0, 83297.0, 21988.0, 6842.0, 2717.0, 1212.0, 601.0, 346.0, 189.0, 122.0, 92.0, 62.0, 39.0, 46.0, 26.0, 17.0, 21.0, 16.0, 18.0, 7.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0], "bins": [-0.61474609375, -0.5971298217773438, -0.5795135498046875, -0.5618972778320312, -0.544281005859375, -0.5266647338867188, -0.5090484619140625, -0.49143218994140625, -0.47381591796875, -0.45619964599609375, -0.4385833740234375, -0.42096710205078125, -0.403350830078125, -0.38573455810546875, -0.3681182861328125, -0.35050201416015625, -0.3328857421875, -0.31526947021484375, -0.2976531982421875, -0.28003692626953125, -0.262420654296875, -0.24480438232421875, -0.2271881103515625, -0.20957183837890625, -0.19195556640625, -0.17433929443359375, -0.1567230224609375, -0.13910675048828125, -0.121490478515625, -0.10387420654296875, -0.0862579345703125, -0.06864166259765625, -0.051025390625, -0.03340911865234375, -0.0157928466796875, 0.00182342529296875, 0.019439697265625, 0.03705596923828125, 0.0546722412109375, 0.07228851318359375, 0.08990478515625, 0.10752105712890625, 0.1251373291015625, 0.14275360107421875, 0.160369873046875, 0.17798614501953125, 0.1956024169921875, 0.21321868896484375, 0.2308349609375, 0.24845123291015625, 0.2660675048828125, 0.28368377685546875, 0.301300048828125, 0.31891632080078125, 0.3365325927734375, 0.35414886474609375, 0.37176513671875, 0.38938140869140625, 0.4069976806640625, 0.42461395263671875, 0.442230224609375, 0.45984649658203125, 0.4774627685546875, 0.49507904052734375, 0.5126953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 4.0, 4.0, 15.0, 17.0, 17.0, 12.0, 29.0, 23.0, 26.0, 19.0, 28.0, 46.0, 34.0, 27.0, 34.0, 32.0, 43.0, 40.0, 35.0, 40.0, 41.0, 29.0, 33.0, 56.0, 31.0, 37.0, 32.0, 38.0, 31.0, 26.0, 17.0, 21.0, 14.0, 20.0, 8.0, 5.0, 7.0, 7.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.734375, -0.7100906372070312, -0.6858062744140625, -0.6615219116210938, -0.637237548828125, -0.6129531860351562, -0.5886688232421875, -0.5643844604492188, -0.54010009765625, -0.5158157348632812, -0.4915313720703125, -0.46724700927734375, -0.442962646484375, -0.41867828369140625, -0.3943939208984375, -0.37010955810546875, -0.3458251953125, -0.32154083251953125, -0.2972564697265625, -0.27297210693359375, -0.248687744140625, -0.22440338134765625, -0.2001190185546875, -0.17583465576171875, -0.15155029296875, -0.12726593017578125, -0.1029815673828125, -0.07869720458984375, -0.054412841796875, -0.03012847900390625, -0.0058441162109375, 0.01844024658203125, 0.042724609375, 0.06700897216796875, 0.0912933349609375, 0.11557769775390625, 0.139862060546875, 0.16414642333984375, 0.1884307861328125, 0.21271514892578125, 0.23699951171875, 0.26128387451171875, 0.2855682373046875, 0.30985260009765625, 0.334136962890625, 0.35842132568359375, 0.3827056884765625, 0.40699005126953125, 0.4312744140625, 0.45555877685546875, 0.4798431396484375, 0.5041275024414062, 0.528411865234375, 0.5526962280273438, 0.5769805908203125, 0.6012649536132812, 0.62554931640625, 0.6498336791992188, 0.6741180419921875, 0.6984024047851562, 0.722686767578125, 0.7469711303710938, 0.7712554931640625, 0.7955398559570312, 0.81982421875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 15.0, 18.0, 53.0, 109.0, 249.0, 758.0, 2904.0, 20470.0, 653387.0, 353585.0, 13728.0, 2269.0, 636.0, 168.0, 96.0, 51.0, 22.0, 13.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -1.0025558471679688, -0.9767913818359375, -0.9510269165039062, -0.925262451171875, -0.8994979858398438, -0.8737335205078125, -0.8479690551757812, -0.82220458984375, -0.7964401245117188, -0.7706756591796875, -0.7449111938476562, -0.719146728515625, -0.6933822631835938, -0.6676177978515625, -0.6418533325195312, -0.6160888671875, -0.5903244018554688, -0.5645599365234375, -0.5387954711914062, -0.513031005859375, -0.48726654052734375, -0.4615020751953125, -0.43573760986328125, -0.40997314453125, -0.38420867919921875, -0.3584442138671875, -0.33267974853515625, -0.306915283203125, -0.28115081787109375, -0.2553863525390625, -0.22962188720703125, -0.203857421875, -0.17809295654296875, -0.1523284912109375, -0.12656402587890625, -0.100799560546875, -0.07503509521484375, -0.0492706298828125, -0.02350616455078125, 0.00225830078125, 0.02802276611328125, 0.0537872314453125, 0.07955169677734375, 0.105316162109375, 0.13108062744140625, 0.1568450927734375, 0.18260955810546875, 0.2083740234375, 0.23413848876953125, 0.2599029541015625, 0.28566741943359375, 0.311431884765625, 0.33719635009765625, 0.3629608154296875, 0.38872528076171875, 0.41448974609375, 0.44025421142578125, 0.4660186767578125, 0.49178314208984375, 0.517547607421875, 0.5433120727539062, 0.5690765380859375, 0.5948410034179688, 0.62060546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 13.0, 15.0, 12.0, 17.0, 22.0, 38.0, 51.0, 56.0, 76.0, 90.0, 75.0, 85.0, 80.0, 83.0, 64.0, 39.0, 34.0, 34.0, 20.0, 22.0, 16.0, 6.0, 13.0, 12.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.45246696472168e-05, -4.3147243559360504e-05, -4.176981747150421e-05, -4.039239138364792e-05, -3.9014965295791626e-05, -3.763753920793533e-05, -3.626011312007904e-05, -3.488268703222275e-05, -3.3505260944366455e-05, -3.212783485651016e-05, -3.075040876865387e-05, -2.9372982680797577e-05, -2.7995556592941284e-05, -2.661813050508499e-05, -2.52407044172287e-05, -2.3863278329372406e-05, -2.2485852241516113e-05, -2.110842615365982e-05, -1.9731000065803528e-05, -1.8353573977947235e-05, -1.6976147890090942e-05, -1.559872180223465e-05, -1.4221295714378357e-05, -1.2843869626522064e-05, -1.1466443538665771e-05, -1.0089017450809479e-05, -8.711591362953186e-06, -7.334165275096893e-06, -5.956739187240601e-06, -4.579313099384308e-06, -3.201887011528015e-06, -1.8244609236717224e-06, -4.470348358154297e-07, 9.30391252040863e-07, 2.3078173398971558e-06, 3.6852434277534485e-06, 5.062669515609741e-06, 6.440095603466034e-06, 7.817521691322327e-06, 9.19494777917862e-06, 1.0572373867034912e-05, 1.1949799954891205e-05, 1.3327226042747498e-05, 1.470465213060379e-05, 1.6082078218460083e-05, 1.7459504306316376e-05, 1.883693039417267e-05, 2.021435648202896e-05, 2.1591782569885254e-05, 2.2969208657741547e-05, 2.434663474559784e-05, 2.5724060833454132e-05, 2.7101486921310425e-05, 2.8478913009166718e-05, 2.985633909702301e-05, 3.12337651848793e-05, 3.2611191272735596e-05, 3.398861736059189e-05, 3.536604344844818e-05, 3.6743469536304474e-05, 3.8120895624160767e-05, 3.949832171201706e-05, 4.087574779987335e-05, 4.2253173887729645e-05, 4.363059997558594e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 4.0, 14.0, 9.0, 18.0, 13.0, 44.0, 36.0, 65.0, 97.0, 113.0, 176.0, 309.0, 490.0, 897.0, 1711.0, 3871.0, 10147.0, 32946.0, 160604.0, 569324.0, 206676.0, 40369.0, 11761.0, 4458.0, 2008.0, 913.0, 506.0, 314.0, 212.0, 124.0, 93.0, 64.0, 47.0, 25.0, 14.0, 14.0, 13.0, 9.0, 9.0, 8.0, 2.0, 0.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.3076171875, -0.2972145080566406, -0.28681182861328125, -0.2764091491699219, -0.2660064697265625, -0.2556037902832031, -0.24520111083984375, -0.23479843139648438, -0.224395751953125, -0.21399307250976562, -0.20359039306640625, -0.19318771362304688, -0.1827850341796875, -0.17238235473632812, -0.16197967529296875, -0.15157699584960938, -0.14117431640625, -0.13077163696289062, -0.12036895751953125, -0.10996627807617188, -0.0995635986328125, -0.08916091918945312, -0.07875823974609375, -0.06835556030273438, -0.057952880859375, -0.047550201416015625, -0.03714752197265625, -0.026744842529296875, -0.0163421630859375, -0.005939483642578125, 0.00446319580078125, 0.014865875244140625, 0.0252685546875, 0.035671234130859375, 0.04607391357421875, 0.056476593017578125, 0.0668792724609375, 0.07728195190429688, 0.08768463134765625, 0.09808731079101562, 0.108489990234375, 0.11889266967773438, 0.12929534912109375, 0.13969802856445312, 0.1501007080078125, 0.16050338745117188, 0.17090606689453125, 0.18130874633789062, 0.19171142578125, 0.20211410522460938, 0.21251678466796875, 0.22291946411132812, 0.2333221435546875, 0.24372482299804688, 0.25412750244140625, 0.2645301818847656, 0.274932861328125, 0.2853355407714844, 0.29573822021484375, 0.3061408996582031, 0.3165435791015625, 0.3269462585449219, 0.33734893798828125, 0.3477516174316406, 0.358154296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 7.0, 4.0, 10.0, 17.0, 15.0, 25.0, 31.0, 29.0, 40.0, 58.0, 72.0, 71.0, 63.0, 90.0, 66.0, 71.0, 72.0, 57.0, 49.0, 29.0, 17.0, 24.0, 18.0, 20.0, 4.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350830078125, -0.34069061279296875, -0.3305511474609375, -0.32041168212890625, -0.310272216796875, -0.30013275146484375, -0.2899932861328125, -0.27985382080078125, -0.26971435546875, -0.25957489013671875, -0.2494354248046875, -0.23929595947265625, -0.229156494140625, -0.21901702880859375, -0.2088775634765625, -0.19873809814453125, -0.1885986328125, -0.17845916748046875, -0.1683197021484375, -0.15818023681640625, -0.148040771484375, -0.13790130615234375, -0.1277618408203125, -0.11762237548828125, -0.10748291015625, -0.09734344482421875, -0.0872039794921875, -0.07706451416015625, -0.066925048828125, -0.05678558349609375, -0.0466461181640625, -0.03650665283203125, -0.0263671875, -0.01622772216796875, -0.0060882568359375, 0.00405120849609375, 0.014190673828125, 0.02433013916015625, 0.0344696044921875, 0.04460906982421875, 0.05474853515625, 0.06488800048828125, 0.0750274658203125, 0.08516693115234375, 0.095306396484375, 0.10544586181640625, 0.1155853271484375, 0.12572479248046875, 0.1358642578125, 0.14600372314453125, 0.1561431884765625, 0.16628265380859375, 0.176422119140625, 0.18656158447265625, 0.1967010498046875, 0.20684051513671875, 0.21697998046875, 0.22711944580078125, 0.2372589111328125, 0.24739837646484375, 0.257537841796875, 0.26767730712890625, 0.2778167724609375, 0.28795623779296875, 0.298095703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 21.0, 75.0, 266.0, 438.0, 126.0, 27.0, 15.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.840322494506836, -13.436375617980957, -13.032429695129395, -12.628482818603516, -12.224535942077637, -11.820589065551758, -11.416643142700195, -11.012696266174316, -10.608749389648438, -10.204802513122559, -9.800856590270996, -9.396909713745117, -8.992962837219238, -8.58901596069336, -8.185070037841797, -7.781123161315918, -7.3771772384643555, -6.973230838775635, -6.569283962249756, -6.165337562561035, -5.761390686035156, -5.3574442863464355, -4.953497886657715, -4.549551010131836, -4.145604610443115, -3.7416579723358154, -3.3377113342285156, -2.933764934539795, -2.529818296432495, -2.1258716583251953, -1.7219252586364746, -1.3179786205291748, -0.914031982421875, -0.51008540391922, -0.10613882541656494, 0.2978076934814453, 0.7017543315887451, 1.105700969696045, 1.5096473693847656, 1.9135940074920654, 2.3175406455993652, 2.721487283706665, 3.125433921813965, 3.5293803215026855, 3.9333269596099854, 4.337273597717285, 4.741219997406006, 5.145166397094727, 5.5491132736206055, 5.953059673309326, 6.357006549835205, 6.760952949523926, 7.164899826049805, 7.568846225738525, 7.972792625427246, 8.376739501953125, 8.780685424804688, 9.184632301330566, 9.588578224182129, 9.992525100708008, 10.396471977233887, 10.800418853759766, 11.204364776611328, 11.608311653137207, 12.012258529663086]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 18.0, 28.0, 41.0, 71.0, 118.0, 148.0, 146.0, 149.0, 84.0, 53.0, 21.0, 17.0, 10.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.44284439086914, -12.981671333312988, -12.52049732208252, -12.059324264526367, -11.598150253295898, -11.136977195739746, -10.675803184509277, -10.214630126953125, -9.753456115722656, -9.292283058166504, -8.831109046936035, -8.369935989379883, -7.908761978149414, -7.447588920593262, -6.986414909362793, -6.525241851806641, -6.06406831741333, -5.6028947830200195, -5.141721248626709, -4.680547714233398, -4.219374179840088, -3.7582008838653564, -3.297027349472046, -2.8358538150787354, -2.374680280685425, -1.9135067462921143, -1.4523332118988037, -0.9911597967147827, -0.5299862623214722, -0.06881284713745117, 0.3923606872558594, 0.8535342216491699, 1.3147077560424805, 1.775881290435791, 2.2370548248291016, 2.698228359222412, 3.1594018936157227, 3.620575189590454, 4.081748962402344, 4.542922019958496, 5.004096031188965, 5.465269565582275, 5.926443099975586, 6.3876166343688965, 6.848790168762207, 7.309963226318359, 7.771137237548828, 8.23231029510498, 8.693483352661133, 9.154656410217285, 9.615830421447754, 10.077003479003906, 10.538177490234375, 10.999350547790527, 11.460524559020996, 11.921697616577148, 12.382871627807617, 12.84404468536377, 13.305218696594238, 13.76639175415039, 14.22756576538086, 14.688738822937012, 15.14991283416748, 15.611085891723633, 16.0722599029541]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 8.0, 9.0, 13.0, 18.0, 21.0, 32.0, 38.0, 58.0, 95.0, 126.0, 144.0, 253.0, 354.0, 596.0, 931.0, 1563.0, 2755.0, 5269.0, 12040.0, 36951.0, 3846309.0, 237025.0, 27406.0, 10640.0, 5064.0, 2635.0, 1440.0, 893.0, 532.0, 346.0, 226.0, 141.0, 98.0, 78.0, 50.0, 38.0, 19.0, 18.0, 19.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5419921875, -1.4964752197265625, -1.450958251953125, -1.4054412841796875, -1.35992431640625, -1.3144073486328125, -1.268890380859375, -1.2233734130859375, -1.1778564453125, -1.1323394775390625, -1.086822509765625, -1.0413055419921875, -0.99578857421875, -0.9502716064453125, -0.904754638671875, -0.8592376708984375, -0.813720703125, -0.7682037353515625, -0.722686767578125, -0.6771697998046875, -0.63165283203125, -0.5861358642578125, -0.540618896484375, -0.4951019287109375, -0.4495849609375, -0.4040679931640625, -0.358551025390625, -0.3130340576171875, -0.26751708984375, -0.2220001220703125, -0.176483154296875, -0.1309661865234375, -0.08544921875, -0.0399322509765625, 0.005584716796875, 0.0511016845703125, 0.09661865234375, 0.1421356201171875, 0.187652587890625, 0.2331695556640625, 0.2786865234375, 0.3242034912109375, 0.369720458984375, 0.4152374267578125, 0.46075439453125, 0.5062713623046875, 0.551788330078125, 0.5973052978515625, 0.642822265625, 0.6883392333984375, 0.733856201171875, 0.7793731689453125, 0.82489013671875, 0.8704071044921875, 0.915924072265625, 0.9614410400390625, 1.0069580078125, 1.0524749755859375, 1.097991943359375, 1.1435089111328125, 1.18902587890625, 1.2345428466796875, 1.280059814453125, 1.3255767822265625, 1.37109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 12.0, 8.0, 11.0, 12.0, 63.0, 227.0, 371.0, 121.0, 34.0, 18.0, 10.0, 8.0, 9.0, 7.0, 7.0, 4.0, 12.0, 1.0, 10.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.168212890625, -0.1633129119873047, -0.15841293334960938, -0.15351295471191406, -0.14861297607421875, -0.14371299743652344, -0.13881301879882812, -0.1339130401611328, -0.1290130615234375, -0.12411308288574219, -0.11921310424804688, -0.11431312561035156, -0.10941314697265625, -0.10451316833496094, -0.09961318969726562, -0.09471321105957031, -0.089813232421875, -0.08491325378417969, -0.08001327514648438, -0.07511329650878906, -0.07021331787109375, -0.06531333923339844, -0.060413360595703125, -0.05551338195800781, -0.0506134033203125, -0.04571342468261719, -0.040813446044921875, -0.03591346740722656, -0.03101348876953125, -0.026113510131835938, -0.021213531494140625, -0.016313552856445312, -0.01141357421875, -0.0065135955810546875, -0.001613616943359375, 0.0032863616943359375, 0.00818634033203125, 0.013086318969726562, 0.017986297607421875, 0.022886276245117188, 0.0277862548828125, 0.03268623352050781, 0.037586212158203125, 0.04248619079589844, 0.04738616943359375, 0.05228614807128906, 0.057186126708984375, 0.06208610534667969, 0.066986083984375, 0.07188606262207031, 0.07678604125976562, 0.08168601989746094, 0.08658599853515625, 0.09148597717285156, 0.09638595581054688, 0.10128593444824219, 0.1061859130859375, 0.11108589172363281, 0.11598587036132812, 0.12088584899902344, 0.12578582763671875, 0.13068580627441406, 0.13558578491210938, 0.1404857635498047, 0.1453857421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 15.0, 12.0, 21.0, 23.0, 39.0, 68.0, 102.0, 164.0, 268.0, 556.0, 1168.0, 2461.0, 6221.0, 19372.0, 85812.0, 2659404.0, 1309580.0, 79688.0, 18514.0, 5968.0, 2359.0, 1090.0, 569.0, 310.0, 162.0, 104.0, 67.0, 50.0, 31.0, 13.0, 14.0, 13.0, 5.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.1374282836914062, -1.1039581298828125, -1.0704879760742188, -1.037017822265625, -1.0035476684570312, -0.9700775146484375, -0.9366073608398438, -0.90313720703125, -0.8696670532226562, -0.8361968994140625, -0.8027267456054688, -0.769256591796875, -0.7357864379882812, -0.7023162841796875, -0.6688461303710938, -0.6353759765625, -0.6019058227539062, -0.5684356689453125, -0.5349655151367188, -0.501495361328125, -0.46802520751953125, -0.4345550537109375, -0.40108489990234375, -0.36761474609375, -0.33414459228515625, -0.3006744384765625, -0.26720428466796875, -0.233734130859375, -0.20026397705078125, -0.1667938232421875, -0.13332366943359375, -0.099853515625, -0.06638336181640625, -0.0329132080078125, 0.00055694580078125, 0.034027099609375, 0.06749725341796875, 0.1009674072265625, 0.13443756103515625, 0.16790771484375, 0.20137786865234375, 0.2348480224609375, 0.26831817626953125, 0.301788330078125, 0.33525848388671875, 0.3687286376953125, 0.40219879150390625, 0.4356689453125, 0.46913909912109375, 0.5026092529296875, 0.5360794067382812, 0.569549560546875, 0.6030197143554688, 0.6364898681640625, 0.6699600219726562, 0.70343017578125, 0.7369003295898438, 0.7703704833984375, 0.8038406372070312, 0.837310791015625, 0.8707809448242188, 0.9042510986328125, 0.9377212524414062, 0.97119140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 4.0, 7.0, 12.0, 17.0, 18.0, 20.0, 27.0, 33.0, 51.0, 50.0, 84.0, 118.0, 165.0, 318.0, 1802.0, 624.0, 215.0, 123.0, 77.0, 70.0, 41.0, 35.0, 32.0, 25.0, 23.0, 8.0, 15.0, 5.0, 13.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.161865234375, -0.15746784210205078, -0.15307044982910156, -0.14867305755615234, -0.14427566528320312, -0.1398782730102539, -0.1354808807373047, -0.13108348846435547, -0.12668609619140625, -0.12228870391845703, -0.11789131164550781, -0.1134939193725586, -0.10909652709960938, -0.10469913482666016, -0.10030174255371094, -0.09590435028076172, -0.0915069580078125, -0.08710956573486328, -0.08271217346191406, -0.07831478118896484, -0.07391738891601562, -0.0695199966430664, -0.06512260437011719, -0.06072521209716797, -0.05632781982421875, -0.05193042755126953, -0.04753303527832031, -0.043135643005371094, -0.038738250732421875, -0.034340858459472656, -0.029943466186523438, -0.02554607391357422, -0.021148681640625, -0.01675128936767578, -0.012353897094726562, -0.007956504821777344, -0.003559112548828125, 0.0008382797241210938, 0.0052356719970703125, 0.009633064270019531, 0.01403045654296875, 0.01842784881591797, 0.022825241088867188, 0.027222633361816406, 0.031620025634765625, 0.036017417907714844, 0.04041481018066406, 0.04481220245361328, 0.0492095947265625, 0.05360698699951172, 0.05800437927246094, 0.062401771545410156, 0.06679916381835938, 0.0711965560913086, 0.07559394836425781, 0.07999134063720703, 0.08438873291015625, 0.08878612518310547, 0.09318351745605469, 0.0975809097290039, 0.10197830200195312, 0.10637569427490234, 0.11077308654785156, 0.11517047882080078, 0.11956787109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 60.0, 193.0, 339.0, 259.0, 76.0, 28.0, 12.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4995644092559814, -1.4386417865753174, -1.3777192831039429, -1.3167966604232788, -1.2558740377426147, -1.1949515342712402, -1.1340289115905762, -1.073106288909912, -1.012183666229248, -0.9512611031532288, -0.8903384804725647, -0.8294159173965454, -0.7684932947158813, -0.7075707316398621, -0.6466481685638428, -0.5857255458831787, -0.5248029828071594, -0.46388038992881775, -0.4029577970504761, -0.3420352339744568, -0.2811126112937927, -0.22019004821777344, -0.15926745533943176, -0.09834486246109009, -0.03742226958274841, 0.023500319570302963, 0.08442290872335434, 0.14534549415111542, 0.2062680870294571, 0.2671906650066376, 0.32811325788497925, 0.3890358507633209, 0.4499584436416626, 0.5108810067176819, 0.571803629398346, 0.6327261924743652, 0.6936488151550293, 0.7545713782310486, 0.8154939413070679, 0.8764165639877319, 0.937339186668396, 0.9982617497444153, 1.0591843128204346, 1.1201069355010986, 1.1810295581817627, 1.2419521808624268, 1.3028746843338013, 1.3637973070144653, 1.4247198104858398, 1.485642433166504, 1.5465649366378784, 1.6074875593185425, 1.6684101819992065, 1.729332685470581, 1.7902553081512451, 1.8511779308319092, 1.9121005535125732, 1.9730231761932373, 2.0339457988739014, 2.0948684215545654, 2.1557908058166504, 2.2167134284973145, 2.2776360511779785, 2.3385586738586426, 2.3994812965393066]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 12.0, 15.0, 10.0, 22.0, 22.0, 19.0, 36.0, 42.0, 34.0, 51.0, 57.0, 63.0, 55.0, 54.0, 54.0, 43.0, 53.0, 47.0, 55.0, 34.0, 36.0, 33.0, 27.0, 26.0, 16.0, 17.0, 16.0, 6.0, 8.0, 6.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6652513146400452, -0.6455979347229004, -0.6259444952011108, -0.6062910556793213, -0.5866376757621765, -0.5669842958450317, -0.5473308563232422, -0.5276774168014526, -0.5080240368843079, -0.4883706271648407, -0.46871721744537354, -0.44906380772590637, -0.4294103980064392, -0.40975698828697205, -0.3901035785675049, -0.3704501688480377, -0.35079675912857056, -0.3311433494091034, -0.31148993968963623, -0.29183652997016907, -0.2721831202507019, -0.25252971053123474, -0.23287630081176758, -0.21322289109230042, -0.19356948137283325, -0.1739160716533661, -0.15426266193389893, -0.13460925221443176, -0.1149558424949646, -0.09530243277549744, -0.07564902305603027, -0.05599561333656311, -0.03634214401245117, -0.01668873429298401, 0.0029646754264831543, 0.022618085145950317, 0.04227149486541748, 0.061924904584884644, 0.0815783143043518, 0.10123172402381897, 0.12088513374328613, 0.1405385434627533, 0.16019195318222046, 0.17984536290168762, 0.19949877262115479, 0.21915218234062195, 0.2388055920600891, 0.2584590017795563, 0.27811241149902344, 0.2977658212184906, 0.31741923093795776, 0.3370726406574249, 0.3567260503768921, 0.37637946009635925, 0.3960328698158264, 0.4156862795352936, 0.43533968925476074, 0.4549930989742279, 0.47464650869369507, 0.49429991841316223, 0.5139533281326294, 0.533606767654419, 0.5532601475715637, 0.5729135274887085, 0.592566967010498]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 21.0, 22.0, 28.0, 47.0, 76.0, 132.0, 251.0, 438.0, 944.0, 1839.0, 4215.0, 11377.0, 39124.0, 839642.0, 117042.0, 20893.0, 6780.0, 2831.0, 1354.0, 673.0, 338.0, 188.0, 110.0, 55.0, 44.0, 35.0, 17.0, 14.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4287109375, -1.38372802734375, -1.3387451171875, -1.29376220703125, -1.248779296875, -1.20379638671875, -1.1588134765625, -1.11383056640625, -1.06884765625, -1.02386474609375, -0.9788818359375, -0.93389892578125, -0.888916015625, -0.84393310546875, -0.7989501953125, -0.75396728515625, -0.708984375, -0.66400146484375, -0.6190185546875, -0.57403564453125, -0.529052734375, -0.48406982421875, -0.4390869140625, -0.39410400390625, -0.34912109375, -0.30413818359375, -0.2591552734375, -0.21417236328125, -0.169189453125, -0.12420654296875, -0.0792236328125, -0.03424072265625, 0.0107421875, 0.05572509765625, 0.1007080078125, 0.14569091796875, 0.190673828125, 0.23565673828125, 0.2806396484375, 0.32562255859375, 0.37060546875, 0.41558837890625, 0.4605712890625, 0.50555419921875, 0.550537109375, 0.59552001953125, 0.6405029296875, 0.68548583984375, 0.73046875, 0.77545166015625, 0.8204345703125, 0.86541748046875, 0.910400390625, 0.95538330078125, 1.0003662109375, 1.04534912109375, 1.09033203125, 1.13531494140625, 1.1802978515625, 1.22528076171875, 1.270263671875, 1.31524658203125, 1.3602294921875, 1.40521240234375, 1.4501953125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 5.0, 13.0, 9.0, 20.0, 59.0, 207.0, 303.0, 189.0, 48.0, 30.0, 9.0, 12.0, 8.0, 10.0, 5.0, 5.0, 3.0, 7.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1712646484375, -0.1661548614501953, -0.16104507446289062, -0.15593528747558594, -0.15082550048828125, -0.14571571350097656, -0.14060592651367188, -0.1354961395263672, -0.1303863525390625, -0.1252765655517578, -0.12016677856445312, -0.11505699157714844, -0.10994720458984375, -0.10483741760253906, -0.09972763061523438, -0.09461784362792969, -0.089508056640625, -0.08439826965332031, -0.07928848266601562, -0.07417869567871094, -0.06906890869140625, -0.06395912170410156, -0.058849334716796875, -0.05373954772949219, -0.0486297607421875, -0.04351997375488281, -0.038410186767578125, -0.03330039978027344, -0.02819061279296875, -0.023080825805664062, -0.017971038818359375, -0.012861251831054688, -0.00775146484375, -0.0026416778564453125, 0.002468109130859375, 0.0075778961181640625, 0.01268768310546875, 0.017797470092773438, 0.022907257080078125, 0.028017044067382812, 0.0331268310546875, 0.03823661804199219, 0.043346405029296875, 0.04845619201660156, 0.05356597900390625, 0.05867576599121094, 0.06378555297851562, 0.06889533996582031, 0.074005126953125, 0.07911491394042969, 0.08422470092773438, 0.08933448791503906, 0.09444427490234375, 0.09955406188964844, 0.10466384887695312, 0.10977363586425781, 0.1148834228515625, 0.11999320983886719, 0.12510299682617188, 0.13021278381347656, 0.13532257080078125, 0.14043235778808594, 0.14554214477539062, 0.1506519317626953, 0.15576171875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 11.0, 14.0, 13.0, 16.0, 22.0, 48.0, 69.0, 96.0, 151.0, 263.0, 575.0, 1146.0, 2771.0, 7978.0, 31403.0, 245362.0, 644140.0, 91394.0, 15189.0, 4523.0, 1672.0, 782.0, 358.0, 193.0, 123.0, 76.0, 40.0, 37.0, 17.0, 17.0, 15.0, 10.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8219757080078125, -0.794830322265625, -0.7676849365234375, -0.74053955078125, -0.7133941650390625, -0.686248779296875, -0.6591033935546875, -0.6319580078125, -0.6048126220703125, -0.577667236328125, -0.5505218505859375, -0.52337646484375, -0.4962310791015625, -0.469085693359375, -0.4419403076171875, -0.414794921875, -0.3876495361328125, -0.360504150390625, -0.3333587646484375, -0.30621337890625, -0.2790679931640625, -0.251922607421875, -0.2247772216796875, -0.1976318359375, -0.1704864501953125, -0.143341064453125, -0.1161956787109375, -0.08905029296875, -0.0619049072265625, -0.034759521484375, -0.0076141357421875, 0.01953125, 0.0466766357421875, 0.073822021484375, 0.1009674072265625, 0.12811279296875, 0.1552581787109375, 0.182403564453125, 0.2095489501953125, 0.2366943359375, 0.2638397216796875, 0.290985107421875, 0.3181304931640625, 0.34527587890625, 0.3724212646484375, 0.399566650390625, 0.4267120361328125, 0.453857421875, 0.4810028076171875, 0.508148193359375, 0.5352935791015625, 0.56243896484375, 0.5895843505859375, 0.616729736328125, 0.6438751220703125, 0.6710205078125, 0.6981658935546875, 0.725311279296875, 0.7524566650390625, 0.77960205078125, 0.8067474365234375, 0.833892822265625, 0.8610382080078125, 0.88818359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 9.0, 8.0, 9.0, 9.0, 16.0, 12.0, 13.0, 15.0, 34.0, 22.0, 43.0, 30.0, 39.0, 36.0, 39.0, 49.0, 60.0, 43.0, 59.0, 50.0, 40.0, 56.0, 52.0, 40.0, 35.0, 29.0, 30.0, 29.0, 17.0, 16.0, 15.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.59521484375, -0.579803466796875, -0.56439208984375, -0.548980712890625, -0.5335693359375, -0.518157958984375, -0.50274658203125, -0.487335205078125, -0.471923828125, -0.456512451171875, -0.44110107421875, -0.425689697265625, -0.4102783203125, -0.394866943359375, -0.37945556640625, -0.364044189453125, -0.3486328125, -0.333221435546875, -0.31781005859375, -0.302398681640625, -0.2869873046875, -0.271575927734375, -0.25616455078125, -0.240753173828125, -0.225341796875, -0.209930419921875, -0.19451904296875, -0.179107666015625, -0.1636962890625, -0.148284912109375, -0.13287353515625, -0.117462158203125, -0.10205078125, -0.086639404296875, -0.07122802734375, -0.055816650390625, -0.0404052734375, -0.024993896484375, -0.00958251953125, 0.005828857421875, 0.021240234375, 0.036651611328125, 0.05206298828125, 0.067474365234375, 0.0828857421875, 0.098297119140625, 0.11370849609375, 0.129119873046875, 0.14453125, 0.159942626953125, 0.17535400390625, 0.190765380859375, 0.2061767578125, 0.221588134765625, 0.23699951171875, 0.252410888671875, 0.267822265625, 0.283233642578125, 0.29864501953125, 0.314056396484375, 0.3294677734375, 0.344879150390625, 0.36029052734375, 0.375701904296875, 0.39111328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 12.0, 10.0, 9.0, 18.0, 31.0, 45.0, 83.0, 161.0, 277.0, 511.0, 1106.0, 2760.0, 8743.0, 42152.0, 348148.0, 549835.0, 75026.0, 13104.0, 3682.0, 1397.0, 617.0, 328.0, 186.0, 99.0, 76.0, 37.0, 24.0, 20.0, 16.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67626953125, -0.656463623046875, -0.63665771484375, -0.616851806640625, -0.5970458984375, -0.577239990234375, -0.55743408203125, -0.537628173828125, -0.517822265625, -0.498016357421875, -0.47821044921875, -0.458404541015625, -0.4385986328125, -0.418792724609375, -0.39898681640625, -0.379180908203125, -0.359375, -0.339569091796875, -0.31976318359375, -0.299957275390625, -0.2801513671875, -0.260345458984375, -0.24053955078125, -0.220733642578125, -0.200927734375, -0.181121826171875, -0.16131591796875, -0.141510009765625, -0.1217041015625, -0.101898193359375, -0.08209228515625, -0.062286376953125, -0.04248046875, -0.022674560546875, -0.00286865234375, 0.016937255859375, 0.0367431640625, 0.056549072265625, 0.07635498046875, 0.096160888671875, 0.115966796875, 0.135772705078125, 0.15557861328125, 0.175384521484375, 0.1951904296875, 0.214996337890625, 0.23480224609375, 0.254608154296875, 0.2744140625, 0.294219970703125, 0.31402587890625, 0.333831787109375, 0.3536376953125, 0.373443603515625, 0.39324951171875, 0.413055419921875, 0.432861328125, 0.452667236328125, 0.47247314453125, 0.492279052734375, 0.5120849609375, 0.531890869140625, 0.55169677734375, 0.571502685546875, 0.59130859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 12.0, 9.0, 15.0, 19.0, 27.0, 46.0, 47.0, 55.0, 58.0, 82.0, 102.0, 87.0, 72.0, 69.0, 71.0, 49.0, 33.0, 20.0, 28.0, 19.0, 9.0, 9.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.861146539449692e-05, -6.653182208538055e-05, -6.445217877626419e-05, -6.237253546714783e-05, -6.0292892158031464e-05, -5.82132488489151e-05, -5.6133605539798737e-05, -5.405396223068237e-05, -5.197431892156601e-05, -4.9894675612449646e-05, -4.781503230333328e-05, -4.573538899421692e-05, -4.3655745685100555e-05, -4.157610237598419e-05, -3.949645906686783e-05, -3.7416815757751465e-05, -3.53371724486351e-05, -3.325752913951874e-05, -3.1177885830402374e-05, -2.909824252128601e-05, -2.7018599212169647e-05, -2.4938955903053284e-05, -2.285931259393692e-05, -2.0779669284820557e-05, -1.8700025975704193e-05, -1.662038266658783e-05, -1.4540739357471466e-05, -1.2461096048355103e-05, -1.0381452739238739e-05, -8.301809430122375e-06, -6.222166121006012e-06, -4.1425228118896484e-06, -2.062879502773285e-06, 1.6763806343078613e-08, 2.096407115459442e-06, 4.176050424575806e-06, 6.255693733692169e-06, 8.335337042808533e-06, 1.0414980351924896e-05, 1.249462366104126e-05, 1.4574266970157623e-05, 1.6653910279273987e-05, 1.873355358839035e-05, 2.0813196897506714e-05, 2.2892840206623077e-05, 2.497248351573944e-05, 2.7052126824855804e-05, 2.9131770133972168e-05, 3.121141344308853e-05, 3.3291056752204895e-05, 3.537070006132126e-05, 3.745034337043762e-05, 3.9529986679553986e-05, 4.160962998867035e-05, 4.368927329778671e-05, 4.5768916606903076e-05, 4.784855991601944e-05, 4.99282032251358e-05, 5.200784653425217e-05, 5.408748984336853e-05, 5.6167133152484894e-05, 5.824677646160126e-05, 6.032641977071762e-05, 6.240606307983398e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 8.0, 13.0, 18.0, 35.0, 52.0, 59.0, 105.0, 194.0, 323.0, 626.0, 1280.0, 3049.0, 8466.0, 29954.0, 145879.0, 517867.0, 267417.0, 52431.0, 12855.0, 4341.0, 1686.0, 820.0, 433.0, 245.0, 128.0, 76.0, 60.0, 31.0, 22.0, 21.0, 12.0, 10.0, 4.0, 8.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.5069503784179688, -0.4914398193359375, -0.47592926025390625, -0.460418701171875, -0.44490814208984375, -0.4293975830078125, -0.41388702392578125, -0.39837646484375, -0.38286590576171875, -0.3673553466796875, -0.35184478759765625, -0.336334228515625, -0.32082366943359375, -0.3053131103515625, -0.28980255126953125, -0.2742919921875, -0.25878143310546875, -0.2432708740234375, -0.22776031494140625, -0.212249755859375, -0.19673919677734375, -0.1812286376953125, -0.16571807861328125, -0.15020751953125, -0.13469696044921875, -0.1191864013671875, -0.10367584228515625, -0.088165283203125, -0.07265472412109375, -0.0571441650390625, -0.04163360595703125, -0.026123046875, -0.01061248779296875, 0.0048980712890625, 0.02040863037109375, 0.035919189453125, 0.05142974853515625, 0.0669403076171875, 0.08245086669921875, 0.09796142578125, 0.11347198486328125, 0.1289825439453125, 0.14449310302734375, 0.160003662109375, 0.17551422119140625, 0.1910247802734375, 0.20653533935546875, 0.2220458984375, 0.23755645751953125, 0.2530670166015625, 0.26857757568359375, 0.284088134765625, 0.29959869384765625, 0.3151092529296875, 0.33061981201171875, 0.34613037109375, 0.36164093017578125, 0.3771514892578125, 0.39266204833984375, 0.408172607421875, 0.42368316650390625, 0.4391937255859375, 0.45470428466796875, 0.47021484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 4.0, 9.0, 8.0, 12.0, 15.0, 15.0, 15.0, 31.0, 35.0, 46.0, 34.0, 59.0, 63.0, 64.0, 62.0, 54.0, 56.0, 50.0, 53.0, 50.0, 38.0, 33.0, 32.0, 31.0, 27.0, 14.0, 21.0, 13.0, 15.0, 17.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.19418716430664062, -0.18622589111328125, -0.17826461791992188, -0.1703033447265625, -0.16234207153320312, -0.15438079833984375, -0.14641952514648438, -0.138458251953125, -0.13049697875976562, -0.12253570556640625, -0.11457443237304688, -0.1066131591796875, -0.09865188598632812, -0.09069061279296875, -0.08272933959960938, -0.07476806640625, -0.06680679321289062, -0.05884552001953125, -0.050884246826171875, -0.0429229736328125, -0.034961700439453125, -0.02700042724609375, -0.019039154052734375, -0.011077880859375, -0.003116607666015625, 0.00484466552734375, 0.012805938720703125, 0.0207672119140625, 0.028728485107421875, 0.03668975830078125, 0.044651031494140625, 0.0526123046875, 0.060573577880859375, 0.06853485107421875, 0.07649612426757812, 0.0844573974609375, 0.09241867065429688, 0.10037994384765625, 0.10834121704101562, 0.116302490234375, 0.12426376342773438, 0.13222503662109375, 0.14018630981445312, 0.1481475830078125, 0.15610885620117188, 0.16407012939453125, 0.17203140258789062, 0.17999267578125, 0.18795394897460938, 0.19591522216796875, 0.20387649536132812, 0.2118377685546875, 0.21979904174804688, 0.22776031494140625, 0.23572158813476562, 0.243682861328125, 0.2516441345214844, 0.25960540771484375, 0.2675666809082031, 0.2755279541015625, 0.2834892272949219, 0.29145050048828125, 0.2994117736816406, 0.307373046875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 17.0, 19.0, 50.0, 92.0, 206.0, 244.0, 188.0, 91.0, 35.0, 20.0, 16.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.619997501373291, -5.465272903442383, -5.310548305511475, -5.155823707580566, -5.001099109649658, -4.84637451171875, -4.691649913787842, -4.536925315856934, -4.382201194763184, -4.227476596832275, -4.072751998901367, -3.918027400970459, -3.763302803039551, -3.6085782051086426, -3.4538538455963135, -3.2991292476654053, -3.144404411315918, -2.9896798133850098, -2.8349552154541016, -2.6802306175231934, -2.525506019592285, -2.370781421661377, -2.216057062149048, -2.0613324642181396, -1.9066078662872314, -1.7518832683563232, -1.597158670425415, -1.4424341917037964, -1.2877095937728882, -1.13298499584198, -0.9782604575157166, -0.8235359191894531, -0.6688108444213867, -0.5140862464904785, -0.3593617081642151, -0.20463714003562927, -0.04991257190704346, 0.10481202602386475, 0.2595365643501282, 0.4142611026763916, 0.5689857006072998, 0.723710298538208, 0.8784348368644714, 1.0331593751907349, 1.187883973121643, 1.3426085710525513, 1.49733304977417, 1.6520576477050781, 1.8067822456359863, 1.9615068435668945, 2.1162314414978027, 2.270956039428711, 2.425680637359619, 2.5804052352905273, 2.7351295948028564, 2.8898541927337646, 3.044578790664673, 3.199303388595581, 3.3540279865264893, 3.5087525844573975, 3.6634769439697266, 3.8182015419006348, 3.972926139831543, 4.127650737762451, 4.282375335693359]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 8.0, 4.0, 4.0, 3.0, 4.0, 11.0, 6.0, 14.0, 23.0, 24.0, 41.0, 52.0, 88.0, 74.0, 112.0, 91.0, 100.0, 75.0, 63.0, 51.0, 37.0, 34.0, 24.0, 15.0, 10.0, 14.0, 9.0, 6.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.259364604949951, -5.104634761810303, -4.949904918670654, -4.795175075531006, -4.640445232391357, -4.485715389251709, -4.3309855461120605, -4.17625617980957, -4.021526336669922, -3.8667964935302734, -3.712066650390625, -3.5573368072509766, -3.402606964111328, -3.2478771209716797, -3.0931475162506104, -2.938417673110962, -2.7836875915527344, -2.628957748413086, -2.4742279052734375, -2.319498062133789, -2.1647682189941406, -2.010038375854492, -1.8553087711334229, -1.7005789279937744, -1.545849084854126, -1.3911192417144775, -1.236389398574829, -1.0816596746444702, -0.9269298315048218, -0.7721999883651733, -0.6174702048301697, -0.462740421295166, -0.3080110549926758, -0.15328124165534973, 0.0014485716819763184, 0.15617838501930237, 0.3109081983566284, 0.46563804149627686, 0.6203678250312805, 0.7750976085662842, 0.9298274517059326, 1.084557294845581, 1.2392871379852295, 1.3940168619155884, 1.5487467050552368, 1.7034765481948853, 1.8582062721252441, 2.0129361152648926, 2.167665958404541, 2.3223958015441895, 2.477125644683838, 2.6318554878234863, 2.7865853309631348, 2.941315174102783, 3.0960447788238525, 3.250774621963501, 3.4055044651031494, 3.560234308242798, 3.7149641513824463, 3.8696939945220947, 4.024423599243164, 4.1791534423828125, 4.333883285522461, 4.488613128662109, 4.643342971801758]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 9.0, 16.0, 9.0, 14.0, 17.0, 26.0, 42.0, 47.0, 32.0, 80.0, 67.0, 97.0, 141.0, 190.0, 288.0, 396.0, 466.0, 689.0, 1069.0, 1796.0, 3523.0, 9024.0, 47372.0, 4029121.0, 77397.0, 12199.0, 4174.0, 2056.0, 1258.0, 780.0, 527.0, 384.0, 253.0, 189.0, 128.0, 105.0, 68.0, 58.0, 48.0, 39.0, 18.0, 20.0, 13.0, 7.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0], "bins": [-2.73828125, -2.665435791015625, -2.59259033203125, -2.519744873046875, -2.4468994140625, -2.374053955078125, -2.30120849609375, -2.228363037109375, -2.155517578125, -2.082672119140625, -2.00982666015625, -1.936981201171875, -1.8641357421875, -1.791290283203125, -1.71844482421875, -1.645599365234375, -1.57275390625, -1.499908447265625, -1.42706298828125, -1.354217529296875, -1.2813720703125, -1.208526611328125, -1.13568115234375, -1.062835693359375, -0.989990234375, -0.917144775390625, -0.84429931640625, -0.771453857421875, -0.6986083984375, -0.625762939453125, -0.55291748046875, -0.480072021484375, -0.4072265625, -0.334381103515625, -0.26153564453125, -0.188690185546875, -0.1158447265625, -0.042999267578125, 0.02984619140625, 0.102691650390625, 0.175537109375, 0.248382568359375, 0.32122802734375, 0.394073486328125, 0.4669189453125, 0.539764404296875, 0.61260986328125, 0.685455322265625, 0.75830078125, 0.831146240234375, 0.90399169921875, 0.976837158203125, 1.0496826171875, 1.122528076171875, 1.19537353515625, 1.268218994140625, 1.341064453125, 1.413909912109375, 1.48675537109375, 1.559600830078125, 1.6324462890625, 1.705291748046875, 1.77813720703125, 1.850982666015625, 1.923828125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 11.0, 11.0, 14.0, 14.0, 46.0, 102.0, 238.0, 243.0, 151.0, 63.0, 15.0, 14.0, 13.0, 7.0, 4.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17431640625, -0.16935348510742188, -0.16439056396484375, -0.15942764282226562, -0.1544647216796875, -0.14950180053710938, -0.14453887939453125, -0.13957595825195312, -0.134613037109375, -0.12965011596679688, -0.12468719482421875, -0.11972427368164062, -0.1147613525390625, -0.10979843139648438, -0.10483551025390625, -0.09987258911132812, -0.09490966796875, -0.08994674682617188, -0.08498382568359375, -0.08002090454101562, -0.0750579833984375, -0.07009506225585938, -0.06513214111328125, -0.060169219970703125, -0.055206298828125, -0.050243377685546875, -0.04528045654296875, -0.040317535400390625, -0.0353546142578125, -0.030391693115234375, -0.02542877197265625, -0.020465850830078125, -0.0155029296875, -0.010540008544921875, -0.00557708740234375, -0.000614166259765625, 0.0043487548828125, 0.009311676025390625, 0.01427459716796875, 0.019237518310546875, 0.024200439453125, 0.029163360595703125, 0.03412628173828125, 0.039089202880859375, 0.0440521240234375, 0.049015045166015625, 0.05397796630859375, 0.058940887451171875, 0.06390380859375, 0.06886672973632812, 0.07382965087890625, 0.07879257202148438, 0.0837554931640625, 0.08871841430664062, 0.09368133544921875, 0.09864425659179688, 0.103607177734375, 0.10857009887695312, 0.11353302001953125, 0.11849594116210938, 0.1234588623046875, 0.12842178344726562, 0.13338470458984375, 0.13834762573242188, 0.143310546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 12.0, 7.0, 15.0, 15.0, 29.0, 37.0, 59.0, 116.0, 177.0, 430.0, 1140.0, 3551.0, 13926.0, 91950.0, 3872380.0, 182360.0, 20361.0, 5018.0, 1556.0, 552.0, 262.0, 112.0, 64.0, 36.0, 31.0, 16.0, 17.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.099609375, -2.0389556884765625, -1.978302001953125, -1.9176483154296875, -1.85699462890625, -1.7963409423828125, -1.735687255859375, -1.6750335693359375, -1.6143798828125, -1.5537261962890625, -1.493072509765625, -1.4324188232421875, -1.37176513671875, -1.3111114501953125, -1.250457763671875, -1.1898040771484375, -1.129150390625, -1.0684967041015625, -1.007843017578125, -0.9471893310546875, -0.88653564453125, -0.8258819580078125, -0.765228271484375, -0.7045745849609375, -0.6439208984375, -0.5832672119140625, -0.522613525390625, -0.4619598388671875, -0.40130615234375, -0.3406524658203125, -0.279998779296875, -0.2193450927734375, -0.15869140625, -0.0980377197265625, -0.037384033203125, 0.0232696533203125, 0.08392333984375, 0.1445770263671875, 0.205230712890625, 0.2658843994140625, 0.3265380859375, 0.3871917724609375, 0.447845458984375, 0.5084991455078125, 0.56915283203125, 0.6298065185546875, 0.690460205078125, 0.7511138916015625, 0.811767578125, 0.8724212646484375, 0.933074951171875, 0.9937286376953125, 1.05438232421875, 1.1150360107421875, 1.175689697265625, 1.2363433837890625, 1.2969970703125, 1.3576507568359375, 1.418304443359375, 1.4789581298828125, 1.53961181640625, 1.6002655029296875, 1.660919189453125, 1.7215728759765625, 1.7822265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 6.0, 15.0, 15.0, 28.0, 31.0, 41.0, 104.0, 174.0, 526.0, 2158.0, 471.0, 210.0, 102.0, 56.0, 33.0, 26.0, 16.0, 8.0, 7.0, 9.0, 3.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.251953125, -0.24393844604492188, -0.23592376708984375, -0.22790908813476562, -0.2198944091796875, -0.21187973022460938, -0.20386505126953125, -0.19585037231445312, -0.187835693359375, -0.17982101440429688, -0.17180633544921875, -0.16379165649414062, -0.1557769775390625, -0.14776229858398438, -0.13974761962890625, -0.13173294067382812, -0.12371826171875, -0.11570358276367188, -0.10768890380859375, -0.09967422485351562, -0.0916595458984375, -0.08364486694335938, -0.07563018798828125, -0.06761550903320312, -0.059600830078125, -0.051586151123046875, -0.04357147216796875, -0.035556793212890625, -0.0275421142578125, -0.019527435302734375, -0.01151275634765625, -0.003498077392578125, 0.0045166015625, 0.012531280517578125, 0.02054595947265625, 0.028560638427734375, 0.0365753173828125, 0.044589996337890625, 0.05260467529296875, 0.060619354248046875, 0.068634033203125, 0.07664871215820312, 0.08466339111328125, 0.09267807006835938, 0.1006927490234375, 0.10870742797851562, 0.11672210693359375, 0.12473678588867188, 0.13275146484375, 0.14076614379882812, 0.14878082275390625, 0.15679550170898438, 0.1648101806640625, 0.17282485961914062, 0.18083953857421875, 0.18885421752929688, 0.196868896484375, 0.20488357543945312, 0.21289825439453125, 0.22091293334960938, 0.2289276123046875, 0.23694229125976562, 0.24495697021484375, 0.2529716491699219, 0.260986328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 19.0, 71.0, 219.0, 395.0, 198.0, 66.0, 25.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5961108207702637, -3.507216215133667, -3.4183218479156494, -3.3294272422790527, -3.240532636642456, -3.1516380310058594, -3.062743663787842, -2.973849058151245, -2.8849544525146484, -2.7960598468780518, -2.707165479660034, -2.6182708740234375, -2.529376268386841, -2.440481662750244, -2.3515872955322266, -2.26269268989563, -2.1737983226776123, -2.0849037170410156, -1.9960092306137085, -1.9071147441864014, -1.8182201385498047, -1.7293256521224976, -1.6404311656951904, -1.5515365600585938, -1.4626420736312866, -1.3737475872039795, -1.2848529815673828, -1.1959584951400757, -1.1070640087127686, -1.0181694030761719, -0.9292749166488647, -0.8403803706169128, -0.7514858245849609, -0.662591278553009, -0.5736967325210571, -0.48480224609375, -0.3959077000617981, -0.3070131540298462, -0.21811866760253906, -0.12922412157058716, -0.040329575538635254, 0.04856495559215546, 0.13745948672294617, 0.22635400295257568, 0.3152485489845276, 0.4041430950164795, 0.4930375814437866, 0.5819321274757385, 0.6708266735076904, 0.7597212195396423, 0.8486157655715942, 0.9375102519989014, 1.026404857635498, 1.1152993440628052, 1.2041938304901123, 1.293088436126709, 1.3819829225540161, 1.4708774089813232, 1.55977201461792, 1.648666501045227, 1.7375609874725342, 1.8264555931091309, 1.915350079536438, 2.004244565963745, 2.093139171600342]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 11.0, 9.0, 11.0, 10.0, 15.0, 15.0, 25.0, 29.0, 32.0, 35.0, 52.0, 39.0, 40.0, 46.0, 58.0, 52.0, 51.0, 53.0, 52.0, 45.0, 48.0, 42.0, 32.0, 27.0, 29.0, 25.0, 18.0, 14.0, 15.0, 12.0, 6.0, 5.0, 3.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.6629970669746399, -0.6418800950050354, -0.6207630634307861, -0.5996460914611816, -0.5785291194915771, -0.5574121475219727, -0.5362951159477234, -0.5151781439781189, -0.494061142206192, -0.47294414043426514, -0.45182716846466064, -0.43071016669273376, -0.4095931649208069, -0.3884761929512024, -0.3673591911792755, -0.34624218940734863, -0.32512521743774414, -0.30400821566581726, -0.28289124369621277, -0.2617742419242859, -0.2406572550535202, -0.21954026818275452, -0.19842326641082764, -0.17730627954006195, -0.15618929266929626, -0.13507230579853058, -0.1139553114771843, -0.09283831715583801, -0.07172133028507233, -0.05060434341430664, -0.02948734164237976, -0.008370354771614075, 0.012746691703796387, 0.03386368229985237, 0.054980672895908356, 0.07609766721725464, 0.09721465408802032, 0.11833164095878601, 0.1394486427307129, 0.16056562960147858, 0.18168261647224426, 0.20279960334300995, 0.22391659021377563, 0.24503359198570251, 0.2661505937576294, 0.2872675657272339, 0.30838456749916077, 0.32950156927108765, 0.35061854124069214, 0.371735543012619, 0.3928525149822235, 0.4139695167541504, 0.4350864887237549, 0.45620349049568176, 0.47732049226760864, 0.49843746423721313, 0.5195544958114624, 0.5406714677810669, 0.5617884993553162, 0.5829054713249207, 0.6040224432945251, 0.6251394748687744, 0.6462564468383789, 0.6673734188079834, 0.6884903907775879]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 2.0, 10.0, 23.0, 33.0, 43.0, 54.0, 87.0, 142.0, 242.0, 368.0, 658.0, 1284.0, 2441.0, 5667.0, 17056.0, 106994.0, 812544.0, 76568.0, 14401.0, 5087.0, 2142.0, 1137.0, 601.0, 345.0, 211.0, 140.0, 72.0, 70.0, 46.0, 30.0, 13.0, 15.0, 10.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7080078125, -1.6499786376953125, -1.591949462890625, -1.5339202880859375, -1.47589111328125, -1.4178619384765625, -1.359832763671875, -1.3018035888671875, -1.2437744140625, -1.1857452392578125, -1.127716064453125, -1.0696868896484375, -1.01165771484375, -0.9536285400390625, -0.895599365234375, -0.8375701904296875, -0.779541015625, -0.7215118408203125, -0.663482666015625, -0.6054534912109375, -0.54742431640625, -0.4893951416015625, -0.431365966796875, -0.3733367919921875, -0.3153076171875, -0.2572784423828125, -0.199249267578125, -0.1412200927734375, -0.08319091796875, -0.0251617431640625, 0.032867431640625, 0.0908966064453125, 0.14892578125, 0.2069549560546875, 0.264984130859375, 0.3230133056640625, 0.38104248046875, 0.4390716552734375, 0.497100830078125, 0.5551300048828125, 0.6131591796875, 0.6711883544921875, 0.729217529296875, 0.7872467041015625, 0.84527587890625, 0.9033050537109375, 0.961334228515625, 1.0193634033203125, 1.077392578125, 1.1354217529296875, 1.193450927734375, 1.2514801025390625, 1.30950927734375, 1.3675384521484375, 1.425567626953125, 1.4835968017578125, 1.5416259765625, 1.5996551513671875, 1.657684326171875, 1.7157135009765625, 1.77374267578125, 1.8317718505859375, 1.889801025390625, 1.9478302001953125, 2.005859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 2.0, 12.0, 13.0, 15.0, 36.0, 70.0, 132.0, 208.0, 197.0, 133.0, 63.0, 38.0, 14.0, 8.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1669921875, -0.16221046447753906, -0.15742874145507812, -0.1526470184326172, -0.14786529541015625, -0.1430835723876953, -0.13830184936523438, -0.13352012634277344, -0.1287384033203125, -0.12395668029785156, -0.11917495727539062, -0.11439323425292969, -0.10961151123046875, -0.10482978820800781, -0.10004806518554688, -0.09526634216308594, -0.090484619140625, -0.08570289611816406, -0.08092117309570312, -0.07613945007324219, -0.07135772705078125, -0.06657600402832031, -0.061794281005859375, -0.05701255798339844, -0.0522308349609375, -0.04744911193847656, -0.042667388916015625, -0.03788566589355469, -0.03310394287109375, -0.028322219848632812, -0.023540496826171875, -0.018758773803710938, -0.01397705078125, -0.009195327758789062, -0.004413604736328125, 0.0003681182861328125, 0.00514984130859375, 0.009931564331054688, 0.014713287353515625, 0.019495010375976562, 0.0242767333984375, 0.029058456420898438, 0.033840179443359375, 0.03862190246582031, 0.04340362548828125, 0.04818534851074219, 0.052967071533203125, 0.05774879455566406, 0.062530517578125, 0.06731224060058594, 0.07209396362304688, 0.07687568664550781, 0.08165740966796875, 0.08643913269042969, 0.09122085571289062, 0.09600257873535156, 0.1007843017578125, 0.10556602478027344, 0.11034774780273438, 0.11512947082519531, 0.11991119384765625, 0.12469291687011719, 0.12947463989257812, 0.13425636291503906, 0.1390380859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 13.0, 10.0, 24.0, 31.0, 40.0, 42.0, 68.0, 110.0, 159.0, 253.0, 354.0, 660.0, 1182.0, 2399.0, 6905.0, 27838.0, 172528.0, 609849.0, 183964.0, 29510.0, 7051.0, 2530.0, 1245.0, 657.0, 369.0, 268.0, 148.0, 93.0, 80.0, 51.0, 44.0, 26.0, 15.0, 12.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.48046875, -1.4362945556640625, -1.392120361328125, -1.3479461669921875, -1.30377197265625, -1.2595977783203125, -1.215423583984375, -1.1712493896484375, -1.1270751953125, -1.0829010009765625, -1.038726806640625, -0.9945526123046875, -0.95037841796875, -0.9062042236328125, -0.862030029296875, -0.8178558349609375, -0.773681640625, -0.7295074462890625, -0.685333251953125, -0.6411590576171875, -0.59698486328125, -0.5528106689453125, -0.508636474609375, -0.4644622802734375, -0.4202880859375, -0.3761138916015625, -0.331939697265625, -0.2877655029296875, -0.24359130859375, -0.1994171142578125, -0.155242919921875, -0.1110687255859375, -0.06689453125, -0.0227203369140625, 0.021453857421875, 0.0656280517578125, 0.10980224609375, 0.1539764404296875, 0.198150634765625, 0.2423248291015625, 0.2864990234375, 0.3306732177734375, 0.374847412109375, 0.4190216064453125, 0.46319580078125, 0.5073699951171875, 0.551544189453125, 0.5957183837890625, 0.639892578125, 0.6840667724609375, 0.728240966796875, 0.7724151611328125, 0.81658935546875, 0.8607635498046875, 0.904937744140625, 0.9491119384765625, 0.9932861328125, 1.0374603271484375, 1.081634521484375, 1.1258087158203125, 1.16998291015625, 1.2141571044921875, 1.258331298828125, 1.3025054931640625, 1.3466796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 1.0, 4.0, 11.0, 15.0, 8.0, 16.0, 9.0, 26.0, 18.0, 20.0, 37.0, 33.0, 32.0, 29.0, 43.0, 49.0, 68.0, 55.0, 53.0, 53.0, 52.0, 46.0, 46.0, 45.0, 30.0, 26.0, 34.0, 28.0, 20.0, 16.0, 11.0, 12.0, 20.0, 10.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4892578125, -0.4735565185546875, -0.457855224609375, -0.4421539306640625, -0.42645263671875, -0.4107513427734375, -0.395050048828125, -0.3793487548828125, -0.3636474609375, -0.3479461669921875, -0.332244873046875, -0.3165435791015625, -0.30084228515625, -0.2851409912109375, -0.269439697265625, -0.2537384033203125, -0.238037109375, -0.2223358154296875, -0.206634521484375, -0.1909332275390625, -0.17523193359375, -0.1595306396484375, -0.143829345703125, -0.1281280517578125, -0.1124267578125, -0.0967254638671875, -0.081024169921875, -0.0653228759765625, -0.04962158203125, -0.0339202880859375, -0.018218994140625, -0.0025177001953125, 0.01318359375, 0.0288848876953125, 0.044586181640625, 0.0602874755859375, 0.07598876953125, 0.0916900634765625, 0.107391357421875, 0.1230926513671875, 0.1387939453125, 0.1544952392578125, 0.170196533203125, 0.1858978271484375, 0.20159912109375, 0.2173004150390625, 0.233001708984375, 0.2487030029296875, 0.264404296875, 0.2801055908203125, 0.295806884765625, 0.3115081787109375, 0.32720947265625, 0.3429107666015625, 0.358612060546875, 0.3743133544921875, 0.3900146484375, 0.4057159423828125, 0.421417236328125, 0.4371185302734375, 0.45281982421875, 0.4685211181640625, 0.484222412109375, 0.4999237060546875, 0.515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 8.0, 17.0, 20.0, 29.0, 41.0, 83.0, 132.0, 230.0, 366.0, 769.0, 1705.0, 4808.0, 15443.0, 66399.0, 362875.0, 469804.0, 95344.0, 20515.0, 5928.0, 2081.0, 896.0, 454.0, 246.0, 124.0, 61.0, 55.0, 44.0, 29.0, 11.0, 10.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6591796875, -0.6372833251953125, -0.615386962890625, -0.5934906005859375, -0.57159423828125, -0.5496978759765625, -0.527801513671875, -0.5059051513671875, -0.4840087890625, -0.4621124267578125, -0.440216064453125, -0.4183197021484375, -0.39642333984375, -0.3745269775390625, -0.352630615234375, -0.3307342529296875, -0.308837890625, -0.2869415283203125, -0.265045166015625, -0.2431488037109375, -0.22125244140625, -0.1993560791015625, -0.177459716796875, -0.1555633544921875, -0.1336669921875, -0.1117706298828125, -0.089874267578125, -0.0679779052734375, -0.04608154296875, -0.0241851806640625, -0.002288818359375, 0.0196075439453125, 0.04150390625, 0.0634002685546875, 0.085296630859375, 0.1071929931640625, 0.12908935546875, 0.1509857177734375, 0.172882080078125, 0.1947784423828125, 0.2166748046875, 0.2385711669921875, 0.260467529296875, 0.2823638916015625, 0.30426025390625, 0.3261566162109375, 0.348052978515625, 0.3699493408203125, 0.391845703125, 0.4137420654296875, 0.435638427734375, 0.4575347900390625, 0.47943115234375, 0.5013275146484375, 0.523223876953125, 0.5451202392578125, 0.5670166015625, 0.5889129638671875, 0.610809326171875, 0.6327056884765625, 0.65460205078125, 0.6764984130859375, 0.698394775390625, 0.7202911376953125, 0.7421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 7.0, 13.0, 8.0, 16.0, 17.0, 24.0, 18.0, 34.0, 37.0, 56.0, 48.0, 63.0, 63.0, 84.0, 64.0, 60.0, 74.0, 57.0, 55.0, 38.0, 31.0, 31.0, 22.0, 16.0, 14.0, 13.0, 8.0, 3.0, 4.0, 4.0, 4.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.238719940185547e-05, -8.969288319349289e-05, -8.699856698513031e-05, -8.430425077676773e-05, -8.160993456840515e-05, -7.891561836004257e-05, -7.622130215167999e-05, -7.352698594331741e-05, -7.083266973495483e-05, -6.813835352659225e-05, -6.544403731822968e-05, -6.27497211098671e-05, -6.0055404901504517e-05, -5.736108869314194e-05, -5.466677248477936e-05, -5.197245627641678e-05, -4.92781400680542e-05, -4.658382385969162e-05, -4.388950765132904e-05, -4.119519144296646e-05, -3.850087523460388e-05, -3.58065590262413e-05, -3.311224281787872e-05, -3.0417926609516144e-05, -2.7723610401153564e-05, -2.5029294192790985e-05, -2.2334977984428406e-05, -1.9640661776065826e-05, -1.6946345567703247e-05, -1.4252029359340668e-05, -1.1557713150978088e-05, -8.863396942615509e-06, -6.16908073425293e-06, -3.4747645258903503e-06, -7.80448317527771e-07, 1.9138678908348083e-06, 4.608184099197388e-06, 7.302500307559967e-06, 9.996816515922546e-06, 1.2691132724285126e-05, 1.5385448932647705e-05, 1.8079765141010284e-05, 2.0774081349372864e-05, 2.3468397557735443e-05, 2.6162713766098022e-05, 2.8857029974460602e-05, 3.155134618282318e-05, 3.424566239118576e-05, 3.693997859954834e-05, 3.963429480791092e-05, 4.23286110162735e-05, 4.502292722463608e-05, 4.771724343299866e-05, 5.0411559641361237e-05, 5.3105875849723816e-05, 5.5800192058086395e-05, 5.8494508266448975e-05, 6.118882447481155e-05, 6.388314068317413e-05, 6.657745689153671e-05, 6.927177309989929e-05, 7.196608930826187e-05, 7.466040551662445e-05, 7.735472172498703e-05, 8.004903793334961e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 11.0, 8.0, 13.0, 17.0, 17.0, 20.0, 39.0, 53.0, 64.0, 102.0, 143.0, 219.0, 325.0, 526.0, 987.0, 2076.0, 4798.0, 13856.0, 53834.0, 298830.0, 524289.0, 110762.0, 24119.0, 7247.0, 2795.0, 1363.0, 761.0, 408.0, 265.0, 179.0, 120.0, 83.0, 46.0, 45.0, 39.0, 27.0, 16.0, 13.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.74755859375, -0.7263336181640625, -0.705108642578125, -0.6838836669921875, -0.66265869140625, -0.6414337158203125, -0.620208740234375, -0.5989837646484375, -0.5777587890625, -0.5565338134765625, -0.535308837890625, -0.5140838623046875, -0.49285888671875, -0.4716339111328125, -0.450408935546875, -0.4291839599609375, -0.407958984375, -0.3867340087890625, -0.365509033203125, -0.3442840576171875, -0.32305908203125, -0.3018341064453125, -0.280609130859375, -0.2593841552734375, -0.2381591796875, -0.2169342041015625, -0.195709228515625, -0.1744842529296875, -0.15325927734375, -0.1320343017578125, -0.110809326171875, -0.0895843505859375, -0.068359375, -0.0471343994140625, -0.025909423828125, -0.0046844482421875, 0.01654052734375, 0.0377655029296875, 0.058990478515625, 0.0802154541015625, 0.1014404296875, 0.1226654052734375, 0.143890380859375, 0.1651153564453125, 0.18634033203125, 0.2075653076171875, 0.228790283203125, 0.2500152587890625, 0.271240234375, 0.2924652099609375, 0.313690185546875, 0.3349151611328125, 0.35614013671875, 0.3773651123046875, 0.398590087890625, 0.4198150634765625, 0.4410400390625, 0.4622650146484375, 0.483489990234375, 0.5047149658203125, 0.52593994140625, 0.5471649169921875, 0.568389892578125, 0.5896148681640625, 0.61083984375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 5.0, 13.0, 5.0, 13.0, 12.0, 11.0, 25.0, 22.0, 23.0, 29.0, 30.0, 44.0, 48.0, 48.0, 62.0, 68.0, 59.0, 64.0, 56.0, 53.0, 51.0, 47.0, 33.0, 28.0, 20.0, 23.0, 16.0, 18.0, 15.0, 10.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.2449016571044922, -0.23711776733398438, -0.22933387756347656, -0.22154998779296875, -0.21376609802246094, -0.20598220825195312, -0.1981983184814453, -0.1904144287109375, -0.1826305389404297, -0.17484664916992188, -0.16706275939941406, -0.15927886962890625, -0.15149497985839844, -0.14371109008789062, -0.1359272003173828, -0.128143310546875, -0.12035942077636719, -0.11257553100585938, -0.10479164123535156, -0.09700775146484375, -0.08922386169433594, -0.08143997192382812, -0.07365608215332031, -0.0658721923828125, -0.05808830261230469, -0.050304412841796875, -0.04252052307128906, -0.03473663330078125, -0.026952743530273438, -0.019168853759765625, -0.011384963989257812, -0.00360107421875, 0.0041828155517578125, 0.011966705322265625, 0.019750595092773438, 0.02753448486328125, 0.03531837463378906, 0.043102264404296875, 0.05088615417480469, 0.0586700439453125, 0.06645393371582031, 0.07423782348632812, 0.08202171325683594, 0.08980560302734375, 0.09758949279785156, 0.10537338256835938, 0.11315727233886719, 0.120941162109375, 0.1287250518798828, 0.13650894165039062, 0.14429283142089844, 0.15207672119140625, 0.15986061096191406, 0.16764450073242188, 0.1754283905029297, 0.1832122802734375, 0.1909961700439453, 0.19878005981445312, 0.20656394958496094, 0.21434783935546875, 0.22213172912597656, 0.22991561889648438, 0.2376995086669922, 0.2454833984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 12.0, 43.0, 97.0, 186.0, 273.0, 204.0, 114.0, 46.0, 11.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.227106094360352, -9.868215560913086, -9.50932502746582, -9.150434494018555, -8.791543960571289, -8.43265438079834, -8.073763847351074, -7.714873313903809, -7.355982780456543, -6.997092247009277, -6.638201713562012, -6.279311656951904, -5.920421123504639, -5.561530590057373, -5.202640533447266, -4.84375, -4.484859466552734, -4.125968933105469, -3.7670786380767822, -3.4081883430480957, -3.04929780960083, -2.6904072761535645, -2.331516981124878, -1.9726266860961914, -1.6137361526489258, -1.2548457384109497, -0.8959553241729736, -0.5370649099349976, -0.17817449569702148, 0.1807159185409546, 0.5396063327789307, 0.8984966278076172, 1.2573871612548828, 1.6162775754928589, 1.975167989730835, 2.3340582847595215, 2.692948818206787, 3.0518393516540527, 3.4107296466827393, 3.769619941711426, 4.128510475158691, 4.487401008605957, 4.846291542053223, 5.20518159866333, 5.564072132110596, 5.922962665557861, 6.281852722167969, 6.640743255615234, 6.9996337890625, 7.358524322509766, 7.717414855957031, 8.076305389404297, 8.435195922851562, 8.794085502624512, 9.152976036071777, 9.511866569519043, 9.870757102966309, 10.229647636413574, 10.58853816986084, 10.947428703308105, 11.306318283081055, 11.66520881652832, 12.024099349975586, 12.382989883422852, 12.741880416870117]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 10.0, 19.0, 24.0, 28.0, 28.0, 33.0, 40.0, 60.0, 52.0, 61.0, 53.0, 63.0, 67.0, 65.0, 66.0, 71.0, 46.0, 56.0, 34.0, 25.0, 22.0, 15.0, 11.0, 15.0, 7.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.010191917419434, -5.852184295654297, -5.694176197052002, -5.536168575286865, -5.37816047668457, -5.220152854919434, -5.062145233154297, -4.90413761138916, -4.746129512786865, -4.5881218910217285, -4.430113792419434, -4.272106170654297, -4.11409854888916, -3.9560904502868652, -3.7980828285217285, -3.6400749683380127, -3.482067108154297, -3.324059247970581, -3.1660513877868652, -3.0080437660217285, -2.8500359058380127, -2.692028045654297, -2.53402042388916, -2.3760125637054443, -2.2180047035217285, -2.0599968433380127, -1.9019891023635864, -1.7439813613891602, -1.5859735012054443, -1.4279656410217285, -1.2699579000473022, -1.111950159072876, -0.9539422988891602, -0.7959344983100891, -0.6379266977310181, -0.479918897151947, -0.321911096572876, -0.16390329599380493, -0.005895495414733887, 0.15211224555969238, 0.3101201057434082, 0.46812790632247925, 0.6261357069015503, 0.7841435074806213, 0.9421513080596924, 1.1001591682434082, 1.2581669092178345, 1.4161746501922607, 1.5741825103759766, 1.7321903705596924, 1.8901981115341187, 2.048205852508545, 2.2062137126922607, 2.3642215728759766, 2.5222291946411133, 2.680237054824829, 2.838244915008545, 2.9962527751922607, 3.1542606353759766, 3.3122682571411133, 3.470276117324829, 3.628283977508545, 3.7862915992736816, 3.9442994594573975, 4.102307319641113]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 11.0, 17.0, 25.0, 66.0, 116.0, 291.0, 1083.0, 10415.0, 4154034.0, 25960.0, 1599.0, 384.0, 132.0, 53.0, 28.0, 16.0, 9.0, 8.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.83203125, -7.605712890625, -7.37939453125, -7.153076171875, -6.9267578125, -6.700439453125, -6.47412109375, -6.247802734375, -6.021484375, -5.795166015625, -5.56884765625, -5.342529296875, -5.1162109375, -4.889892578125, -4.66357421875, -4.437255859375, -4.2109375, -3.984619140625, -3.75830078125, -3.531982421875, -3.3056640625, -3.079345703125, -2.85302734375, -2.626708984375, -2.400390625, -2.174072265625, -1.94775390625, -1.721435546875, -1.4951171875, -1.268798828125, -1.04248046875, -0.816162109375, -0.58984375, -0.363525390625, -0.13720703125, 0.089111328125, 0.3154296875, 0.541748046875, 0.76806640625, 0.994384765625, 1.220703125, 1.447021484375, 1.67333984375, 1.899658203125, 2.1259765625, 2.352294921875, 2.57861328125, 2.804931640625, 3.03125, 3.257568359375, 3.48388671875, 3.710205078125, 3.9365234375, 4.162841796875, 4.38916015625, 4.615478515625, 4.841796875, 5.068115234375, 5.29443359375, 5.520751953125, 5.7470703125, 5.973388671875, 6.19970703125, 6.426025390625, 6.65234375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 11.0, 11.0, 19.0, 26.0, 57.0, 97.0, 118.0, 142.0, 134.0, 127.0, 100.0, 52.0, 21.0, 21.0, 12.0, 7.0, 7.0, 3.0, 1.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1806640625, -0.17517662048339844, -0.16968917846679688, -0.1642017364501953, -0.15871429443359375, -0.1532268524169922, -0.14773941040039062, -0.14225196838378906, -0.1367645263671875, -0.13127708435058594, -0.12578964233398438, -0.12030220031738281, -0.11481475830078125, -0.10932731628417969, -0.10383987426757812, -0.09835243225097656, -0.092864990234375, -0.08737754821777344, -0.08189010620117188, -0.07640266418457031, -0.07091522216796875, -0.06542778015136719, -0.059940338134765625, -0.05445289611816406, -0.0489654541015625, -0.04347801208496094, -0.037990570068359375, -0.03250312805175781, -0.02701568603515625, -0.021528244018554688, -0.016040802001953125, -0.010553359985351562, -0.00506591796875, 0.0004215240478515625, 0.005908966064453125, 0.011396408081054688, 0.01688385009765625, 0.022371292114257812, 0.027858734130859375, 0.03334617614746094, 0.0388336181640625, 0.04432106018066406, 0.049808502197265625, 0.05529594421386719, 0.06078338623046875, 0.06627082824707031, 0.07175827026367188, 0.07724571228027344, 0.082733154296875, 0.08822059631347656, 0.09370803833007812, 0.09919548034667969, 0.10468292236328125, 0.11017036437988281, 0.11565780639648438, 0.12114524841308594, 0.1266326904296875, 0.13212013244628906, 0.13760757446289062, 0.1430950164794922, 0.14858245849609375, 0.1540699005126953, 0.15955734252929688, 0.16504478454589844, 0.1705322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 2.0, 5.0, 13.0, 25.0, 25.0, 38.0, 64.0, 93.0, 138.0, 235.0, 406.0, 880.0, 1783.0, 4357.0, 14089.0, 63325.0, 1027644.0, 2972955.0, 82445.0, 17017.0, 5037.0, 1849.0, 819.0, 429.0, 236.0, 134.0, 74.0, 53.0, 34.0, 22.0, 17.0, 14.0, 8.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.595703125, -1.5408172607421875, -1.485931396484375, -1.4310455322265625, -1.37615966796875, -1.3212738037109375, -1.266387939453125, -1.2115020751953125, -1.1566162109375, -1.1017303466796875, -1.046844482421875, -0.9919586181640625, -0.93707275390625, -0.8821868896484375, -0.827301025390625, -0.7724151611328125, -0.717529296875, -0.6626434326171875, -0.607757568359375, -0.5528717041015625, -0.49798583984375, -0.4430999755859375, -0.388214111328125, -0.3333282470703125, -0.2784423828125, -0.2235565185546875, -0.168670654296875, -0.1137847900390625, -0.05889892578125, -0.0040130615234375, 0.050872802734375, 0.1057586669921875, 0.16064453125, 0.2155303955078125, 0.270416259765625, 0.3253021240234375, 0.38018798828125, 0.4350738525390625, 0.489959716796875, 0.5448455810546875, 0.5997314453125, 0.6546173095703125, 0.709503173828125, 0.7643890380859375, 0.81927490234375, 0.8741607666015625, 0.929046630859375, 0.9839324951171875, 1.038818359375, 1.0937042236328125, 1.148590087890625, 1.2034759521484375, 1.25836181640625, 1.3132476806640625, 1.368133544921875, 1.4230194091796875, 1.4779052734375, 1.5327911376953125, 1.587677001953125, 1.6425628662109375, 1.69744873046875, 1.7523345947265625, 1.807220458984375, 1.8621063232421875, 1.9169921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 13.0, 25.0, 27.0, 32.0, 57.0, 79.0, 120.0, 170.0, 390.0, 1458.0, 899.0, 310.0, 156.0, 92.0, 68.0, 29.0, 33.0, 30.0, 16.0, 19.0, 5.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0], "bins": [-0.3583984375, -0.3498497009277344, -0.34130096435546875, -0.3327522277832031, -0.3242034912109375, -0.3156547546386719, -0.30710601806640625, -0.2985572814941406, -0.290008544921875, -0.2814598083496094, -0.27291107177734375, -0.2643623352050781, -0.2558135986328125, -0.24726486206054688, -0.23871612548828125, -0.23016738891601562, -0.22161865234375, -0.21306991577148438, -0.20452117919921875, -0.19597244262695312, -0.1874237060546875, -0.17887496948242188, -0.17032623291015625, -0.16177749633789062, -0.153228759765625, -0.14468002319335938, -0.13613128662109375, -0.12758255004882812, -0.1190338134765625, -0.11048507690429688, -0.10193634033203125, -0.09338760375976562, -0.0848388671875, -0.07629013061523438, -0.06774139404296875, -0.059192657470703125, -0.0506439208984375, -0.042095184326171875, -0.03354644775390625, -0.024997711181640625, -0.016448974609375, -0.007900238037109375, 0.00064849853515625, 0.009197235107421875, 0.0177459716796875, 0.026294708251953125, 0.03484344482421875, 0.043392181396484375, 0.05194091796875, 0.060489654541015625, 0.06903839111328125, 0.07758712768554688, 0.0861358642578125, 0.09468460083007812, 0.10323333740234375, 0.11178207397460938, 0.120330810546875, 0.12887954711914062, 0.13742828369140625, 0.14597702026367188, 0.1545257568359375, 0.16307449340820312, 0.17162322998046875, 0.18017196655273438, 0.188720703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 16.0, 32.0, 33.0, 61.0, 107.0, 168.0, 156.0, 160.0, 106.0, 59.0, 34.0, 23.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.257053852081299, -3.1841275691986084, -3.111201286315918, -3.0382750034332275, -2.965348720550537, -2.892422676086426, -2.8194963932037354, -2.746570110321045, -2.6736438274383545, -2.600717544555664, -2.5277912616729736, -2.454864978790283, -2.381938934326172, -2.3090126514434814, -2.236086368560791, -2.1631600856781006, -2.09023380279541, -2.0173075199127197, -1.9443812370300293, -1.8714550733566284, -1.798528790473938, -1.7256025075912476, -1.6526763439178467, -1.5797500610351562, -1.5068237781524658, -1.4338974952697754, -1.360971212387085, -1.288045048713684, -1.2151187658309937, -1.1421924829483032, -1.0692663192749023, -0.9963400363922119, -0.9234137535095215, -0.850487470626831, -0.7775612473487854, -0.7046350240707397, -0.6317087411880493, -0.5587824583053589, -0.48585623502731323, -0.4129300117492676, -0.34000372886657715, -0.2670774757862091, -0.19415122270584106, -0.12122496962547302, -0.04829871654510498, 0.02462753653526306, 0.0975537896156311, 0.17048001289367676, 0.2434062957763672, 0.31633254885673523, 0.38925880193710327, 0.4621850550174713, 0.5351113080978394, 0.6080375909805298, 0.6809638142585754, 0.7538900375366211, 0.8268163204193115, 0.899742603302002, 0.9726688265800476, 1.0455950498580933, 1.1185213327407837, 1.1914476156234741, 1.264373779296875, 1.3373000621795654, 1.4102263450622559]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 16.0, 6.0, 13.0, 8.0, 11.0, 16.0, 12.0, 18.0, 15.0, 21.0, 22.0, 28.0, 32.0, 40.0, 36.0, 38.0, 45.0, 32.0, 40.0, 42.0, 41.0, 46.0, 23.0, 39.0, 43.0, 40.0, 31.0, 22.0, 28.0, 29.0, 29.0, 23.0, 21.0, 16.0, 11.0, 17.0, 10.0, 13.0, 5.0, 5.0, 1.0, 3.0, 6.0, 0.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.9901532530784607, -0.9607658386230469, -0.9313783645629883, -0.9019909501075745, -0.8726034760475159, -0.843216061592102, -0.8138285875320435, -0.7844411730766296, -0.755053699016571, -0.7256662845611572, -0.6962788105010986, -0.6668913960456848, -0.6375039219856262, -0.6081165075302124, -0.5787290334701538, -0.54934161901474, -0.5199542045593262, -0.49056676030158997, -0.46117931604385376, -0.43179187178611755, -0.40240442752838135, -0.37301701307296753, -0.34362953901290894, -0.3142421245574951, -0.2848546504974365, -0.2554672062397003, -0.2260797619819641, -0.1966923177242279, -0.1673048734664917, -0.1379174441099167, -0.10852999985218048, -0.07914255559444427, -0.049755096435546875, -0.020367654040455818, 0.009019788354635239, 0.038407228887081146, 0.06779467314481735, 0.09718210995197296, 0.12656955420970917, 0.15595699846744537, 0.18534444272518158, 0.21473188698291779, 0.244119331240654, 0.273506760597229, 0.3028942048549652, 0.3322816491127014, 0.3616690933704376, 0.39105653762817383, 0.42044398188591003, 0.44983142614364624, 0.47921887040138245, 0.5086063146591187, 0.5379937291145325, 0.5673812031745911, 0.5967686176300049, 0.6261560916900635, 0.6555435061454773, 0.6849309206008911, 0.7143183946609497, 0.7437058091163635, 0.7730932831764221, 0.8024806976318359, 0.8318681716918945, 0.8612555861473083, 0.8906430602073669]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 14.0, 8.0, 8.0, 25.0, 26.0, 33.0, 65.0, 95.0, 113.0, 218.0, 336.0, 527.0, 914.0, 1720.0, 3672.0, 11466.0, 52806.0, 362911.0, 508621.0, 80187.0, 15375.0, 4681.0, 1989.0, 1093.0, 612.0, 346.0, 195.0, 153.0, 103.0, 84.0, 44.0, 26.0, 18.0, 17.0, 16.0, 9.0, 5.0, 0.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.40924072265625, -1.3653564453125, -1.32147216796875, -1.277587890625, -1.23370361328125, -1.1898193359375, -1.14593505859375, -1.10205078125, -1.05816650390625, -1.0142822265625, -0.97039794921875, -0.926513671875, -0.88262939453125, -0.8387451171875, -0.79486083984375, -0.7509765625, -0.70709228515625, -0.6632080078125, -0.61932373046875, -0.575439453125, -0.53155517578125, -0.4876708984375, -0.44378662109375, -0.39990234375, -0.35601806640625, -0.3121337890625, -0.26824951171875, -0.224365234375, -0.18048095703125, -0.1365966796875, -0.09271240234375, -0.048828125, -0.00494384765625, 0.0389404296875, 0.08282470703125, 0.126708984375, 0.17059326171875, 0.2144775390625, 0.25836181640625, 0.30224609375, 0.34613037109375, 0.3900146484375, 0.43389892578125, 0.477783203125, 0.52166748046875, 0.5655517578125, 0.60943603515625, 0.6533203125, 0.69720458984375, 0.7410888671875, 0.78497314453125, 0.828857421875, 0.87274169921875, 0.9166259765625, 0.96051025390625, 1.00439453125, 1.04827880859375, 1.0921630859375, 1.13604736328125, 1.179931640625, 1.22381591796875, 1.2677001953125, 1.31158447265625, 1.35546875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 12.0, 6.0, 26.0, 27.0, 51.0, 59.0, 74.0, 104.0, 134.0, 110.0, 97.0, 73.0, 62.0, 58.0, 33.0, 16.0, 10.0, 12.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.182861328125, -0.17763137817382812, -0.17240142822265625, -0.16717147827148438, -0.1619415283203125, -0.15671157836914062, -0.15148162841796875, -0.14625167846679688, -0.141021728515625, -0.13579177856445312, -0.13056182861328125, -0.12533187866210938, -0.1201019287109375, -0.11487197875976562, -0.10964202880859375, -0.10441207885742188, -0.09918212890625, -0.09395217895507812, -0.08872222900390625, -0.08349227905273438, -0.0782623291015625, -0.07303237915039062, -0.06780242919921875, -0.06257247924804688, -0.057342529296875, -0.052112579345703125, -0.04688262939453125, -0.041652679443359375, -0.0364227294921875, -0.031192779541015625, -0.02596282958984375, -0.020732879638671875, -0.0155029296875, -0.010272979736328125, -0.00504302978515625, 0.000186920166015625, 0.0054168701171875, 0.010646820068359375, 0.01587677001953125, 0.021106719970703125, 0.026336669921875, 0.031566619873046875, 0.03679656982421875, 0.042026519775390625, 0.0472564697265625, 0.052486419677734375, 0.05771636962890625, 0.06294631958007812, 0.06817626953125, 0.07340621948242188, 0.07863616943359375, 0.08386611938476562, 0.0890960693359375, 0.09432601928710938, 0.09955596923828125, 0.10478591918945312, 0.110015869140625, 0.11524581909179688, 0.12047576904296875, 0.12570571899414062, 0.1309356689453125, 0.13616561889648438, 0.14139556884765625, 0.14662551879882812, 0.15185546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 10.0, 19.0, 32.0, 26.0, 46.0, 60.0, 83.0, 144.0, 175.0, 272.0, 378.0, 555.0, 850.0, 1360.0, 2721.0, 6054.0, 18528.0, 67796.0, 271656.0, 477075.0, 143977.0, 36791.0, 10705.0, 4047.0, 1887.0, 1072.0, 693.0, 438.0, 336.0, 211.0, 135.0, 95.0, 76.0, 69.0, 51.0, 39.0, 21.0, 21.0, 12.0, 10.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0167694091796875, -0.980804443359375, -0.9448394775390625, -0.90887451171875, -0.8729095458984375, -0.836944580078125, -0.8009796142578125, -0.7650146484375, -0.7290496826171875, -0.693084716796875, -0.6571197509765625, -0.62115478515625, -0.5851898193359375, -0.549224853515625, -0.5132598876953125, -0.477294921875, -0.4413299560546875, -0.405364990234375, -0.3694000244140625, -0.33343505859375, -0.2974700927734375, -0.261505126953125, -0.2255401611328125, -0.1895751953125, -0.1536102294921875, -0.117645263671875, -0.0816802978515625, -0.04571533203125, -0.0097503662109375, 0.026214599609375, 0.0621795654296875, 0.09814453125, 0.1341094970703125, 0.170074462890625, 0.2060394287109375, 0.24200439453125, 0.2779693603515625, 0.313934326171875, 0.3498992919921875, 0.3858642578125, 0.4218292236328125, 0.457794189453125, 0.4937591552734375, 0.52972412109375, 0.5656890869140625, 0.601654052734375, 0.6376190185546875, 0.673583984375, 0.7095489501953125, 0.745513916015625, 0.7814788818359375, 0.81744384765625, 0.8534088134765625, 0.889373779296875, 0.9253387451171875, 0.9613037109375, 0.9972686767578125, 1.033233642578125, 1.0691986083984375, 1.10516357421875, 1.1411285400390625, 1.177093505859375, 1.2130584716796875, 1.2490234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 6.0, 5.0, 11.0, 18.0, 7.0, 19.0, 19.0, 22.0, 22.0, 34.0, 29.0, 37.0, 39.0, 47.0, 44.0, 61.0, 43.0, 53.0, 62.0, 55.0, 58.0, 47.0, 53.0, 32.0, 27.0, 18.0, 29.0, 18.0, 15.0, 10.0, 11.0, 9.0, 6.0, 9.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59033203125, -0.5686569213867188, -0.5469818115234375, -0.5253067016601562, -0.503631591796875, -0.48195648193359375, -0.4602813720703125, -0.43860626220703125, -0.41693115234375, -0.39525604248046875, -0.3735809326171875, -0.35190582275390625, -0.330230712890625, -0.30855560302734375, -0.2868804931640625, -0.26520538330078125, -0.2435302734375, -0.22185516357421875, -0.2001800537109375, -0.17850494384765625, -0.156829833984375, -0.13515472412109375, -0.1134796142578125, -0.09180450439453125, -0.07012939453125, -0.04845428466796875, -0.0267791748046875, -0.00510406494140625, 0.016571044921875, 0.03824615478515625, 0.0599212646484375, 0.08159637451171875, 0.103271484375, 0.12494659423828125, 0.1466217041015625, 0.16829681396484375, 0.189971923828125, 0.21164703369140625, 0.2333221435546875, 0.25499725341796875, 0.27667236328125, 0.29834747314453125, 0.3200225830078125, 0.34169769287109375, 0.363372802734375, 0.38504791259765625, 0.4067230224609375, 0.42839813232421875, 0.4500732421875, 0.47174835205078125, 0.4934234619140625, 0.5150985717773438, 0.536773681640625, 0.5584487915039062, 0.5801239013671875, 0.6017990112304688, 0.62347412109375, 0.6451492309570312, 0.6668243408203125, 0.6884994506835938, 0.710174560546875, 0.7318496704101562, 0.7535247802734375, 0.7751998901367188, 0.796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 6.0, 21.0, 32.0, 77.0, 114.0, 231.0, 519.0, 1370.0, 3517.0, 12636.0, 77370.0, 559999.0, 340907.0, 39395.0, 7987.0, 2552.0, 936.0, 444.0, 194.0, 87.0, 48.0, 37.0, 18.0, 16.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78466796875, -0.760772705078125, -0.73687744140625, -0.712982177734375, -0.6890869140625, -0.665191650390625, -0.64129638671875, -0.617401123046875, -0.593505859375, -0.569610595703125, -0.54571533203125, -0.521820068359375, -0.4979248046875, -0.474029541015625, -0.45013427734375, -0.426239013671875, -0.40234375, -0.378448486328125, -0.35455322265625, -0.330657958984375, -0.3067626953125, -0.282867431640625, -0.25897216796875, -0.235076904296875, -0.211181640625, -0.187286376953125, -0.16339111328125, -0.139495849609375, -0.1156005859375, -0.091705322265625, -0.06781005859375, -0.043914794921875, -0.02001953125, 0.003875732421875, 0.02777099609375, 0.051666259765625, 0.0755615234375, 0.099456787109375, 0.12335205078125, 0.147247314453125, 0.171142578125, 0.195037841796875, 0.21893310546875, 0.242828369140625, 0.2667236328125, 0.290618896484375, 0.31451416015625, 0.338409423828125, 0.3623046875, 0.386199951171875, 0.41009521484375, 0.433990478515625, 0.4578857421875, 0.481781005859375, 0.50567626953125, 0.529571533203125, 0.553466796875, 0.577362060546875, 0.60125732421875, 0.625152587890625, 0.6490478515625, 0.672943115234375, 0.69683837890625, 0.720733642578125, 0.74462890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 8.0, 4.0, 5.0, 9.0, 10.0, 14.0, 20.0, 15.0, 30.0, 35.0, 58.0, 56.0, 71.0, 84.0, 111.0, 84.0, 67.0, 73.0, 76.0, 37.0, 36.0, 23.0, 21.0, 20.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.00012624263763427734, -0.0001232260838150978, -0.00012020952999591827, -0.00011719297617673874, -0.0001141764223575592, -0.00011115986853837967, -0.00010814331471920013, -0.0001051267609000206, -0.00010211020708084106, -9.909365326166153e-05, -9.6077099442482e-05, -9.306054562330246e-05, -9.004399180412292e-05, -8.702743798494339e-05, -8.401088416576385e-05, -8.099433034658432e-05, -7.797777652740479e-05, -7.496122270822525e-05, -7.194466888904572e-05, -6.892811506986618e-05, -6.591156125068665e-05, -6.289500743150711e-05, -5.9878453612327576e-05, -5.686189979314804e-05, -5.3845345973968506e-05, -5.082879215478897e-05, -4.7812238335609436e-05, -4.47956845164299e-05, -4.1779130697250366e-05, -3.876257687807083e-05, -3.5746023058891296e-05, -3.272946923971176e-05, -2.9712915420532227e-05, -2.669636160135269e-05, -2.3679807782173157e-05, -2.0663253962993622e-05, -1.7646700143814087e-05, -1.4630146324634552e-05, -1.1613592505455017e-05, -8.597038686275482e-06, -5.580484867095947e-06, -2.5639310479164124e-06, 4.5262277126312256e-07, 3.4691765904426575e-06, 6.485730409622192e-06, 9.502284228801727e-06, 1.2518838047981262e-05, 1.5535391867160797e-05, 1.8551945686340332e-05, 2.1568499505519867e-05, 2.4585053324699402e-05, 2.7601607143878937e-05, 3.061816096305847e-05, 3.3634714782238007e-05, 3.665126860141754e-05, 3.9667822420597076e-05, 4.268437623977661e-05, 4.5700930058956146e-05, 4.871748387813568e-05, 5.1734037697315216e-05, 5.475059151649475e-05, 5.7767145335674286e-05, 6.078369915485382e-05, 6.380025297403336e-05, 6.681680679321289e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 10.0, 12.0, 20.0, 27.0, 32.0, 55.0, 69.0, 105.0, 147.0, 276.0, 410.0, 703.0, 1307.0, 2828.0, 6751.0, 22359.0, 120397.0, 540777.0, 285796.0, 46693.0, 11309.0, 4116.0, 1860.0, 930.0, 562.0, 329.0, 162.0, 134.0, 117.0, 65.0, 59.0, 30.0, 20.0, 12.0, 13.0, 3.0, 5.0, 7.0, 5.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.634765625, -0.6141128540039062, -0.5934600830078125, -0.5728073120117188, -0.552154541015625, -0.5315017700195312, -0.5108489990234375, -0.49019622802734375, -0.46954345703125, -0.44889068603515625, -0.4282379150390625, -0.40758514404296875, -0.386932373046875, -0.36627960205078125, -0.3456268310546875, -0.32497406005859375, -0.3043212890625, -0.28366851806640625, -0.2630157470703125, -0.24236297607421875, -0.221710205078125, -0.20105743408203125, -0.1804046630859375, -0.15975189208984375, -0.13909912109375, -0.11844635009765625, -0.0977935791015625, -0.07714080810546875, -0.056488037109375, -0.03583526611328125, -0.0151824951171875, 0.00547027587890625, 0.026123046875, 0.04677581787109375, 0.0674285888671875, 0.08808135986328125, 0.108734130859375, 0.12938690185546875, 0.1500396728515625, 0.17069244384765625, 0.19134521484375, 0.21199798583984375, 0.2326507568359375, 0.25330352783203125, 0.273956298828125, 0.29460906982421875, 0.3152618408203125, 0.33591461181640625, 0.3565673828125, 0.37722015380859375, 0.3978729248046875, 0.41852569580078125, 0.439178466796875, 0.45983123779296875, 0.4804840087890625, 0.5011367797851562, 0.52178955078125, 0.5424423217773438, 0.5630950927734375, 0.5837478637695312, 0.604400634765625, 0.6250534057617188, 0.6457061767578125, 0.6663589477539062, 0.68701171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 20.0, 20.0, 19.0, 30.0, 42.0, 53.0, 75.0, 87.0, 101.0, 88.0, 100.0, 75.0, 66.0, 50.0, 43.0, 29.0, 13.0, 18.0, 7.0, 9.0, 7.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.3512458801269531, -0.33921051025390625, -0.3271751403808594, -0.3151397705078125, -0.3031044006347656, -0.29106903076171875, -0.2790336608886719, -0.266998291015625, -0.2549629211425781, -0.24292755126953125, -0.23089218139648438, -0.2188568115234375, -0.20682144165039062, -0.19478607177734375, -0.18275070190429688, -0.17071533203125, -0.15867996215820312, -0.14664459228515625, -0.13460922241210938, -0.1225738525390625, -0.11053848266601562, -0.09850311279296875, -0.08646774291992188, -0.074432373046875, -0.062397003173828125, -0.05036163330078125, -0.038326263427734375, -0.0262908935546875, -0.014255523681640625, -0.00222015380859375, 0.009815216064453125, 0.0218505859375, 0.033885955810546875, 0.04592132568359375, 0.057956695556640625, 0.0699920654296875, 0.08202743530273438, 0.09406280517578125, 0.10609817504882812, 0.118133544921875, 0.13016891479492188, 0.14220428466796875, 0.15423965454101562, 0.1662750244140625, 0.17831039428710938, 0.19034576416015625, 0.20238113403320312, 0.21441650390625, 0.22645187377929688, 0.23848724365234375, 0.2505226135253906, 0.2625579833984375, 0.2745933532714844, 0.28662872314453125, 0.2986640930175781, 0.310699462890625, 0.3227348327636719, 0.33477020263671875, 0.3468055725097656, 0.3588409423828125, 0.3708763122558594, 0.38291168212890625, 0.3949470520019531, 0.406982421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 7.0, 9.0, 16.0, 60.0, 125.0, 237.0, 262.0, 182.0, 65.0, 26.0, 14.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.279369354248047, -4.850130558013916, -4.420891284942627, -3.991652488708496, -3.5624136924743652, -3.1331746578216553, -2.7039356231689453, -2.2746968269348145, -1.8454577922821045, -1.416218876838684, -0.9869799017906189, -0.5577409267425537, -0.1285020112991333, 0.3007369041442871, 0.7299759387969971, 1.159214735031128, 1.588453769683838, 2.017692804336548, 2.4469316005706787, 2.8761706352233887, 3.3054094314575195, 3.7346484661102295, 4.1638875007629395, 4.59312629699707, 5.022365570068359, 5.45160436630249, 5.880843639373779, 6.31008243560791, 6.739321231842041, 7.168560028076172, 7.597799301147461, 8.02703857421875, 8.456276893615723, 8.885516166687012, 9.314754486083984, 9.743993759155273, 10.173233032226562, 10.602471351623535, 11.031710624694824, 11.460948944091797, 11.890188217163086, 12.319427490234375, 12.748665809631348, 13.177905082702637, 13.607144355773926, 14.036382675170898, 14.465621948242188, 14.894861221313477, 15.324100494384766, 15.753339767456055, 16.182579040527344, 16.61181640625, 17.04105567932129, 17.470294952392578, 17.899534225463867, 18.328773498535156, 18.758010864257812, 19.1872501373291, 19.61648941040039, 20.045726776123047, 20.474966049194336, 20.904205322265625, 21.333444595336914, 21.762683868408203, 22.191923141479492]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 7.0, 7.0, 8.0, 6.0, 13.0, 15.0, 9.0, 18.0, 19.0, 25.0, 26.0, 22.0, 32.0, 39.0, 30.0, 47.0, 33.0, 38.0, 50.0, 54.0, 47.0, 50.0, 44.0, 34.0, 29.0, 37.0, 31.0, 30.0, 33.0, 31.0, 24.0, 18.0, 15.0, 15.0, 10.0, 14.0, 6.0, 10.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451831579208374, -3.325211524963379, -3.198591709136963, -3.0719716548919678, -2.9453516006469727, -2.8187317848205566, -2.6921117305755615, -2.5654916763305664, -2.4388718605041504, -2.3122518062591553, -2.1856319904327393, -2.059011936187744, -1.9323920011520386, -1.805772066116333, -1.679152011871338, -1.5525320768356323, -1.4259121417999268, -1.2992922067642212, -1.1726722717285156, -1.0460522174835205, -0.9194322824478149, -0.7928123474121094, -0.666192352771759, -0.5395723581314087, -0.4129524230957031, -0.28633245825767517, -0.15971249341964722, -0.03309252858161926, 0.09352743625640869, 0.22014737129211426, 0.3467673659324646, 0.47338736057281494, 0.6000075340270996, 0.7266274690628052, 0.8532474637031555, 0.9798674583435059, 1.1064873933792114, 1.233107328414917, 1.359727382659912, 1.4863473176956177, 1.6129672527313232, 1.7395871877670288, 1.8662071228027344, 1.9928271770477295, 2.1194472312927246, 2.2460670471191406, 2.3726871013641357, 2.499307155609131, 2.625926971435547, 2.752547025680542, 2.879166841506958, 3.005786895751953, 3.132406711578369, 3.2590267658233643, 3.3856468200683594, 3.5122666358947754, 3.6388866901397705, 3.7655067443847656, 3.8921265602111816, 4.018746376037598, 4.145366668701172, 4.271986484527588, 4.398606300354004, 4.525226593017578, 4.651846408843994]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 8.0, 13.0, 14.0, 14.0, 16.0, 29.0, 47.0, 72.0, 78.0, 144.0, 283.0, 481.0, 1185.0, 3145.0, 13519.0, 137933.0, 3929505.0, 92059.0, 10808.0, 2737.0, 1046.0, 479.0, 262.0, 157.0, 69.0, 46.0, 39.0, 21.0, 21.0, 16.0, 7.0, 8.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8984375, -1.83990478515625, -1.7813720703125, -1.72283935546875, -1.664306640625, -1.60577392578125, -1.5472412109375, -1.48870849609375, -1.43017578125, -1.37164306640625, -1.3131103515625, -1.25457763671875, -1.196044921875, -1.13751220703125, -1.0789794921875, -1.02044677734375, -0.9619140625, -0.90338134765625, -0.8448486328125, -0.78631591796875, -0.727783203125, -0.66925048828125, -0.6107177734375, -0.55218505859375, -0.49365234375, -0.43511962890625, -0.3765869140625, -0.31805419921875, -0.259521484375, -0.20098876953125, -0.1424560546875, -0.08392333984375, -0.025390625, 0.03314208984375, 0.0916748046875, 0.15020751953125, 0.208740234375, 0.26727294921875, 0.3258056640625, 0.38433837890625, 0.44287109375, 0.50140380859375, 0.5599365234375, 0.61846923828125, 0.677001953125, 0.73553466796875, 0.7940673828125, 0.85260009765625, 0.9111328125, 0.96966552734375, 1.0281982421875, 1.08673095703125, 1.145263671875, 1.20379638671875, 1.2623291015625, 1.32086181640625, 1.37939453125, 1.43792724609375, 1.4964599609375, 1.55499267578125, 1.613525390625, 1.67205810546875, 1.7305908203125, 1.78912353515625, 1.84765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 4.0, 4.0, 9.0, 3.0, 12.0, 18.0, 28.0, 23.0, 29.0, 50.0, 74.0, 73.0, 96.0, 84.0, 85.0, 75.0, 67.0, 66.0, 55.0, 43.0, 27.0, 22.0, 13.0, 12.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1763916015625, -0.1710186004638672, -0.16564559936523438, -0.16027259826660156, -0.15489959716796875, -0.14952659606933594, -0.14415359497070312, -0.1387805938720703, -0.1334075927734375, -0.1280345916748047, -0.12266159057617188, -0.11728858947753906, -0.11191558837890625, -0.10654258728027344, -0.10116958618164062, -0.09579658508300781, -0.090423583984375, -0.08505058288574219, -0.07967758178710938, -0.07430458068847656, -0.06893157958984375, -0.06355857849121094, -0.058185577392578125, -0.05281257629394531, -0.0474395751953125, -0.04206657409667969, -0.036693572998046875, -0.03132057189941406, -0.02594757080078125, -0.020574569702148438, -0.015201568603515625, -0.009828567504882812, -0.00445556640625, 0.0009174346923828125, 0.006290435791015625, 0.011663436889648438, 0.01703643798828125, 0.022409439086914062, 0.027782440185546875, 0.03315544128417969, 0.0385284423828125, 0.04390144348144531, 0.049274444580078125, 0.05464744567871094, 0.06002044677734375, 0.06539344787597656, 0.07076644897460938, 0.07613945007324219, 0.081512451171875, 0.08688545227050781, 0.09225845336914062, 0.09763145446777344, 0.10300445556640625, 0.10837745666503906, 0.11375045776367188, 0.11912345886230469, 0.1244964599609375, 0.1298694610595703, 0.13524246215820312, 0.14061546325683594, 0.14598846435546875, 0.15136146545410156, 0.15673446655273438, 0.1621074676513672, 0.16748046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 10.0, 11.0, 35.0, 23.0, 43.0, 63.0, 109.0, 187.0, 311.0, 615.0, 1176.0, 2768.0, 7322.0, 23941.0, 125437.0, 3421036.0, 534140.0, 55488.0, 13269.0, 4592.0, 1817.0, 844.0, 445.0, 238.0, 130.0, 90.0, 49.0, 32.0, 18.0, 11.0, 7.0, 2.0, 8.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.373046875, -1.329833984375, -1.28662109375, -1.243408203125, -1.2001953125, -1.156982421875, -1.11376953125, -1.070556640625, -1.02734375, -0.984130859375, -0.94091796875, -0.897705078125, -0.8544921875, -0.811279296875, -0.76806640625, -0.724853515625, -0.681640625, -0.638427734375, -0.59521484375, -0.552001953125, -0.5087890625, -0.465576171875, -0.42236328125, -0.379150390625, -0.3359375, -0.292724609375, -0.24951171875, -0.206298828125, -0.1630859375, -0.119873046875, -0.07666015625, -0.033447265625, 0.009765625, 0.052978515625, 0.09619140625, 0.139404296875, 0.1826171875, 0.225830078125, 0.26904296875, 0.312255859375, 0.35546875, 0.398681640625, 0.44189453125, 0.485107421875, 0.5283203125, 0.571533203125, 0.61474609375, 0.657958984375, 0.701171875, 0.744384765625, 0.78759765625, 0.830810546875, 0.8740234375, 0.917236328125, 0.96044921875, 1.003662109375, 1.046875, 1.090087890625, 1.13330078125, 1.176513671875, 1.2197265625, 1.262939453125, 1.30615234375, 1.349365234375, 1.392578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 7.0, 8.0, 8.0, 13.0, 16.0, 26.0, 38.0, 44.0, 90.0, 173.0, 327.0, 1068.0, 1446.0, 350.0, 173.0, 86.0, 61.0, 36.0, 31.0, 29.0, 12.0, 9.0, 7.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326171875, -0.3159942626953125, -0.305816650390625, -0.2956390380859375, -0.28546142578125, -0.2752838134765625, -0.265106201171875, -0.2549285888671875, -0.2447509765625, -0.2345733642578125, -0.224395751953125, -0.2142181396484375, -0.20404052734375, -0.1938629150390625, -0.183685302734375, -0.1735076904296875, -0.163330078125, -0.1531524658203125, -0.142974853515625, -0.1327972412109375, -0.12261962890625, -0.1124420166015625, -0.102264404296875, -0.0920867919921875, -0.0819091796875, -0.0717315673828125, -0.061553955078125, -0.0513763427734375, -0.04119873046875, -0.0310211181640625, -0.020843505859375, -0.0106658935546875, -0.00048828125, 0.0096893310546875, 0.019866943359375, 0.0300445556640625, 0.04022216796875, 0.0503997802734375, 0.060577392578125, 0.0707550048828125, 0.0809326171875, 0.0911102294921875, 0.101287841796875, 0.1114654541015625, 0.12164306640625, 0.1318206787109375, 0.141998291015625, 0.1521759033203125, 0.162353515625, 0.1725311279296875, 0.182708740234375, 0.1928863525390625, 0.20306396484375, 0.2132415771484375, 0.223419189453125, 0.2335968017578125, 0.2437744140625, 0.2539520263671875, 0.264129638671875, 0.2743072509765625, 0.28448486328125, 0.2946624755859375, 0.304840087890625, 0.3150177001953125, 0.3251953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 9.0, 25.0, 51.0, 151.0, 184.0, 243.0, 176.0, 92.0, 37.0, 15.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0574164390563965, -1.9604787826538086, -1.8635412454605103, -1.7666035890579224, -1.669666051864624, -1.5727283954620361, -1.4757907390594482, -1.37885320186615, -1.2819156646728516, -1.1849780082702637, -1.0880404710769653, -0.9911028146743774, -0.8941652774810791, -0.7972276210784912, -0.7002900242805481, -0.603352427482605, -0.5064147710800171, -0.409477174282074, -0.31253957748413086, -0.21560195088386536, -0.11866435408592224, -0.021726757287979126, 0.07521086931228638, 0.1721484661102295, 0.2690860629081726, 0.3660236597061157, 0.46296125650405884, 0.559898853302002, 0.6568365097045898, 0.7537740468978882, 0.8507117033004761, 0.9476493000984192, 1.0445868968963623, 1.1415245532989502, 1.2384620904922485, 1.3353997468948364, 1.4323372840881348, 1.5292749404907227, 1.6262125968933105, 1.7231501340866089, 1.8200876712799072, 1.9170253276824951, 2.013962984085083, 2.110900402069092, 2.2078380584716797, 2.3047757148742676, 2.4017133712768555, 2.4986510276794434, 2.5955886840820312, 2.692526340484619, 2.789463996887207, 2.886401414871216, 2.9833390712738037, 3.0802767276763916, 3.1772143840789795, 3.2741518020629883, 3.371089458465576, 3.468027114868164, 3.564964771270752, 3.6619021892547607, 3.7588398456573486, 3.8557775020599365, 3.9527151584625244, 4.049652576446533, 4.146590232849121]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 12.0, 15.0, 19.0, 21.0, 26.0, 21.0, 25.0, 29.0, 34.0, 37.0, 39.0, 38.0, 35.0, 47.0, 36.0, 37.0, 33.0, 44.0, 53.0, 50.0, 44.0, 32.0, 37.0, 28.0, 31.0, 14.0, 22.0, 21.0, 11.0, 12.0, 14.0, 8.0, 6.0, 4.0, 10.0, 2.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.8738830089569092, -0.8464518785476685, -0.8190207481384277, -0.791589617729187, -0.7641584873199463, -0.7367273569107056, -0.7092962861061096, -0.6818651556968689, -0.6544340252876282, -0.6270028948783875, -0.5995717644691467, -0.572140634059906, -0.5447095632553101, -0.5172784328460693, -0.4898473024368286, -0.4624161720275879, -0.43498504161834717, -0.40755391120910645, -0.3801227807998657, -0.3526916801929474, -0.32526054978370667, -0.29782941937446594, -0.2703983187675476, -0.24296718835830688, -0.21553605794906616, -0.18810492753982544, -0.1606738120317459, -0.13324269652366638, -0.10581156611442566, -0.07838043570518494, -0.05094932019710541, -0.02351820468902588, 0.003912925720214844, 0.03134404867887497, 0.058775171637535095, 0.08620629459619522, 0.11363741755485535, 0.14106854796409607, 0.1684996634721756, 0.19593077898025513, 0.22336190938949585, 0.2507930397987366, 0.2782241702079773, 0.30565527081489563, 0.33308640122413635, 0.3605175316333771, 0.3879486322402954, 0.41537976264953613, 0.44281089305877686, 0.4702420234680176, 0.4976731538772583, 0.525104284286499, 0.5525354146957397, 0.5799665451049805, 0.6073976159095764, 0.6348287463188171, 0.6622598767280579, 0.6896910071372986, 0.7171221375465393, 0.74455326795578, 0.771984338760376, 0.7994154691696167, 0.8268465995788574, 0.8542777299880981, 0.8817088603973389]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 10.0, 9.0, 17.0, 17.0, 48.0, 61.0, 104.0, 147.0, 241.0, 372.0, 615.0, 1188.0, 2753.0, 7437.0, 26133.0, 105382.0, 397785.0, 373024.0, 96630.0, 23958.0, 7110.0, 2638.0, 1194.0, 621.0, 392.0, 244.0, 142.0, 82.0, 63.0, 33.0, 38.0, 13.0, 12.0, 8.0, 6.0, 8.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.111328125, -1.07861328125, -1.0458984375, -1.01318359375, -0.98046875, -0.94775390625, -0.9150390625, -0.88232421875, -0.849609375, -0.81689453125, -0.7841796875, -0.75146484375, -0.71875, -0.68603515625, -0.6533203125, -0.62060546875, -0.587890625, -0.55517578125, -0.5224609375, -0.48974609375, -0.45703125, -0.42431640625, -0.3916015625, -0.35888671875, -0.326171875, -0.29345703125, -0.2607421875, -0.22802734375, -0.1953125, -0.16259765625, -0.1298828125, -0.09716796875, -0.064453125, -0.03173828125, 0.0009765625, 0.03369140625, 0.06640625, 0.09912109375, 0.1318359375, 0.16455078125, 0.197265625, 0.22998046875, 0.2626953125, 0.29541015625, 0.328125, 0.36083984375, 0.3935546875, 0.42626953125, 0.458984375, 0.49169921875, 0.5244140625, 0.55712890625, 0.58984375, 0.62255859375, 0.6552734375, 0.68798828125, 0.720703125, 0.75341796875, 0.7861328125, 0.81884765625, 0.8515625, 0.88427734375, 0.9169921875, 0.94970703125, 0.982421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 11.0, 8.0, 21.0, 34.0, 35.0, 43.0, 49.0, 65.0, 83.0, 85.0, 65.0, 72.0, 76.0, 56.0, 71.0, 49.0, 40.0, 33.0, 18.0, 23.0, 15.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1771240234375, -0.17185592651367188, -0.16658782958984375, -0.16131973266601562, -0.1560516357421875, -0.15078353881835938, -0.14551544189453125, -0.14024734497070312, -0.134979248046875, -0.12971115112304688, -0.12444305419921875, -0.11917495727539062, -0.1139068603515625, -0.10863876342773438, -0.10337066650390625, -0.09810256958007812, -0.09283447265625, -0.08756637573242188, -0.08229827880859375, -0.07703018188476562, -0.0717620849609375, -0.06649398803710938, -0.06122589111328125, -0.055957794189453125, -0.050689697265625, -0.045421600341796875, -0.04015350341796875, -0.034885406494140625, -0.0296173095703125, -0.024349212646484375, -0.01908111572265625, -0.013813018798828125, -0.008544921875, -0.003276824951171875, 0.00199127197265625, 0.007259368896484375, 0.0125274658203125, 0.017795562744140625, 0.02306365966796875, 0.028331756591796875, 0.033599853515625, 0.038867950439453125, 0.04413604736328125, 0.049404144287109375, 0.0546722412109375, 0.059940338134765625, 0.06520843505859375, 0.07047653198242188, 0.07574462890625, 0.08101272583007812, 0.08628082275390625, 0.09154891967773438, 0.0968170166015625, 0.10208511352539062, 0.10735321044921875, 0.11262130737304688, 0.117889404296875, 0.12315750122070312, 0.12842559814453125, 0.13369369506835938, 0.1389617919921875, 0.14422988891601562, 0.14949798583984375, 0.15476608276367188, 0.1600341796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 8.0, 9.0, 12.0, 11.0, 23.0, 32.0, 48.0, 68.0, 73.0, 87.0, 139.0, 178.0, 246.0, 355.0, 559.0, 779.0, 1225.0, 2031.0, 4096.0, 10053.0, 29125.0, 91384.0, 261185.0, 383049.0, 173928.0, 56892.0, 18371.0, 6757.0, 2979.0, 1609.0, 1022.0, 648.0, 410.0, 300.0, 212.0, 197.0, 136.0, 93.0, 63.0, 40.0, 32.0, 33.0, 19.0, 7.0, 13.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7425765991210938, -0.7180633544921875, -0.6935501098632812, -0.669036865234375, -0.6445236206054688, -0.6200103759765625, -0.5954971313476562, -0.57098388671875, -0.5464706420898438, -0.5219573974609375, -0.49744415283203125, -0.472930908203125, -0.44841766357421875, -0.4239044189453125, -0.39939117431640625, -0.3748779296875, -0.35036468505859375, -0.3258514404296875, -0.30133819580078125, -0.276824951171875, -0.25231170654296875, -0.2277984619140625, -0.20328521728515625, -0.17877197265625, -0.15425872802734375, -0.1297454833984375, -0.10523223876953125, -0.080718994140625, -0.05620574951171875, -0.0316925048828125, -0.00717926025390625, 0.017333984375, 0.04184722900390625, 0.0663604736328125, 0.09087371826171875, 0.115386962890625, 0.13990020751953125, 0.1644134521484375, 0.18892669677734375, 0.21343994140625, 0.23795318603515625, 0.2624664306640625, 0.28697967529296875, 0.311492919921875, 0.33600616455078125, 0.3605194091796875, 0.38503265380859375, 0.4095458984375, 0.43405914306640625, 0.4585723876953125, 0.48308563232421875, 0.507598876953125, 0.5321121215820312, 0.5566253662109375, 0.5811386108398438, 0.60565185546875, 0.6301651000976562, 0.6546783447265625, 0.6791915893554688, 0.703704833984375, 0.7282180786132812, 0.7527313232421875, 0.7772445678710938, 0.8017578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 6.0, 10.0, 15.0, 10.0, 15.0, 19.0, 15.0, 25.0, 26.0, 30.0, 40.0, 38.0, 31.0, 33.0, 50.0, 48.0, 53.0, 53.0, 54.0, 50.0, 49.0, 26.0, 30.0, 35.0, 28.0, 38.0, 28.0, 24.0, 22.0, 15.0, 21.0, 11.0, 10.0, 5.0, 11.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.59814453125, -0.5786972045898438, -0.5592498779296875, -0.5398025512695312, -0.520355224609375, -0.5009078979492188, -0.4814605712890625, -0.46201324462890625, -0.44256591796875, -0.42311859130859375, -0.4036712646484375, -0.38422393798828125, -0.364776611328125, -0.34532928466796875, -0.3258819580078125, -0.30643463134765625, -0.2869873046875, -0.26753997802734375, -0.2480926513671875, -0.22864532470703125, -0.209197998046875, -0.18975067138671875, -0.1703033447265625, -0.15085601806640625, -0.13140869140625, -0.11196136474609375, -0.0925140380859375, -0.07306671142578125, -0.053619384765625, -0.03417205810546875, -0.0147247314453125, 0.00472259521484375, 0.024169921875, 0.04361724853515625, 0.0630645751953125, 0.08251190185546875, 0.101959228515625, 0.12140655517578125, 0.1408538818359375, 0.16030120849609375, 0.17974853515625, 0.19919586181640625, 0.2186431884765625, 0.23809051513671875, 0.257537841796875, 0.27698516845703125, 0.2964324951171875, 0.31587982177734375, 0.3353271484375, 0.35477447509765625, 0.3742218017578125, 0.39366912841796875, 0.413116455078125, 0.43256378173828125, 0.4520111083984375, 0.47145843505859375, 0.49090576171875, 0.5103530883789062, 0.5298004150390625, 0.5492477416992188, 0.568695068359375, 0.5881423950195312, 0.6075897216796875, 0.6270370483398438, 0.646484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 14.0, 21.0, 27.0, 31.0, 55.0, 71.0, 113.0, 235.0, 463.0, 1067.0, 2731.0, 9865.0, 55613.0, 554196.0, 375724.0, 36768.0, 7407.0, 2325.0, 878.0, 401.0, 206.0, 107.0, 66.0, 47.0, 34.0, 25.0, 13.0, 6.0, 2.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6687850952148438, -0.6471405029296875, -0.6254959106445312, -0.603851318359375, -0.5822067260742188, -0.5605621337890625, -0.5389175415039062, -0.51727294921875, -0.49562835693359375, -0.4739837646484375, -0.45233917236328125, -0.430694580078125, -0.40904998779296875, -0.3874053955078125, -0.36576080322265625, -0.3441162109375, -0.32247161865234375, -0.3008270263671875, -0.27918243408203125, -0.257537841796875, -0.23589324951171875, -0.2142486572265625, -0.19260406494140625, -0.17095947265625, -0.14931488037109375, -0.1276702880859375, -0.10602569580078125, -0.084381103515625, -0.06273651123046875, -0.0410919189453125, -0.01944732666015625, 0.002197265625, 0.02384185791015625, 0.0454864501953125, 0.06713104248046875, 0.088775634765625, 0.11042022705078125, 0.1320648193359375, 0.15370941162109375, 0.17535400390625, 0.19699859619140625, 0.2186431884765625, 0.24028778076171875, 0.261932373046875, 0.28357696533203125, 0.3052215576171875, 0.32686614990234375, 0.3485107421875, 0.37015533447265625, 0.3917999267578125, 0.41344451904296875, 0.435089111328125, 0.45673370361328125, 0.4783782958984375, 0.5000228881835938, 0.52166748046875, 0.5433120727539062, 0.5649566650390625, 0.5866012573242188, 0.608245849609375, 0.6298904418945312, 0.6515350341796875, 0.6731796264648438, 0.69482421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 7.0, 12.0, 22.0, 17.0, 25.0, 35.0, 32.0, 55.0, 69.0, 61.0, 69.0, 97.0, 87.0, 63.0, 66.0, 46.0, 65.0, 47.0, 33.0, 29.0, 11.0, 20.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.00010943412780761719, -0.00010684318840503693, -0.00010425224900245667, -0.0001016613095998764, -9.907037019729614e-05, -9.647943079471588e-05, -9.388849139213562e-05, -9.129755198955536e-05, -8.87066125869751e-05, -8.611567318439484e-05, -8.352473378181458e-05, -8.093379437923431e-05, -7.834285497665405e-05, -7.575191557407379e-05, -7.316097617149353e-05, -7.057003676891327e-05, -6.797909736633301e-05, -6.538815796375275e-05, -6.279721856117249e-05, -6.0206279158592224e-05, -5.761533975601196e-05, -5.50244003534317e-05, -5.243346095085144e-05, -4.984252154827118e-05, -4.725158214569092e-05, -4.466064274311066e-05, -4.2069703340530396e-05, -3.9478763937950134e-05, -3.688782453536987e-05, -3.429688513278961e-05, -3.170594573020935e-05, -2.911500632762909e-05, -2.6524066925048828e-05, -2.3933127522468567e-05, -2.1342188119888306e-05, -1.8751248717308044e-05, -1.6160309314727783e-05, -1.3569369912147522e-05, -1.097843050956726e-05, -8.387491106987e-06, -5.796551704406738e-06, -3.205612301826477e-06, -6.146728992462158e-07, 1.9762665033340454e-06, 4.567205905914307e-06, 7.158145308494568e-06, 9.749084711074829e-06, 1.234002411365509e-05, 1.4930963516235352e-05, 1.7521902918815613e-05, 2.0112842321395874e-05, 2.2703781723976135e-05, 2.5294721126556396e-05, 2.7885660529136658e-05, 3.047659993171692e-05, 3.306753933429718e-05, 3.565847873687744e-05, 3.82494181394577e-05, 4.0840357542037964e-05, 4.3431296944618225e-05, 4.6022236347198486e-05, 4.861317574977875e-05, 5.120411515235901e-05, 5.379505455493927e-05, 5.638599395751953e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 5.0, 7.0, 11.0, 8.0, 13.0, 20.0, 32.0, 31.0, 52.0, 93.0, 142.0, 230.0, 405.0, 718.0, 1663.0, 4320.0, 13900.0, 69611.0, 585666.0, 318829.0, 37973.0, 9124.0, 2986.0, 1243.0, 588.0, 352.0, 183.0, 115.0, 62.0, 53.0, 30.0, 21.0, 19.0, 13.0, 8.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7119140625, -0.692047119140625, -0.67218017578125, -0.652313232421875, -0.6324462890625, -0.612579345703125, -0.59271240234375, -0.572845458984375, -0.552978515625, -0.533111572265625, -0.51324462890625, -0.493377685546875, -0.4735107421875, -0.453643798828125, -0.43377685546875, -0.413909912109375, -0.39404296875, -0.374176025390625, -0.35430908203125, -0.334442138671875, -0.3145751953125, -0.294708251953125, -0.27484130859375, -0.254974365234375, -0.235107421875, -0.215240478515625, -0.19537353515625, -0.175506591796875, -0.1556396484375, -0.135772705078125, -0.11590576171875, -0.096038818359375, -0.076171875, -0.056304931640625, -0.03643798828125, -0.016571044921875, 0.0032958984375, 0.023162841796875, 0.04302978515625, 0.062896728515625, 0.082763671875, 0.102630615234375, 0.12249755859375, 0.142364501953125, 0.1622314453125, 0.182098388671875, 0.20196533203125, 0.221832275390625, 0.24169921875, 0.261566162109375, 0.28143310546875, 0.301300048828125, 0.3211669921875, 0.341033935546875, 0.36090087890625, 0.380767822265625, 0.400634765625, 0.420501708984375, 0.44036865234375, 0.460235595703125, 0.4801025390625, 0.499969482421875, 0.51983642578125, 0.539703369140625, 0.5595703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 5.0, 14.0, 13.0, 13.0, 29.0, 36.0, 49.0, 76.0, 106.0, 115.0, 132.0, 112.0, 80.0, 73.0, 44.0, 31.0, 20.0, 12.0, 10.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.54150390625, -0.5269203186035156, -0.5123367309570312, -0.4977531433105469, -0.4831695556640625, -0.4685859680175781, -0.45400238037109375, -0.4394187927246094, -0.424835205078125, -0.4102516174316406, -0.39566802978515625, -0.3810844421386719, -0.3665008544921875, -0.3519172668457031, -0.33733367919921875, -0.3227500915527344, -0.30816650390625, -0.2935829162597656, -0.27899932861328125, -0.2644157409667969, -0.2498321533203125, -0.23524856567382812, -0.22066497802734375, -0.20608139038085938, -0.191497802734375, -0.17691421508789062, -0.16233062744140625, -0.14774703979492188, -0.1331634521484375, -0.11857986450195312, -0.10399627685546875, -0.08941268920898438, -0.0748291015625, -0.060245513916015625, -0.04566192626953125, -0.031078338623046875, -0.0164947509765625, -0.001911163330078125, 0.01267242431640625, 0.027256011962890625, 0.041839599609375, 0.056423187255859375, 0.07100677490234375, 0.08559036254882812, 0.1001739501953125, 0.11475753784179688, 0.12934112548828125, 0.14392471313476562, 0.15850830078125, 0.17309188842773438, 0.18767547607421875, 0.20225906372070312, 0.2168426513671875, 0.23142623901367188, 0.24600982666015625, 0.2605934143066406, 0.275177001953125, 0.2897605895996094, 0.30434417724609375, 0.3189277648925781, 0.3335113525390625, 0.3480949401855469, 0.36267852783203125, 0.3772621154785156, 0.391845703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 11.0, 14.0, 24.0, 27.0, 57.0, 106.0, 123.0, 122.0, 161.0, 116.0, 72.0, 57.0, 41.0, 20.0, 21.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.110924243927002, -6.928389072418213, -6.745853900909424, -6.563318729400635, -6.380783557891846, -6.198248386383057, -6.015713691711426, -5.833178520202637, -5.650643348693848, -5.468108177185059, -5.2855730056762695, -5.1030378341674805, -4.920502662658691, -4.737967491149902, -4.555432319641113, -4.372897148132324, -4.190361976623535, -4.007826805114746, -3.825291633605957, -3.642756462097168, -3.460221290588379, -3.27768611907959, -3.09515118598938, -2.912616014480591, -2.7300808429718018, -2.5475456714630127, -2.3650104999542236, -2.1824755668640137, -1.999940276145935, -1.817405104637146, -1.6348700523376465, -1.4523348808288574, -1.2697997093200684, -1.0872645378112793, -0.904729425907135, -0.7221943140029907, -0.5396591424942017, -0.3571239709854126, -0.17458891868591309, 0.007946252822875977, 0.19048142433166504, 0.3730165660381317, 0.5555517077445984, 0.7380868196487427, 0.9206219911575317, 1.1031571626663208, 1.2856922149658203, 1.4682273864746094, 1.6507625579833984, 1.8332977294921875, 2.0158329010009766, 2.1983680725097656, 2.3809032440185547, 2.5634384155273438, 2.7459733486175537, 2.9285085201263428, 3.111043691635132, 3.293578863143921, 3.47611403465271, 3.65864896774292, 3.841184139251709, 4.023719310760498, 4.206254482269287, 4.388789653778076, 4.571324825286865]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 9.0, 7.0, 11.0, 13.0, 14.0, 16.0, 20.0, 11.0, 22.0, 35.0, 29.0, 43.0, 39.0, 34.0, 43.0, 44.0, 50.0, 53.0, 41.0, 44.0, 35.0, 42.0, 49.0, 30.0, 32.0, 29.0, 32.0, 20.0, 21.0, 13.0, 19.0, 15.0, 13.0, 11.0, 5.0, 5.0, 12.0, 8.0, 0.0, 5.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.5399158000946045, -3.4354758262634277, -3.33103609085083, -3.2265961170196533, -3.1221561431884766, -3.017716407775879, -2.913276433944702, -2.8088364601135254, -2.7043967247009277, -2.599956750869751, -2.4955170154571533, -2.3910770416259766, -2.286637306213379, -2.182197332382202, -2.0777573585510254, -1.9733175039291382, -1.868877649307251, -1.7644377946853638, -1.6599979400634766, -1.5555579662322998, -1.4511181116104126, -1.3466782569885254, -1.2422382831573486, -1.1377984285354614, -1.0333585739135742, -0.928918719291687, -0.824478805065155, -0.720038890838623, -0.6155990362167358, -0.5111591815948486, -0.40671926736831665, -0.30227935314178467, -0.19783949851989746, -0.09339961409568787, 0.011040270328521729, 0.11548015475273132, 0.21992003917694092, 0.3243598937988281, 0.4287998080253601, 0.5332397222518921, 0.6376795768737793, 0.7421194314956665, 0.8465593457221985, 0.9509992599487305, 1.0554391145706177, 1.1598789691925049, 1.2643189430236816, 1.3687587976455688, 1.473198652267456, 1.5776385068893433, 1.6820783615112305, 1.7865183353424072, 1.8909581899642944, 1.9953980445861816, 2.0998380184173584, 2.204277992248535, 2.308717727661133, 2.4131577014923096, 2.5175974369049072, 2.622037410736084, 2.7264771461486816, 2.8309171199798584, 2.935357093811035, 3.039796829223633, 3.1442368030548096]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 9.0, 20.0, 21.0, 29.0, 42.0, 88.0, 109.0, 182.0, 350.0, 595.0, 1155.0, 2468.0, 6027.0, 18359.0, 85715.0, 3590493.0, 426200.0, 43003.0, 11437.0, 4102.0, 1731.0, 874.0, 487.0, 283.0, 163.0, 107.0, 67.0, 48.0, 30.0, 14.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9845428466796875, -0.951507568359375, -0.9184722900390625, -0.88543701171875, -0.8524017333984375, -0.819366455078125, -0.7863311767578125, -0.7532958984375, -0.7202606201171875, -0.687225341796875, -0.6541900634765625, -0.62115478515625, -0.5881195068359375, -0.555084228515625, -0.5220489501953125, -0.489013671875, -0.4559783935546875, -0.422943115234375, -0.3899078369140625, -0.35687255859375, -0.3238372802734375, -0.290802001953125, -0.2577667236328125, -0.2247314453125, -0.1916961669921875, -0.158660888671875, -0.1256256103515625, -0.09259033203125, -0.0595550537109375, -0.026519775390625, 0.0065155029296875, 0.03955078125, 0.0725860595703125, 0.105621337890625, 0.1386566162109375, 0.17169189453125, 0.2047271728515625, 0.237762451171875, 0.2707977294921875, 0.3038330078125, 0.3368682861328125, 0.369903564453125, 0.4029388427734375, 0.43597412109375, 0.4690093994140625, 0.502044677734375, 0.5350799560546875, 0.568115234375, 0.6011505126953125, 0.634185791015625, 0.6672210693359375, 0.70025634765625, 0.7332916259765625, 0.766326904296875, 0.7993621826171875, 0.8323974609375, 0.8654327392578125, 0.898468017578125, 0.9315032958984375, 0.96453857421875, 0.9975738525390625, 1.030609130859375, 1.0636444091796875, 1.0966796875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 7.0, 11.0, 20.0, 29.0, 29.0, 43.0, 45.0, 51.0, 55.0, 79.0, 73.0, 93.0, 87.0, 65.0, 64.0, 41.0, 44.0, 36.0, 33.0, 29.0, 17.0, 10.0, 4.0, 9.0, 8.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1964111328125, -0.19086074829101562, -0.18531036376953125, -0.17975997924804688, -0.1742095947265625, -0.16865921020507812, -0.16310882568359375, -0.15755844116210938, -0.152008056640625, -0.14645767211914062, -0.14090728759765625, -0.13535690307617188, -0.1298065185546875, -0.12425613403320312, -0.11870574951171875, -0.11315536499023438, -0.10760498046875, -0.10205459594726562, -0.09650421142578125, -0.09095382690429688, -0.0854034423828125, -0.07985305786132812, -0.07430267333984375, -0.06875228881835938, -0.063201904296875, -0.057651519775390625, -0.05210113525390625, -0.046550750732421875, -0.0410003662109375, -0.035449981689453125, -0.02989959716796875, -0.024349212646484375, -0.018798828125, -0.013248443603515625, -0.00769805908203125, -0.002147674560546875, 0.0034027099609375, 0.008953094482421875, 0.01450347900390625, 0.020053863525390625, 0.025604248046875, 0.031154632568359375, 0.03670501708984375, 0.042255401611328125, 0.0478057861328125, 0.053356170654296875, 0.05890655517578125, 0.06445693969726562, 0.07000732421875, 0.07555770874023438, 0.08110809326171875, 0.08665847778320312, 0.0922088623046875, 0.09775924682617188, 0.10330963134765625, 0.10886001586914062, 0.114410400390625, 0.11996078491210938, 0.12551116943359375, 0.13106155395507812, 0.1366119384765625, 0.14216232299804688, 0.14771270751953125, 0.15326309204101562, 0.1588134765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 5.0, 16.0, 21.0, 24.0, 23.0, 39.0, 59.0, 87.0, 161.0, 243.0, 437.0, 788.0, 1365.0, 2873.0, 6356.0, 17416.0, 64074.0, 500978.0, 3380105.0, 163611.0, 34856.0, 11376.0, 4560.0, 2125.0, 1139.0, 595.0, 386.0, 206.0, 111.0, 78.0, 51.0, 34.0, 30.0, 15.0, 10.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.1201171875, -1.090057373046875, -1.05999755859375, -1.029937744140625, -0.9998779296875, -0.969818115234375, -0.93975830078125, -0.909698486328125, -0.879638671875, -0.849578857421875, -0.81951904296875, -0.789459228515625, -0.7593994140625, -0.729339599609375, -0.69927978515625, -0.669219970703125, -0.63916015625, -0.609100341796875, -0.57904052734375, -0.548980712890625, -0.5189208984375, -0.488861083984375, -0.45880126953125, -0.428741455078125, -0.398681640625, -0.368621826171875, -0.33856201171875, -0.308502197265625, -0.2784423828125, -0.248382568359375, -0.21832275390625, -0.188262939453125, -0.158203125, -0.128143310546875, -0.09808349609375, -0.068023681640625, -0.0379638671875, -0.007904052734375, 0.02215576171875, 0.052215576171875, 0.082275390625, 0.112335205078125, 0.14239501953125, 0.172454833984375, 0.2025146484375, 0.232574462890625, 0.26263427734375, 0.292694091796875, 0.32275390625, 0.352813720703125, 0.38287353515625, 0.412933349609375, 0.4429931640625, 0.473052978515625, 0.50311279296875, 0.533172607421875, 0.563232421875, 0.593292236328125, 0.62335205078125, 0.653411865234375, 0.6834716796875, 0.713531494140625, 0.74359130859375, 0.773651123046875, 0.8037109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 3.0, 8.0, 5.0, 4.0, 7.0, 14.0, 18.0, 20.0, 30.0, 48.0, 74.0, 92.0, 166.0, 359.0, 1481.0, 853.0, 315.0, 189.0, 108.0, 65.0, 55.0, 46.0, 27.0, 21.0, 13.0, 11.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.260986328125, -0.2537117004394531, -0.24643707275390625, -0.23916244506835938, -0.2318878173828125, -0.22461318969726562, -0.21733856201171875, -0.21006393432617188, -0.202789306640625, -0.19551467895507812, -0.18824005126953125, -0.18096542358398438, -0.1736907958984375, -0.16641616821289062, -0.15914154052734375, -0.15186691284179688, -0.14459228515625, -0.13731765747070312, -0.13004302978515625, -0.12276840209960938, -0.1154937744140625, -0.10821914672851562, -0.10094451904296875, -0.09366989135742188, -0.086395263671875, -0.07912063598632812, -0.07184600830078125, -0.06457138061523438, -0.0572967529296875, -0.050022125244140625, -0.04274749755859375, -0.035472869873046875, -0.0281982421875, -0.020923614501953125, -0.01364898681640625, -0.006374359130859375, 0.0009002685546875, 0.008174896240234375, 0.01544952392578125, 0.022724151611328125, 0.029998779296875, 0.037273406982421875, 0.04454803466796875, 0.051822662353515625, 0.0590972900390625, 0.06637191772460938, 0.07364654541015625, 0.08092117309570312, 0.08819580078125, 0.09547042846679688, 0.10274505615234375, 0.11001968383789062, 0.1172943115234375, 0.12456893920898438, 0.13184356689453125, 0.13911819458007812, 0.146392822265625, 0.15366744995117188, 0.16094207763671875, 0.16821670532226562, 0.1754913330078125, 0.18276596069335938, 0.19004058837890625, 0.19731521606445312, 0.20458984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 16.0, 35.0, 67.0, 109.0, 159.0, 173.0, 167.0, 102.0, 65.0, 46.0, 21.0, 13.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.824238896369934, -1.7545937299728394, -1.6849486827850342, -1.6153035163879395, -1.5456583499908447, -1.4760133028030396, -1.4063681364059448, -1.3367230892181396, -1.267077922821045, -1.1974327564239502, -1.127787709236145, -1.0581425428390503, -0.9884974360466003, -0.9188523292541504, -0.8492071628570557, -0.7795620560646057, -0.7099169492721558, -0.6402718424797058, -0.5706267356872559, -0.5009815692901611, -0.4313364624977112, -0.36169135570526123, -0.2920462191104889, -0.22240108251571655, -0.1527559757232666, -0.08311085402965546, -0.013465732336044312, 0.056179389357566833, 0.12582451105117798, 0.19546961784362793, 0.26511475443840027, 0.3347598910331726, 0.4044051170349121, 0.47405022382736206, 0.543695330619812, 0.6133404970169067, 0.6829856038093567, 0.7526307106018066, 0.8222758769989014, 0.8919209837913513, 0.9615660905838013, 1.031211256980896, 1.1008563041687012, 1.170501470565796, 1.2401466369628906, 1.3097916841506958, 1.3794368505477905, 1.4490818977355957, 1.5187270641326904, 1.5883722305297852, 1.6580172777175903, 1.727662444114685, 1.7973074913024902, 1.866952657699585, 1.9365978240966797, 2.0062429904937744, 2.075888156890869, 2.145533323287964, 2.2151784896850586, 2.284823417663574, 2.354468584060669, 2.4241137504577637, 2.4937589168548584, 2.563404083251953, 2.6330490112304688]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 4.0, 11.0, 10.0, 16.0, 15.0, 14.0, 14.0, 15.0, 18.0, 26.0, 34.0, 28.0, 33.0, 42.0, 35.0, 45.0, 41.0, 39.0, 36.0, 44.0, 37.0, 35.0, 36.0, 36.0, 38.0, 33.0, 32.0, 32.0, 30.0, 23.0, 14.0, 13.0, 14.0, 19.0, 20.0, 14.0, 8.0, 6.0, 5.0, 6.0, 3.0, 7.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.8793981075286865, -0.8544269800186157, -0.8294557929039001, -0.8044846057891846, -0.7795134782791138, -0.754542350769043, -0.7295711636543274, -0.7045999765396118, -0.679628849029541, -0.6546577215194702, -0.6296865344047546, -0.6047153472900391, -0.5797442197799683, -0.5547730922698975, -0.5298019051551819, -0.5048307180404663, -0.4798595905303955, -0.4548884332180023, -0.42991727590560913, -0.40494611859321594, -0.37997496128082275, -0.35500380396842957, -0.3300326466560364, -0.3050614893436432, -0.28009033203125, -0.2551191747188568, -0.23014801740646362, -0.20517686009407043, -0.18020570278167725, -0.15523454546928406, -0.13026338815689087, -0.10529223084449768, -0.08032107353210449, -0.055349916219711304, -0.030378758907318115, -0.005407601594924927, 0.01956355571746826, 0.04453471302986145, 0.06950587034225464, 0.09447702765464783, 0.11944818496704102, 0.1444193422794342, 0.1693904995918274, 0.19436165690422058, 0.21933281421661377, 0.24430397152900696, 0.26927512884140015, 0.29424628615379333, 0.3192174434661865, 0.3441886007785797, 0.3691597580909729, 0.3941309154033661, 0.4191020727157593, 0.44407323002815247, 0.46904438734054565, 0.49401554465293884, 0.518986701965332, 0.5439578294754028, 0.5689290165901184, 0.593900203704834, 0.6188713312149048, 0.6438424587249756, 0.6688136458396912, 0.6937848329544067, 0.7187559604644775]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 16.0, 13.0, 19.0, 38.0, 42.0, 58.0, 79.0, 130.0, 194.0, 306.0, 602.0, 1059.0, 2133.0, 4969.0, 12742.0, 36442.0, 114086.0, 321948.0, 353987.0, 132784.0, 41793.0, 14403.0, 5472.0, 2383.0, 1193.0, 621.0, 321.0, 232.0, 142.0, 111.0, 74.0, 50.0, 24.0, 16.0, 11.0, 15.0, 9.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84765625, -0.8212203979492188, -0.7947845458984375, -0.7683486938476562, -0.741912841796875, -0.7154769897460938, -0.6890411376953125, -0.6626052856445312, -0.63616943359375, -0.6097335815429688, -0.5832977294921875, -0.5568618774414062, -0.530426025390625, -0.5039901733398438, -0.4775543212890625, -0.45111846923828125, -0.4246826171875, -0.39824676513671875, -0.3718109130859375, -0.34537506103515625, -0.318939208984375, -0.29250335693359375, -0.2660675048828125, -0.23963165283203125, -0.21319580078125, -0.18675994873046875, -0.1603240966796875, -0.13388824462890625, -0.107452392578125, -0.08101654052734375, -0.0545806884765625, -0.02814483642578125, -0.001708984375, 0.02472686767578125, 0.0511627197265625, 0.07759857177734375, 0.104034423828125, 0.13047027587890625, 0.1569061279296875, 0.18334197998046875, 0.20977783203125, 0.23621368408203125, 0.2626495361328125, 0.28908538818359375, 0.315521240234375, 0.34195709228515625, 0.3683929443359375, 0.39482879638671875, 0.4212646484375, 0.44770050048828125, 0.4741363525390625, 0.5005722045898438, 0.527008056640625, 0.5534439086914062, 0.5798797607421875, 0.6063156127929688, 0.63275146484375, 0.6591873168945312, 0.6856231689453125, 0.7120590209960938, 0.738494873046875, 0.7649307250976562, 0.7913665771484375, 0.8178024291992188, 0.84423828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 7.0, 11.0, 20.0, 22.0, 31.0, 41.0, 40.0, 64.0, 68.0, 57.0, 91.0, 84.0, 85.0, 73.0, 56.0, 50.0, 44.0, 35.0, 31.0, 13.0, 15.0, 16.0, 8.0, 9.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1949462890625, -0.18909072875976562, -0.18323516845703125, -0.17737960815429688, -0.1715240478515625, -0.16566848754882812, -0.15981292724609375, -0.15395736694335938, -0.148101806640625, -0.14224624633789062, -0.13639068603515625, -0.13053512573242188, -0.1246795654296875, -0.11882400512695312, -0.11296844482421875, -0.10711288452148438, -0.10125732421875, -0.09540176391601562, -0.08954620361328125, -0.08369064331054688, -0.0778350830078125, -0.07197952270507812, -0.06612396240234375, -0.060268402099609375, -0.054412841796875, -0.048557281494140625, -0.04270172119140625, -0.036846160888671875, -0.0309906005859375, -0.025135040283203125, -0.01927947998046875, -0.013423919677734375, -0.007568359375, -0.001712799072265625, 0.00414276123046875, 0.009998321533203125, 0.0158538818359375, 0.021709442138671875, 0.02756500244140625, 0.033420562744140625, 0.039276123046875, 0.045131683349609375, 0.05098724365234375, 0.056842803955078125, 0.0626983642578125, 0.06855392456054688, 0.07440948486328125, 0.08026504516601562, 0.08612060546875, 0.09197616577148438, 0.09783172607421875, 0.10368728637695312, 0.1095428466796875, 0.11539840698242188, 0.12125396728515625, 0.12710952758789062, 0.132965087890625, 0.13882064819335938, 0.14467620849609375, 0.15053176879882812, 0.1563873291015625, 0.16224288940429688, 0.16809844970703125, 0.17395401000976562, 0.1798095703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 8.0, 7.0, 4.0, 10.0, 20.0, 15.0, 32.0, 32.0, 41.0, 73.0, 95.0, 159.0, 209.0, 317.0, 475.0, 695.0, 1152.0, 2050.0, 4570.0, 12365.0, 41545.0, 151430.0, 409794.0, 295598.0, 87980.0, 24392.0, 7855.0, 3291.0, 1583.0, 944.0, 558.0, 387.0, 277.0, 169.0, 128.0, 75.0, 73.0, 50.0, 39.0, 18.0, 14.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93212890625, -0.90533447265625, -0.8785400390625, -0.85174560546875, -0.824951171875, -0.79815673828125, -0.7713623046875, -0.74456787109375, -0.7177734375, -0.69097900390625, -0.6641845703125, -0.63739013671875, -0.610595703125, -0.58380126953125, -0.5570068359375, -0.53021240234375, -0.50341796875, -0.47662353515625, -0.4498291015625, -0.42303466796875, -0.396240234375, -0.36944580078125, -0.3426513671875, -0.31585693359375, -0.2890625, -0.26226806640625, -0.2354736328125, -0.20867919921875, -0.181884765625, -0.15509033203125, -0.1282958984375, -0.10150146484375, -0.07470703125, -0.04791259765625, -0.0211181640625, 0.00567626953125, 0.032470703125, 0.05926513671875, 0.0860595703125, 0.11285400390625, 0.1396484375, 0.16644287109375, 0.1932373046875, 0.22003173828125, 0.246826171875, 0.27362060546875, 0.3004150390625, 0.32720947265625, 0.35400390625, 0.38079833984375, 0.4075927734375, 0.43438720703125, 0.461181640625, 0.48797607421875, 0.5147705078125, 0.54156494140625, 0.568359375, 0.59515380859375, 0.6219482421875, 0.64874267578125, 0.675537109375, 0.70233154296875, 0.7291259765625, 0.75592041015625, 0.78271484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 8.0, 11.0, 12.0, 11.0, 16.0, 20.0, 24.0, 38.0, 15.0, 39.0, 29.0, 35.0, 34.0, 35.0, 47.0, 47.0, 39.0, 56.0, 45.0, 32.0, 44.0, 41.0, 40.0, 47.0, 34.0, 24.0, 24.0, 26.0, 20.0, 17.0, 17.0, 8.0, 12.0, 8.0, 8.0, 9.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.5132522583007812, -0.4942779541015625, -0.47530364990234375, -0.456329345703125, -0.43735504150390625, -0.4183807373046875, -0.39940643310546875, -0.38043212890625, -0.36145782470703125, -0.3424835205078125, -0.32350921630859375, -0.304534912109375, -0.28556060791015625, -0.2665863037109375, -0.24761199951171875, -0.2286376953125, -0.20966339111328125, -0.1906890869140625, -0.17171478271484375, -0.152740478515625, -0.13376617431640625, -0.1147918701171875, -0.09581756591796875, -0.07684326171875, -0.05786895751953125, -0.0388946533203125, -0.01992034912109375, -0.000946044921875, 0.01802825927734375, 0.0370025634765625, 0.05597686767578125, 0.074951171875, 0.09392547607421875, 0.1128997802734375, 0.13187408447265625, 0.150848388671875, 0.16982269287109375, 0.1887969970703125, 0.20777130126953125, 0.22674560546875, 0.24571990966796875, 0.2646942138671875, 0.28366851806640625, 0.302642822265625, 0.32161712646484375, 0.3405914306640625, 0.35956573486328125, 0.3785400390625, 0.39751434326171875, 0.4164886474609375, 0.43546295166015625, 0.454437255859375, 0.47341156005859375, 0.4923858642578125, 0.5113601684570312, 0.53033447265625, 0.5493087768554688, 0.5682830810546875, 0.5872573852539062, 0.606231689453125, 0.6252059936523438, 0.6441802978515625, 0.6631546020507812, 0.68212890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 8.0, 11.0, 19.0, 32.0, 41.0, 80.0, 135.0, 275.0, 667.0, 1944.0, 7318.0, 45524.0, 484583.0, 455528.0, 42315.0, 6874.0, 1872.0, 679.0, 299.0, 150.0, 77.0, 42.0, 27.0, 12.0, 15.0, 10.0, 6.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5172042846679688, -0.4972991943359375, -0.47739410400390625, -0.457489013671875, -0.43758392333984375, -0.4176788330078125, -0.39777374267578125, -0.37786865234375, -0.35796356201171875, -0.3380584716796875, -0.31815338134765625, -0.298248291015625, -0.27834320068359375, -0.2584381103515625, -0.23853302001953125, -0.2186279296875, -0.19872283935546875, -0.1788177490234375, -0.15891265869140625, -0.139007568359375, -0.11910247802734375, -0.0991973876953125, -0.07929229736328125, -0.05938720703125, -0.03948211669921875, -0.0195770263671875, 0.00032806396484375, 0.020233154296875, 0.04013824462890625, 0.0600433349609375, 0.07994842529296875, 0.099853515625, 0.11975860595703125, 0.1396636962890625, 0.15956878662109375, 0.179473876953125, 0.19937896728515625, 0.2192840576171875, 0.23918914794921875, 0.25909423828125, 0.27899932861328125, 0.2989044189453125, 0.31880950927734375, 0.338714599609375, 0.35861968994140625, 0.3785247802734375, 0.39842987060546875, 0.4183349609375, 0.43824005126953125, 0.4581451416015625, 0.47805023193359375, 0.497955322265625, 0.5178604125976562, 0.5377655029296875, 0.5576705932617188, 0.57757568359375, 0.5974807739257812, 0.6173858642578125, 0.6372909545898438, 0.657196044921875, 0.6771011352539062, 0.6970062255859375, 0.7169113159179688, 0.73681640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 16.0, 19.0, 20.0, 39.0, 53.0, 41.0, 45.0, 55.0, 80.0, 85.0, 77.0, 73.0, 70.0, 69.0, 58.0, 42.0, 27.0, 20.0, 25.0, 23.0, 12.0, 11.0, 13.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00011855363845825195, -0.00011562090367078781, -0.00011268816888332367, -0.00010975543409585953, -0.00010682269930839539, -0.00010388996452093124, -0.0001009572297334671, -9.802449494600296e-05, -9.509176015853882e-05, -9.215902537107468e-05, -8.922629058361053e-05, -8.629355579614639e-05, -8.336082100868225e-05, -8.042808622121811e-05, -7.749535143375397e-05, -7.456261664628983e-05, -7.162988185882568e-05, -6.869714707136154e-05, -6.57644122838974e-05, -6.283167749643326e-05, -5.9898942708969116e-05, -5.6966207921504974e-05, -5.403347313404083e-05, -5.110073834657669e-05, -4.816800355911255e-05, -4.523526877164841e-05, -4.2302533984184265e-05, -3.936979919672012e-05, -3.643706440925598e-05, -3.350432962179184e-05, -3.05715948343277e-05, -2.7638860046863556e-05, -2.4706125259399414e-05, -2.1773390471935272e-05, -1.884065568447113e-05, -1.590792089700699e-05, -1.2975186109542847e-05, -1.0042451322078705e-05, -7.109716534614563e-06, -4.176981747150421e-06, -1.2442469596862793e-06, 1.6884878277778625e-06, 4.621222615242004e-06, 7.553957402706146e-06, 1.0486692190170288e-05, 1.341942697763443e-05, 1.6352161765098572e-05, 1.9284896552562714e-05, 2.2217631340026855e-05, 2.5150366127490997e-05, 2.808310091495514e-05, 3.101583570241928e-05, 3.394857048988342e-05, 3.6881305277347565e-05, 3.9814040064811707e-05, 4.274677485227585e-05, 4.567950963973999e-05, 4.861224442720413e-05, 5.1544979214668274e-05, 5.4477714002132416e-05, 5.741044878959656e-05, 6.03431835770607e-05, 6.327591836452484e-05, 6.620865315198898e-05, 6.914138793945312e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 10.0, 7.0, 13.0, 14.0, 36.0, 44.0, 48.0, 73.0, 103.0, 188.0, 295.0, 472.0, 1101.0, 2639.0, 8098.0, 35137.0, 300441.0, 598606.0, 79776.0, 13958.0, 4132.0, 1611.0, 712.0, 408.0, 202.0, 117.0, 76.0, 68.0, 42.0, 27.0, 21.0, 10.0, 15.0, 9.0, 7.0, 4.0, 5.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.51611328125, -0.498443603515625, -0.48077392578125, -0.463104248046875, -0.4454345703125, -0.427764892578125, -0.41009521484375, -0.392425537109375, -0.374755859375, -0.357086181640625, -0.33941650390625, -0.321746826171875, -0.3040771484375, -0.286407470703125, -0.26873779296875, -0.251068115234375, -0.2333984375, -0.215728759765625, -0.19805908203125, -0.180389404296875, -0.1627197265625, -0.145050048828125, -0.12738037109375, -0.109710693359375, -0.092041015625, -0.074371337890625, -0.05670166015625, -0.039031982421875, -0.0213623046875, -0.003692626953125, 0.01397705078125, 0.031646728515625, 0.04931640625, 0.066986083984375, 0.08465576171875, 0.102325439453125, 0.1199951171875, 0.137664794921875, 0.15533447265625, 0.173004150390625, 0.190673828125, 0.208343505859375, 0.22601318359375, 0.243682861328125, 0.2613525390625, 0.279022216796875, 0.29669189453125, 0.314361572265625, 0.33203125, 0.349700927734375, 0.36737060546875, 0.385040283203125, 0.4027099609375, 0.420379638671875, 0.43804931640625, 0.455718994140625, 0.473388671875, 0.491058349609375, 0.50872802734375, 0.526397705078125, 0.5440673828125, 0.561737060546875, 0.57940673828125, 0.597076416015625, 0.61474609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 4.0, 13.0, 21.0, 22.0, 36.0, 39.0, 57.0, 60.0, 60.0, 63.0, 89.0, 88.0, 70.0, 79.0, 61.0, 40.0, 38.0, 18.0, 22.0, 18.0, 21.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2665748596191406, -0.25800323486328125, -0.24943161010742188, -0.2408599853515625, -0.23228836059570312, -0.22371673583984375, -0.21514511108398438, -0.206573486328125, -0.19800186157226562, -0.18943023681640625, -0.18085861206054688, -0.1722869873046875, -0.16371536254882812, -0.15514373779296875, -0.14657211303710938, -0.13800048828125, -0.12942886352539062, -0.12085723876953125, -0.11228561401367188, -0.1037139892578125, -0.09514236450195312, -0.08657073974609375, -0.07799911499023438, -0.069427490234375, -0.060855865478515625, -0.05228424072265625, -0.043712615966796875, -0.0351409912109375, -0.026569366455078125, -0.01799774169921875, -0.009426116943359375, -0.0008544921875, 0.007717132568359375, 0.01628875732421875, 0.024860382080078125, 0.0334320068359375, 0.042003631591796875, 0.05057525634765625, 0.059146881103515625, 0.067718505859375, 0.07629013061523438, 0.08486175537109375, 0.09343338012695312, 0.1020050048828125, 0.11057662963867188, 0.11914825439453125, 0.12771987915039062, 0.13629150390625, 0.14486312866210938, 0.15343475341796875, 0.16200637817382812, 0.1705780029296875, 0.17914962768554688, 0.18772125244140625, 0.19629287719726562, 0.204864501953125, 0.21343612670898438, 0.22200775146484375, 0.23057937622070312, 0.2391510009765625, 0.24772262573242188, 0.25629425048828125, 0.2648658752441406, 0.2734375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 10.0, 19.0, 32.0, 46.0, 59.0, 106.0, 100.0, 111.0, 115.0, 95.0, 93.0, 72.0, 51.0, 31.0, 16.0, 13.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26450252532959, -5.103144645690918, -4.941786766052246, -4.780428409576416, -4.619070529937744, -4.457712650299072, -4.296354293823242, -4.13499641418457, -3.9736385345458984, -3.8122806549072266, -3.6509225368499756, -3.4895644187927246, -3.3282065391540527, -3.166848659515381, -3.00549054145813, -2.844132423400879, -2.682774543762207, -2.521416664123535, -2.360058546066284, -2.198700428009033, -2.0373425483703613, -1.8759845495224, -1.7146265506744385, -1.553268551826477, -1.3919105529785156, -1.2305525541305542, -1.0691945552825928, -0.9078365564346313, -0.7464785575866699, -0.5851205587387085, -0.42376255989074707, -0.26240456104278564, -0.10104656219482422, 0.06031143665313721, 0.22166943550109863, 0.38302743434906006, 0.5443854331970215, 0.7057434320449829, 0.8671014308929443, 1.0284594297409058, 1.1898174285888672, 1.3511754274368286, 1.51253342628479, 1.6738914251327515, 1.835249423980713, 1.9966074228286743, 2.1579654216766357, 2.3193235397338867, 2.4806814193725586, 2.6420392990112305, 2.8033974170684814, 2.9647555351257324, 3.1261134147644043, 3.287471294403076, 3.448829412460327, 3.610187530517578, 3.77154541015625, 3.932903289794922, 4.094261169433594, 4.255619525909424, 4.416977405548096, 4.578335285186768, 4.739693641662598, 4.9010515213012695, 5.062409400939941]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 15.0, 16.0, 12.0, 23.0, 26.0, 38.0, 37.0, 39.0, 45.0, 54.0, 46.0, 58.0, 68.0, 72.0, 63.0, 55.0, 59.0, 49.0, 44.0, 35.0, 22.0, 26.0, 24.0, 16.0, 10.0, 4.0, 8.0, 6.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.008084297180176, -4.8652167320251465, -4.722349166870117, -4.579482078552246, -4.436614513397217, -4.2937469482421875, -4.150879383087158, -4.008011817932129, -3.8651442527770996, -3.7222766876220703, -3.57940936088562, -3.436541795730591, -3.2936742305755615, -3.1508069038391113, -3.007939338684082, -2.8650717735290527, -2.7222044467926025, -2.5793368816375732, -2.436469554901123, -2.2936019897460938, -2.1507344245910645, -2.007866859436035, -1.864999532699585, -1.7221319675445557, -1.579264521598816, -1.4363970756530762, -1.2935295104980469, -1.1506620645523071, -1.0077946186065674, -0.8649270534515381, -0.7220596075057983, -0.579192042350769, -0.4363245964050293, -0.2934570908546448, -0.15058961510658264, -0.007722139358520508, 0.135145366191864, 0.27801287174224854, 0.4208803176879883, 0.5637478828430176, 0.7066153287887573, 0.8494828343391418, 0.9923503398895264, 1.1352177858352661, 1.2780852317810059, 1.4209527969360352, 1.563820242881775, 1.7066878080368042, 1.849555253982544, 1.9924226999282837, 2.1352901458740234, 2.2781577110290527, 2.421025276184082, 2.5638928413391113, 2.7067601680755615, 2.849627733230591, 2.992495059967041, 3.1353626251220703, 3.2782299518585205, 3.42109751701355, 3.563965082168579, 3.7068324089050293, 3.8496999740600586, 3.992567539215088, 4.135435104370117]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 5.0, 7.0, 4.0, 14.0, 11.0, 12.0, 29.0, 38.0, 72.0, 96.0, 147.0, 222.0, 342.0, 634.0, 1153.0, 2399.0, 5446.0, 13825.0, 42262.0, 203903.0, 3436573.0, 392959.0, 61961.0, 18653.0, 7065.0, 3027.0, 1455.0, 775.0, 458.0, 256.0, 165.0, 104.0, 56.0, 47.0, 35.0, 21.0, 12.0, 14.0, 11.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8729782104492188, -0.8470306396484375, -0.8210830688476562, -0.795135498046875, -0.7691879272460938, -0.7432403564453125, -0.7172927856445312, -0.69134521484375, -0.6653976440429688, -0.6394500732421875, -0.6135025024414062, -0.587554931640625, -0.5616073608398438, -0.5356597900390625, -0.5097122192382812, -0.4837646484375, -0.45781707763671875, -0.4318695068359375, -0.40592193603515625, -0.379974365234375, -0.35402679443359375, -0.3280792236328125, -0.30213165283203125, -0.27618408203125, -0.25023651123046875, -0.2242889404296875, -0.19834136962890625, -0.172393798828125, -0.14644622802734375, -0.1204986572265625, -0.09455108642578125, -0.068603515625, -0.04265594482421875, -0.0167083740234375, 0.00923919677734375, 0.035186767578125, 0.06113433837890625, 0.0870819091796875, 0.11302947998046875, 0.13897705078125, 0.16492462158203125, 0.1908721923828125, 0.21681976318359375, 0.242767333984375, 0.26871490478515625, 0.2946624755859375, 0.32061004638671875, 0.3465576171875, 0.37250518798828125, 0.3984527587890625, 0.42440032958984375, 0.450347900390625, 0.47629547119140625, 0.5022430419921875, 0.5281906127929688, 0.55413818359375, 0.5800857543945312, 0.6060333251953125, 0.6319808959960938, 0.657928466796875, 0.6838760375976562, 0.7098236083984375, 0.7357711791992188, 0.76171875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 8.0, 12.0, 15.0, 12.0, 24.0, 26.0, 35.0, 60.0, 60.0, 70.0, 78.0, 73.0, 91.0, 78.0, 67.0, 67.0, 51.0, 46.0, 29.0, 20.0, 21.0, 13.0, 8.0, 10.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19580078125, -0.18987274169921875, -0.1839447021484375, -0.17801666259765625, -0.172088623046875, -0.16616058349609375, -0.1602325439453125, -0.15430450439453125, -0.14837646484375, -0.14244842529296875, -0.1365203857421875, -0.13059234619140625, -0.124664306640625, -0.11873626708984375, -0.1128082275390625, -0.10688018798828125, -0.1009521484375, -0.09502410888671875, -0.0890960693359375, -0.08316802978515625, -0.077239990234375, -0.07131195068359375, -0.0653839111328125, -0.05945587158203125, -0.05352783203125, -0.04759979248046875, -0.0416717529296875, -0.03574371337890625, -0.029815673828125, -0.02388763427734375, -0.0179595947265625, -0.01203155517578125, -0.006103515625, -0.00017547607421875, 0.0057525634765625, 0.01168060302734375, 0.017608642578125, 0.02353668212890625, 0.0294647216796875, 0.03539276123046875, 0.04132080078125, 0.04724884033203125, 0.0531768798828125, 0.05910491943359375, 0.065032958984375, 0.07096099853515625, 0.0768890380859375, 0.08281707763671875, 0.0887451171875, 0.09467315673828125, 0.1006011962890625, 0.10652923583984375, 0.112457275390625, 0.11838531494140625, 0.1243133544921875, 0.13024139404296875, 0.13616943359375, 0.14209747314453125, 0.1480255126953125, 0.15395355224609375, 0.159881591796875, 0.16580963134765625, 0.1717376708984375, 0.17766571044921875, 0.18359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 11.0, 28.0, 38.0, 63.0, 95.0, 148.0, 210.0, 327.0, 616.0, 1136.0, 2160.0, 4462.0, 10525.0, 30521.0, 115458.0, 951449.0, 2814893.0, 193184.0, 43704.0, 14079.0, 5661.0, 2559.0, 1215.0, 661.0, 381.0, 244.0, 124.0, 97.0, 62.0, 41.0, 22.0, 22.0, 12.0, 12.0, 6.0, 10.0, 2.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72119140625, -0.6964569091796875, -0.671722412109375, -0.6469879150390625, -0.62225341796875, -0.5975189208984375, -0.572784423828125, -0.5480499267578125, -0.5233154296875, -0.4985809326171875, -0.473846435546875, -0.4491119384765625, -0.42437744140625, -0.3996429443359375, -0.374908447265625, -0.3501739501953125, -0.325439453125, -0.3007049560546875, -0.275970458984375, -0.2512359619140625, -0.22650146484375, -0.2017669677734375, -0.177032470703125, -0.1522979736328125, -0.1275634765625, -0.1028289794921875, -0.078094482421875, -0.0533599853515625, -0.02862548828125, -0.0038909912109375, 0.020843505859375, 0.0455780029296875, 0.0703125, 0.0950469970703125, 0.119781494140625, 0.1445159912109375, 0.16925048828125, 0.1939849853515625, 0.218719482421875, 0.2434539794921875, 0.2681884765625, 0.2929229736328125, 0.317657470703125, 0.3423919677734375, 0.36712646484375, 0.3918609619140625, 0.416595458984375, 0.4413299560546875, 0.466064453125, 0.4907989501953125, 0.515533447265625, 0.5402679443359375, 0.56500244140625, 0.5897369384765625, 0.614471435546875, 0.6392059326171875, 0.6639404296875, 0.6886749267578125, 0.713409423828125, 0.7381439208984375, 0.76287841796875, 0.7876129150390625, 0.812347412109375, 0.8370819091796875, 0.86181640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 9.0, 3.0, 16.0, 17.0, 20.0, 36.0, 46.0, 42.0, 71.0, 110.0, 184.0, 275.0, 568.0, 1201.0, 621.0, 298.0, 175.0, 109.0, 72.0, 63.0, 32.0, 33.0, 15.0, 13.0, 10.0, 9.0, 2.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33251953125, -0.3229026794433594, -0.31328582763671875, -0.3036689758300781, -0.2940521240234375, -0.2844352722167969, -0.27481842041015625, -0.2652015686035156, -0.255584716796875, -0.24596786499023438, -0.23635101318359375, -0.22673416137695312, -0.2171173095703125, -0.20750045776367188, -0.19788360595703125, -0.18826675415039062, -0.17864990234375, -0.16903305053710938, -0.15941619873046875, -0.14979934692382812, -0.1401824951171875, -0.13056564331054688, -0.12094879150390625, -0.11133193969726562, -0.101715087890625, -0.09209823608398438, -0.08248138427734375, -0.07286453247070312, -0.0632476806640625, -0.053630828857421875, -0.04401397705078125, -0.034397125244140625, -0.0247802734375, -0.015163421630859375, -0.00554656982421875, 0.004070281982421875, 0.0136871337890625, 0.023303985595703125, 0.03292083740234375, 0.042537689208984375, 0.052154541015625, 0.061771392822265625, 0.07138824462890625, 0.08100509643554688, 0.0906219482421875, 0.10023880004882812, 0.10985565185546875, 0.11947250366210938, 0.12908935546875, 0.13870620727539062, 0.14832305908203125, 0.15793991088867188, 0.1675567626953125, 0.17717361450195312, 0.18679046630859375, 0.19640731811523438, 0.206024169921875, 0.21564102172851562, 0.22525787353515625, 0.23487472534179688, 0.2444915771484375, 0.2541084289550781, 0.26372528076171875, 0.2733421325683594, 0.282958984375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 8.0, 9.0, 24.0, 25.0, 42.0, 58.0, 73.0, 113.0, 113.0, 126.0, 107.0, 92.0, 65.0, 50.0, 20.0, 24.0, 16.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.068491220474243, -2.997741222381592, -2.9269909858703613, -2.85624098777771, -2.7854909896850586, -2.714740753173828, -2.6439907550811768, -2.5732407569885254, -2.502490520477295, -2.4317405223846436, -2.360990285873413, -2.2902402877807617, -2.2194902896881104, -2.148740291595459, -2.0779900550842285, -2.007240056991577, -1.9364900588989258, -1.8657399415969849, -1.7949899435043335, -1.7242398262023926, -1.6534898281097412, -1.5827397108078003, -1.5119895935058594, -1.441239595413208, -1.370489478111267, -1.2997393608093262, -1.2289893627166748, -1.1582392454147339, -1.087489128112793, -1.0167391300201416, -0.9459890127182007, -0.8752389550209045, -0.8044886589050293, -0.7337386012077332, -0.662988543510437, -0.5922384262084961, -0.5214883685112, -0.4507383108139038, -0.3799882233142853, -0.30923813581466675, -0.2384880781173706, -0.16773800551891327, -0.09698793292045593, -0.026237860321998596, 0.04451221227645874, 0.11526226997375488, 0.1860123574733734, 0.25676244497299194, 0.3275125026702881, 0.39826256036758423, 0.46901264786720276, 0.5397627353668213, 0.6105127930641174, 0.6812628507614136, 0.7520129680633545, 0.8227630257606506, 0.8935130834579468, 0.9642631411552429, 1.035013198852539, 1.10576331615448, 1.176513433456421, 1.2472634315490723, 1.3180135488510132, 1.388763666152954, 1.4595136642456055]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 7.0, 9.0, 14.0, 13.0, 19.0, 18.0, 10.0, 25.0, 27.0, 33.0, 24.0, 22.0, 35.0, 28.0, 41.0, 37.0, 42.0, 44.0, 41.0, 41.0, 31.0, 45.0, 39.0, 37.0, 41.0, 24.0, 26.0, 26.0, 26.0, 24.0, 13.0, 23.0, 22.0, 11.0, 13.0, 9.0, 9.0, 8.0, 10.0, 9.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9749810695648193, -0.9420328140258789, -0.9090846180915833, -0.8761363625526428, -0.8431881666183472, -0.8102399110794067, -0.7772916555404663, -0.7443434596061707, -0.711395263671875, -0.6784470081329346, -0.6454988121986389, -0.6125505566596985, -0.5796023607254028, -0.5466541051864624, -0.513705849647522, -0.4807576537132263, -0.4478093981742859, -0.41486117243766785, -0.3819129467010498, -0.3489646911621094, -0.3160164952278137, -0.2830682396888733, -0.25012001395225525, -0.2171717882156372, -0.18422356247901917, -0.15127533674240112, -0.11832710355520248, -0.08537887036800385, -0.0524306446313858, -0.01948241889476776, 0.013465821743011475, 0.04641404747962952, 0.07936227321624756, 0.1123104989528656, 0.14525872468948364, 0.17820696532726288, 0.21115519106388092, 0.24410341680049896, 0.2770516574382782, 0.30999988317489624, 0.3429481089115143, 0.3758963346481323, 0.40884456038475037, 0.4417927861213684, 0.47474104166030884, 0.5076892375946045, 0.5406374931335449, 0.5735857486724854, 0.606533944606781, 0.6394822001457214, 0.6724303960800171, 0.7053786516189575, 0.7383268475532532, 0.7712751030921936, 0.8042232990264893, 0.8371715545654297, 0.8701198101043701, 0.9030680656433105, 0.9360162615776062, 0.9689645171165466, 1.0019127130508423, 1.0348609685897827, 1.0678092241287231, 1.100757360458374, 1.1337056159973145]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 3.0, 3.0, 8.0, 10.0, 13.0, 27.0, 32.0, 40.0, 50.0, 73.0, 111.0, 155.0, 225.0, 293.0, 527.0, 835.0, 1452.0, 2647.0, 5364.0, 11409.0, 27072.0, 66924.0, 175904.0, 431007.0, 196619.0, 73062.0, 29643.0, 12584.0, 5683.0, 2780.0, 1473.0, 881.0, 560.0, 334.0, 206.0, 151.0, 114.0, 74.0, 52.0, 40.0, 22.0, 19.0, 19.0, 13.0, 8.0, 10.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.79638671875, -0.7719192504882812, -0.7474517822265625, -0.7229843139648438, -0.698516845703125, -0.6740493774414062, -0.6495819091796875, -0.6251144409179688, -0.60064697265625, -0.5761795043945312, -0.5517120361328125, -0.5272445678710938, -0.502777099609375, -0.47830963134765625, -0.4538421630859375, -0.42937469482421875, -0.4049072265625, -0.38043975830078125, -0.3559722900390625, -0.33150482177734375, -0.307037353515625, -0.28256988525390625, -0.2581024169921875, -0.23363494873046875, -0.20916748046875, -0.18470001220703125, -0.1602325439453125, -0.13576507568359375, -0.111297607421875, -0.08683013916015625, -0.0623626708984375, -0.03789520263671875, -0.013427734375, 0.01103973388671875, 0.0355072021484375, 0.05997467041015625, 0.084442138671875, 0.10890960693359375, 0.1333770751953125, 0.15784454345703125, 0.18231201171875, 0.20677947998046875, 0.2312469482421875, 0.25571441650390625, 0.280181884765625, 0.30464935302734375, 0.3291168212890625, 0.35358428955078125, 0.3780517578125, 0.40251922607421875, 0.4269866943359375, 0.45145416259765625, 0.475921630859375, 0.5003890991210938, 0.5248565673828125, 0.5493240356445312, 0.57379150390625, 0.5982589721679688, 0.6227264404296875, 0.6471939086914062, 0.671661376953125, 0.6961288452148438, 0.7205963134765625, 0.7450637817382812, 0.76953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 4.0, 4.0, 6.0, 11.0, 11.0, 14.0, 23.0, 33.0, 34.0, 55.0, 56.0, 55.0, 67.0, 75.0, 74.0, 77.0, 80.0, 69.0, 44.0, 51.0, 38.0, 31.0, 27.0, 12.0, 9.0, 10.0, 9.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1920166015625, -0.18627166748046875, -0.1805267333984375, -0.17478179931640625, -0.169036865234375, -0.16329193115234375, -0.1575469970703125, -0.15180206298828125, -0.14605712890625, -0.14031219482421875, -0.1345672607421875, -0.12882232666015625, -0.123077392578125, -0.11733245849609375, -0.1115875244140625, -0.10584259033203125, -0.10009765625, -0.09435272216796875, -0.0886077880859375, -0.08286285400390625, -0.077117919921875, -0.07137298583984375, -0.0656280517578125, -0.05988311767578125, -0.05413818359375, -0.04839324951171875, -0.0426483154296875, -0.03690338134765625, -0.031158447265625, -0.02541351318359375, -0.0196685791015625, -0.01392364501953125, -0.0081787109375, -0.00243377685546875, 0.0033111572265625, 0.00905609130859375, 0.014801025390625, 0.02054595947265625, 0.0262908935546875, 0.03203582763671875, 0.03778076171875, 0.04352569580078125, 0.0492706298828125, 0.05501556396484375, 0.060760498046875, 0.06650543212890625, 0.0722503662109375, 0.07799530029296875, 0.083740234375, 0.08948516845703125, 0.0952301025390625, 0.10097503662109375, 0.106719970703125, 0.11246490478515625, 0.1182098388671875, 0.12395477294921875, 0.12969970703125, 0.13544464111328125, 0.1411895751953125, 0.14693450927734375, 0.152679443359375, 0.15842437744140625, 0.1641693115234375, 0.16991424560546875, 0.1756591796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 11.0, 6.0, 17.0, 23.0, 17.0, 28.0, 39.0, 48.0, 95.0, 111.0, 140.0, 229.0, 293.0, 508.0, 775.0, 1196.0, 2036.0, 3967.0, 8265.0, 19235.0, 48061.0, 121813.0, 338271.0, 311350.0, 112626.0, 44427.0, 18208.0, 7665.0, 3746.0, 1925.0, 1149.0, 706.0, 446.0, 316.0, 220.0, 158.0, 116.0, 81.0, 58.0, 38.0, 35.0, 24.0, 20.0, 9.0, 8.0, 9.0, 2.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.630859375, -0.6104812622070312, -0.5901031494140625, -0.5697250366210938, -0.549346923828125, -0.5289688110351562, -0.5085906982421875, -0.48821258544921875, -0.46783447265625, -0.44745635986328125, -0.4270782470703125, -0.40670013427734375, -0.386322021484375, -0.36594390869140625, -0.3455657958984375, -0.32518768310546875, -0.3048095703125, -0.28443145751953125, -0.2640533447265625, -0.24367523193359375, -0.223297119140625, -0.20291900634765625, -0.1825408935546875, -0.16216278076171875, -0.14178466796875, -0.12140655517578125, -0.1010284423828125, -0.08065032958984375, -0.060272216796875, -0.03989410400390625, -0.0195159912109375, 0.00086212158203125, 0.021240234375, 0.04161834716796875, 0.0619964599609375, 0.08237457275390625, 0.102752685546875, 0.12313079833984375, 0.1435089111328125, 0.16388702392578125, 0.18426513671875, 0.20464324951171875, 0.2250213623046875, 0.24539947509765625, 0.265777587890625, 0.28615570068359375, 0.3065338134765625, 0.32691192626953125, 0.3472900390625, 0.36766815185546875, 0.3880462646484375, 0.40842437744140625, 0.428802490234375, 0.44918060302734375, 0.4695587158203125, 0.48993682861328125, 0.51031494140625, 0.5306930541992188, 0.5510711669921875, 0.5714492797851562, 0.591827392578125, 0.6122055053710938, 0.6325836181640625, 0.6529617309570312, 0.67333984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 11.0, 5.0, 10.0, 10.0, 16.0, 14.0, 21.0, 19.0, 30.0, 23.0, 40.0, 42.0, 26.0, 45.0, 54.0, 55.0, 62.0, 52.0, 44.0, 47.0, 52.0, 38.0, 33.0, 45.0, 36.0, 32.0, 34.0, 24.0, 19.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.7959213256835938, -0.7725067138671875, -0.7490921020507812, -0.725677490234375, -0.7022628784179688, -0.6788482666015625, -0.6554336547851562, -0.63201904296875, -0.6086044311523438, -0.5851898193359375, -0.5617752075195312, -0.538360595703125, -0.5149459838867188, -0.4915313720703125, -0.46811676025390625, -0.4447021484375, -0.42128753662109375, -0.3978729248046875, -0.37445831298828125, -0.351043701171875, -0.32762908935546875, -0.3042144775390625, -0.28079986572265625, -0.25738525390625, -0.23397064208984375, -0.2105560302734375, -0.18714141845703125, -0.163726806640625, -0.14031219482421875, -0.1168975830078125, -0.09348297119140625, -0.070068359375, -0.04665374755859375, -0.0232391357421875, 0.00017547607421875, 0.023590087890625, 0.04700469970703125, 0.0704193115234375, 0.09383392333984375, 0.11724853515625, 0.14066314697265625, 0.1640777587890625, 0.18749237060546875, 0.210906982421875, 0.23432159423828125, 0.2577362060546875, 0.28115081787109375, 0.3045654296875, 0.32798004150390625, 0.3513946533203125, 0.37480926513671875, 0.398223876953125, 0.42163848876953125, 0.4450531005859375, 0.46846771240234375, 0.49188232421875, 0.5152969360351562, 0.5387115478515625, 0.5621261596679688, 0.585540771484375, 0.6089553833007812, 0.6323699951171875, 0.6557846069335938, 0.67919921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 19.0, 27.0, 26.0, 50.0, 65.0, 108.0, 182.0, 344.0, 650.0, 1458.0, 3671.0, 10588.0, 45830.0, 390195.0, 512499.0, 62505.0, 12825.0, 4215.0, 1638.0, 750.0, 363.0, 177.0, 134.0, 65.0, 41.0, 34.0, 24.0, 13.0, 9.0, 10.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.4994049072265625, -0.480255126953125, -0.4611053466796875, -0.44195556640625, -0.4228057861328125, -0.403656005859375, -0.3845062255859375, -0.3653564453125, -0.3462066650390625, -0.327056884765625, -0.3079071044921875, -0.28875732421875, -0.2696075439453125, -0.250457763671875, -0.2313079833984375, -0.212158203125, -0.1930084228515625, -0.173858642578125, -0.1547088623046875, -0.13555908203125, -0.1164093017578125, -0.097259521484375, -0.0781097412109375, -0.0589599609375, -0.0398101806640625, -0.020660400390625, -0.0015106201171875, 0.01763916015625, 0.0367889404296875, 0.055938720703125, 0.0750885009765625, 0.09423828125, 0.1133880615234375, 0.132537841796875, 0.1516876220703125, 0.17083740234375, 0.1899871826171875, 0.209136962890625, 0.2282867431640625, 0.2474365234375, 0.2665863037109375, 0.285736083984375, 0.3048858642578125, 0.32403564453125, 0.3431854248046875, 0.362335205078125, 0.3814849853515625, 0.400634765625, 0.4197845458984375, 0.438934326171875, 0.4580841064453125, 0.47723388671875, 0.4963836669921875, 0.515533447265625, 0.5346832275390625, 0.5538330078125, 0.5729827880859375, 0.592132568359375, 0.6112823486328125, 0.63043212890625, 0.6495819091796875, 0.668731689453125, 0.6878814697265625, 0.70703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 11.0, 8.0, 8.0, 9.0, 20.0, 19.0, 26.0, 27.0, 24.0, 52.0, 45.0, 42.0, 68.0, 53.0, 65.0, 64.0, 57.0, 51.0, 44.0, 46.0, 38.0, 33.0, 25.0, 29.0, 29.0, 20.0, 16.0, 13.0, 7.0, 6.0, 6.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.507469177246094e-05, -5.302857607603073e-05, -5.0982460379600525e-05, -4.893634468317032e-05, -4.689022898674011e-05, -4.4844113290309906e-05, -4.27979975938797e-05, -4.0751881897449493e-05, -3.870576620101929e-05, -3.665965050458908e-05, -3.4613534808158875e-05, -3.256741911172867e-05, -3.052130341529846e-05, -2.8475187718868256e-05, -2.642907202243805e-05, -2.4382956326007843e-05, -2.2336840629577637e-05, -2.029072493314743e-05, -1.8244609236717224e-05, -1.6198493540287018e-05, -1.4152377843856812e-05, -1.2106262147426605e-05, -1.0060146450996399e-05, -8.014030754566193e-06, -5.967915058135986e-06, -3.92179936170578e-06, -1.8756836652755737e-06, 1.7043203115463257e-07, 2.216547727584839e-06, 4.262663424015045e-06, 6.3087791204452515e-06, 8.354894816875458e-06, 1.0401010513305664e-05, 1.244712620973587e-05, 1.4493241906166077e-05, 1.6539357602596283e-05, 1.858547329902649e-05, 2.0631588995456696e-05, 2.2677704691886902e-05, 2.4723820388317108e-05, 2.6769936084747314e-05, 2.881605178117752e-05, 3.086216747760773e-05, 3.290828317403793e-05, 3.495439887046814e-05, 3.7000514566898346e-05, 3.904663026332855e-05, 4.109274595975876e-05, 4.3138861656188965e-05, 4.518497735261917e-05, 4.723109304904938e-05, 4.9277208745479584e-05, 5.132332444190979e-05, 5.3369440138339996e-05, 5.54155558347702e-05, 5.746167153120041e-05, 5.9507787227630615e-05, 6.155390292406082e-05, 6.360001862049103e-05, 6.564613431692123e-05, 6.769225001335144e-05, 6.973836570978165e-05, 7.178448140621185e-05, 7.383059710264206e-05, 7.587671279907227e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 13.0, 8.0, 7.0, 12.0, 17.0, 37.0, 49.0, 64.0, 85.0, 139.0, 211.0, 377.0, 576.0, 1061.0, 2231.0, 4887.0, 11462.0, 36786.0, 191481.0, 571397.0, 173540.0, 33899.0, 11082.0, 4479.0, 2084.0, 1053.0, 572.0, 318.0, 214.0, 127.0, 87.0, 58.0, 44.0, 30.0, 26.0, 12.0, 11.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3539466857910156, -0.33948516845703125, -0.3250236511230469, -0.3105621337890625, -0.2961006164550781, -0.28163909912109375, -0.2671775817871094, -0.252716064453125, -0.23825454711914062, -0.22379302978515625, -0.20933151245117188, -0.1948699951171875, -0.18040847778320312, -0.16594696044921875, -0.15148544311523438, -0.13702392578125, -0.12256240844726562, -0.10810089111328125, -0.09363937377929688, -0.0791778564453125, -0.06471633911132812, -0.05025482177734375, -0.035793304443359375, -0.021331787109375, -0.006870269775390625, 0.00759124755859375, 0.022052764892578125, 0.0365142822265625, 0.050975799560546875, 0.06543731689453125, 0.07989883422851562, 0.0943603515625, 0.10882186889648438, 0.12328338623046875, 0.13774490356445312, 0.1522064208984375, 0.16666793823242188, 0.18112945556640625, 0.19559097290039062, 0.210052490234375, 0.22451400756835938, 0.23897552490234375, 0.2534370422363281, 0.2678985595703125, 0.2823600769042969, 0.29682159423828125, 0.3112831115722656, 0.32574462890625, 0.3402061462402344, 0.35466766357421875, 0.3691291809082031, 0.3835906982421875, 0.3980522155761719, 0.41251373291015625, 0.4269752502441406, 0.441436767578125, 0.4558982849121094, 0.47035980224609375, 0.4848213195800781, 0.4992828369140625, 0.5137443542480469, 0.5282058715820312, 0.5426673889160156, 0.55712890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 4.0, 5.0, 8.0, 8.0, 16.0, 18.0, 20.0, 25.0, 24.0, 53.0, 59.0, 69.0, 84.0, 117.0, 115.0, 72.0, 68.0, 52.0, 53.0, 31.0, 26.0, 13.0, 13.0, 7.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331787109375, -0.32123565673828125, -0.3106842041015625, -0.30013275146484375, -0.289581298828125, -0.27902984619140625, -0.2684783935546875, -0.25792694091796875, -0.24737548828125, -0.23682403564453125, -0.2262725830078125, -0.21572113037109375, -0.205169677734375, -0.19461822509765625, -0.1840667724609375, -0.17351531982421875, -0.1629638671875, -0.15241241455078125, -0.1418609619140625, -0.13130950927734375, -0.120758056640625, -0.11020660400390625, -0.0996551513671875, -0.08910369873046875, -0.07855224609375, -0.06800079345703125, -0.0574493408203125, -0.04689788818359375, -0.036346435546875, -0.02579498291015625, -0.0152435302734375, -0.00469207763671875, 0.005859375, 0.01641082763671875, 0.0269622802734375, 0.03751373291015625, 0.048065185546875, 0.05861663818359375, 0.0691680908203125, 0.07971954345703125, 0.09027099609375, 0.10082244873046875, 0.1113739013671875, 0.12192535400390625, 0.132476806640625, 0.14302825927734375, 0.1535797119140625, 0.16413116455078125, 0.1746826171875, 0.18523406982421875, 0.1957855224609375, 0.20633697509765625, 0.216888427734375, 0.22743988037109375, 0.2379913330078125, 0.24854278564453125, 0.25909423828125, 0.26964569091796875, 0.2801971435546875, 0.29074859619140625, 0.301300048828125, 0.31185150146484375, 0.3224029541015625, 0.33295440673828125, 0.343505859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 21.0, 26.0, 39.0, 64.0, 83.0, 115.0, 133.0, 120.0, 101.0, 93.0, 64.0, 44.0, 30.0, 18.0, 7.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.646726608276367, -4.46989631652832, -4.293066024780273, -4.116235733032227, -3.9394054412841797, -3.762575149536133, -3.585744619369507, -3.40891432762146, -3.232084035873413, -3.055253744125366, -2.8784234523773193, -2.7015929222106934, -2.5247626304626465, -2.3479323387145996, -2.1711020469665527, -1.9942717552185059, -1.817441463470459, -1.640611171722412, -1.4637808799743652, -1.2869504690170288, -1.110120177268982, -0.9332898855209351, -0.7564594745635986, -0.5796291828155518, -0.4027988910675049, -0.22596856951713562, -0.04913824796676636, 0.1276921033859253, 0.30452239513397217, 0.48135268688201904, 0.6581830978393555, 0.8350133895874023, 1.0118441581726074, 1.1886744499206543, 1.3655047416687012, 1.5423351526260376, 1.7191654443740845, 1.8959957361221313, 2.0728261470794678, 2.2496564388275146, 2.4264867305755615, 2.6033170223236084, 2.7801473140716553, 2.9569778442382812, 3.133808135986328, 3.310638427734375, 3.487468719482422, 3.6642990112304688, 3.8411293029785156, 4.0179595947265625, 4.194789886474609, 4.371620178222656, 4.548450469970703, 4.72528076171875, 4.902111053466797, 5.078941345214844, 5.255771636962891, 5.4326019287109375, 5.609432220458984, 5.786262512207031, 5.963092803955078, 6.139923095703125, 6.316753387451172, 6.493583679199219, 6.670414447784424]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 8.0, 15.0, 13.0, 20.0, 17.0, 23.0, 21.0, 28.0, 34.0, 23.0, 38.0, 44.0, 53.0, 43.0, 48.0, 49.0, 43.0, 48.0, 57.0, 41.0, 39.0, 25.0, 33.0, 28.0, 27.0, 28.0, 21.0, 26.0, 11.0, 16.0, 10.0, 9.0, 8.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0], "bins": [-4.570374488830566, -4.450555801391602, -4.3307366371154785, -4.210917949676514, -4.091098785400391, -3.9712798595428467, -3.8514609336853027, -3.731642007827759, -3.611823081970215, -3.492004156112671, -3.372185230255127, -3.252366304397583, -3.132547378540039, -3.012728452682495, -2.892909526824951, -2.7730906009674072, -2.6532716751098633, -2.5334527492523193, -2.4136338233947754, -2.2938148975372314, -2.1739959716796875, -2.0541770458221436, -1.9343581199645996, -1.8145391941070557, -1.6947205066680908, -1.5749015808105469, -1.455082654953003, -1.335263729095459, -1.215444803237915, -1.095625877380371, -0.9758070111274719, -0.855988085269928, -0.7361690998077393, -0.6163501739501953, -0.49653124809265137, -0.3767123520374298, -0.25689342617988586, -0.1370745301246643, -0.01725560426712036, 0.10256332159042358, 0.22238224744796753, 0.3422011733055115, 0.4620200991630554, 0.5818389654159546, 0.7016578912734985, 0.8214768171310425, 0.9412957429885864, 1.0611146688461304, 1.1809335947036743, 1.3007525205612183, 1.4205714464187622, 1.5403903722763062, 1.66020929813385, 1.7800281047821045, 1.8998470306396484, 2.0196659564971924, 2.1394848823547363, 2.2593038082122803, 2.379122734069824, 2.498941659927368, 2.618760585784912, 2.738579511642456, 2.8583984375, 2.978217363357544, 3.098036289215088]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 10.0, 13.0, 13.0, 18.0, 26.0, 28.0, 62.0, 101.0, 172.0, 331.0, 626.0, 1215.0, 2758.0, 6952.0, 19956.0, 77861.0, 1405480.0, 2562423.0, 82286.0, 20865.0, 7307.0, 2940.0, 1319.0, 627.0, 355.0, 193.0, 119.0, 75.0, 42.0, 45.0, 25.0, 10.0, 7.0, 7.0, 5.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91015625, -0.8798370361328125, -0.849517822265625, -0.8191986083984375, -0.78887939453125, -0.7585601806640625, -0.728240966796875, -0.6979217529296875, -0.6676025390625, -0.6372833251953125, -0.606964111328125, -0.5766448974609375, -0.54632568359375, -0.5160064697265625, -0.485687255859375, -0.4553680419921875, -0.425048828125, -0.3947296142578125, -0.364410400390625, -0.3340911865234375, -0.30377197265625, -0.2734527587890625, -0.243133544921875, -0.2128143310546875, -0.1824951171875, -0.1521759033203125, -0.121856689453125, -0.0915374755859375, -0.06121826171875, -0.0308990478515625, -0.000579833984375, 0.0297393798828125, 0.06005859375, 0.0903778076171875, 0.120697021484375, 0.1510162353515625, 0.18133544921875, 0.2116546630859375, 0.241973876953125, 0.2722930908203125, 0.3026123046875, 0.3329315185546875, 0.363250732421875, 0.3935699462890625, 0.42388916015625, 0.4542083740234375, 0.484527587890625, 0.5148468017578125, 0.545166015625, 0.5754852294921875, 0.605804443359375, 0.6361236572265625, 0.66644287109375, 0.6967620849609375, 0.727081298828125, 0.7574005126953125, 0.7877197265625, 0.8180389404296875, 0.848358154296875, 0.8786773681640625, 0.90899658203125, 0.9393157958984375, 0.969635009765625, 0.9999542236328125, 1.0302734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 3.0, 10.0, 9.0, 12.0, 14.0, 30.0, 24.0, 39.0, 51.0, 52.0, 74.0, 70.0, 67.0, 56.0, 79.0, 69.0, 64.0, 57.0, 46.0, 46.0, 30.0, 26.0, 13.0, 16.0, 9.0, 7.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1962890625, -0.19023513793945312, -0.18418121337890625, -0.17812728881835938, -0.1720733642578125, -0.16601943969726562, -0.15996551513671875, -0.15391159057617188, -0.147857666015625, -0.14180374145507812, -0.13574981689453125, -0.12969589233398438, -0.1236419677734375, -0.11758804321289062, -0.11153411865234375, -0.10548019409179688, -0.09942626953125, -0.09337234497070312, -0.08731842041015625, -0.08126449584960938, -0.0752105712890625, -0.06915664672851562, -0.06310272216796875, -0.057048797607421875, -0.050994873046875, -0.044940948486328125, -0.03888702392578125, -0.032833099365234375, -0.0267791748046875, -0.020725250244140625, -0.01467132568359375, -0.008617401123046875, -0.0025634765625, 0.003490447998046875, 0.00954437255859375, 0.015598297119140625, 0.0216522216796875, 0.027706146240234375, 0.03376007080078125, 0.039813995361328125, 0.045867919921875, 0.051921844482421875, 0.05797576904296875, 0.06402969360351562, 0.0700836181640625, 0.07613754272460938, 0.08219146728515625, 0.08824539184570312, 0.09429931640625, 0.10035324096679688, 0.10640716552734375, 0.11246109008789062, 0.1185150146484375, 0.12456893920898438, 0.13062286376953125, 0.13667678833007812, 0.142730712890625, 0.14878463745117188, 0.15483856201171875, 0.16089248657226562, 0.1669464111328125, 0.17300033569335938, 0.17905426025390625, 0.18510818481445312, 0.191162109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 8.0, 7.0, 10.0, 12.0, 16.0, 19.0, 28.0, 33.0, 51.0, 70.0, 144.0, 276.0, 593.0, 1311.0, 3625.0, 12257.0, 56142.0, 744211.0, 3256752.0, 93162.0, 17502.0, 4811.0, 1697.0, 742.0, 365.0, 166.0, 106.0, 55.0, 45.0, 23.0, 16.0, 7.0, 4.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3046875, -1.2640838623046875, -1.223480224609375, -1.1828765869140625, -1.14227294921875, -1.1016693115234375, -1.061065673828125, -1.0204620361328125, -0.9798583984375, -0.9392547607421875, -0.898651123046875, -0.8580474853515625, -0.81744384765625, -0.7768402099609375, -0.736236572265625, -0.6956329345703125, -0.655029296875, -0.6144256591796875, -0.573822021484375, -0.5332183837890625, -0.49261474609375, -0.4520111083984375, -0.411407470703125, -0.3708038330078125, -0.3302001953125, -0.2895965576171875, -0.248992919921875, -0.2083892822265625, -0.16778564453125, -0.1271820068359375, -0.086578369140625, -0.0459747314453125, -0.00537109375, 0.0352325439453125, 0.075836181640625, 0.1164398193359375, 0.15704345703125, 0.1976470947265625, 0.238250732421875, 0.2788543701171875, 0.3194580078125, 0.3600616455078125, 0.400665283203125, 0.4412689208984375, 0.48187255859375, 0.5224761962890625, 0.563079833984375, 0.6036834716796875, 0.644287109375, 0.6848907470703125, 0.725494384765625, 0.7660980224609375, 0.80670166015625, 0.8473052978515625, 0.887908935546875, 0.9285125732421875, 0.9691162109375, 1.0097198486328125, 1.050323486328125, 1.0909271240234375, 1.13153076171875, 1.1721343994140625, 1.212738037109375, 1.2533416748046875, 1.2939453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 10.0, 10.0, 5.0, 12.0, 27.0, 30.0, 40.0, 75.0, 95.0, 254.0, 818.0, 1821.0, 422.0, 175.0, 100.0, 58.0, 41.0, 30.0, 17.0, 11.0, 9.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.56494140625, -0.5512466430664062, -0.5375518798828125, -0.5238571166992188, -0.510162353515625, -0.49646759033203125, -0.4827728271484375, -0.46907806396484375, -0.45538330078125, -0.44168853759765625, -0.4279937744140625, -0.41429901123046875, -0.400604248046875, -0.38690948486328125, -0.3732147216796875, -0.35951995849609375, -0.3458251953125, -0.33213043212890625, -0.3184356689453125, -0.30474090576171875, -0.291046142578125, -0.27735137939453125, -0.2636566162109375, -0.24996185302734375, -0.23626708984375, -0.22257232666015625, -0.2088775634765625, -0.19518280029296875, -0.181488037109375, -0.16779327392578125, -0.1540985107421875, -0.14040374755859375, -0.126708984375, -0.11301422119140625, -0.0993194580078125, -0.08562469482421875, -0.071929931640625, -0.05823516845703125, -0.0445404052734375, -0.03084564208984375, -0.01715087890625, -0.00345611572265625, 0.0102386474609375, 0.02393341064453125, 0.037628173828125, 0.05132293701171875, 0.0650177001953125, 0.07871246337890625, 0.0924072265625, 0.10610198974609375, 0.1197967529296875, 0.13349151611328125, 0.147186279296875, 0.16088104248046875, 0.1745758056640625, 0.18827056884765625, 0.20196533203125, 0.21566009521484375, 0.2293548583984375, 0.24304962158203125, 0.256744384765625, 0.27043914794921875, 0.2841339111328125, 0.29782867431640625, 0.3115234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 7.0, 8.0, 24.0, 27.0, 38.0, 61.0, 76.0, 117.0, 110.0, 127.0, 104.0, 89.0, 64.0, 52.0, 31.0, 27.0, 13.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9320218563079834, -1.8636082410812378, -1.7951946258544922, -1.7267810106277466, -1.658367395401001, -1.589953899383545, -1.5215402841567993, -1.4531266689300537, -1.384713053703308, -1.3162994384765625, -1.247885823249817, -1.1794722080230713, -1.1110587120056152, -1.04264497756958, -0.974231481552124, -0.9058178663253784, -0.8374042510986328, -0.7689906358718872, -0.7005770206451416, -0.6321634650230408, -0.5637498497962952, -0.49533623456954956, -0.42692264914512634, -0.3585090637207031, -0.2900954484939575, -0.2216818481683731, -0.1532682478427887, -0.08485464751720428, -0.016441047191619873, 0.05197256803512573, 0.12038615345954895, 0.18879973888397217, 0.2572135925292969, 0.3256272077560425, 0.3940407931804657, 0.4624543786048889, 0.5308679938316345, 0.5992816090583801, 0.667695164680481, 0.7361087799072266, 0.8045223951339722, 0.8729360103607178, 0.9413496255874634, 1.009763240814209, 1.078176736831665, 1.1465904712677002, 1.2150039672851562, 1.2834175825119019, 1.3518311977386475, 1.420244812965393, 1.4886584281921387, 1.5570720434188843, 1.6254856586456299, 1.693899154663086, 1.7623127698898315, 1.8307263851165771, 1.8991400003433228, 1.9675536155700684, 2.0359671115875244, 2.1043808460235596, 2.1727943420410156, 2.241208076477051, 2.309621572494507, 2.378035068511963, 2.446448802947998]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 19.0, 6.0, 9.0, 14.0, 14.0, 12.0, 22.0, 24.0, 24.0, 27.0, 20.0, 24.0, 23.0, 23.0, 33.0, 35.0, 35.0, 41.0, 28.0, 37.0, 29.0, 32.0, 52.0, 40.0, 42.0, 38.0, 26.0, 24.0, 23.0, 28.0, 22.0, 28.0, 22.0, 15.0, 20.0, 18.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.9040170311927795, -0.8751654624938965, -0.8463138937950134, -0.8174623250961304, -0.7886107563972473, -0.7597591876983643, -0.7309075593948364, -0.7020560503005981, -0.6732044219970703, -0.6443528532981873, -0.6155012845993042, -0.5866497159004211, -0.5577981472015381, -0.528946578502655, -0.500095009803772, -0.47124341130256653, -0.44239187240600586, -0.4135403037071228, -0.38468873500823975, -0.3558371663093567, -0.32698559761047363, -0.2981340289115906, -0.26928243041038513, -0.24043086171150208, -0.21157929301261902, -0.18272772431373596, -0.1538761556148529, -0.12502457201480865, -0.0961730033159256, -0.06732143461704254, -0.03846985101699829, -0.009618282318115234, 0.019233226776123047, 0.0480847992002964, 0.07693637162446976, 0.10578794777393341, 0.13463951647281647, 0.16349108517169952, 0.19234266877174377, 0.22119423747062683, 0.2500458061695099, 0.27889737486839294, 0.307748943567276, 0.33660054206848145, 0.3654521107673645, 0.39430367946624756, 0.4231552481651306, 0.45200681686401367, 0.48085838556289673, 0.5097099542617798, 0.5385615229606628, 0.5674130916595459, 0.596264660358429, 0.625116229057312, 0.6539678573608398, 0.6828193664550781, 0.711670994758606, 0.740522563457489, 0.7693741321563721, 0.7982257008552551, 0.8270772695541382, 0.8559288382530212, 0.8847804069519043, 0.9136320352554321, 0.9424835443496704]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 15.0, 9.0, 14.0, 22.0, 34.0, 42.0, 77.0, 85.0, 138.0, 218.0, 359.0, 543.0, 920.0, 1654.0, 3164.0, 5958.0, 12507.0, 26524.0, 61250.0, 143325.0, 337166.0, 261471.0, 106854.0, 45490.0, 20271.0, 9601.0, 4846.0, 2423.0, 1293.0, 828.0, 473.0, 308.0, 175.0, 134.0, 93.0, 64.0, 50.0, 35.0, 28.0, 18.0, 19.0, 10.0, 14.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.77294921875, -0.7494049072265625, -0.725860595703125, -0.7023162841796875, -0.67877197265625, -0.6552276611328125, -0.631683349609375, -0.6081390380859375, -0.5845947265625, -0.5610504150390625, -0.537506103515625, -0.5139617919921875, -0.49041748046875, -0.4668731689453125, -0.443328857421875, -0.4197845458984375, -0.396240234375, -0.3726959228515625, -0.349151611328125, -0.3256072998046875, -0.30206298828125, -0.2785186767578125, -0.254974365234375, -0.2314300537109375, -0.2078857421875, -0.1843414306640625, -0.160797119140625, -0.1372528076171875, -0.11370849609375, -0.0901641845703125, -0.066619873046875, -0.0430755615234375, -0.01953125, 0.0040130615234375, 0.027557373046875, 0.0511016845703125, 0.07464599609375, 0.0981903076171875, 0.121734619140625, 0.1452789306640625, 0.1688232421875, 0.1923675537109375, 0.215911865234375, 0.2394561767578125, 0.26300048828125, 0.2865447998046875, 0.310089111328125, 0.3336334228515625, 0.357177734375, 0.3807220458984375, 0.404266357421875, 0.4278106689453125, 0.45135498046875, 0.4748992919921875, 0.498443603515625, 0.5219879150390625, 0.5455322265625, 0.5690765380859375, 0.592620849609375, 0.6161651611328125, 0.63970947265625, 0.6632537841796875, 0.686798095703125, 0.7103424072265625, 0.73388671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 9.0, 5.0, 13.0, 14.0, 16.0, 24.0, 30.0, 37.0, 40.0, 56.0, 71.0, 71.0, 62.0, 56.0, 60.0, 74.0, 64.0, 54.0, 50.0, 34.0, 26.0, 29.0, 23.0, 14.0, 13.0, 17.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1822509765625, -0.1764698028564453, -0.17068862915039062, -0.16490745544433594, -0.15912628173828125, -0.15334510803222656, -0.14756393432617188, -0.1417827606201172, -0.1360015869140625, -0.1302204132080078, -0.12443923950195312, -0.11865806579589844, -0.11287689208984375, -0.10709571838378906, -0.10131454467773438, -0.09553337097167969, -0.089752197265625, -0.08397102355957031, -0.07818984985351562, -0.07240867614746094, -0.06662750244140625, -0.06084632873535156, -0.055065155029296875, -0.04928398132324219, -0.0435028076171875, -0.03772163391113281, -0.031940460205078125, -0.026159286499023438, -0.02037811279296875, -0.014596939086914062, -0.008815765380859375, -0.0030345916748046875, 0.00274658203125, 0.008527755737304688, 0.014308929443359375, 0.020090103149414062, 0.02587127685546875, 0.03165245056152344, 0.037433624267578125, 0.04321479797363281, 0.0489959716796875, 0.05477714538574219, 0.060558319091796875, 0.06633949279785156, 0.07212066650390625, 0.07790184020996094, 0.08368301391601562, 0.08946418762207031, 0.095245361328125, 0.10102653503417969, 0.10680770874023438, 0.11258888244628906, 0.11837005615234375, 0.12415122985839844, 0.12993240356445312, 0.1357135772705078, 0.1414947509765625, 0.1472759246826172, 0.15305709838867188, 0.15883827209472656, 0.16461944580078125, 0.17040061950683594, 0.17618179321289062, 0.1819629669189453, 0.187744140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 6.0, 3.0, 6.0, 12.0, 17.0, 17.0, 25.0, 35.0, 50.0, 53.0, 71.0, 99.0, 133.0, 168.0, 254.0, 385.0, 579.0, 1025.0, 2001.0, 5193.0, 16869.0, 63981.0, 252561.0, 493750.0, 153628.0, 39352.0, 10856.0, 3559.0, 1509.0, 787.0, 463.0, 344.0, 211.0, 143.0, 116.0, 86.0, 66.0, 46.0, 30.0, 17.0, 11.0, 15.0, 10.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.005859375, -0.9756698608398438, -0.9454803466796875, -0.9152908325195312, -0.885101318359375, -0.8549118041992188, -0.8247222900390625, -0.7945327758789062, -0.76434326171875, -0.7341537475585938, -0.7039642333984375, -0.6737747192382812, -0.643585205078125, -0.6133956909179688, -0.5832061767578125, -0.5530166625976562, -0.5228271484375, -0.49263763427734375, -0.4624481201171875, -0.43225860595703125, -0.402069091796875, -0.37187957763671875, -0.3416900634765625, -0.31150054931640625, -0.28131103515625, -0.25112152099609375, -0.2209320068359375, -0.19074249267578125, -0.160552978515625, -0.13036346435546875, -0.1001739501953125, -0.06998443603515625, -0.039794921875, -0.00960540771484375, 0.0205841064453125, 0.05077362060546875, 0.080963134765625, 0.11115264892578125, 0.1413421630859375, 0.17153167724609375, 0.20172119140625, 0.23191070556640625, 0.2621002197265625, 0.29228973388671875, 0.322479248046875, 0.35266876220703125, 0.3828582763671875, 0.41304779052734375, 0.4432373046875, 0.47342681884765625, 0.5036163330078125, 0.5338058471679688, 0.563995361328125, 0.5941848754882812, 0.6243743896484375, 0.6545639038085938, 0.68475341796875, 0.7149429321289062, 0.7451324462890625, 0.7753219604492188, 0.805511474609375, 0.8357009887695312, 0.8658905029296875, 0.8960800170898438, 0.92626953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 6.0, 10.0, 13.0, 12.0, 14.0, 20.0, 12.0, 26.0, 36.0, 35.0, 24.0, 33.0, 36.0, 58.0, 39.0, 48.0, 52.0, 39.0, 49.0, 50.0, 46.0, 51.0, 36.0, 33.0, 32.0, 22.0, 20.0, 19.0, 16.0, 11.0, 16.0, 15.0, 12.0, 9.0, 4.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.63232421875, -0.6118392944335938, -0.5913543701171875, -0.5708694458007812, -0.550384521484375, -0.5298995971679688, -0.5094146728515625, -0.48892974853515625, -0.46844482421875, -0.44795989990234375, -0.4274749755859375, -0.40699005126953125, -0.386505126953125, -0.36602020263671875, -0.3455352783203125, -0.32505035400390625, -0.3045654296875, -0.28408050537109375, -0.2635955810546875, -0.24311065673828125, -0.222625732421875, -0.20214080810546875, -0.1816558837890625, -0.16117095947265625, -0.14068603515625, -0.12020111083984375, -0.0997161865234375, -0.07923126220703125, -0.058746337890625, -0.03826141357421875, -0.0177764892578125, 0.00270843505859375, 0.023193359375, 0.04367828369140625, 0.0641632080078125, 0.08464813232421875, 0.105133056640625, 0.12561798095703125, 0.1461029052734375, 0.16658782958984375, 0.18707275390625, 0.20755767822265625, 0.2280426025390625, 0.24852752685546875, 0.269012451171875, 0.28949737548828125, 0.3099822998046875, 0.33046722412109375, 0.3509521484375, 0.37143707275390625, 0.3919219970703125, 0.41240692138671875, 0.432891845703125, 0.45337677001953125, 0.4738616943359375, 0.49434661865234375, 0.51483154296875, 0.5353164672851562, 0.5558013916015625, 0.5762863159179688, 0.596771240234375, 0.6172561645507812, 0.6377410888671875, 0.6582260131835938, 0.6787109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 11.0, 8.0, 9.0, 11.0, 31.0, 40.0, 63.0, 113.0, 183.0, 319.0, 516.0, 930.0, 1916.0, 4246.0, 10859.0, 36417.0, 236236.0, 631521.0, 92063.0, 20172.0, 6815.0, 2906.0, 1413.0, 722.0, 382.0, 243.0, 141.0, 83.0, 59.0, 37.0, 30.0, 11.0, 15.0, 7.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7958984375, -0.771240234375, -0.74658203125, -0.721923828125, -0.697265625, -0.672607421875, -0.64794921875, -0.623291015625, -0.5986328125, -0.573974609375, -0.54931640625, -0.524658203125, -0.5, -0.475341796875, -0.45068359375, -0.426025390625, -0.4013671875, -0.376708984375, -0.35205078125, -0.327392578125, -0.302734375, -0.278076171875, -0.25341796875, -0.228759765625, -0.2041015625, -0.179443359375, -0.15478515625, -0.130126953125, -0.10546875, -0.080810546875, -0.05615234375, -0.031494140625, -0.0068359375, 0.017822265625, 0.04248046875, 0.067138671875, 0.091796875, 0.116455078125, 0.14111328125, 0.165771484375, 0.1904296875, 0.215087890625, 0.23974609375, 0.264404296875, 0.2890625, 0.313720703125, 0.33837890625, 0.363037109375, 0.3876953125, 0.412353515625, 0.43701171875, 0.461669921875, 0.486328125, 0.510986328125, 0.53564453125, 0.560302734375, 0.5849609375, 0.609619140625, 0.63427734375, 0.658935546875, 0.68359375, 0.708251953125, 0.73291015625, 0.757568359375, 0.7822265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 11.0, 12.0, 15.0, 24.0, 16.0, 27.0, 36.0, 30.0, 33.0, 45.0, 54.0, 61.0, 67.0, 71.0, 67.0, 63.0, 66.0, 47.0, 41.0, 33.0, 30.0, 19.0, 17.0, 16.0, 12.0, 16.0, 11.0, 9.0, 8.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95125961303711e-05, -7.690489292144775e-05, -7.429718971252441e-05, -7.168948650360107e-05, -6.908178329467773e-05, -6.64740800857544e-05, -6.386637687683105e-05, -6.125867366790771e-05, -5.8650970458984375e-05, -5.6043267250061035e-05, -5.3435564041137695e-05, -5.0827860832214355e-05, -4.8220157623291016e-05, -4.5612454414367676e-05, -4.3004751205444336e-05, -4.0397047996520996e-05, -3.7789344787597656e-05, -3.5181641578674316e-05, -3.2573938369750977e-05, -2.9966235160827637e-05, -2.7358531951904297e-05, -2.4750828742980957e-05, -2.2143125534057617e-05, -1.9535422325134277e-05, -1.6927719116210938e-05, -1.4320015907287598e-05, -1.1712312698364258e-05, -9.104609489440918e-06, -6.496906280517578e-06, -3.889203071594238e-06, -1.2814998626708984e-06, 1.3262033462524414e-06, 3.933906555175781e-06, 6.541609764099121e-06, 9.149312973022461e-06, 1.17570161819458e-05, 1.436471939086914e-05, 1.697242259979248e-05, 1.958012580871582e-05, 2.218782901763916e-05, 2.47955322265625e-05, 2.740323543548584e-05, 3.001093864440918e-05, 3.261864185333252e-05, 3.522634506225586e-05, 3.78340482711792e-05, 4.044175148010254e-05, 4.304945468902588e-05, 4.565715789794922e-05, 4.826486110687256e-05, 5.08725643157959e-05, 5.348026752471924e-05, 5.608797073364258e-05, 5.869567394256592e-05, 6.130337715148926e-05, 6.39110803604126e-05, 6.651878356933594e-05, 6.912648677825928e-05, 7.173418998718262e-05, 7.434189319610596e-05, 7.69495964050293e-05, 7.955729961395264e-05, 8.216500282287598e-05, 8.477270603179932e-05, 8.738040924072266e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 11.0, 6.0, 11.0, 16.0, 33.0, 48.0, 59.0, 107.0, 179.0, 372.0, 718.0, 1876.0, 5658.0, 25399.0, 294500.0, 663377.0, 43380.0, 8392.0, 2512.0, 865.0, 420.0, 220.0, 133.0, 83.0, 51.0, 39.0, 21.0, 13.0, 11.0, 10.0, 7.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1015625, -1.066192626953125, -1.03082275390625, -0.995452880859375, -0.9600830078125, -0.924713134765625, -0.88934326171875, -0.853973388671875, -0.818603515625, -0.783233642578125, -0.74786376953125, -0.712493896484375, -0.6771240234375, -0.641754150390625, -0.60638427734375, -0.571014404296875, -0.53564453125, -0.500274658203125, -0.46490478515625, -0.429534912109375, -0.3941650390625, -0.358795166015625, -0.32342529296875, -0.288055419921875, -0.252685546875, -0.217315673828125, -0.18194580078125, -0.146575927734375, -0.1112060546875, -0.075836181640625, -0.04046630859375, -0.005096435546875, 0.0302734375, 0.065643310546875, 0.10101318359375, 0.136383056640625, 0.1717529296875, 0.207122802734375, 0.24249267578125, 0.277862548828125, 0.313232421875, 0.348602294921875, 0.38397216796875, 0.419342041015625, 0.4547119140625, 0.490081787109375, 0.52545166015625, 0.560821533203125, 0.59619140625, 0.631561279296875, 0.66693115234375, 0.702301025390625, 0.7376708984375, 0.773040771484375, 0.80841064453125, 0.843780517578125, 0.879150390625, 0.914520263671875, 0.94989013671875, 0.985260009765625, 1.0206298828125, 1.055999755859375, 1.09136962890625, 1.126739501953125, 1.162109375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 5.0, 12.0, 12.0, 27.0, 23.0, 26.0, 49.0, 83.0, 128.0, 134.0, 140.0, 110.0, 61.0, 53.0, 32.0, 27.0, 16.0, 11.0, 14.0, 5.0, 5.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.77783203125, -0.757293701171875, -0.73675537109375, -0.716217041015625, -0.6956787109375, -0.675140380859375, -0.65460205078125, -0.634063720703125, -0.613525390625, -0.592987060546875, -0.57244873046875, -0.551910400390625, -0.5313720703125, -0.510833740234375, -0.49029541015625, -0.469757080078125, -0.44921875, -0.428680419921875, -0.40814208984375, -0.387603759765625, -0.3670654296875, -0.346527099609375, -0.32598876953125, -0.305450439453125, -0.284912109375, -0.264373779296875, -0.24383544921875, -0.223297119140625, -0.2027587890625, -0.182220458984375, -0.16168212890625, -0.141143798828125, -0.12060546875, -0.100067138671875, -0.07952880859375, -0.058990478515625, -0.0384521484375, -0.017913818359375, 0.00262451171875, 0.023162841796875, 0.043701171875, 0.064239501953125, 0.08477783203125, 0.105316162109375, 0.1258544921875, 0.146392822265625, 0.16693115234375, 0.187469482421875, 0.2080078125, 0.228546142578125, 0.24908447265625, 0.269622802734375, 0.2901611328125, 0.310699462890625, 0.33123779296875, 0.351776123046875, 0.372314453125, 0.392852783203125, 0.41339111328125, 0.433929443359375, 0.4544677734375, 0.475006103515625, 0.49554443359375, 0.516082763671875, 0.53662109375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 8.0, 22.0, 37.0, 65.0, 88.0, 132.0, 149.0, 158.0, 131.0, 83.0, 54.0, 31.0, 22.0, 8.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.179854393005371, -5.921067714691162, -5.662281036376953, -5.403494358062744, -5.144707679748535, -4.885921478271484, -4.627134799957275, -4.368348121643066, -4.109561443328857, -3.8507747650146484, -3.5919880867004395, -3.3332016468048096, -3.0744149684906006, -2.8156282901763916, -2.5568418502807617, -2.2980551719665527, -2.0392684936523438, -1.7804818153381348, -1.5216952562332153, -1.262908697128296, -1.004122018814087, -0.7453353404998779, -0.4865487813949585, -0.22776222229003906, 0.031024456024169922, 0.28981107473373413, 0.5485976934432983, 0.8073843121528625, 1.0661709308624268, 1.3249576091766357, 1.5837441682815552, 1.8425307273864746, 2.1013174057006836, 2.3601040840148926, 2.6188907623291016, 2.8776772022247314, 3.1364638805389404, 3.3952505588531494, 3.6540369987487793, 3.9128236770629883, 4.171610355377197, 4.430397033691406, 4.689183712005615, 4.947970390319824, 5.206756591796875, 5.465543746948242, 5.724329948425293, 5.983116626739502, 6.241903305053711, 6.50068998336792, 6.759476661682129, 7.018263339996338, 7.277050018310547, 7.535836219787598, 7.794622898101807, 8.053409576416016, 8.312196731567383, 8.570982933044434, 8.8297700881958, 9.088556289672852, 9.347343444824219, 9.60612964630127, 9.864916801452637, 10.123703002929688, 10.382489204406738]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 11.0, 13.0, 9.0, 12.0, 22.0, 26.0, 23.0, 33.0, 26.0, 34.0, 31.0, 50.0, 48.0, 45.0, 46.0, 52.0, 50.0, 53.0, 50.0, 46.0, 51.0, 40.0, 36.0, 50.0, 33.0, 18.0, 17.0, 14.0, 18.0, 19.0, 9.0, 6.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.043224811553955, -4.891587734222412, -4.739951133728027, -4.588314056396484, -4.436676979064941, -4.285039901733398, -4.133403301239014, -3.9817662239074707, -3.8301291465759277, -3.678492307662964, -3.526855230331421, -3.375218391418457, -3.223581314086914, -3.07194447517395, -2.9203076362609863, -2.7686705589294434, -2.6170337200164795, -2.4653968811035156, -2.3137598037719727, -2.162122964859009, -2.010485887527466, -1.858849048614502, -1.7072120904922485, -1.5555751323699951, -1.4039381742477417, -1.2523012161254883, -1.1006642580032349, -0.9490273594856262, -0.7973904013633728, -0.6457534432411194, -0.49411654472351074, -0.3424795866012573, -0.1908426284790039, -0.03920568525791168, 0.11243125796318054, 0.2640681862831116, 0.415705144405365, 0.5673421025276184, 0.718979001045227, 0.8706159591674805, 1.0222529172897339, 1.1738898754119873, 1.3255268335342407, 1.4771637916564941, 1.628800630569458, 1.780437707901001, 1.9320745468139648, 2.083711624145508, 2.2353484630584717, 2.3869853019714355, 2.5386223793029785, 2.6902592182159424, 2.8418962955474854, 2.993533134460449, 3.145170211791992, 3.296807050704956, 3.44844388961792, 3.600080728530884, 3.7517178058624268, 3.9033546447753906, 4.054991722106934, 4.206628799438477, 4.358265399932861, 4.509902477264404, 4.661539554595947]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 12.0, 9.0, 22.0, 34.0, 44.0, 82.0, 118.0, 190.0, 271.0, 501.0, 790.0, 1466.0, 2762.0, 5629.0, 12824.0, 33527.0, 114002.0, 1235311.0, 2593917.0, 128707.0, 37201.0, 13810.0, 6081.0, 2993.0, 1575.0, 935.0, 529.0, 324.0, 211.0, 138.0, 73.0, 48.0, 34.0, 34.0, 20.0, 15.0, 6.0, 7.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7705078125, -0.7439804077148438, -0.7174530029296875, -0.6909255981445312, -0.664398193359375, -0.6378707885742188, -0.6113433837890625, -0.5848159790039062, -0.55828857421875, -0.5317611694335938, -0.5052337646484375, -0.47870635986328125, -0.452178955078125, -0.42565155029296875, -0.3991241455078125, -0.37259674072265625, -0.3460693359375, -0.31954193115234375, -0.2930145263671875, -0.26648712158203125, -0.239959716796875, -0.21343231201171875, -0.1869049072265625, -0.16037750244140625, -0.13385009765625, -0.10732269287109375, -0.0807952880859375, -0.05426788330078125, -0.027740478515625, -0.00121307373046875, 0.0253143310546875, 0.05184173583984375, 0.078369140625, 0.10489654541015625, 0.1314239501953125, 0.15795135498046875, 0.184478759765625, 0.21100616455078125, 0.2375335693359375, 0.26406097412109375, 0.29058837890625, 0.31711578369140625, 0.3436431884765625, 0.37017059326171875, 0.396697998046875, 0.42322540283203125, 0.4497528076171875, 0.47628021240234375, 0.5028076171875, 0.5293350219726562, 0.5558624267578125, 0.5823898315429688, 0.608917236328125, 0.6354446411132812, 0.6619720458984375, 0.6884994506835938, 0.71502685546875, 0.7415542602539062, 0.7680816650390625, 0.7946090698242188, 0.821136474609375, 0.8476638793945312, 0.8741912841796875, 0.9007186889648438, 0.92724609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 7.0, 5.0, 17.0, 17.0, 10.0, 14.0, 23.0, 20.0, 40.0, 36.0, 53.0, 42.0, 62.0, 71.0, 64.0, 74.0, 68.0, 58.0, 54.0, 45.0, 38.0, 32.0, 22.0, 30.0, 26.0, 11.0, 15.0, 6.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1735706329345703, -0.16757583618164062, -0.16158103942871094, -0.15558624267578125, -0.14959144592285156, -0.14359664916992188, -0.1376018524169922, -0.1316070556640625, -0.1256122589111328, -0.11961746215820312, -0.11362266540527344, -0.10762786865234375, -0.10163307189941406, -0.09563827514648438, -0.08964347839355469, -0.083648681640625, -0.07765388488769531, -0.07165908813476562, -0.06566429138183594, -0.05966949462890625, -0.05367469787597656, -0.047679901123046875, -0.04168510437011719, -0.0356903076171875, -0.029695510864257812, -0.023700714111328125, -0.017705917358398438, -0.01171112060546875, -0.0057163238525390625, 0.000278472900390625, 0.0062732696533203125, 0.01226806640625, 0.018262863159179688, 0.024257659912109375, 0.030252456665039062, 0.03624725341796875, 0.04224205017089844, 0.048236846923828125, 0.05423164367675781, 0.0602264404296875, 0.06622123718261719, 0.07221603393554688, 0.07821083068847656, 0.08420562744140625, 0.09020042419433594, 0.09619522094726562, 0.10219001770019531, 0.108184814453125, 0.11417961120605469, 0.12017440795898438, 0.12616920471191406, 0.13216400146484375, 0.13815879821777344, 0.14415359497070312, 0.1501483917236328, 0.1561431884765625, 0.1621379852294922, 0.16813278198242188, 0.17412757873535156, 0.18012237548828125, 0.18611717224121094, 0.19211196899414062, 0.1981067657470703, 0.2041015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 12.0, 21.0, 30.0, 43.0, 54.0, 90.0, 143.0, 198.0, 328.0, 513.0, 767.0, 1324.0, 2246.0, 4124.0, 8041.0, 17003.0, 40537.0, 120759.0, 643961.0, 2950310.0, 277507.0, 72782.0, 27477.0, 12038.0, 5930.0, 3224.0, 1790.0, 1110.0, 658.0, 444.0, 266.0, 195.0, 110.0, 90.0, 44.0, 38.0, 20.0, 15.0, 10.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.80712890625, -0.7854843139648438, -0.7638397216796875, -0.7421951293945312, -0.720550537109375, -0.6989059448242188, -0.6772613525390625, -0.6556167602539062, -0.63397216796875, -0.6123275756835938, -0.5906829833984375, -0.5690383911132812, -0.547393798828125, -0.5257492065429688, -0.5041046142578125, -0.48246002197265625, -0.4608154296875, -0.43917083740234375, -0.4175262451171875, -0.39588165283203125, -0.374237060546875, -0.35259246826171875, -0.3309478759765625, -0.30930328369140625, -0.28765869140625, -0.26601409912109375, -0.2443695068359375, -0.22272491455078125, -0.201080322265625, -0.17943572998046875, -0.1577911376953125, -0.13614654541015625, -0.114501953125, -0.09285736083984375, -0.0712127685546875, -0.04956817626953125, -0.027923583984375, -0.00627899169921875, 0.0153656005859375, 0.03701019287109375, 0.05865478515625, 0.08029937744140625, 0.1019439697265625, 0.12358856201171875, 0.145233154296875, 0.16687774658203125, 0.1885223388671875, 0.21016693115234375, 0.2318115234375, 0.25345611572265625, 0.2751007080078125, 0.29674530029296875, 0.318389892578125, 0.34003448486328125, 0.3616790771484375, 0.38332366943359375, 0.40496826171875, 0.42661285400390625, 0.4482574462890625, 0.46990203857421875, 0.491546630859375, 0.5131912231445312, 0.5348358154296875, 0.5564804077148438, 0.578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 10.0, 9.0, 14.0, 10.0, 11.0, 27.0, 28.0, 27.0, 42.0, 75.0, 99.0, 165.0, 244.0, 481.0, 1275.0, 719.0, 265.0, 173.0, 104.0, 79.0, 52.0, 34.0, 25.0, 16.0, 23.0, 11.0, 8.0, 9.0, 5.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31494140625, -0.3039703369140625, -0.292999267578125, -0.2820281982421875, -0.27105712890625, -0.2600860595703125, -0.249114990234375, -0.2381439208984375, -0.2271728515625, -0.2162017822265625, -0.205230712890625, -0.1942596435546875, -0.18328857421875, -0.1723175048828125, -0.161346435546875, -0.1503753662109375, -0.139404296875, -0.1284332275390625, -0.117462158203125, -0.1064910888671875, -0.09552001953125, -0.0845489501953125, -0.073577880859375, -0.0626068115234375, -0.0516357421875, -0.0406646728515625, -0.029693603515625, -0.0187225341796875, -0.00775146484375, 0.0032196044921875, 0.014190673828125, 0.0251617431640625, 0.0361328125, 0.0471038818359375, 0.058074951171875, 0.0690460205078125, 0.08001708984375, 0.0909881591796875, 0.101959228515625, 0.1129302978515625, 0.1239013671875, 0.1348724365234375, 0.145843505859375, 0.1568145751953125, 0.16778564453125, 0.1787567138671875, 0.189727783203125, 0.2006988525390625, 0.211669921875, 0.2226409912109375, 0.233612060546875, 0.2445831298828125, 0.25555419921875, 0.2665252685546875, 0.277496337890625, 0.2884674072265625, 0.2994384765625, 0.3104095458984375, 0.321380615234375, 0.3323516845703125, 0.34332275390625, 0.3542938232421875, 0.365264892578125, 0.3762359619140625, 0.38720703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 9.0, 12.0, 38.0, 39.0, 82.0, 122.0, 121.0, 130.0, 131.0, 96.0, 83.0, 55.0, 39.0, 13.0, 10.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0203566551208496, -2.920823097229004, -2.821289539337158, -2.7217559814453125, -2.622222661972046, -2.5226891040802, -2.4231555461883545, -2.323621988296509, -2.224088668823242, -2.1245551109313965, -2.025021553039551, -1.9254881143569946, -1.8259546756744385, -1.7264211177825928, -1.626887559890747, -1.5273540019989014, -1.4278204441070557, -1.32828688621521, -1.2287534475326538, -1.129219889640808, -1.029686450958252, -0.9301528930664062, -0.8306193351745605, -0.7310858368873596, -0.6315523386001587, -0.5320188403129578, -0.43248531222343445, -0.33295178413391113, -0.2334182858467102, -0.13388478755950928, -0.034351229667663574, 0.06518226861953735, 0.16471576690673828, 0.2642492651939392, 0.3637827932834625, 0.46331632137298584, 0.5628498196601868, 0.6623833179473877, 0.7619168758392334, 0.8614503741264343, 0.9609838724136353, 1.060517430305481, 1.160050868988037, 1.2595844268798828, 1.3591179847717285, 1.4586514234542847, 1.5581849813461304, 1.6577184200286865, 1.7572519779205322, 1.856785535812378, 1.956318974494934, 2.0558524131774902, 2.155385971069336, 2.2549195289611816, 2.3544530868530273, 2.453986644744873, 2.5535202026367188, 2.6530537605285645, 2.75258731842041, 2.852120876312256, 2.9516541957855225, 3.051187753677368, 3.150721311569214, 3.2502548694610596, 3.349788188934326]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 9.0, 10.0, 11.0, 20.0, 17.0, 25.0, 21.0, 22.0, 35.0, 22.0, 32.0, 35.0, 36.0, 31.0, 39.0, 36.0, 44.0, 46.0, 43.0, 46.0, 44.0, 55.0, 34.0, 34.0, 38.0, 32.0, 29.0, 32.0, 20.0, 17.0, 19.0, 9.0, 9.0, 10.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4160257577896118, -1.3683379888534546, -1.3206502199172974, -1.2729624509811401, -1.225274682044983, -1.1775869131088257, -1.129899263381958, -1.0822114944458008, -1.0345237255096436, -0.9868359565734863, -0.9391481876373291, -0.8914604187011719, -0.8437726497650146, -0.7960848808288574, -0.748397171497345, -0.7007094025611877, -0.6530215740203857, -0.6053338050842285, -0.5576460361480713, -0.5099582672119141, -0.4622705280780792, -0.414582759141922, -0.36689502000808716, -0.31920725107192993, -0.2715194821357727, -0.22383171319961548, -0.17614395916461945, -0.1284562051296234, -0.08076843619346619, -0.03308066725730896, 0.014607071876525879, 0.062294840812683105, 0.10998249053955078, 0.157670259475708, 0.20535801351070404, 0.2530457675457001, 0.3007335364818573, 0.3484213054180145, 0.39610904455184937, 0.4437968134880066, 0.4914845824241638, 0.539172351360321, 0.5868601202964783, 0.6345478296279907, 0.682235598564148, 0.7299233675003052, 0.7776111364364624, 0.8252989053726196, 0.8729866743087769, 0.9206744432449341, 0.9683622121810913, 1.0160499811172485, 1.0637377500534058, 1.111425518989563, 1.1591131687164307, 1.206800937652588, 1.2544887065887451, 1.3021764755249023, 1.3498642444610596, 1.3975520133972168, 1.445239782333374, 1.4929275512695312, 1.5406153202056885, 1.5883030891418457, 1.635990858078003]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 9.0, 11.0, 11.0, 22.0, 36.0, 53.0, 70.0, 78.0, 122.0, 191.0, 330.0, 550.0, 899.0, 1488.0, 2725.0, 5104.0, 10097.0, 21013.0, 46015.0, 117430.0, 577888.0, 159687.0, 54814.0, 24831.0, 11763.0, 5836.0, 3217.0, 1674.0, 1015.0, 553.0, 351.0, 200.0, 149.0, 102.0, 60.0, 47.0, 31.0, 24.0, 18.0, 14.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.97021484375, -0.9421768188476562, -0.9141387939453125, -0.8861007690429688, -0.858062744140625, -0.8300247192382812, -0.8019866943359375, -0.7739486694335938, -0.74591064453125, -0.7178726196289062, -0.6898345947265625, -0.6617965698242188, -0.633758544921875, -0.6057205200195312, -0.5776824951171875, -0.5496444702148438, -0.5216064453125, -0.49356842041015625, -0.4655303955078125, -0.43749237060546875, -0.409454345703125, -0.38141632080078125, -0.3533782958984375, -0.32534027099609375, -0.29730224609375, -0.26926422119140625, -0.2412261962890625, -0.21318817138671875, -0.185150146484375, -0.15711212158203125, -0.1290740966796875, -0.10103607177734375, -0.072998046875, -0.04496002197265625, -0.0169219970703125, 0.01111602783203125, 0.039154052734375, 0.06719207763671875, 0.0952301025390625, 0.12326812744140625, 0.15130615234375, 0.17934417724609375, 0.2073822021484375, 0.23542022705078125, 0.263458251953125, 0.29149627685546875, 0.3195343017578125, 0.34757232666015625, 0.3756103515625, 0.40364837646484375, 0.4316864013671875, 0.45972442626953125, 0.487762451171875, 0.5158004760742188, 0.5438385009765625, 0.5718765258789062, 0.59991455078125, 0.6279525756835938, 0.6559906005859375, 0.6840286254882812, 0.712066650390625, 0.7401046752929688, 0.7681427001953125, 0.7961807250976562, 0.82421875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 5.0, 7.0, 14.0, 15.0, 14.0, 12.0, 21.0, 18.0, 20.0, 36.0, 52.0, 37.0, 47.0, 64.0, 67.0, 71.0, 53.0, 60.0, 60.0, 53.0, 42.0, 32.0, 35.0, 28.0, 24.0, 24.0, 24.0, 13.0, 13.0, 7.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18017578125, -0.174346923828125, -0.16851806640625, -0.162689208984375, -0.1568603515625, -0.151031494140625, -0.14520263671875, -0.139373779296875, -0.133544921875, -0.127716064453125, -0.12188720703125, -0.116058349609375, -0.1102294921875, -0.104400634765625, -0.09857177734375, -0.092742919921875, -0.0869140625, -0.081085205078125, -0.07525634765625, -0.069427490234375, -0.0635986328125, -0.057769775390625, -0.05194091796875, -0.046112060546875, -0.040283203125, -0.034454345703125, -0.02862548828125, -0.022796630859375, -0.0169677734375, -0.011138916015625, -0.00531005859375, 0.000518798828125, 0.00634765625, 0.012176513671875, 0.01800537109375, 0.023834228515625, 0.0296630859375, 0.035491943359375, 0.04132080078125, 0.047149658203125, 0.052978515625, 0.058807373046875, 0.06463623046875, 0.070465087890625, 0.0762939453125, 0.082122802734375, 0.08795166015625, 0.093780517578125, 0.099609375, 0.105438232421875, 0.11126708984375, 0.117095947265625, 0.1229248046875, 0.128753662109375, 0.13458251953125, 0.140411376953125, 0.146240234375, 0.152069091796875, 0.15789794921875, 0.163726806640625, 0.1695556640625, 0.175384521484375, 0.18121337890625, 0.187042236328125, 0.19287109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 10.0, 4.0, 4.0, 11.0, 12.0, 20.0, 37.0, 33.0, 41.0, 58.0, 91.0, 109.0, 178.0, 240.0, 342.0, 523.0, 1008.0, 2180.0, 5904.0, 19402.0, 75875.0, 642629.0, 236374.0, 43890.0, 11927.0, 3792.0, 1573.0, 762.0, 456.0, 279.0, 220.0, 152.0, 109.0, 93.0, 49.0, 47.0, 35.0, 22.0, 16.0, 16.0, 8.0, 9.0, 10.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2041015625, -1.1662445068359375, -1.128387451171875, -1.0905303955078125, -1.05267333984375, -1.0148162841796875, -0.976959228515625, -0.9391021728515625, -0.9012451171875, -0.8633880615234375, -0.825531005859375, -0.7876739501953125, -0.74981689453125, -0.7119598388671875, -0.674102783203125, -0.6362457275390625, -0.598388671875, -0.5605316162109375, -0.522674560546875, -0.4848175048828125, -0.44696044921875, -0.4091033935546875, -0.371246337890625, -0.3333892822265625, -0.2955322265625, -0.2576751708984375, -0.219818115234375, -0.1819610595703125, -0.14410400390625, -0.1062469482421875, -0.068389892578125, -0.0305328369140625, 0.00732421875, 0.0451812744140625, 0.083038330078125, 0.1208953857421875, 0.15875244140625, 0.1966094970703125, 0.234466552734375, 0.2723236083984375, 0.3101806640625, 0.3480377197265625, 0.385894775390625, 0.4237518310546875, 0.46160888671875, 0.4994659423828125, 0.537322998046875, 0.5751800537109375, 0.613037109375, 0.6508941650390625, 0.688751220703125, 0.7266082763671875, 0.76446533203125, 0.8023223876953125, 0.840179443359375, 0.8780364990234375, 0.9158935546875, 0.9537506103515625, 0.991607666015625, 1.0294647216796875, 1.06732177734375, 1.1051788330078125, 1.143035888671875, 1.1808929443359375, 1.21875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 12.0, 7.0, 12.0, 19.0, 25.0, 49.0, 27.0, 48.0, 62.0, 78.0, 72.0, 77.0, 54.0, 68.0, 63.0, 57.0, 60.0, 41.0, 35.0, 15.0, 34.0, 19.0, 10.0, 14.0, 8.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2080078125, -1.1754379272460938, -1.1428680419921875, -1.1102981567382812, -1.077728271484375, -1.0451583862304688, -1.0125885009765625, -0.9800186157226562, -0.94744873046875, -0.9148788452148438, -0.8823089599609375, -0.8497390747070312, -0.817169189453125, -0.7845993041992188, -0.7520294189453125, -0.7194595336914062, -0.6868896484375, -0.6543197631835938, -0.6217498779296875, -0.5891799926757812, -0.556610107421875, -0.5240402221679688, -0.4914703369140625, -0.45890045166015625, -0.42633056640625, -0.39376068115234375, -0.3611907958984375, -0.32862091064453125, -0.296051025390625, -0.26348114013671875, -0.2309112548828125, -0.19834136962890625, -0.165771484375, -0.13320159912109375, -0.1006317138671875, -0.06806182861328125, -0.035491943359375, -0.00292205810546875, 0.0296478271484375, 0.06221771240234375, 0.09478759765625, 0.12735748291015625, 0.1599273681640625, 0.19249725341796875, 0.225067138671875, 0.25763702392578125, 0.2902069091796875, 0.32277679443359375, 0.3553466796875, 0.38791656494140625, 0.4204864501953125, 0.45305633544921875, 0.485626220703125, 0.5181961059570312, 0.5507659912109375, 0.5833358764648438, 0.61590576171875, 0.6484756469726562, 0.6810455322265625, 0.7136154174804688, 0.746185302734375, 0.7787551879882812, 0.8113250732421875, 0.8438949584960938, 0.87646484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 6.0, 10.0, 11.0, 11.0, 25.0, 28.0, 42.0, 88.0, 139.0, 313.0, 1033.0, 5274.0, 52576.0, 851538.0, 124897.0, 9999.0, 1669.0, 438.0, 185.0, 89.0, 55.0, 35.0, 23.0, 16.0, 13.0, 12.0, 6.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9977645874023438, -0.9672088623046875, -0.9366531372070312, -0.906097412109375, -0.8755416870117188, -0.8449859619140625, -0.8144302368164062, -0.78387451171875, -0.7533187866210938, -0.7227630615234375, -0.6922073364257812, -0.661651611328125, -0.6310958862304688, -0.6005401611328125, -0.5699844360351562, -0.5394287109375, -0.5088729858398438, -0.4783172607421875, -0.44776153564453125, -0.417205810546875, -0.38665008544921875, -0.3560943603515625, -0.32553863525390625, -0.29498291015625, -0.26442718505859375, -0.2338714599609375, -0.20331573486328125, -0.172760009765625, -0.14220428466796875, -0.1116485595703125, -0.08109283447265625, -0.050537109375, -0.01998138427734375, 0.0105743408203125, 0.04113006591796875, 0.071685791015625, 0.10224151611328125, 0.1327972412109375, 0.16335296630859375, 0.19390869140625, 0.22446441650390625, 0.2550201416015625, 0.28557586669921875, 0.316131591796875, 0.34668731689453125, 0.3772430419921875, 0.40779876708984375, 0.4383544921875, 0.46891021728515625, 0.4994659423828125, 0.5300216674804688, 0.560577392578125, 0.5911331176757812, 0.6216888427734375, 0.6522445678710938, 0.68280029296875, 0.7133560180664062, 0.7439117431640625, 0.7744674682617188, 0.805023193359375, 0.8355789184570312, 0.8661346435546875, 0.8966903686523438, 0.92724609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 12.0, 16.0, 19.0, 30.0, 26.0, 38.0, 47.0, 78.0, 81.0, 108.0, 106.0, 107.0, 79.0, 59.0, 31.0, 36.0, 29.0, 24.0, 20.0, 8.0, 6.0, 6.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010538101196289062, -0.00010199286043643951, -9.86047089099884e-05, -9.521655738353729e-05, -9.182840585708618e-05, -8.844025433063507e-05, -8.505210280418396e-05, -8.166395127773285e-05, -7.827579975128174e-05, -7.488764822483063e-05, -7.149949669837952e-05, -6.81113451719284e-05, -6.47231936454773e-05, -6.133504211902618e-05, -5.794689059257507e-05, -5.455873906612396e-05, -5.117058753967285e-05, -4.778243601322174e-05, -4.439428448677063e-05, -4.100613296031952e-05, -3.761798143386841e-05, -3.42298299074173e-05, -3.0841678380966187e-05, -2.7453526854515076e-05, -2.4065375328063965e-05, -2.0677223801612854e-05, -1.7289072275161743e-05, -1.3900920748710632e-05, -1.0512769222259521e-05, -7.124617695808411e-06, -3.7364661693573e-06, -3.4831464290618896e-07, 3.039836883544922e-06, 6.427988409996033e-06, 9.816139936447144e-06, 1.3204291462898254e-05, 1.6592442989349365e-05, 1.9980594515800476e-05, 2.3368746042251587e-05, 2.6756897568702698e-05, 3.014504909515381e-05, 3.353320062160492e-05, 3.692135214805603e-05, 4.030950367450714e-05, 4.369765520095825e-05, 4.708580672740936e-05, 5.0473958253860474e-05, 5.3862109780311584e-05, 5.7250261306762695e-05, 6.0638412833213806e-05, 6.402656435966492e-05, 6.741471588611603e-05, 7.080286741256714e-05, 7.419101893901825e-05, 7.757917046546936e-05, 8.096732199192047e-05, 8.435547351837158e-05, 8.774362504482269e-05, 9.11317765712738e-05, 9.451992809772491e-05, 9.790807962417603e-05, 0.00010129623115062714, 0.00010468438267707825, 0.00010807253420352936, 0.00011146068572998047]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 15.0, 10.0, 5.0, 8.0, 12.0, 18.0, 20.0, 32.0, 35.0, 84.0, 134.0, 247.0, 560.0, 1443.0, 7103.0, 103874.0, 885714.0, 42907.0, 4259.0, 1073.0, 432.0, 223.0, 125.0, 58.0, 42.0, 24.0, 21.0, 18.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0419921875, -1.0107574462890625, -0.979522705078125, -0.9482879638671875, -0.91705322265625, -0.8858184814453125, -0.854583740234375, -0.8233489990234375, -0.7921142578125, -0.7608795166015625, -0.729644775390625, -0.6984100341796875, -0.66717529296875, -0.6359405517578125, -0.604705810546875, -0.5734710693359375, -0.542236328125, -0.5110015869140625, -0.479766845703125, -0.4485321044921875, -0.41729736328125, -0.3860626220703125, -0.354827880859375, -0.3235931396484375, -0.2923583984375, -0.2611236572265625, -0.229888916015625, -0.1986541748046875, -0.16741943359375, -0.1361846923828125, -0.104949951171875, -0.0737152099609375, -0.04248046875, -0.0112457275390625, 0.019989013671875, 0.0512237548828125, 0.08245849609375, 0.1136932373046875, 0.144927978515625, 0.1761627197265625, 0.2073974609375, 0.2386322021484375, 0.269866943359375, 0.3011016845703125, 0.33233642578125, 0.3635711669921875, 0.394805908203125, 0.4260406494140625, 0.457275390625, 0.4885101318359375, 0.519744873046875, 0.5509796142578125, 0.58221435546875, 0.6134490966796875, 0.644683837890625, 0.6759185791015625, 0.7071533203125, 0.7383880615234375, 0.769622802734375, 0.8008575439453125, 0.83209228515625, 0.8633270263671875, 0.894561767578125, 0.9257965087890625, 0.95703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 4.0, 10.0, 5.0, 16.0, 20.0, 40.0, 47.0, 119.0, 225.0, 207.0, 143.0, 57.0, 30.0, 19.0, 15.0, 7.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431640625, -0.4129180908203125, -0.394195556640625, -0.3754730224609375, -0.35675048828125, -0.3380279541015625, -0.319305419921875, -0.3005828857421875, -0.2818603515625, -0.2631378173828125, -0.244415283203125, -0.2256927490234375, -0.20697021484375, -0.1882476806640625, -0.169525146484375, -0.1508026123046875, -0.132080078125, -0.1133575439453125, -0.094635009765625, -0.0759124755859375, -0.05718994140625, -0.0384674072265625, -0.019744873046875, -0.0010223388671875, 0.0177001953125, 0.0364227294921875, 0.055145263671875, 0.0738677978515625, 0.09259033203125, 0.1113128662109375, 0.130035400390625, 0.1487579345703125, 0.16748046875, 0.1862030029296875, 0.204925537109375, 0.2236480712890625, 0.24237060546875, 0.2610931396484375, 0.279815673828125, 0.2985382080078125, 0.3172607421875, 0.3359832763671875, 0.354705810546875, 0.3734283447265625, 0.39215087890625, 0.4108734130859375, 0.429595947265625, 0.4483184814453125, 0.467041015625, 0.4857635498046875, 0.504486083984375, 0.5232086181640625, 0.54193115234375, 0.5606536865234375, 0.579376220703125, 0.5980987548828125, 0.6168212890625, 0.6355438232421875, 0.654266357421875, 0.6729888916015625, 0.69171142578125, 0.7104339599609375, 0.729156494140625, 0.7478790283203125, 0.7666015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 24.0, 82.0, 220.0, 303.0, 218.0, 102.0, 31.0, 7.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.39349365234375, -19.94576644897461, -19.498037338256836, -19.050310134887695, -18.602582931518555, -18.15485382080078, -17.70712661743164, -17.2593994140625, -16.81167221069336, -16.36394500732422, -15.916216850280762, -15.468488693237305, -15.020761489868164, -14.573033332824707, -14.12530517578125, -13.67757797241211, -13.229848861694336, -12.782120704650879, -12.334393501281738, -11.886665344238281, -11.43893814086914, -10.991209983825684, -10.543481826782227, -10.095754623413086, -9.648026466369629, -9.200298309326172, -8.752571105957031, -8.304842948913574, -7.857115268707275, -7.409387588500977, -6.9616594314575195, -6.513931751251221, -6.066204071044922, -5.618476390838623, -5.170748710632324, -4.723020553588867, -4.275292873382568, -3.8275651931762695, -3.3798372745513916, -2.9321093559265137, -2.484381675720215, -2.036653995513916, -1.588926076889038, -1.1411982774734497, -0.6934704780578613, -0.2457427978515625, 0.20198512077331543, 0.6497130393981934, 1.0974407196044922, 1.5451685190200806, 1.992896318435669, 2.440624237060547, 2.8883519172668457, 3.3360795974731445, 3.7838075160980225, 4.2315354347229, 4.679263114929199, 5.126990795135498, 5.574718475341797, 6.022446632385254, 6.470174312591553, 6.917901992797852, 7.365630149841309, 7.813357830047607, 8.261085510253906]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 2.0, 20.0, 13.0, 18.0, 15.0, 23.0, 23.0, 23.0, 27.0, 30.0, 48.0, 41.0, 31.0, 48.0, 46.0, 46.0, 55.0, 39.0, 46.0, 36.0, 35.0, 40.0, 48.0, 27.0, 29.0, 28.0, 23.0, 23.0, 19.0, 18.0, 16.0, 8.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3596577644348145, -3.239802122116089, -3.1199464797973633, -3.0000905990600586, -2.880234956741333, -2.7603793144226074, -2.640523672103882, -2.5206680297851562, -2.4008121490478516, -2.280956506729126, -2.1611008644104004, -2.0412449836730957, -1.9213893413543701, -1.8015336990356445, -1.681678056716919, -1.5618222951889038, -1.4419666528701782, -1.3221110105514526, -1.2022552490234375, -1.082399606704712, -0.9625438451766968, -0.8426882028579712, -0.7228325009346008, -0.6029767990112305, -0.4831210970878601, -0.36326539516448975, -0.24340970814228058, -0.12355402112007141, -0.00369831919670105, 0.11615735292434692, 0.23601305484771729, 0.35586875677108765, 0.475724458694458, 0.5955801606178284, 0.7154358625411987, 0.8352915048599243, 0.9551472663879395, 1.075002908706665, 1.1948585510253906, 1.3147143125534058, 1.434570074081421, 1.5544257164001465, 1.6742814779281616, 1.7941371202468872, 1.9139928817749023, 2.033848524093628, 2.1537041664123535, 2.273560047149658, 2.3934154510498047, 2.5132710933685303, 2.633126735687256, 2.7529826164245605, 2.872838258743286, 2.9926939010620117, 3.1125495433807373, 3.232405185699463, 3.3522610664367676, 3.472116708755493, 3.5919723510742188, 3.7118282318115234, 3.831683874130249, 3.9515395164489746, 4.071395397186279, 4.191250801086426, 4.3111066818237305]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 11.0, 5.0, 10.0, 8.0, 27.0, 32.0, 24.0, 56.0, 67.0, 135.0, 221.0, 341.0, 561.0, 988.0, 1657.0, 3086.0, 5729.0, 12022.0, 27505.0, 74353.0, 375239.0, 3404553.0, 193483.0, 51737.0, 21033.0, 10042.0, 4863.0, 2661.0, 1522.0, 914.0, 471.0, 304.0, 222.0, 121.0, 79.0, 63.0, 30.0, 31.0, 33.0, 13.0, 6.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7794876098632812, -0.7537994384765625, -0.7281112670898438, -0.702423095703125, -0.6767349243164062, -0.6510467529296875, -0.6253585815429688, -0.59967041015625, -0.5739822387695312, -0.5482940673828125, -0.5226058959960938, -0.496917724609375, -0.47122955322265625, -0.4455413818359375, -0.41985321044921875, -0.3941650390625, -0.36847686767578125, -0.3427886962890625, -0.31710052490234375, -0.291412353515625, -0.26572418212890625, -0.2400360107421875, -0.21434783935546875, -0.18865966796875, -0.16297149658203125, -0.1372833251953125, -0.11159515380859375, -0.085906982421875, -0.06021881103515625, -0.0345306396484375, -0.00884246826171875, 0.016845703125, 0.04253387451171875, 0.0682220458984375, 0.09391021728515625, 0.119598388671875, 0.14528656005859375, 0.1709747314453125, 0.19666290283203125, 0.22235107421875, 0.24803924560546875, 0.2737274169921875, 0.29941558837890625, 0.325103759765625, 0.35079193115234375, 0.3764801025390625, 0.40216827392578125, 0.4278564453125, 0.45354461669921875, 0.4792327880859375, 0.5049209594726562, 0.530609130859375, 0.5562973022460938, 0.5819854736328125, 0.6076736450195312, 0.63336181640625, 0.6590499877929688, 0.6847381591796875, 0.7104263305664062, 0.736114501953125, 0.7618026733398438, 0.7874908447265625, 0.8131790161132812, 0.8388671875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 3.0, 4.0, 12.0, 14.0, 6.0, 12.0, 22.0, 17.0, 18.0, 23.0, 41.0, 35.0, 50.0, 68.0, 51.0, 57.0, 67.0, 57.0, 63.0, 64.0, 40.0, 47.0, 33.0, 35.0, 28.0, 25.0, 27.0, 14.0, 17.0, 13.0, 6.0, 9.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2149658203125, -0.20843887329101562, -0.20191192626953125, -0.19538497924804688, -0.1888580322265625, -0.18233108520507812, -0.17580413818359375, -0.16927719116210938, -0.162750244140625, -0.15622329711914062, -0.14969635009765625, -0.14316940307617188, -0.1366424560546875, -0.13011550903320312, -0.12358856201171875, -0.11706161499023438, -0.11053466796875, -0.10400772094726562, -0.09748077392578125, -0.09095382690429688, -0.0844268798828125, -0.07789993286132812, -0.07137298583984375, -0.06484603881835938, -0.058319091796875, -0.051792144775390625, -0.04526519775390625, -0.038738250732421875, -0.0322113037109375, -0.025684356689453125, -0.01915740966796875, -0.012630462646484375, -0.006103515625, 0.000423431396484375, 0.00695037841796875, 0.013477325439453125, 0.0200042724609375, 0.026531219482421875, 0.03305816650390625, 0.039585113525390625, 0.046112060546875, 0.052639007568359375, 0.05916595458984375, 0.06569290161132812, 0.0722198486328125, 0.07874679565429688, 0.08527374267578125, 0.09180068969726562, 0.09832763671875, 0.10485458374023438, 0.11138153076171875, 0.11790847778320312, 0.1244354248046875, 0.13096237182617188, 0.13748931884765625, 0.14401626586914062, 0.150543212890625, 0.15707015991210938, 0.16359710693359375, 0.17012405395507812, 0.1766510009765625, 0.18317794799804688, 0.18970489501953125, 0.19623184204101562, 0.2027587890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 17.0, 15.0, 34.0, 44.0, 58.0, 112.0, 179.0, 260.0, 449.0, 775.0, 1407.0, 2675.0, 5217.0, 11943.0, 31698.0, 124015.0, 2944289.0, 936495.0, 89112.0, 25437.0, 10022.0, 4560.0, 2355.0, 1291.0, 697.0, 389.0, 255.0, 169.0, 115.0, 70.0, 46.0, 23.0, 20.0, 7.0, 8.0, 9.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0444259643554688, -1.0126800537109375, -0.9809341430664062, -0.949188232421875, -0.9174423217773438, -0.8856964111328125, -0.8539505004882812, -0.82220458984375, -0.7904586791992188, -0.7587127685546875, -0.7269668579101562, -0.695220947265625, -0.6634750366210938, -0.6317291259765625, -0.5999832153320312, -0.5682373046875, -0.5364913940429688, -0.5047454833984375, -0.47299957275390625, -0.441253662109375, -0.40950775146484375, -0.3777618408203125, -0.34601593017578125, -0.31427001953125, -0.28252410888671875, -0.2507781982421875, -0.21903228759765625, -0.187286376953125, -0.15554046630859375, -0.1237945556640625, -0.09204864501953125, -0.060302734375, -0.02855682373046875, 0.0031890869140625, 0.03493499755859375, 0.066680908203125, 0.09842681884765625, 0.1301727294921875, 0.16191864013671875, 0.19366455078125, 0.22541046142578125, 0.2571563720703125, 0.28890228271484375, 0.320648193359375, 0.35239410400390625, 0.3841400146484375, 0.41588592529296875, 0.4476318359375, 0.47937774658203125, 0.5111236572265625, 0.5428695678710938, 0.574615478515625, 0.6063613891601562, 0.6381072998046875, 0.6698532104492188, 0.70159912109375, 0.7333450317382812, 0.7650909423828125, 0.7968368530273438, 0.828582763671875, 0.8603286743164062, 0.8920745849609375, 0.9238204956054688, 0.95556640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 4.0, 7.0, 11.0, 20.0, 25.0, 33.0, 47.0, 77.0, 147.0, 306.0, 1121.0, 1627.0, 288.0, 137.0, 68.0, 49.0, 27.0, 19.0, 11.0, 11.0, 9.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441162109375, -0.4254493713378906, -0.40973663330078125, -0.3940238952636719, -0.3783111572265625, -0.3625984191894531, -0.34688568115234375, -0.3311729431152344, -0.315460205078125, -0.2997474670410156, -0.28403472900390625, -0.2683219909667969, -0.2526092529296875, -0.23689651489257812, -0.22118377685546875, -0.20547103881835938, -0.18975830078125, -0.17404556274414062, -0.15833282470703125, -0.14262008666992188, -0.1269073486328125, -0.11119461059570312, -0.09548187255859375, -0.07976913452148438, -0.064056396484375, -0.048343658447265625, -0.03263092041015625, -0.016918182373046875, -0.0012054443359375, 0.014507293701171875, 0.03022003173828125, 0.045932769775390625, 0.0616455078125, 0.07735824584960938, 0.09307098388671875, 0.10878372192382812, 0.1244964599609375, 0.14020919799804688, 0.15592193603515625, 0.17163467407226562, 0.187347412109375, 0.20306015014648438, 0.21877288818359375, 0.23448562622070312, 0.2501983642578125, 0.2659111022949219, 0.28162384033203125, 0.2973365783691406, 0.31304931640625, 0.3287620544433594, 0.34447479248046875, 0.3601875305175781, 0.3759002685546875, 0.3916130065917969, 0.40732574462890625, 0.4230384826660156, 0.438751220703125, 0.4544639587402344, 0.47017669677734375, 0.4858894348144531, 0.5016021728515625, 0.5173149108886719, 0.5330276489257812, 0.5487403869628906, 0.564453125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 12.0, 20.0, 66.0, 86.0, 119.0, 166.0, 166.0, 139.0, 105.0, 52.0, 28.0, 18.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8368101119995117, -3.7227165699005127, -3.6086230278015137, -3.4945294857025146, -3.3804359436035156, -3.2663421630859375, -3.1522486209869385, -3.0381550788879395, -2.9240615367889404, -2.8099679946899414, -2.6958744525909424, -2.5817809104919434, -2.4676871299743652, -2.3535938262939453, -2.239500045776367, -2.125406503677368, -2.011312961578369, -1.8972194194793701, -1.783125877380371, -1.6690322160720825, -1.5549386739730835, -1.4408451318740845, -1.326751470565796, -1.2126579284667969, -1.0985643863677979, -0.9844708442687988, -0.870377242565155, -0.7562836408615112, -0.6421900987625122, -0.5280965566635132, -0.4140029549598694, -0.2999093532562256, -0.18581557273864746, -0.07172200083732605, 0.04237157106399536, 0.15646514296531677, 0.2705587148666382, 0.3846522569656372, 0.498745858669281, 0.6128394603729248, 0.7269330024719238, 0.8410265445709229, 0.9551201462745667, 1.0692137479782104, 1.1833072900772095, 1.2974008321762085, 1.411494493484497, 1.525588035583496, 1.6396815776824951, 1.7537751197814941, 1.8678686618804932, 1.9819623231887817, 2.0960559844970703, 2.2101492881774902, 2.3242430686950684, 2.4383366107940674, 2.5524301528930664, 2.6665236949920654, 2.7806172370910645, 2.8947107791900635, 3.0088043212890625, 3.1228981018066406, 3.2369916439056396, 3.3510851860046387, 3.4651787281036377]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 4.0, 11.0, 15.0, 18.0, 17.0, 25.0, 27.0, 16.0, 34.0, 43.0, 32.0, 30.0, 37.0, 42.0, 28.0, 49.0, 54.0, 46.0, 46.0, 41.0, 44.0, 39.0, 34.0, 30.0, 29.0, 33.0, 22.0, 27.0, 19.0, 20.0, 20.0, 9.0, 12.0, 8.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.5805082321166992, -1.5368040800094604, -1.4931000471115112, -1.4493958950042725, -1.4056917428970337, -1.361987590789795, -1.3182835578918457, -1.274579405784607, -1.2308752536773682, -1.1871711015701294, -1.1434670686721802, -1.0997629165649414, -1.0560587644577026, -1.0123546123504639, -0.9686505794525146, -0.9249464273452759, -0.8812423944473267, -0.8375383019447327, -0.7938341498374939, -0.7501300573348999, -0.7064259052276611, -0.6627218127250671, -0.6190177202224731, -0.5753135681152344, -0.5316094756126404, -0.487905353307724, -0.4442012310028076, -0.4004971385002136, -0.35679301619529724, -0.31308889389038086, -0.26938480138778687, -0.22568067908287048, -0.1819765567779541, -0.13827243447303772, -0.09456832706928253, -0.050864219665527344, -0.007160097360610962, 0.03654402494430542, 0.08024811744689941, 0.1239522397518158, 0.16765636205673218, 0.21136048436164856, 0.25506460666656494, 0.29876869916915894, 0.3424728214740753, 0.3861769437789917, 0.4298810362815857, 0.4735851585865021, 0.5172892808914185, 0.5609933733940125, 0.6046975255012512, 0.6484016180038452, 0.692105770111084, 0.735809862613678, 0.779513955116272, 0.8232181072235107, 0.8669221997261047, 0.9106262922286987, 0.9543304443359375, 0.9980345368385315, 1.0417386293411255, 1.0854427814483643, 1.1291468143463135, 1.1728509664535522, 1.216555118560791]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 7.0, 4.0, 5.0, 6.0, 9.0, 8.0, 14.0, 22.0, 18.0, 23.0, 35.0, 64.0, 85.0, 117.0, 153.0, 269.0, 442.0, 708.0, 1220.0, 2320.0, 4180.0, 7684.0, 15031.0, 30029.0, 68012.0, 297630.0, 451774.0, 93480.0, 36320.0, 18109.0, 9245.0, 5106.0, 2695.0, 1462.0, 870.0, 499.0, 311.0, 191.0, 126.0, 101.0, 42.0, 33.0, 28.0, 21.0, 23.0, 7.0, 8.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7392578125, -0.7162551879882812, -0.6932525634765625, -0.6702499389648438, -0.647247314453125, -0.6242446899414062, -0.6012420654296875, -0.5782394409179688, -0.55523681640625, -0.5322341918945312, -0.5092315673828125, -0.48622894287109375, -0.463226318359375, -0.44022369384765625, -0.4172210693359375, -0.39421844482421875, -0.3712158203125, -0.34821319580078125, -0.3252105712890625, -0.30220794677734375, -0.279205322265625, -0.25620269775390625, -0.2332000732421875, -0.21019744873046875, -0.18719482421875, -0.16419219970703125, -0.1411895751953125, -0.11818695068359375, -0.095184326171875, -0.07218170166015625, -0.0491790771484375, -0.02617645263671875, -0.003173828125, 0.01982879638671875, 0.0428314208984375, 0.06583404541015625, 0.088836669921875, 0.11183929443359375, 0.1348419189453125, 0.15784454345703125, 0.18084716796875, 0.20384979248046875, 0.2268524169921875, 0.24985504150390625, 0.272857666015625, 0.29586029052734375, 0.3188629150390625, 0.34186553955078125, 0.3648681640625, 0.38787078857421875, 0.4108734130859375, 0.43387603759765625, 0.456878662109375, 0.47988128662109375, 0.5028839111328125, 0.5258865356445312, 0.54888916015625, 0.5718917846679688, 0.5948944091796875, 0.6178970336914062, 0.640899658203125, 0.6639022827148438, 0.6869049072265625, 0.7099075317382812, 0.73291015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 5.0, 9.0, 7.0, 9.0, 12.0, 10.0, 17.0, 19.0, 14.0, 31.0, 22.0, 33.0, 40.0, 49.0, 43.0, 67.0, 65.0, 52.0, 46.0, 47.0, 64.0, 48.0, 43.0, 30.0, 30.0, 28.0, 33.0, 24.0, 29.0, 16.0, 14.0, 14.0, 11.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2091064453125, -0.20276832580566406, -0.19643020629882812, -0.1900920867919922, -0.18375396728515625, -0.1774158477783203, -0.17107772827148438, -0.16473960876464844, -0.1584014892578125, -0.15206336975097656, -0.14572525024414062, -0.1393871307373047, -0.13304901123046875, -0.1267108917236328, -0.12037277221679688, -0.11403465270996094, -0.107696533203125, -0.10135841369628906, -0.09502029418945312, -0.08868217468261719, -0.08234405517578125, -0.07600593566894531, -0.06966781616210938, -0.06332969665527344, -0.0569915771484375, -0.05065345764160156, -0.044315338134765625, -0.03797721862792969, -0.03163909912109375, -0.025300979614257812, -0.018962860107421875, -0.012624740600585938, -0.00628662109375, 5.14984130859375e-05, 0.006389617919921875, 0.012727737426757812, 0.01906585693359375, 0.025403976440429688, 0.031742095947265625, 0.03808021545410156, 0.0444183349609375, 0.05075645446777344, 0.057094573974609375, 0.06343269348144531, 0.06977081298828125, 0.07610893249511719, 0.08244705200195312, 0.08878517150878906, 0.095123291015625, 0.10146141052246094, 0.10779953002929688, 0.11413764953613281, 0.12047576904296875, 0.1268138885498047, 0.13315200805664062, 0.13949012756347656, 0.1458282470703125, 0.15216636657714844, 0.15850448608398438, 0.1648426055908203, 0.17118072509765625, 0.1775188446044922, 0.18385696411132812, 0.19019508361816406, 0.196533203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 17.0, 12.0, 35.0, 42.0, 62.0, 84.0, 118.0, 189.0, 352.0, 674.0, 1308.0, 2865.0, 6974.0, 17620.0, 46585.0, 239214.0, 616334.0, 72534.0, 25656.0, 10088.0, 3960.0, 1795.0, 888.0, 431.0, 234.0, 147.0, 104.0, 59.0, 47.0, 27.0, 16.0, 16.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97705078125, -0.9457321166992188, -0.9144134521484375, -0.8830947875976562, -0.851776123046875, -0.8204574584960938, -0.7891387939453125, -0.7578201293945312, -0.72650146484375, -0.6951828002929688, -0.6638641357421875, -0.6325454711914062, -0.601226806640625, -0.5699081420898438, -0.5385894775390625, -0.5072708129882812, -0.4759521484375, -0.44463348388671875, -0.4133148193359375, -0.38199615478515625, -0.350677490234375, -0.31935882568359375, -0.2880401611328125, -0.25672149658203125, -0.22540283203125, -0.19408416748046875, -0.1627655029296875, -0.13144683837890625, -0.100128173828125, -0.06880950927734375, -0.0374908447265625, -0.00617218017578125, 0.025146484375, 0.05646514892578125, 0.0877838134765625, 0.11910247802734375, 0.150421142578125, 0.18173980712890625, 0.2130584716796875, 0.24437713623046875, 0.27569580078125, 0.30701446533203125, 0.3383331298828125, 0.36965179443359375, 0.400970458984375, 0.43228912353515625, 0.4636077880859375, 0.49492645263671875, 0.5262451171875, 0.5575637817382812, 0.5888824462890625, 0.6202011108398438, 0.651519775390625, 0.6828384399414062, 0.7141571044921875, 0.7454757690429688, 0.77679443359375, 0.8081130981445312, 0.8394317626953125, 0.8707504272460938, 0.902069091796875, 0.9333877563476562, 0.9647064208984375, 0.9960250854492188, 1.02734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 9.0, 11.0, 8.0, 24.0, 16.0, 32.0, 30.0, 36.0, 40.0, 59.0, 71.0, 61.0, 80.0, 68.0, 58.0, 76.0, 66.0, 45.0, 42.0, 43.0, 19.0, 29.0, 15.0, 11.0, 9.0, 10.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.061920166015625, -1.02423095703125, -0.986541748046875, -0.9488525390625, -0.911163330078125, -0.87347412109375, -0.835784912109375, -0.798095703125, -0.760406494140625, -0.72271728515625, -0.685028076171875, -0.6473388671875, -0.609649658203125, -0.57196044921875, -0.534271240234375, -0.49658203125, -0.458892822265625, -0.42120361328125, -0.383514404296875, -0.3458251953125, -0.308135986328125, -0.27044677734375, -0.232757568359375, -0.195068359375, -0.157379150390625, -0.11968994140625, -0.082000732421875, -0.0443115234375, -0.006622314453125, 0.03106689453125, 0.068756103515625, 0.1064453125, 0.144134521484375, 0.18182373046875, 0.219512939453125, 0.2572021484375, 0.294891357421875, 0.33258056640625, 0.370269775390625, 0.407958984375, 0.445648193359375, 0.48333740234375, 0.521026611328125, 0.5587158203125, 0.596405029296875, 0.63409423828125, 0.671783447265625, 0.70947265625, 0.747161865234375, 0.78485107421875, 0.822540283203125, 0.8602294921875, 0.897918701171875, 0.93560791015625, 0.973297119140625, 1.010986328125, 1.048675537109375, 1.08636474609375, 1.124053955078125, 1.1617431640625, 1.199432373046875, 1.23712158203125, 1.274810791015625, 1.3125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 13.0, 17.0, 14.0, 18.0, 29.0, 44.0, 76.0, 134.0, 243.0, 475.0, 853.0, 1754.0, 3641.0, 8097.0, 21505.0, 82183.0, 554608.0, 298635.0, 49749.0, 14762.0, 6032.0, 2703.0, 1370.0, 678.0, 349.0, 195.0, 125.0, 80.0, 41.0, 24.0, 22.0, 22.0, 15.0, 6.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.4200019836425781, -0.40592193603515625, -0.3918418884277344, -0.3777618408203125, -0.3636817932128906, -0.34960174560546875, -0.3355216979980469, -0.321441650390625, -0.3073616027832031, -0.29328155517578125, -0.2792015075683594, -0.2651214599609375, -0.2510414123535156, -0.23696136474609375, -0.22288131713867188, -0.20880126953125, -0.19472122192382812, -0.18064117431640625, -0.16656112670898438, -0.1524810791015625, -0.13840103149414062, -0.12432098388671875, -0.11024093627929688, -0.096160888671875, -0.08208084106445312, -0.06800079345703125, -0.053920745849609375, -0.0398406982421875, -0.025760650634765625, -0.01168060302734375, 0.002399444580078125, 0.0164794921875, 0.030559539794921875, 0.04463958740234375, 0.058719635009765625, 0.0727996826171875, 0.08687973022460938, 0.10095977783203125, 0.11503982543945312, 0.129119873046875, 0.14319992065429688, 0.15727996826171875, 0.17136001586914062, 0.1854400634765625, 0.19952011108398438, 0.21360015869140625, 0.22768020629882812, 0.24176025390625, 0.2558403015136719, 0.26992034912109375, 0.2840003967285156, 0.2980804443359375, 0.3121604919433594, 0.32624053955078125, 0.3403205871582031, 0.354400634765625, 0.3684806823730469, 0.38256072998046875, 0.3966407775878906, 0.4107208251953125, 0.4248008728027344, 0.43888092041015625, 0.4529609680175781, 0.467041015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 7.0, 6.0, 11.0, 9.0, 10.0, 27.0, 40.0, 62.0, 77.0, 134.0, 172.0, 157.0, 111.0, 63.0, 45.0, 23.0, 23.0, 9.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001748800277709961, -0.00017011351883411407, -0.00016534700989723206, -0.00016058050096035004, -0.00015581399202346802, -0.000151047483086586, -0.00014628097414970398, -0.00014151446521282196, -0.00013674795627593994, -0.00013198144733905792, -0.0001272149384021759, -0.00012244842946529388, -0.00011768192052841187, -0.00011291541159152985, -0.00010814890265464783, -0.00010338239371776581, -9.861588478088379e-05, -9.384937584400177e-05, -8.908286690711975e-05, -8.431635797023773e-05, -7.954984903335571e-05, -7.47833400964737e-05, -7.001683115959167e-05, -6.525032222270966e-05, -6.048381328582764e-05, -5.571730434894562e-05, -5.09507954120636e-05, -4.618428647518158e-05, -4.141777753829956e-05, -3.665126860141754e-05, -3.188475966453552e-05, -2.7118250727653503e-05, -2.2351741790771484e-05, -1.7585232853889465e-05, -1.2818723917007446e-05, -8.052214980125427e-06, -3.285706043243408e-06, 1.4808028936386108e-06, 6.24731183052063e-06, 1.1013820767402649e-05, 1.5780329704284668e-05, 2.0546838641166687e-05, 2.5313347578048706e-05, 3.0079856514930725e-05, 3.4846365451812744e-05, 3.961287438869476e-05, 4.437938332557678e-05, 4.91458922624588e-05, 5.391240119934082e-05, 5.867891013622284e-05, 6.344541907310486e-05, 6.821192800998688e-05, 7.29784369468689e-05, 7.774494588375092e-05, 8.251145482063293e-05, 8.727796375751495e-05, 9.204447269439697e-05, 9.681098163127899e-05, 0.00010157749056816101, 0.00010634399950504303, 0.00011111050844192505, 0.00011587701737880707, 0.00012064352631568909, 0.0001254100352525711, 0.00013017654418945312]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 12.0, 17.0, 19.0, 30.0, 47.0, 85.0, 133.0, 275.0, 563.0, 1304.0, 3701.0, 16143.0, 256115.0, 734797.0, 26928.0, 5291.0, 1711.0, 626.0, 328.0, 167.0, 77.0, 65.0, 48.0, 19.0, 14.0, 4.0, 9.0, 6.0, 3.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9677581787109375, -0.934539794921875, -0.9013214111328125, -0.86810302734375, -0.8348846435546875, -0.801666259765625, -0.7684478759765625, -0.7352294921875, -0.7020111083984375, -0.668792724609375, -0.6355743408203125, -0.60235595703125, -0.5691375732421875, -0.535919189453125, -0.5027008056640625, -0.469482421875, -0.4362640380859375, -0.403045654296875, -0.3698272705078125, -0.33660888671875, -0.3033905029296875, -0.270172119140625, -0.2369537353515625, -0.2037353515625, -0.1705169677734375, -0.137298583984375, -0.1040802001953125, -0.07086181640625, -0.0376434326171875, -0.004425048828125, 0.0287933349609375, 0.06201171875, 0.0952301025390625, 0.128448486328125, 0.1616668701171875, 0.19488525390625, 0.2281036376953125, 0.261322021484375, 0.2945404052734375, 0.3277587890625, 0.3609771728515625, 0.394195556640625, 0.4274139404296875, 0.46063232421875, 0.4938507080078125, 0.527069091796875, 0.5602874755859375, 0.593505859375, 0.6267242431640625, 0.659942626953125, 0.6931610107421875, 0.72637939453125, 0.7595977783203125, 0.792816162109375, 0.8260345458984375, 0.8592529296875, 0.8924713134765625, 0.925689697265625, 0.9589080810546875, 0.99212646484375, 1.0253448486328125, 1.058563232421875, 1.0917816162109375, 1.125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 3.0, 19.0, 10.0, 28.0, 29.0, 53.0, 83.0, 144.0, 177.0, 157.0, 107.0, 65.0, 35.0, 18.0, 19.0, 5.0, 11.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.779296875, -0.7609519958496094, -0.7426071166992188, -0.7242622375488281, -0.7059173583984375, -0.6875724792480469, -0.6692276000976562, -0.6508827209472656, -0.632537841796875, -0.6141929626464844, -0.5958480834960938, -0.5775032043457031, -0.5591583251953125, -0.5408134460449219, -0.5224685668945312, -0.5041236877441406, -0.48577880859375, -0.4674339294433594, -0.44908905029296875, -0.4307441711425781, -0.4123992919921875, -0.3940544128417969, -0.37570953369140625, -0.3573646545410156, -0.339019775390625, -0.3206748962402344, -0.30233001708984375, -0.2839851379394531, -0.2656402587890625, -0.24729537963867188, -0.22895050048828125, -0.21060562133789062, -0.1922607421875, -0.17391586303710938, -0.15557098388671875, -0.13722610473632812, -0.1188812255859375, -0.10053634643554688, -0.08219146728515625, -0.06384658813476562, -0.045501708984375, -0.027156829833984375, -0.00881195068359375, 0.009532928466796875, 0.0278778076171875, 0.046222686767578125, 0.06456756591796875, 0.08291244506835938, 0.10125732421875, 0.11960220336914062, 0.13794708251953125, 0.15629196166992188, 0.1746368408203125, 0.19298171997070312, 0.21132659912109375, 0.22967147827148438, 0.248016357421875, 0.2663612365722656, 0.28470611572265625, 0.3030509948730469, 0.3213958740234375, 0.3397407531738281, 0.35808563232421875, 0.3764305114746094, 0.394775390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 9.0, 33.0, 198.0, 446.0, 269.0, 52.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.475545883178711, -12.710570335388184, -11.945594787597656, -11.180619239807129, -10.415643692016602, -9.650668144226074, -8.885692596435547, -8.12071704864502, -7.355741500854492, -6.590765953063965, -5.8257904052734375, -5.06081485748291, -4.295839309692383, -3.5308637619018555, -2.765888214111328, -2.000912666320801, -1.2359371185302734, -0.4709615707397461, 0.29401397705078125, 1.0589895248413086, 1.823965072631836, 2.5889406204223633, 3.3539161682128906, 4.118891716003418, 4.883867263793945, 5.648842811584473, 6.413818359375, 7.178793907165527, 7.943769454956055, 8.708745002746582, 9.47372055053711, 10.238696098327637, 11.003669738769531, 11.768645286560059, 12.533620834350586, 13.298596382141113, 14.06357192993164, 14.828547477722168, 15.593523025512695, 16.358497619628906, 17.12347412109375, 17.888450622558594, 18.653425216674805, 19.418399810791016, 20.18337631225586, 20.948352813720703, 21.713327407836914, 22.478302001953125, 23.24327850341797, 24.008255004882812, 24.773229598999023, 25.538204193115234, 26.303180694580078, 27.068157196044922, 27.833131790161133, 28.598106384277344, 29.363082885742188, 30.12805938720703, 30.893033981323242, 31.658008575439453, 32.4229850769043, 33.18796157836914, 33.95293426513672, 34.71791076660156, 35.482887268066406]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 2.0, 8.0, 7.0, 13.0, 12.0, 12.0, 9.0, 19.0, 19.0, 27.0, 22.0, 31.0, 25.0, 42.0, 24.0, 31.0, 30.0, 40.0, 53.0, 33.0, 40.0, 37.0, 37.0, 35.0, 41.0, 36.0, 34.0, 36.0, 31.0, 26.0, 20.0, 17.0, 24.0, 25.0, 13.0, 19.0, 9.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-3.937411308288574, -3.823683977127075, -3.709956407546997, -3.596229076385498, -3.482501745223999, -3.368774175643921, -3.255046844482422, -3.1413192749023438, -3.0275919437408447, -2.9138646125793457, -2.8001370429992676, -2.6864097118377686, -2.5726823806762695, -2.4589548110961914, -2.3452274799346924, -2.2315001487731934, -2.1177725791931152, -2.004045248031616, -1.8903177976608276, -1.776590347290039, -1.6628628969192505, -1.549135446548462, -1.435408115386963, -1.3216806650161743, -1.2079534530639648, -1.0942260026931763, -0.9804986119270325, -0.8667712211608887, -0.7530437707901001, -0.6393163800239563, -0.5255889892578125, -0.4118615388870239, -0.29813408851623535, -0.18440666794776917, -0.07067926228046417, 0.04304814338684082, 0.156775563955307, 0.2705029845237732, 0.384230375289917, 0.49795782566070557, 0.6116852164268494, 0.7254126071929932, 0.8391400575637817, 0.9528674483299255, 1.0665948390960693, 1.180322289466858, 1.2940497398376465, 1.4077770709991455, 1.521504521369934, 1.6352319717407227, 1.7489593029022217, 1.8626867532730103, 1.9764142036437988, 2.090141534805298, 2.203868865966797, 2.317596435546875, 2.431323766708374, 2.545051097869873, 2.658778667449951, 2.77250599861145, 2.886233329772949, 2.9999608993530273, 3.1136882305145264, 3.2274155616760254, 3.3411431312561035]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 13.0, 11.0, 36.0, 55.0, 74.0, 117.0, 191.0, 320.0, 487.0, 845.0, 1483.0, 3053.0, 6009.0, 12458.0, 30109.0, 91436.0, 855775.0, 3017956.0, 111066.0, 34155.0, 14183.0, 6780.0, 3342.0, 1792.0, 973.0, 609.0, 353.0, 190.0, 145.0, 91.0, 49.0, 41.0, 25.0, 15.0, 10.0, 4.0, 7.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0966796875, -1.060211181640625, -1.02374267578125, -0.987274169921875, -0.9508056640625, -0.914337158203125, -0.87786865234375, -0.841400146484375, -0.804931640625, -0.768463134765625, -0.73199462890625, -0.695526123046875, -0.6590576171875, -0.622589111328125, -0.58612060546875, -0.549652099609375, -0.51318359375, -0.476715087890625, -0.44024658203125, -0.403778076171875, -0.3673095703125, -0.330841064453125, -0.29437255859375, -0.257904052734375, -0.221435546875, -0.184967041015625, -0.14849853515625, -0.112030029296875, -0.0755615234375, -0.039093017578125, -0.00262451171875, 0.033843994140625, 0.0703125, 0.106781005859375, 0.14324951171875, 0.179718017578125, 0.2161865234375, 0.252655029296875, 0.28912353515625, 0.325592041015625, 0.362060546875, 0.398529052734375, 0.43499755859375, 0.471466064453125, 0.5079345703125, 0.544403076171875, 0.58087158203125, 0.617340087890625, 0.65380859375, 0.690277099609375, 0.72674560546875, 0.763214111328125, 0.7996826171875, 0.836151123046875, 0.87261962890625, 0.909088134765625, 0.945556640625, 0.982025146484375, 1.01849365234375, 1.054962158203125, 1.0914306640625, 1.127899169921875, 1.16436767578125, 1.200836181640625, 1.2373046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 6.0, 12.0, 10.0, 9.0, 19.0, 22.0, 20.0, 17.0, 26.0, 30.0, 33.0, 47.0, 65.0, 46.0, 47.0, 60.0, 53.0, 54.0, 60.0, 50.0, 33.0, 29.0, 25.0, 45.0, 31.0, 32.0, 15.0, 21.0, 15.0, 11.0, 8.0, 7.0, 8.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2181396484375, -0.2117900848388672, -0.20544052124023438, -0.19909095764160156, -0.19274139404296875, -0.18639183044433594, -0.18004226684570312, -0.1736927032470703, -0.1673431396484375, -0.1609935760498047, -0.15464401245117188, -0.14829444885253906, -0.14194488525390625, -0.13559532165527344, -0.12924575805664062, -0.12289619445800781, -0.116546630859375, -0.11019706726074219, -0.10384750366210938, -0.09749794006347656, -0.09114837646484375, -0.08479881286621094, -0.07844924926757812, -0.07209968566894531, -0.0657501220703125, -0.05940055847167969, -0.053050994873046875, -0.04670143127441406, -0.04035186767578125, -0.03400230407714844, -0.027652740478515625, -0.021303176879882812, -0.01495361328125, -0.008604049682617188, -0.002254486083984375, 0.0040950775146484375, 0.01044464111328125, 0.016794204711914062, 0.023143768310546875, 0.029493331909179688, 0.0358428955078125, 0.04219245910644531, 0.048542022705078125, 0.05489158630371094, 0.06124114990234375, 0.06759071350097656, 0.07394027709960938, 0.08028984069824219, 0.086639404296875, 0.09298896789550781, 0.09933853149414062, 0.10568809509277344, 0.11203765869140625, 0.11838722229003906, 0.12473678588867188, 0.1310863494873047, 0.1374359130859375, 0.1437854766845703, 0.15013504028320312, 0.15648460388183594, 0.16283416748046875, 0.16918373107910156, 0.17553329467773438, 0.1818828582763672, 0.188232421875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 3.0, 8.0, 11.0, 30.0, 37.0, 40.0, 65.0, 104.0, 141.0, 246.0, 364.0, 568.0, 975.0, 1717.0, 3199.0, 6827.0, 17280.0, 53633.0, 301625.0, 3563438.0, 177525.0, 40352.0, 13840.0, 5613.0, 2688.0, 1508.0, 832.0, 521.0, 337.0, 240.0, 144.0, 112.0, 76.0, 49.0, 25.0, 33.0, 20.0, 12.0, 11.0, 9.0, 6.0, 1.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3564453125, -1.311798095703125, -1.26715087890625, -1.222503662109375, -1.1778564453125, -1.133209228515625, -1.08856201171875, -1.043914794921875, -0.999267578125, -0.954620361328125, -0.90997314453125, -0.865325927734375, -0.8206787109375, -0.776031494140625, -0.73138427734375, -0.686737060546875, -0.64208984375, -0.597442626953125, -0.55279541015625, -0.508148193359375, -0.4635009765625, -0.418853759765625, -0.37420654296875, -0.329559326171875, -0.284912109375, -0.240264892578125, -0.19561767578125, -0.150970458984375, -0.1063232421875, -0.061676025390625, -0.01702880859375, 0.027618408203125, 0.072265625, 0.116912841796875, 0.16156005859375, 0.206207275390625, 0.2508544921875, 0.295501708984375, 0.34014892578125, 0.384796142578125, 0.429443359375, 0.474090576171875, 0.51873779296875, 0.563385009765625, 0.6080322265625, 0.652679443359375, 0.69732666015625, 0.741973876953125, 0.78662109375, 0.831268310546875, 0.87591552734375, 0.920562744140625, 0.9652099609375, 1.009857177734375, 1.05450439453125, 1.099151611328125, 1.143798828125, 1.188446044921875, 1.23309326171875, 1.277740478515625, 1.3223876953125, 1.367034912109375, 1.41168212890625, 1.456329345703125, 1.5009765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 12.0, 10.0, 21.0, 23.0, 41.0, 67.0, 90.0, 179.0, 588.0, 2270.0, 352.0, 141.0, 86.0, 60.0, 38.0, 24.0, 13.0, 11.0, 11.0, 4.0, 10.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.48542022705078125, -0.4654693603515625, -0.44551849365234375, -0.425567626953125, -0.40561676025390625, -0.3856658935546875, -0.36571502685546875, -0.34576416015625, -0.32581329345703125, -0.3058624267578125, -0.28591156005859375, -0.265960693359375, -0.24600982666015625, -0.2260589599609375, -0.20610809326171875, -0.1861572265625, -0.16620635986328125, -0.1462554931640625, -0.12630462646484375, -0.106353759765625, -0.08640289306640625, -0.0664520263671875, -0.04650115966796875, -0.02655029296875, -0.00659942626953125, 0.0133514404296875, 0.03330230712890625, 0.053253173828125, 0.07320404052734375, 0.0931549072265625, 0.11310577392578125, 0.133056640625, 0.15300750732421875, 0.1729583740234375, 0.19290924072265625, 0.212860107421875, 0.23281097412109375, 0.2527618408203125, 0.27271270751953125, 0.29266357421875, 0.31261444091796875, 0.3325653076171875, 0.35251617431640625, 0.372467041015625, 0.39241790771484375, 0.4123687744140625, 0.43231964111328125, 0.4522705078125, 0.47222137451171875, 0.4921722412109375, 0.5121231079101562, 0.532073974609375, 0.5520248413085938, 0.5719757080078125, 0.5919265747070312, 0.61187744140625, 0.6318283081054688, 0.6517791748046875, 0.6717300415039062, 0.691680908203125, 0.7116317749023438, 0.7315826416015625, 0.7515335083007812, 0.771484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 7.0, 11.0, 24.0, 67.0, 96.0, 173.0, 204.0, 174.0, 114.0, 74.0, 30.0, 12.0, 11.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65437650680542, -5.490328788757324, -5.32628059387207, -5.162232398986816, -4.998184680938721, -4.834136962890625, -4.670088768005371, -4.506040573120117, -4.3419928550720215, -4.177945137023926, -4.013896942138672, -3.849848985671997, -3.6858010292053223, -3.5217530727386475, -3.3577051162719727, -3.193657159805298, -3.029609203338623, -2.8655612468719482, -2.7015132904052734, -2.5374653339385986, -2.373417377471924, -2.209369421005249, -2.045321464538574, -1.8812735080718994, -1.7172255516052246, -1.5531775951385498, -1.389129638671875, -1.2250816822052002, -1.0610337257385254, -0.8969857692718506, -0.7329378128051758, -0.568889856338501, -0.40484142303466797, -0.24079346656799316, -0.07674551010131836, 0.08730244636535645, 0.25135040283203125, 0.41539835929870605, 0.5794463157653809, 0.7434942722320557, 0.9075422286987305, 1.0715901851654053, 1.23563814163208, 1.3996860980987549, 1.5637340545654297, 1.7277820110321045, 1.8918299674987793, 2.055877923965454, 2.219925880432129, 2.3839738368988037, 2.5480217933654785, 2.7120697498321533, 2.876117706298828, 3.040165662765503, 3.2042136192321777, 3.3682615756988525, 3.5323095321655273, 3.696357488632202, 3.860405445098877, 4.024453163146973, 4.188501358032227, 4.3525495529174805, 4.516597270965576, 4.680644989013672, 4.844693183898926]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 7.0, 3.0, 12.0, 11.0, 16.0, 19.0, 15.0, 20.0, 25.0, 34.0, 20.0, 34.0, 33.0, 44.0, 33.0, 50.0, 43.0, 57.0, 45.0, 66.0, 64.0, 44.0, 40.0, 41.0, 19.0, 34.0, 32.0, 32.0, 21.0, 14.0, 16.0, 9.0, 9.0, 12.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.27410888671875, -2.212641954421997, -2.151174783706665, -2.089707851409912, -2.02824068069458, -1.9667736291885376, -1.9053065776824951, -1.8438395261764526, -1.7823724746704102, -1.7209054231643677, -1.6594383716583252, -1.5979713201522827, -1.5365042686462402, -1.4750372171401978, -1.4135701656341553, -1.3521031141281128, -1.2906360626220703, -1.2291690111160278, -1.1677019596099854, -1.1062349081039429, -1.0447678565979004, -0.9833008050918579, -0.9218337535858154, -0.860366702079773, -0.79889976978302, -0.7374327182769775, -0.6759656667709351, -0.6144986152648926, -0.5530315637588501, -0.49156454205513, -0.4300974905490875, -0.36863043904304504, -0.3071633577346802, -0.2456963062286377, -0.18422925472259521, -0.12276221811771393, -0.06129516661167145, 0.00017186999320983887, 0.06163892149925232, 0.1231059730052948, 0.18457302451133728, 0.24604007601737976, 0.30750712752342224, 0.36897414922714233, 0.4304412007331848, 0.4919082522392273, 0.5533753037452698, 0.6148423552513123, 0.6763094067573547, 0.7377764582633972, 0.7992435097694397, 0.8607105612754822, 0.9221776127815247, 0.9836446046829224, 1.0451116561889648, 1.1065787076950073, 1.1680457592010498, 1.2295128107070923, 1.2909798622131348, 1.3524469137191772, 1.4139139652252197, 1.4753810167312622, 1.5368480682373047, 1.5983151197433472, 1.6597821712493896]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 1.0, 11.0, 6.0, 17.0, 12.0, 18.0, 30.0, 50.0, 70.0, 102.0, 157.0, 255.0, 445.0, 766.0, 1324.0, 2371.0, 4532.0, 8998.0, 18083.0, 37368.0, 74234.0, 148231.0, 329409.0, 217868.0, 101592.0, 51298.0, 25264.0, 12523.0, 6273.0, 3183.0, 1718.0, 985.0, 500.0, 314.0, 187.0, 118.0, 78.0, 50.0, 37.0, 16.0, 18.0, 16.0, 11.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7158203125, -0.691741943359375, -0.66766357421875, -0.643585205078125, -0.6195068359375, -0.595428466796875, -0.57135009765625, -0.547271728515625, -0.523193359375, -0.499114990234375, -0.47503662109375, -0.450958251953125, -0.4268798828125, -0.402801513671875, -0.37872314453125, -0.354644775390625, -0.33056640625, -0.306488037109375, -0.28240966796875, -0.258331298828125, -0.2342529296875, -0.210174560546875, -0.18609619140625, -0.162017822265625, -0.137939453125, -0.113861083984375, -0.08978271484375, -0.065704345703125, -0.0416259765625, -0.017547607421875, 0.00653076171875, 0.030609130859375, 0.0546875, 0.078765869140625, 0.10284423828125, 0.126922607421875, 0.1510009765625, 0.175079345703125, 0.19915771484375, 0.223236083984375, 0.247314453125, 0.271392822265625, 0.29547119140625, 0.319549560546875, 0.3436279296875, 0.367706298828125, 0.39178466796875, 0.415863037109375, 0.43994140625, 0.464019775390625, 0.48809814453125, 0.512176513671875, 0.5362548828125, 0.560333251953125, 0.58441162109375, 0.608489990234375, 0.632568359375, 0.656646728515625, 0.68072509765625, 0.704803466796875, 0.7288818359375, 0.752960205078125, 0.77703857421875, 0.801116943359375, 0.8251953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 5.0, 0.0, 6.0, 4.0, 6.0, 3.0, 7.0, 13.0, 9.0, 12.0, 14.0, 26.0, 31.0, 24.0, 35.0, 33.0, 43.0, 33.0, 46.0, 50.0, 44.0, 51.0, 50.0, 48.0, 51.0, 48.0, 47.0, 38.0, 24.0, 31.0, 29.0, 24.0, 23.0, 22.0, 16.0, 12.0, 13.0, 6.0, 7.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2303466796875, -0.2235736846923828, -0.21680068969726562, -0.21002769470214844, -0.20325469970703125, -0.19648170471191406, -0.18970870971679688, -0.1829357147216797, -0.1761627197265625, -0.1693897247314453, -0.16261672973632812, -0.15584373474121094, -0.14907073974609375, -0.14229774475097656, -0.13552474975585938, -0.1287517547607422, -0.121978759765625, -0.11520576477050781, -0.10843276977539062, -0.10165977478027344, -0.09488677978515625, -0.08811378479003906, -0.08134078979492188, -0.07456779479980469, -0.0677947998046875, -0.06102180480957031, -0.054248809814453125, -0.04747581481933594, -0.04070281982421875, -0.03392982482910156, -0.027156829833984375, -0.020383834838867188, -0.01361083984375, -0.0068378448486328125, -6.4849853515625e-05, 0.0067081451416015625, 0.01348114013671875, 0.020254135131835938, 0.027027130126953125, 0.03380012512207031, 0.0405731201171875, 0.04734611511230469, 0.054119110107421875, 0.06089210510253906, 0.06766510009765625, 0.07443809509277344, 0.08121109008789062, 0.08798408508300781, 0.094757080078125, 0.10153007507324219, 0.10830307006835938, 0.11507606506347656, 0.12184906005859375, 0.12862205505371094, 0.13539505004882812, 0.1421680450439453, 0.1489410400390625, 0.1557140350341797, 0.16248703002929688, 0.16926002502441406, 0.17603302001953125, 0.18280601501464844, 0.18957901000976562, 0.1963520050048828, 0.203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 4.0, 4.0, 10.0, 11.0, 17.0, 24.0, 28.0, 40.0, 53.0, 77.0, 78.0, 131.0, 180.0, 240.0, 327.0, 493.0, 778.0, 1374.0, 3277.0, 10656.0, 44181.0, 197474.0, 587874.0, 152412.0, 34170.0, 8338.0, 2673.0, 1232.0, 719.0, 468.0, 320.0, 212.0, 144.0, 134.0, 80.0, 76.0, 63.0, 40.0, 32.0, 23.0, 19.0, 13.0, 10.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.2001953125, -1.159393310546875, -1.11859130859375, -1.077789306640625, -1.0369873046875, -0.996185302734375, -0.95538330078125, -0.914581298828125, -0.873779296875, -0.832977294921875, -0.79217529296875, -0.751373291015625, -0.7105712890625, -0.669769287109375, -0.62896728515625, -0.588165283203125, -0.54736328125, -0.506561279296875, -0.46575927734375, -0.424957275390625, -0.3841552734375, -0.343353271484375, -0.30255126953125, -0.261749267578125, -0.220947265625, -0.180145263671875, -0.13934326171875, -0.098541259765625, -0.0577392578125, -0.016937255859375, 0.02386474609375, 0.064666748046875, 0.10546875, 0.146270751953125, 0.18707275390625, 0.227874755859375, 0.2686767578125, 0.309478759765625, 0.35028076171875, 0.391082763671875, 0.431884765625, 0.472686767578125, 0.51348876953125, 0.554290771484375, 0.5950927734375, 0.635894775390625, 0.67669677734375, 0.717498779296875, 0.75830078125, 0.799102783203125, 0.83990478515625, 0.880706787109375, 0.9215087890625, 0.962310791015625, 1.00311279296875, 1.043914794921875, 1.084716796875, 1.125518798828125, 1.16632080078125, 1.207122802734375, 1.2479248046875, 1.288726806640625, 1.32952880859375, 1.370330810546875, 1.4111328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 7.0, 14.0, 12.0, 10.0, 17.0, 14.0, 29.0, 31.0, 38.0, 40.0, 52.0, 44.0, 52.0, 49.0, 49.0, 60.0, 57.0, 53.0, 54.0, 49.0, 42.0, 37.0, 38.0, 23.0, 29.0, 16.0, 15.0, 9.0, 15.0, 8.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.34344482421875, -1.3021240234375, -1.26080322265625, -1.219482421875, -1.17816162109375, -1.1368408203125, -1.09552001953125, -1.05419921875, -1.01287841796875, -0.9715576171875, -0.93023681640625, -0.888916015625, -0.84759521484375, -0.8062744140625, -0.76495361328125, -0.7236328125, -0.68231201171875, -0.6409912109375, -0.59967041015625, -0.558349609375, -0.51702880859375, -0.4757080078125, -0.43438720703125, -0.39306640625, -0.35174560546875, -0.3104248046875, -0.26910400390625, -0.227783203125, -0.18646240234375, -0.1451416015625, -0.10382080078125, -0.0625, -0.02117919921875, 0.0201416015625, 0.06146240234375, 0.102783203125, 0.14410400390625, 0.1854248046875, 0.22674560546875, 0.26806640625, 0.30938720703125, 0.3507080078125, 0.39202880859375, 0.433349609375, 0.47467041015625, 0.5159912109375, 0.55731201171875, 0.5986328125, 0.63995361328125, 0.6812744140625, 0.72259521484375, 0.763916015625, 0.80523681640625, 0.8465576171875, 0.88787841796875, 0.92919921875, 0.97052001953125, 1.0118408203125, 1.05316162109375, 1.094482421875, 1.13580322265625, 1.1771240234375, 1.21844482421875, 1.259765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 13.0, 11.0, 14.0, 20.0, 18.0, 29.0, 35.0, 59.0, 90.0, 87.0, 151.0, 274.0, 531.0, 1510.0, 6105.0, 67898.0, 916959.0, 46978.0, 5165.0, 1371.0, 450.0, 241.0, 160.0, 105.0, 69.0, 50.0, 32.0, 31.0, 25.0, 12.0, 15.0, 14.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.03662109375, -1.9697265625, -1.90283203125, -1.8359375, -1.76904296875, -1.7021484375, -1.63525390625, -1.568359375, -1.50146484375, -1.4345703125, -1.36767578125, -1.30078125, -1.23388671875, -1.1669921875, -1.10009765625, -1.033203125, -0.96630859375, -0.8994140625, -0.83251953125, -0.765625, -0.69873046875, -0.6318359375, -0.56494140625, -0.498046875, -0.43115234375, -0.3642578125, -0.29736328125, -0.23046875, -0.16357421875, -0.0966796875, -0.02978515625, 0.037109375, 0.10400390625, 0.1708984375, 0.23779296875, 0.3046875, 0.37158203125, 0.4384765625, 0.50537109375, 0.572265625, 0.63916015625, 0.7060546875, 0.77294921875, 0.83984375, 0.90673828125, 0.9736328125, 1.04052734375, 1.107421875, 1.17431640625, 1.2412109375, 1.30810546875, 1.375, 1.44189453125, 1.5087890625, 1.57568359375, 1.642578125, 1.70947265625, 1.7763671875, 1.84326171875, 1.91015625, 1.97705078125, 2.0439453125, 2.11083984375, 2.177734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 12.0, 20.0, 32.0, 29.0, 61.0, 74.0, 112.0, 164.0, 166.0, 81.0, 45.0, 45.0, 39.0, 27.0, 18.0, 15.0, 11.0, 11.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00017178058624267578, -0.00016698800027370453, -0.00016219541430473328, -0.00015740282833576202, -0.00015261024236679077, -0.00014781765639781952, -0.00014302507042884827, -0.00013823248445987701, -0.00013343989849090576, -0.0001286473125219345, -0.00012385472655296326, -0.000119062140583992, -0.00011426955461502075, -0.0001094769686460495, -0.00010468438267707825, -9.9891796708107e-05, -9.509921073913574e-05, -9.030662477016449e-05, -8.551403880119324e-05, -8.072145283222198e-05, -7.592886686325073e-05, -7.113628089427948e-05, -6.634369492530823e-05, -6.155110895633698e-05, -5.675852298736572e-05, -5.196593701839447e-05, -4.717335104942322e-05, -4.2380765080451965e-05, -3.758817911148071e-05, -3.279559314250946e-05, -2.8003007173538208e-05, -2.3210421204566956e-05, -1.8417835235595703e-05, -1.362524926662445e-05, -8.832663297653198e-06, -4.040077328681946e-06, 7.525086402893066e-07, 5.545094609260559e-06, 1.0337680578231812e-05, 1.5130266547203064e-05, 1.9922852516174316e-05, 2.471543848514557e-05, 2.950802445411682e-05, 3.4300610423088074e-05, 3.9093196392059326e-05, 4.388578236103058e-05, 4.867836833000183e-05, 5.3470954298973083e-05, 5.8263540267944336e-05, 6.305612623691559e-05, 6.784871220588684e-05, 7.26412981748581e-05, 7.743388414382935e-05, 8.22264701128006e-05, 8.701905608177185e-05, 9.18116420507431e-05, 9.660422801971436e-05, 0.00010139681398868561, 0.00010618939995765686, 0.00011098198592662811, 0.00011577457189559937, 0.00012056715786457062, 0.00012535974383354187, 0.00013015232980251312, 0.00013494491577148438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 6.0, 7.0, 4.0, 5.0, 5.0, 6.0, 22.0, 20.0, 26.0, 35.0, 49.0, 81.0, 171.0, 353.0, 793.0, 2083.0, 7725.0, 91505.0, 895804.0, 41437.0, 5468.0, 1634.0, 643.0, 280.0, 118.0, 82.0, 42.0, 29.0, 25.0, 13.0, 16.0, 18.0, 8.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8349609375, -1.7725067138671875, -1.710052490234375, -1.6475982666015625, -1.58514404296875, -1.5226898193359375, -1.460235595703125, -1.3977813720703125, -1.3353271484375, -1.2728729248046875, -1.210418701171875, -1.1479644775390625, -1.08551025390625, -1.0230560302734375, -0.960601806640625, -0.8981475830078125, -0.835693359375, -0.7732391357421875, -0.710784912109375, -0.6483306884765625, -0.58587646484375, -0.5234222412109375, -0.460968017578125, -0.3985137939453125, -0.3360595703125, -0.2736053466796875, -0.211151123046875, -0.1486968994140625, -0.08624267578125, -0.0237884521484375, 0.038665771484375, 0.1011199951171875, 0.16357421875, 0.2260284423828125, 0.288482666015625, 0.3509368896484375, 0.41339111328125, 0.4758453369140625, 0.538299560546875, 0.6007537841796875, 0.6632080078125, 0.7256622314453125, 0.788116455078125, 0.8505706787109375, 0.91302490234375, 0.9754791259765625, 1.037933349609375, 1.1003875732421875, 1.162841796875, 1.2252960205078125, 1.287750244140625, 1.3502044677734375, 1.41265869140625, 1.4751129150390625, 1.537567138671875, 1.6000213623046875, 1.6624755859375, 1.7249298095703125, 1.787384033203125, 1.8498382568359375, 1.91229248046875, 1.9747467041015625, 2.037200927734375, 2.0996551513671875, 2.162109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 14.0, 24.0, 34.0, 42.0, 100.0, 146.0, 268.0, 130.0, 80.0, 47.0, 24.0, 18.0, 13.0, 9.0, 10.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.373046875, -1.33319091796875, -1.2933349609375, -1.25347900390625, -1.213623046875, -1.17376708984375, -1.1339111328125, -1.09405517578125, -1.05419921875, -1.01434326171875, -0.9744873046875, -0.93463134765625, -0.894775390625, -0.85491943359375, -0.8150634765625, -0.77520751953125, -0.7353515625, -0.69549560546875, -0.6556396484375, -0.61578369140625, -0.575927734375, -0.53607177734375, -0.4962158203125, -0.45635986328125, -0.41650390625, -0.37664794921875, -0.3367919921875, -0.29693603515625, -0.257080078125, -0.21722412109375, -0.1773681640625, -0.13751220703125, -0.09765625, -0.05780029296875, -0.0179443359375, 0.02191162109375, 0.061767578125, 0.10162353515625, 0.1414794921875, 0.18133544921875, 0.22119140625, 0.26104736328125, 0.3009033203125, 0.34075927734375, 0.380615234375, 0.42047119140625, 0.4603271484375, 0.50018310546875, 0.5400390625, 0.57989501953125, 0.6197509765625, 0.65960693359375, 0.699462890625, 0.73931884765625, 0.7791748046875, 0.81903076171875, 0.85888671875, 0.89874267578125, 0.9385986328125, 0.97845458984375, 1.018310546875, 1.05816650390625, 1.0980224609375, 1.13787841796875, 1.177734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 16.0, 29.0, 40.0, 84.0, 160.0, 155.0, 173.0, 135.0, 74.0, 57.0, 33.0, 19.0, 12.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.351655960083008, -12.918238639831543, -12.484822273254395, -12.05140495300293, -11.617987632751465, -11.184571266174316, -10.751153945922852, -10.317737579345703, -9.884320259094238, -9.450902938842773, -9.017486572265625, -8.58406925201416, -8.150651931762695, -7.717235565185547, -7.283818244934082, -6.850401401519775, -6.4169840812683105, -5.983567237854004, -5.550149917602539, -5.116733074188232, -4.683316230773926, -4.249898910522461, -3.8164820671081543, -3.3830652236938477, -2.949648141860962, -2.516231060028076, -2.0828142166137695, -1.6493971347808838, -1.2159801721572876, -0.7825632095336914, -0.34914612770080566, 0.08427071571350098, 0.5176877975463867, 0.9511047601699829, 1.384521722793579, 1.8179388046264648, 2.2513556480407715, 2.6847727298736572, 3.118189811706543, 3.5516066551208496, 3.9850237369537354, 4.418440818786621, 4.851857662200928, 5.285274505615234, 5.718691825866699, 6.152108669281006, 6.5855255126953125, 7.018942832946777, 7.452359676361084, 7.885776519775391, 8.319193840026855, 8.75261116027832, 9.186027526855469, 9.619444847106934, 10.052862167358398, 10.486278533935547, 10.919695854187012, 11.353113174438477, 11.786529541015625, 12.21994686126709, 12.653364181518555, 13.086780548095703, 13.520197868347168, 13.953615188598633, 14.387031555175781]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 8.0, 7.0, 18.0, 11.0, 25.0, 22.0, 28.0, 26.0, 21.0, 31.0, 34.0, 51.0, 39.0, 48.0, 43.0, 41.0, 52.0, 55.0, 38.0, 43.0, 44.0, 39.0, 39.0, 32.0, 24.0, 32.0, 21.0, 17.0, 11.0, 17.0, 16.0, 13.0, 8.0, 4.0, 4.0, 6.0, 6.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.146567344665527, -5.936808109283447, -5.727048873901367, -5.517289161682129, -5.307529926300049, -5.097770690917969, -4.888011455535889, -4.678252220153809, -4.46849250793457, -4.25873327255249, -4.04897403717041, -3.839214563369751, -3.629455089569092, -3.4196958541870117, -3.2099366188049316, -3.0001771450042725, -2.7904179096221924, -2.5806586742401123, -2.370899200439453, -2.161139965057373, -1.9513804912567139, -1.7416212558746338, -1.5318619012832642, -1.3221025466918945, -1.112343192100525, -0.9025838375091553, -0.6928244829177856, -0.4830651879310608, -0.27330583333969116, -0.06354653835296631, 0.14621281623840332, 0.35597217082977295, 0.5657315254211426, 0.7754908800125122, 0.9852502346038818, 1.195009469985962, 1.404768943786621, 1.6145281791687012, 1.8242875337600708, 2.0340468883514404, 2.2438063621520996, 2.4535655975341797, 2.663325071334839, 2.873084306716919, 3.082843780517578, 3.292603015899658, 3.5023622512817383, 3.7121217250823975, 3.9218809604644775, 4.131640434265137, 4.341399669647217, 4.551158905029297, 4.760918140411377, 4.970677375793457, 5.180437088012695, 5.390196323394775, 5.5999555587768555, 5.8097147941589355, 6.019474029541016, 6.229233741760254, 6.438992977142334, 6.648752212524414, 6.858511447906494, 7.068270683288574, 7.2780303955078125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 10.0, 14.0, 12.0, 27.0, 35.0, 58.0, 69.0, 115.0, 142.0, 255.0, 437.0, 692.0, 1263.0, 2375.0, 4686.0, 10268.0, 24711.0, 72237.0, 357328.0, 3392551.0, 232007.0, 56300.0, 20299.0, 8770.0, 4225.0, 2208.0, 1235.0, 712.0, 424.0, 242.0, 179.0, 116.0, 86.0, 61.0, 45.0, 28.0, 18.0, 11.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1782379150390625, -1.136749267578125, -1.0952606201171875, -1.05377197265625, -1.0122833251953125, -0.970794677734375, -0.9293060302734375, -0.8878173828125, -0.8463287353515625, -0.804840087890625, -0.7633514404296875, -0.72186279296875, -0.6803741455078125, -0.638885498046875, -0.5973968505859375, -0.555908203125, -0.5144195556640625, -0.472930908203125, -0.4314422607421875, -0.38995361328125, -0.3484649658203125, -0.306976318359375, -0.2654876708984375, -0.2239990234375, -0.1825103759765625, -0.141021728515625, -0.0995330810546875, -0.05804443359375, -0.0165557861328125, 0.024932861328125, 0.0664215087890625, 0.10791015625, 0.1493988037109375, 0.190887451171875, 0.2323760986328125, 0.27386474609375, 0.3153533935546875, 0.356842041015625, 0.3983306884765625, 0.4398193359375, 0.4813079833984375, 0.522796630859375, 0.5642852783203125, 0.60577392578125, 0.6472625732421875, 0.688751220703125, 0.7302398681640625, 0.771728515625, 0.8132171630859375, 0.854705810546875, 0.8961944580078125, 0.93768310546875, 0.9791717529296875, 1.020660400390625, 1.0621490478515625, 1.1036376953125, 1.1451263427734375, 1.186614990234375, 1.2281036376953125, 1.26959228515625, 1.3110809326171875, 1.352569580078125, 1.3940582275390625, 1.435546875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 9.0, 18.0, 15.0, 20.0, 23.0, 31.0, 37.0, 31.0, 41.0, 39.0, 51.0, 35.0, 45.0, 46.0, 60.0, 54.0, 48.0, 41.0, 58.0, 36.0, 42.0, 40.0, 26.0, 27.0, 22.0, 16.0, 15.0, 6.0, 13.0, 6.0, 5.0, 4.0, 8.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2467041015625, -0.2385730743408203, -0.23044204711914062, -0.22231101989746094, -0.21417999267578125, -0.20604896545410156, -0.19791793823242188, -0.1897869110107422, -0.1816558837890625, -0.1735248565673828, -0.16539382934570312, -0.15726280212402344, -0.14913177490234375, -0.14100074768066406, -0.13286972045898438, -0.12473869323730469, -0.116607666015625, -0.10847663879394531, -0.10034561157226562, -0.09221458435058594, -0.08408355712890625, -0.07595252990722656, -0.06782150268554688, -0.05969047546386719, -0.0515594482421875, -0.04342842102050781, -0.035297393798828125, -0.027166366577148438, -0.01903533935546875, -0.010904312133789062, -0.002773284912109375, 0.0053577423095703125, 0.01348876953125, 0.021619796752929688, 0.029750823974609375, 0.03788185119628906, 0.04601287841796875, 0.05414390563964844, 0.062274932861328125, 0.07040596008300781, 0.0785369873046875, 0.08666801452636719, 0.09479904174804688, 0.10293006896972656, 0.11106109619140625, 0.11919212341308594, 0.12732315063476562, 0.1354541778564453, 0.143585205078125, 0.1517162322998047, 0.15984725952148438, 0.16797828674316406, 0.17610931396484375, 0.18424034118652344, 0.19237136840820312, 0.2005023956298828, 0.2086334228515625, 0.2167644500732422, 0.22489547729492188, 0.23302650451660156, 0.24115753173828125, 0.24928855895996094, 0.2574195861816406, 0.2655506134033203, 0.273681640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 6.0, 10.0, 9.0, 13.0, 22.0, 26.0, 43.0, 42.0, 48.0, 82.0, 120.0, 135.0, 217.0, 306.0, 525.0, 877.0, 1511.0, 3198.0, 7457.0, 20569.0, 70791.0, 467708.0, 3347035.0, 204188.0, 44169.0, 14073.0, 5373.0, 2446.0, 1216.0, 689.0, 421.0, 266.0, 182.0, 140.0, 111.0, 75.0, 58.0, 37.0, 29.0, 21.0, 12.0, 9.0, 10.0, 2.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59765625, -1.5466461181640625, -1.495635986328125, -1.4446258544921875, -1.39361572265625, -1.3426055908203125, -1.291595458984375, -1.2405853271484375, -1.1895751953125, -1.1385650634765625, -1.087554931640625, -1.0365447998046875, -0.98553466796875, -0.9345245361328125, -0.883514404296875, -0.8325042724609375, -0.781494140625, -0.7304840087890625, -0.679473876953125, -0.6284637451171875, -0.57745361328125, -0.5264434814453125, -0.475433349609375, -0.4244232177734375, -0.3734130859375, -0.3224029541015625, -0.271392822265625, -0.2203826904296875, -0.16937255859375, -0.1183624267578125, -0.067352294921875, -0.0163421630859375, 0.03466796875, 0.0856781005859375, 0.136688232421875, 0.1876983642578125, 0.23870849609375, 0.2897186279296875, 0.340728759765625, 0.3917388916015625, 0.4427490234375, 0.4937591552734375, 0.544769287109375, 0.5957794189453125, 0.64678955078125, 0.6977996826171875, 0.748809814453125, 0.7998199462890625, 0.850830078125, 0.9018402099609375, 0.952850341796875, 1.0038604736328125, 1.05487060546875, 1.1058807373046875, 1.156890869140625, 1.2079010009765625, 1.2589111328125, 1.3099212646484375, 1.360931396484375, 1.4119415283203125, 1.46295166015625, 1.5139617919921875, 1.564971923828125, 1.6159820556640625, 1.6669921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 15.0, 26.0, 51.0, 101.0, 186.0, 645.0, 2180.0, 437.0, 183.0, 107.0, 45.0, 40.0, 17.0, 5.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.033447265625, -0.99267578125, -0.951904296875, -0.9111328125, -0.870361328125, -0.82958984375, -0.788818359375, -0.748046875, -0.707275390625, -0.66650390625, -0.625732421875, -0.5849609375, -0.544189453125, -0.50341796875, -0.462646484375, -0.421875, -0.381103515625, -0.34033203125, -0.299560546875, -0.2587890625, -0.218017578125, -0.17724609375, -0.136474609375, -0.095703125, -0.054931640625, -0.01416015625, 0.026611328125, 0.0673828125, 0.108154296875, 0.14892578125, 0.189697265625, 0.23046875, 0.271240234375, 0.31201171875, 0.352783203125, 0.3935546875, 0.434326171875, 0.47509765625, 0.515869140625, 0.556640625, 0.597412109375, 0.63818359375, 0.678955078125, 0.7197265625, 0.760498046875, 0.80126953125, 0.842041015625, 0.8828125, 0.923583984375, 0.96435546875, 1.005126953125, 1.0458984375, 1.086669921875, 1.12744140625, 1.168212890625, 1.208984375, 1.249755859375, 1.29052734375, 1.331298828125, 1.3720703125, 1.412841796875, 1.45361328125, 1.494384765625, 1.53515625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 17.0, 67.0, 243.0, 390.0, 224.0, 50.0, 13.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.677103042602539, -12.157782554626465, -11.63846206665039, -11.119141578674316, -10.599821090698242, -10.080500602722168, -9.561180114746094, -9.04185962677002, -8.522539138793945, -8.003218650817871, -7.483898162841797, -6.964577674865723, -6.445257186889648, -5.925936698913574, -5.4066162109375, -4.887295722961426, -4.367975234985352, -3.8486547470092773, -3.329334259033203, -2.810013771057129, -2.2906932830810547, -1.7713727951049805, -1.2520523071289062, -0.732731819152832, -0.2134113311767578, 0.3059091567993164, 0.8252296447753906, 1.3445501327514648, 1.863870620727539, 2.3831911087036133, 2.9025115966796875, 3.4218320846557617, 3.9411544799804688, 4.460474967956543, 4.979795455932617, 5.499115943908691, 6.018436431884766, 6.53775691986084, 7.057077407836914, 7.576397895812988, 8.095718383789062, 8.615038871765137, 9.134359359741211, 9.653679847717285, 10.17300033569336, 10.692320823669434, 11.211641311645508, 11.730961799621582, 12.250282287597656, 12.76960277557373, 13.288923263549805, 13.808243751525879, 14.327564239501953, 14.846884727478027, 15.366205215454102, 15.885525703430176, 16.40484619140625, 16.92416763305664, 17.4434871673584, 17.962806701660156, 18.482128143310547, 19.001449584960938, 19.520769119262695, 20.040088653564453, 20.559410095214844]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 8.0, 14.0, 11.0, 13.0, 22.0, 22.0, 23.0, 39.0, 44.0, 43.0, 45.0, 53.0, 60.0, 64.0, 46.0, 49.0, 53.0, 47.0, 55.0, 42.0, 38.0, 43.0, 35.0, 20.0, 16.0, 19.0, 16.0, 10.0, 10.0, 11.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6291866302490234, -2.518465042114258, -2.407743215560913, -2.2970216274261475, -2.186300039291382, -2.075578212738037, -1.9648566246032715, -1.8541350364685059, -1.7434133291244507, -1.6326916217803955, -1.5219700336456299, -1.4112483263015747, -1.3005266189575195, -1.189805030822754, -1.0790833234786987, -0.9683616757392883, -0.8576400279998779, -0.7469183802604675, -0.6361967325210571, -0.525475025177002, -0.41475337743759155, -0.30403172969818115, -0.19331002235412598, -0.08258837461471558, 0.028133273124694824, 0.13885493576526642, 0.249576598405838, 0.3602982759475708, 0.4710199236869812, 0.5817415714263916, 0.6924632787704468, 0.8031849265098572, 0.9139065742492676, 1.0246282815933228, 1.1353498697280884, 1.2460715770721436, 1.3567931652069092, 1.4675148725509644, 1.5782365798950195, 1.6889581680297852, 1.7996798753738403, 1.9104015827178955, 2.021123170852661, 2.131844997406006, 2.2425665855407715, 2.353288173675537, 2.4640097618103027, 2.5747315883636475, 2.685453176498413, 2.7961747646331787, 2.9068965911865234, 3.017618179321289, 3.1283397674560547, 3.2390613555908203, 3.349783182144165, 3.4605047702789307, 3.5712265968322754, 3.681948184967041, 3.7926700115203857, 3.9033915996551514, 4.014113426208496, 4.124835014343262, 4.235556602478027, 4.346278190612793, 4.456999778747559]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 13.0, 19.0, 23.0, 38.0, 43.0, 97.0, 170.0, 259.0, 540.0, 1115.0, 2500.0, 5868.0, 14363.0, 38660.0, 115951.0, 328734.0, 345237.0, 126285.0, 41935.0, 15441.0, 6104.0, 2633.0, 1200.0, 597.0, 305.0, 160.0, 70.0, 57.0, 35.0, 20.0, 20.0, 14.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0811920166015625, -1.045196533203125, -1.0092010498046875, -0.97320556640625, -0.9372100830078125, -0.901214599609375, -0.8652191162109375, -0.8292236328125, -0.7932281494140625, -0.757232666015625, -0.7212371826171875, -0.68524169921875, -0.6492462158203125, -0.613250732421875, -0.5772552490234375, -0.541259765625, -0.5052642822265625, -0.469268798828125, -0.4332733154296875, -0.39727783203125, -0.3612823486328125, -0.325286865234375, -0.2892913818359375, -0.2532958984375, -0.2173004150390625, -0.181304931640625, -0.1453094482421875, -0.10931396484375, -0.0733184814453125, -0.037322998046875, -0.0013275146484375, 0.03466796875, 0.0706634521484375, 0.106658935546875, 0.1426544189453125, 0.17864990234375, 0.2146453857421875, 0.250640869140625, 0.2866363525390625, 0.3226318359375, 0.3586273193359375, 0.394622802734375, 0.4306182861328125, 0.46661376953125, 0.5026092529296875, 0.538604736328125, 0.5746002197265625, 0.610595703125, 0.6465911865234375, 0.682586669921875, 0.7185821533203125, 0.75457763671875, 0.7905731201171875, 0.826568603515625, 0.8625640869140625, 0.8985595703125, 0.9345550537109375, 0.970550537109375, 1.0065460205078125, 1.04254150390625, 1.0785369873046875, 1.114532470703125, 1.1505279541015625, 1.1865234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 3.0, 2.0, 12.0, 13.0, 13.0, 8.0, 26.0, 27.0, 26.0, 44.0, 36.0, 39.0, 39.0, 47.0, 46.0, 35.0, 44.0, 52.0, 49.0, 54.0, 51.0, 52.0, 41.0, 31.0, 37.0, 32.0, 30.0, 20.0, 15.0, 9.0, 13.0, 11.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.2530517578125, -0.244140625, -0.2352294921875, -0.226318359375, -0.2174072265625, -0.20849609375, -0.1995849609375, -0.190673828125, -0.1817626953125, -0.1728515625, -0.1639404296875, -0.155029296875, -0.1461181640625, -0.13720703125, -0.1282958984375, -0.119384765625, -0.1104736328125, -0.1015625, -0.0926513671875, -0.083740234375, -0.0748291015625, -0.06591796875, -0.0570068359375, -0.048095703125, -0.0391845703125, -0.0302734375, -0.0213623046875, -0.012451171875, -0.0035400390625, 0.00537109375, 0.0142822265625, 0.023193359375, 0.0321044921875, 0.041015625, 0.0499267578125, 0.058837890625, 0.0677490234375, 0.07666015625, 0.0855712890625, 0.094482421875, 0.1033935546875, 0.1123046875, 0.1212158203125, 0.130126953125, 0.1390380859375, 0.14794921875, 0.1568603515625, 0.165771484375, 0.1746826171875, 0.18359375, 0.1925048828125, 0.201416015625, 0.2103271484375, 0.21923828125, 0.2281494140625, 0.237060546875, 0.2459716796875, 0.2548828125, 0.2637939453125, 0.272705078125, 0.2816162109375, 0.29052734375, 0.2994384765625, 0.308349609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 6.0, 0.0, 6.0, 7.0, 7.0, 8.0, 12.0, 19.0, 20.0, 42.0, 38.0, 53.0, 95.0, 135.0, 186.0, 279.0, 416.0, 740.0, 1410.0, 3427.0, 12177.0, 63610.0, 446426.0, 438749.0, 61842.0, 12001.0, 3328.0, 1403.0, 741.0, 424.0, 270.0, 179.0, 137.0, 88.0, 78.0, 49.0, 33.0, 37.0, 21.0, 18.0, 7.0, 9.0, 7.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.73046875, -1.6727752685546875, -1.615081787109375, -1.5573883056640625, -1.49969482421875, -1.4420013427734375, -1.384307861328125, -1.3266143798828125, -1.2689208984375, -1.2112274169921875, -1.153533935546875, -1.0958404541015625, -1.03814697265625, -0.9804534912109375, -0.922760009765625, -0.8650665283203125, -0.807373046875, -0.7496795654296875, -0.691986083984375, -0.6342926025390625, -0.57659912109375, -0.5189056396484375, -0.461212158203125, -0.4035186767578125, -0.3458251953125, -0.2881317138671875, -0.230438232421875, -0.1727447509765625, -0.11505126953125, -0.0573577880859375, 0.000335693359375, 0.0580291748046875, 0.11572265625, 0.1734161376953125, 0.231109619140625, 0.2888031005859375, 0.34649658203125, 0.4041900634765625, 0.461883544921875, 0.5195770263671875, 0.5772705078125, 0.6349639892578125, 0.692657470703125, 0.7503509521484375, 0.80804443359375, 0.8657379150390625, 0.923431396484375, 0.9811248779296875, 1.038818359375, 1.0965118408203125, 1.154205322265625, 1.2118988037109375, 1.26959228515625, 1.3272857666015625, 1.384979248046875, 1.4426727294921875, 1.5003662109375, 1.5580596923828125, 1.615753173828125, 1.6734466552734375, 1.73114013671875, 1.7888336181640625, 1.846527099609375, 1.9042205810546875, 1.9619140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 5.0, 4.0, 7.0, 6.0, 6.0, 13.0, 14.0, 14.0, 34.0, 23.0, 22.0, 18.0, 33.0, 33.0, 37.0, 45.0, 50.0, 44.0, 61.0, 54.0, 61.0, 44.0, 50.0, 43.0, 46.0, 38.0, 32.0, 28.0, 25.0, 19.0, 22.0, 11.0, 12.0, 11.0, 9.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7716217041015625, -1.720001220703125, -1.6683807373046875, -1.61676025390625, -1.5651397705078125, -1.513519287109375, -1.4618988037109375, -1.4102783203125, -1.3586578369140625, -1.307037353515625, -1.2554168701171875, -1.20379638671875, -1.1521759033203125, -1.100555419921875, -1.0489349365234375, -0.997314453125, -0.9456939697265625, -0.894073486328125, -0.8424530029296875, -0.79083251953125, -0.7392120361328125, -0.687591552734375, -0.6359710693359375, -0.5843505859375, -0.5327301025390625, -0.481109619140625, -0.4294891357421875, -0.37786865234375, -0.3262481689453125, -0.274627685546875, -0.2230072021484375, -0.17138671875, -0.1197662353515625, -0.068145751953125, -0.0165252685546875, 0.03509521484375, 0.0867156982421875, 0.138336181640625, 0.1899566650390625, 0.2415771484375, 0.2931976318359375, 0.344818115234375, 0.3964385986328125, 0.44805908203125, 0.4996795654296875, 0.551300048828125, 0.6029205322265625, 0.654541015625, 0.7061614990234375, 0.757781982421875, 0.8094024658203125, 0.86102294921875, 0.9126434326171875, 0.964263916015625, 1.0158843994140625, 1.0675048828125, 1.1191253662109375, 1.170745849609375, 1.2223663330078125, 1.27398681640625, 1.3256072998046875, 1.377227783203125, 1.4288482666015625, 1.48046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 9.0, 7.0, 8.0, 17.0, 17.0, 25.0, 46.0, 56.0, 58.0, 88.0, 158.0, 259.0, 361.0, 716.0, 1396.0, 3061.0, 8567.0, 36592.0, 248366.0, 598582.0, 119151.0, 20482.0, 5802.0, 2259.0, 970.0, 552.0, 334.0, 198.0, 132.0, 85.0, 62.0, 38.0, 18.0, 21.0, 24.0, 10.0, 7.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7822265625, -0.7572479248046875, -0.732269287109375, -0.7072906494140625, -0.68231201171875, -0.6573333740234375, -0.632354736328125, -0.6073760986328125, -0.5823974609375, -0.5574188232421875, -0.532440185546875, -0.5074615478515625, -0.48248291015625, -0.4575042724609375, -0.432525634765625, -0.4075469970703125, -0.382568359375, -0.3575897216796875, -0.332611083984375, -0.3076324462890625, -0.28265380859375, -0.2576751708984375, -0.232696533203125, -0.2077178955078125, -0.1827392578125, -0.1577606201171875, -0.132781982421875, -0.1078033447265625, -0.08282470703125, -0.0578460693359375, -0.032867431640625, -0.0078887939453125, 0.01708984375, 0.0420684814453125, 0.067047119140625, 0.0920257568359375, 0.11700439453125, 0.1419830322265625, 0.166961669921875, 0.1919403076171875, 0.2169189453125, 0.2418975830078125, 0.266876220703125, 0.2918548583984375, 0.31683349609375, 0.3418121337890625, 0.366790771484375, 0.3917694091796875, 0.416748046875, 0.4417266845703125, 0.466705322265625, 0.4916839599609375, 0.51666259765625, 0.5416412353515625, 0.566619873046875, 0.5915985107421875, 0.6165771484375, 0.6415557861328125, 0.666534423828125, 0.6915130615234375, 0.71649169921875, 0.7414703369140625, 0.766448974609375, 0.7914276123046875, 0.81640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 15.0, 19.0, 18.0, 33.0, 31.0, 49.0, 58.0, 75.0, 79.0, 80.0, 80.0, 60.0, 63.0, 59.0, 52.0, 53.0, 38.0, 30.0, 18.0, 26.0, 13.0, 17.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00013113021850585938, -0.00012769736349582672, -0.00012426450848579407, -0.00012083165347576141, -0.00011739879846572876, -0.0001139659434556961, -0.00011053308844566345, -0.0001071002334356308, -0.00010366737842559814, -0.00010023452341556549, -9.680166840553284e-05, -9.336881339550018e-05, -8.993595838546753e-05, -8.650310337543488e-05, -8.307024836540222e-05, -7.963739335536957e-05, -7.620453834533691e-05, -7.277168333530426e-05, -6.93388283252716e-05, -6.590597331523895e-05, -6.24731183052063e-05, -5.9040263295173645e-05, -5.560740828514099e-05, -5.217455327510834e-05, -4.8741698265075684e-05, -4.530884325504303e-05, -4.1875988245010376e-05, -3.844313323497772e-05, -3.501027822494507e-05, -3.1577423214912415e-05, -2.814456820487976e-05, -2.4711713194847107e-05, -2.1278858184814453e-05, -1.78460031747818e-05, -1.4413148164749146e-05, -1.0980293154716492e-05, -7.547438144683838e-06, -4.114583134651184e-06, -6.817281246185303e-07, 2.7511268854141235e-06, 6.183981895446777e-06, 9.616836905479431e-06, 1.3049691915512085e-05, 1.648254692554474e-05, 1.9915401935577393e-05, 2.3348256945610046e-05, 2.67811119556427e-05, 3.0213966965675354e-05, 3.364682197570801e-05, 3.707967698574066e-05, 4.0512531995773315e-05, 4.394538700580597e-05, 4.737824201583862e-05, 5.081109702587128e-05, 5.424395203590393e-05, 5.7676807045936584e-05, 6.110966205596924e-05, 6.454251706600189e-05, 6.797537207603455e-05, 7.14082270860672e-05, 7.484108209609985e-05, 7.827393710613251e-05, 8.170679211616516e-05, 8.513964712619781e-05, 8.857250213623047e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 5.0, 15.0, 21.0, 25.0, 40.0, 70.0, 91.0, 145.0, 304.0, 647.0, 1415.0, 4150.0, 17266.0, 173404.0, 739662.0, 94024.0, 11670.0, 3270.0, 1173.0, 474.0, 245.0, 136.0, 89.0, 54.0, 35.0, 23.0, 21.0, 16.0, 10.0, 11.0, 4.0, 5.0, 1.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0], "bins": [-1.37890625, -1.3438949584960938, -1.3088836669921875, -1.2738723754882812, -1.238861083984375, -1.2038497924804688, -1.1688385009765625, -1.1338272094726562, -1.09881591796875, -1.0638046264648438, -1.0287933349609375, -0.9937820434570312, -0.958770751953125, -0.9237594604492188, -0.8887481689453125, -0.8537368774414062, -0.8187255859375, -0.7837142944335938, -0.7487030029296875, -0.7136917114257812, -0.678680419921875, -0.6436691284179688, -0.6086578369140625, -0.5736465454101562, -0.53863525390625, -0.5036239624023438, -0.4686126708984375, -0.43360137939453125, -0.398590087890625, -0.36357879638671875, -0.3285675048828125, -0.29355621337890625, -0.258544921875, -0.22353363037109375, -0.1885223388671875, -0.15351104736328125, -0.118499755859375, -0.08348846435546875, -0.0484771728515625, -0.01346588134765625, 0.02154541015625, 0.05655670166015625, 0.0915679931640625, 0.12657928466796875, 0.161590576171875, 0.19660186767578125, 0.2316131591796875, 0.26662445068359375, 0.3016357421875, 0.33664703369140625, 0.3716583251953125, 0.40666961669921875, 0.441680908203125, 0.47669219970703125, 0.5117034912109375, 0.5467147827148438, 0.58172607421875, 0.6167373657226562, 0.6517486572265625, 0.6867599487304688, 0.721771240234375, 0.7567825317382812, 0.7917938232421875, 0.8268051147460938, 0.86181640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 1.0, 6.0, 3.0, 1.0, 6.0, 9.0, 14.0, 16.0, 31.0, 30.0, 34.0, 53.0, 70.0, 97.0, 103.0, 89.0, 111.0, 77.0, 64.0, 36.0, 41.0, 30.0, 16.0, 14.0, 11.0, 8.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5277633666992188, -0.5066986083984375, -0.48563385009765625, -0.464569091796875, -0.44350433349609375, -0.4224395751953125, -0.40137481689453125, -0.38031005859375, -0.35924530029296875, -0.3381805419921875, -0.31711578369140625, -0.296051025390625, -0.27498626708984375, -0.2539215087890625, -0.23285675048828125, -0.2117919921875, -0.19072723388671875, -0.1696624755859375, -0.14859771728515625, -0.127532958984375, -0.10646820068359375, -0.0854034423828125, -0.06433868408203125, -0.04327392578125, -0.02220916748046875, -0.0011444091796875, 0.01992034912109375, 0.040985107421875, 0.06204986572265625, 0.0831146240234375, 0.10417938232421875, 0.125244140625, 0.14630889892578125, 0.1673736572265625, 0.18843841552734375, 0.209503173828125, 0.23056793212890625, 0.2516326904296875, 0.27269744873046875, 0.29376220703125, 0.31482696533203125, 0.3358917236328125, 0.35695648193359375, 0.378021240234375, 0.39908599853515625, 0.4201507568359375, 0.44121551513671875, 0.4622802734375, 0.48334503173828125, 0.5044097900390625, 0.5254745483398438, 0.546539306640625, 0.5676040649414062, 0.5886688232421875, 0.6097335815429688, 0.63079833984375, 0.6518630981445312, 0.6729278564453125, 0.6939926147460938, 0.715057373046875, 0.7361221313476562, 0.7571868896484375, 0.7782516479492188, 0.79931640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 11.0, 33.0, 63.0, 102.0, 155.0, 168.0, 144.0, 132.0, 69.0, 57.0, 29.0, 20.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.308833122253418, -4.918044567108154, -4.527256488800049, -4.136467933654785, -3.7456796169281006, -3.354891300201416, -2.9641027450561523, -2.5733144283294678, -2.182526111602783, -1.7917377948760986, -1.4009493589401245, -1.0101609230041504, -0.6193726062774658, -0.22858428955078125, 0.16220426559448242, 0.552992582321167, 0.9437808990478516, 1.3345692157745361, 1.7253576517105103, 2.1161460876464844, 2.506934404373169, 2.8977227210998535, 3.288511276245117, 3.6792995929718018, 4.070087909698486, 4.46087646484375, 4.8516645431518555, 5.242453098297119, 5.633241653442383, 6.024029731750488, 6.414818286895752, 6.805606842041016, 7.196393966674805, 7.587182521820068, 7.977970600128174, 8.368759155273438, 8.759547233581543, 9.150335311889648, 9.54112434387207, 9.931912422180176, 10.322700500488281, 10.713488578796387, 11.104277610778809, 11.495065689086914, 11.88585376739502, 12.276641845703125, 12.667430877685547, 13.058218955993652, 13.449007987976074, 13.83979606628418, 14.230585098266602, 14.621373176574707, 15.012161254882812, 15.402950286865234, 15.79373836517334, 16.184526443481445, 16.575315475463867, 16.96610450744629, 17.356891632080078, 17.7476806640625, 18.138469696044922, 18.52925682067871, 18.920045852661133, 19.310834884643555, 19.701622009277344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 6.0, 8.0, 4.0, 14.0, 11.0, 14.0, 14.0, 21.0, 29.0, 27.0, 45.0, 31.0, 39.0, 41.0, 52.0, 47.0, 52.0, 59.0, 62.0, 54.0, 51.0, 47.0, 38.0, 60.0, 28.0, 25.0, 19.0, 21.0, 24.0, 9.0, 14.0, 8.0, 8.0, 7.0, 3.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.653554916381836, -7.374362468719482, -7.095170021057129, -6.815977573394775, -6.536785125732422, -6.25759220123291, -5.978399753570557, -5.699207305908203, -5.42001485824585, -5.140822410583496, -4.861629962921143, -4.582437515258789, -4.303244590759277, -4.024052619934082, -3.7448596954345703, -3.465667247772217, -3.1864748001098633, -2.9072823524475098, -2.6280899047851562, -2.3488972187042236, -2.06970477104187, -1.7905123233795166, -1.5113197565078735, -1.2321271896362305, -0.952934741973877, -0.6737422347068787, -0.39454972743988037, -0.11535722017288208, 0.1638352870941162, 0.4430277347564697, 0.7222203016281128, 1.0014128684997559, 1.280604362487793, 1.5597968101501465, 1.8389893770217896, 2.1181819438934326, 2.397374391555786, 2.6765668392181396, 2.9557595252990723, 3.234951972961426, 3.5141444206237793, 3.793336868286133, 4.072529315948486, 4.35172176361084, 4.630914688110352, 4.910106658935547, 5.189299583435059, 5.468492031097412, 5.747684478759766, 6.026876926422119, 6.306069374084473, 6.585261821746826, 6.86445426940918, 7.143647193908691, 7.422839641571045, 7.702032089233398, 7.981224536895752, 8.260416984558105, 8.539609909057617, 8.818801879882812, 9.097994804382324, 9.37718677520752, 9.656379699707031, 9.935571670532227, 10.214764595031738]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 8.0, 10.0, 11.0, 11.0, 17.0, 23.0, 32.0, 36.0, 57.0, 70.0, 136.0, 273.0, 400.0, 676.0, 1188.0, 2578.0, 6901.0, 30807.0, 4021132.0, 109261.0, 12822.0, 3855.0, 1696.0, 908.0, 511.0, 288.0, 170.0, 95.0, 76.0, 63.0, 41.0, 32.0, 28.0, 16.0, 10.0, 7.0, 4.0, 7.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.330078125, -2.248992919921875, -2.16790771484375, -2.086822509765625, -2.0057373046875, -1.924652099609375, -1.84356689453125, -1.762481689453125, -1.681396484375, -1.600311279296875, -1.51922607421875, -1.438140869140625, -1.3570556640625, -1.275970458984375, -1.19488525390625, -1.113800048828125, -1.03271484375, -0.951629638671875, -0.87054443359375, -0.789459228515625, -0.7083740234375, -0.627288818359375, -0.54620361328125, -0.465118408203125, -0.384033203125, -0.302947998046875, -0.22186279296875, -0.140777587890625, -0.0596923828125, 0.021392822265625, 0.10247802734375, 0.183563232421875, 0.2646484375, 0.345733642578125, 0.42681884765625, 0.507904052734375, 0.5889892578125, 0.670074462890625, 0.75115966796875, 0.832244873046875, 0.913330078125, 0.994415283203125, 1.07550048828125, 1.156585693359375, 1.2376708984375, 1.318756103515625, 1.39984130859375, 1.480926513671875, 1.56201171875, 1.643096923828125, 1.72418212890625, 1.805267333984375, 1.8863525390625, 1.967437744140625, 2.04852294921875, 2.129608154296875, 2.210693359375, 2.291778564453125, 2.37286376953125, 2.453948974609375, 2.5350341796875, 2.616119384765625, 2.69720458984375, 2.778289794921875, 2.859375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 8.0, 4.0, 10.0, 18.0, 18.0, 19.0, 24.0, 30.0, 29.0, 39.0, 51.0, 46.0, 48.0, 58.0, 49.0, 63.0, 50.0, 41.0, 59.0, 44.0, 45.0, 40.0, 36.0, 28.0, 27.0, 21.0, 15.0, 15.0, 14.0, 10.0, 10.0, 6.0, 3.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31005859375, -0.2992897033691406, -0.28852081298828125, -0.2777519226074219, -0.2669830322265625, -0.2562141418457031, -0.24544525146484375, -0.23467636108398438, -0.223907470703125, -0.21313858032226562, -0.20236968994140625, -0.19160079956054688, -0.1808319091796875, -0.17006301879882812, -0.15929412841796875, -0.14852523803710938, -0.13775634765625, -0.12698745727539062, -0.11621856689453125, -0.10544967651367188, -0.0946807861328125, -0.08391189575195312, -0.07314300537109375, -0.062374114990234375, -0.051605224609375, -0.040836334228515625, -0.03006744384765625, -0.019298553466796875, -0.0085296630859375, 0.002239227294921875, 0.01300811767578125, 0.023777008056640625, 0.0345458984375, 0.045314788818359375, 0.05608367919921875, 0.06685256958007812, 0.0776214599609375, 0.08839035034179688, 0.09915924072265625, 0.10992813110351562, 0.120697021484375, 0.13146591186523438, 0.14223480224609375, 0.15300369262695312, 0.1637725830078125, 0.17454147338867188, 0.18531036376953125, 0.19607925415039062, 0.20684814453125, 0.21761703491210938, 0.22838592529296875, 0.23915481567382812, 0.2499237060546875, 0.2606925964355469, 0.27146148681640625, 0.2822303771972656, 0.292999267578125, 0.3037681579589844, 0.31453704833984375, 0.3253059387207031, 0.3360748291015625, 0.3468437194824219, 0.35761260986328125, 0.3683815002441406, 0.379150390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 9.0, 7.0, 17.0, 26.0, 21.0, 34.0, 62.0, 74.0, 120.0, 172.0, 273.0, 467.0, 803.0, 1540.0, 3094.0, 8267.0, 39893.0, 4050733.0, 70569.0, 10545.0, 3755.0, 1626.0, 815.0, 464.0, 260.0, 181.0, 117.0, 70.0, 59.0, 36.0, 40.0, 19.0, 22.0, 20.0, 15.0, 7.0, 7.0, 8.0, 8.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8515625, -2.758392333984375, -2.66522216796875, -2.572052001953125, -2.4788818359375, -2.385711669921875, -2.29254150390625, -2.199371337890625, -2.106201171875, -2.013031005859375, -1.91986083984375, -1.826690673828125, -1.7335205078125, -1.640350341796875, -1.54718017578125, -1.454010009765625, -1.36083984375, -1.267669677734375, -1.17449951171875, -1.081329345703125, -0.9881591796875, -0.894989013671875, -0.80181884765625, -0.708648681640625, -0.615478515625, -0.522308349609375, -0.42913818359375, -0.335968017578125, -0.2427978515625, -0.149627685546875, -0.05645751953125, 0.036712646484375, 0.1298828125, 0.223052978515625, 0.31622314453125, 0.409393310546875, 0.5025634765625, 0.595733642578125, 0.68890380859375, 0.782073974609375, 0.875244140625, 0.968414306640625, 1.06158447265625, 1.154754638671875, 1.2479248046875, 1.341094970703125, 1.43426513671875, 1.527435302734375, 1.62060546875, 1.713775634765625, 1.80694580078125, 1.900115966796875, 1.9932861328125, 2.086456298828125, 2.17962646484375, 2.272796630859375, 2.365966796875, 2.459136962890625, 2.55230712890625, 2.645477294921875, 2.7386474609375, 2.831817626953125, 2.92498779296875, 3.018157958984375, 3.111328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 3.0, 2.0, 6.0, 6.0, 18.0, 34.0, 83.0, 3608.0, 243.0, 37.0, 21.0, 9.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6538238525390625, -0.625030517578125, -0.5962371826171875, -0.56744384765625, -0.5386505126953125, -0.509857177734375, -0.4810638427734375, -0.4522705078125, -0.4234771728515625, -0.394683837890625, -0.3658905029296875, -0.33709716796875, -0.3083038330078125, -0.279510498046875, -0.2507171630859375, -0.221923828125, -0.1931304931640625, -0.164337158203125, -0.1355438232421875, -0.10675048828125, -0.0779571533203125, -0.049163818359375, -0.0203704833984375, 0.0084228515625, 0.0372161865234375, 0.066009521484375, 0.0948028564453125, 0.12359619140625, 0.1523895263671875, 0.181182861328125, 0.2099761962890625, 0.23876953125, 0.2675628662109375, 0.296356201171875, 0.3251495361328125, 0.35394287109375, 0.3827362060546875, 0.411529541015625, 0.4403228759765625, 0.4691162109375, 0.4979095458984375, 0.526702880859375, 0.5554962158203125, 0.58428955078125, 0.6130828857421875, 0.641876220703125, 0.6706695556640625, 0.699462890625, 0.7282562255859375, 0.757049560546875, 0.7858428955078125, 0.81463623046875, 0.8434295654296875, 0.872222900390625, 0.9010162353515625, 0.9298095703125, 0.9586029052734375, 0.987396240234375, 1.0161895751953125, 1.04498291015625, 1.0737762451171875, 1.102569580078125, 1.1313629150390625, 1.16015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 8.0, 6.0, 9.0, 19.0, 30.0, 41.0, 61.0, 101.0, 142.0, 131.0, 137.0, 121.0, 75.0, 41.0, 33.0, 19.0, 6.0, 10.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7955703735351562, -2.7245702743530273, -2.6535699367523193, -2.5825695991516113, -2.5115694999694824, -2.4405694007873535, -2.3695690631866455, -2.2985687255859375, -2.2275686264038086, -2.1565685272216797, -2.0855681896209717, -2.0145678520202637, -1.9435677528381348, -1.8725675344467163, -1.8015673160552979, -1.7305670976638794, -1.659566879272461, -1.5885666608810425, -1.517566442489624, -1.4465662240982056, -1.375566005706787, -1.3045657873153687, -1.2335655689239502, -1.1625653505325317, -1.0915651321411133, -1.0205649137496948, -0.9495646953582764, -0.8785644769668579, -0.8075642585754395, -0.736564040184021, -0.6655638217926025, -0.5945636034011841, -0.5235631465911865, -0.45256292819976807, -0.3815627098083496, -0.31056249141693115, -0.2395622730255127, -0.16856205463409424, -0.09756183624267578, -0.026561617851257324, 0.04443860054016113, 0.11543881893157959, 0.18643903732299805, 0.2574392557144165, 0.32843947410583496, 0.3994396924972534, 0.4704399108886719, 0.5414401292800903, 0.6124403476715088, 0.6834405660629272, 0.7544407844543457, 0.8254410028457642, 0.8964412212371826, 0.9674414396286011, 1.0384416580200195, 1.109441876411438, 1.1804420948028564, 1.251442313194275, 1.3224425315856934, 1.3934427499771118, 1.4644429683685303, 1.5354431867599487, 1.6064434051513672, 1.6774436235427856, 1.748443841934204]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 11.0, 9.0, 15.0, 8.0, 15.0, 28.0, 26.0, 37.0, 37.0, 45.0, 35.0, 42.0, 51.0, 45.0, 46.0, 47.0, 42.0, 36.0, 39.0, 38.0, 37.0, 38.0, 45.0, 32.0, 36.0, 27.0, 25.0, 21.0, 10.0, 16.0, 14.0, 8.0, 8.0, 7.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3777682781219482, -1.3389514684677124, -1.3001347780227661, -1.2613179683685303, -1.222501277923584, -1.1836844682693481, -1.1448677778244019, -1.106050968170166, -1.0672342777252197, -1.0284174680709839, -0.9896007776260376, -0.9507840275764465, -0.9119672775268555, -0.8731504678726196, -0.8343337178230286, -0.7955169677734375, -0.7567001581192017, -0.7178834080696106, -0.6790666580200195, -0.6402499079704285, -0.6014331579208374, -0.5626163482666016, -0.5237995982170105, -0.48498284816741943, -0.44616609811782837, -0.4073493480682373, -0.36853259801864624, -0.3297158181667328, -0.2908990681171417, -0.25208231806755066, -0.2132655531167984, -0.17444878816604614, -0.13563191890716553, -0.09681516140699387, -0.057998403906822205, -0.019181646406650543, 0.019635111093521118, 0.05845186114311218, 0.09726862609386444, 0.1360853910446167, 0.17490214109420776, 0.21371889114379883, 0.2525356411933899, 0.29135242104530334, 0.3301691710948944, 0.3689859211444855, 0.4078027009963989, 0.44661945104599, 0.48543620109558105, 0.5242529511451721, 0.5630697011947632, 0.6018864512443542, 0.6407032012939453, 0.6795200109481812, 0.7183367609977722, 0.7571535110473633, 0.7959702610969543, 0.8347870111465454, 0.8736037611961365, 0.9124205112457275, 0.9512373208999634, 0.9900540113449097, 1.0288708209991455, 1.0676875114440918, 1.1065043210983276]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 8.0, 6.0, 5.0, 8.0, 16.0, 22.0, 35.0, 55.0, 63.0, 122.0, 208.0, 404.0, 737.0, 1529.0, 3284.0, 6992.0, 16512.0, 37839.0, 85060.0, 179076.0, 280804.0, 226227.0, 115687.0, 52188.0, 22848.0, 9951.0, 4462.0, 2218.0, 1002.0, 532.0, 270.0, 145.0, 74.0, 52.0, 37.0, 22.0, 12.0, 11.0, 15.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.90966796875, -0.880035400390625, -0.85040283203125, -0.820770263671875, -0.7911376953125, -0.761505126953125, -0.73187255859375, -0.702239990234375, -0.672607421875, -0.642974853515625, -0.61334228515625, -0.583709716796875, -0.5540771484375, -0.524444580078125, -0.49481201171875, -0.465179443359375, -0.435546875, -0.405914306640625, -0.37628173828125, -0.346649169921875, -0.3170166015625, -0.287384033203125, -0.25775146484375, -0.228118896484375, -0.198486328125, -0.168853759765625, -0.13922119140625, -0.109588623046875, -0.0799560546875, -0.050323486328125, -0.02069091796875, 0.008941650390625, 0.03857421875, 0.068206787109375, 0.09783935546875, 0.127471923828125, 0.1571044921875, 0.186737060546875, 0.21636962890625, 0.246002197265625, 0.275634765625, 0.305267333984375, 0.33489990234375, 0.364532470703125, 0.3941650390625, 0.423797607421875, 0.45343017578125, 0.483062744140625, 0.5126953125, 0.542327880859375, 0.57196044921875, 0.601593017578125, 0.6312255859375, 0.660858154296875, 0.69049072265625, 0.720123291015625, 0.749755859375, 0.779388427734375, 0.80902099609375, 0.838653564453125, 0.8682861328125, 0.897918701171875, 0.92755126953125, 0.957183837890625, 0.98681640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 9.0, 6.0, 11.0, 8.0, 9.0, 15.0, 19.0, 17.0, 31.0, 26.0, 33.0, 36.0, 50.0, 42.0, 46.0, 42.0, 65.0, 50.0, 54.0, 50.0, 46.0, 45.0, 41.0, 36.0, 30.0, 25.0, 22.0, 22.0, 19.0, 21.0, 17.0, 11.0, 6.0, 11.0, 4.0, 3.0, 5.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.360595703125, -0.3488197326660156, -0.33704376220703125, -0.3252677917480469, -0.3134918212890625, -0.3017158508300781, -0.28993988037109375, -0.2781639099121094, -0.266387939453125, -0.2546119689941406, -0.24283599853515625, -0.23106002807617188, -0.2192840576171875, -0.20750808715820312, -0.19573211669921875, -0.18395614624023438, -0.17218017578125, -0.16040420532226562, -0.14862823486328125, -0.13685226440429688, -0.1250762939453125, -0.11330032348632812, -0.10152435302734375, -0.08974838256835938, -0.077972412109375, -0.06619644165039062, -0.05442047119140625, -0.042644500732421875, -0.0308685302734375, -0.019092559814453125, -0.00731658935546875, 0.004459381103515625, 0.0162353515625, 0.028011322021484375, 0.03978729248046875, 0.051563262939453125, 0.0633392333984375, 0.07511520385742188, 0.08689117431640625, 0.09866714477539062, 0.110443115234375, 0.12221908569335938, 0.13399505615234375, 0.14577102661132812, 0.1575469970703125, 0.16932296752929688, 0.18109893798828125, 0.19287490844726562, 0.20465087890625, 0.21642684936523438, 0.22820281982421875, 0.23997879028320312, 0.2517547607421875, 0.2635307312011719, 0.27530670166015625, 0.2870826721191406, 0.298858642578125, 0.3106346130371094, 0.32241058349609375, 0.3341865539550781, 0.3459625244140625, 0.3577384948730469, 0.36951446533203125, 0.3812904357910156, 0.39306640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 9.0, 16.0, 17.0, 20.0, 40.0, 47.0, 91.0, 118.0, 154.0, 256.0, 375.0, 557.0, 1157.0, 2591.0, 10050.0, 71700.0, 561160.0, 349576.0, 39738.0, 6392.0, 1901.0, 900.0, 519.0, 370.0, 233.0, 159.0, 135.0, 88.0, 56.0, 32.0, 33.0, 14.0, 19.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1953125, -2.128509521484375, -2.06170654296875, -1.994903564453125, -1.9281005859375, -1.861297607421875, -1.79449462890625, -1.727691650390625, -1.660888671875, -1.594085693359375, -1.52728271484375, -1.460479736328125, -1.3936767578125, -1.326873779296875, -1.26007080078125, -1.193267822265625, -1.12646484375, -1.059661865234375, -0.99285888671875, -0.926055908203125, -0.8592529296875, -0.792449951171875, -0.72564697265625, -0.658843994140625, -0.592041015625, -0.525238037109375, -0.45843505859375, -0.391632080078125, -0.3248291015625, -0.258026123046875, -0.19122314453125, -0.124420166015625, -0.0576171875, 0.009185791015625, 0.07598876953125, 0.142791748046875, 0.2095947265625, 0.276397705078125, 0.34320068359375, 0.410003662109375, 0.476806640625, 0.543609619140625, 0.61041259765625, 0.677215576171875, 0.7440185546875, 0.810821533203125, 0.87762451171875, 0.944427490234375, 1.01123046875, 1.078033447265625, 1.14483642578125, 1.211639404296875, 1.2784423828125, 1.345245361328125, 1.41204833984375, 1.478851318359375, 1.545654296875, 1.612457275390625, 1.67926025390625, 1.746063232421875, 1.8128662109375, 1.879669189453125, 1.94647216796875, 2.013275146484375, 2.080078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 11.0, 9.0, 18.0, 17.0, 21.0, 27.0, 26.0, 44.0, 42.0, 59.0, 46.0, 49.0, 59.0, 61.0, 54.0, 51.0, 56.0, 53.0, 46.0, 33.0, 34.0, 25.0, 32.0, 26.0, 17.0, 16.0, 11.0, 7.0, 8.0, 3.0, 6.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.47265625, -2.40533447265625, -2.3380126953125, -2.27069091796875, -2.203369140625, -2.13604736328125, -2.0687255859375, -2.00140380859375, -1.93408203125, -1.86676025390625, -1.7994384765625, -1.73211669921875, -1.664794921875, -1.59747314453125, -1.5301513671875, -1.46282958984375, -1.3955078125, -1.32818603515625, -1.2608642578125, -1.19354248046875, -1.126220703125, -1.05889892578125, -0.9915771484375, -0.92425537109375, -0.85693359375, -0.78961181640625, -0.7222900390625, -0.65496826171875, -0.587646484375, -0.52032470703125, -0.4530029296875, -0.38568115234375, -0.318359375, -0.25103759765625, -0.1837158203125, -0.11639404296875, -0.049072265625, 0.01824951171875, 0.0855712890625, 0.15289306640625, 0.22021484375, 0.28753662109375, 0.3548583984375, 0.42218017578125, 0.489501953125, 0.55682373046875, 0.6241455078125, 0.69146728515625, 0.7587890625, 0.82611083984375, 0.8934326171875, 0.96075439453125, 1.028076171875, 1.09539794921875, 1.1627197265625, 1.23004150390625, 1.29736328125, 1.36468505859375, 1.4320068359375, 1.49932861328125, 1.566650390625, 1.63397216796875, 1.7012939453125, 1.76861572265625, 1.8359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 11.0, 14.0, 23.0, 32.0, 49.0, 169.0, 292.0, 731.0, 2308.0, 9241.0, 87238.0, 867487.0, 69181.0, 8490.0, 2106.0, 654.0, 261.0, 121.0, 61.0, 29.0, 13.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.35546875, -2.2986602783203125, -2.241851806640625, -2.1850433349609375, -2.12823486328125, -2.0714263916015625, -2.014617919921875, -1.9578094482421875, -1.9010009765625, -1.8441925048828125, -1.787384033203125, -1.7305755615234375, -1.67376708984375, -1.6169586181640625, -1.560150146484375, -1.5033416748046875, -1.446533203125, -1.3897247314453125, -1.332916259765625, -1.2761077880859375, -1.21929931640625, -1.1624908447265625, -1.105682373046875, -1.0488739013671875, -0.9920654296875, -0.9352569580078125, -0.878448486328125, -0.8216400146484375, -0.76483154296875, -0.7080230712890625, -0.651214599609375, -0.5944061279296875, -0.53759765625, -0.4807891845703125, -0.423980712890625, -0.3671722412109375, -0.31036376953125, -0.2535552978515625, -0.196746826171875, -0.1399383544921875, -0.0831298828125, -0.0263214111328125, 0.030487060546875, 0.0872955322265625, 0.14410400390625, 0.2009124755859375, 0.257720947265625, 0.3145294189453125, 0.371337890625, 0.4281463623046875, 0.484954833984375, 0.5417633056640625, 0.59857177734375, 0.6553802490234375, 0.712188720703125, 0.7689971923828125, 0.8258056640625, 0.8826141357421875, 0.939422607421875, 0.9962310791015625, 1.05303955078125, 1.1098480224609375, 1.166656494140625, 1.2234649658203125, 1.2802734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 6.0, 11.0, 11.0, 25.0, 34.0, 42.0, 34.0, 51.0, 74.0, 80.0, 89.0, 87.0, 84.0, 78.0, 54.0, 54.0, 43.0, 28.0, 14.0, 17.0, 16.0, 13.0, 7.0, 4.0, 5.0, 7.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001220703125, -0.00011828355491161346, -0.00011449679732322693, -0.00011071003973484039, -0.00010692328214645386, -0.00010313652455806732, -9.934976696968079e-05, -9.556300938129425e-05, -9.177625179290771e-05, -8.798949420452118e-05, -8.420273661613464e-05, -8.041597902774811e-05, -7.662922143936157e-05, -7.284246385097504e-05, -6.90557062625885e-05, -6.526894867420197e-05, -6.148219108581543e-05, -5.7695433497428894e-05, -5.390867590904236e-05, -5.012191832065582e-05, -4.633516073226929e-05, -4.254840314388275e-05, -3.8761645555496216e-05, -3.497488796710968e-05, -3.1188130378723145e-05, -2.740137279033661e-05, -2.3614615201950073e-05, -1.9827857613563538e-05, -1.6041100025177002e-05, -1.2254342436790466e-05, -8.46758484840393e-06, -4.680827260017395e-06, -8.940696716308594e-07, 2.8926879167556763e-06, 6.679445505142212e-06, 1.0466203093528748e-05, 1.4252960681915283e-05, 1.803971827030182e-05, 2.1826475858688354e-05, 2.561323344707489e-05, 2.9399991035461426e-05, 3.318674862384796e-05, 3.69735062122345e-05, 4.076026380062103e-05, 4.454702138900757e-05, 4.8333778977394104e-05, 5.212053656578064e-05, 5.5907294154167175e-05, 5.969405174255371e-05, 6.348080933094025e-05, 6.726756691932678e-05, 7.105432450771332e-05, 7.484108209609985e-05, 7.862783968448639e-05, 8.241459727287292e-05, 8.620135486125946e-05, 8.9988112449646e-05, 9.377487003803253e-05, 9.756162762641907e-05, 0.0001013483852148056, 0.00010513514280319214, 0.00010892190039157867, 0.00011270865797996521, 0.00011649541556835175, 0.00012028217315673828]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 4.0, 13.0, 7.0, 13.0, 12.0, 24.0, 36.0, 44.0, 89.0, 122.0, 218.0, 402.0, 875.0, 2196.0, 6608.0, 27394.0, 304737.0, 640997.0, 49816.0, 9456.0, 3065.0, 1150.0, 503.0, 269.0, 166.0, 87.0, 64.0, 55.0, 27.0, 16.0, 20.0, 13.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3154296875, -1.27691650390625, -1.2384033203125, -1.19989013671875, -1.161376953125, -1.12286376953125, -1.0843505859375, -1.04583740234375, -1.00732421875, -0.96881103515625, -0.9302978515625, -0.89178466796875, -0.853271484375, -0.81475830078125, -0.7762451171875, -0.73773193359375, -0.69921875, -0.66070556640625, -0.6221923828125, -0.58367919921875, -0.545166015625, -0.50665283203125, -0.4681396484375, -0.42962646484375, -0.39111328125, -0.35260009765625, -0.3140869140625, -0.27557373046875, -0.237060546875, -0.19854736328125, -0.1600341796875, -0.12152099609375, -0.0830078125, -0.04449462890625, -0.0059814453125, 0.03253173828125, 0.071044921875, 0.10955810546875, 0.1480712890625, 0.18658447265625, 0.22509765625, 0.26361083984375, 0.3021240234375, 0.34063720703125, 0.379150390625, 0.41766357421875, 0.4561767578125, 0.49468994140625, 0.533203125, 0.57171630859375, 0.6102294921875, 0.64874267578125, 0.687255859375, 0.72576904296875, 0.7642822265625, 0.80279541015625, 0.84130859375, 0.87982177734375, 0.9183349609375, 0.95684814453125, 0.995361328125, 1.03387451171875, 1.0723876953125, 1.11090087890625, 1.1494140625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 7.0, 14.0, 10.0, 17.0, 13.0, 20.0, 29.0, 50.0, 70.0, 102.0, 103.0, 134.0, 114.0, 90.0, 56.0, 48.0, 35.0, 25.0, 15.0, 12.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0060806274414062, -0.9760284423828125, -0.9459762573242188, -0.915924072265625, -0.8858718872070312, -0.8558197021484375, -0.8257675170898438, -0.79571533203125, -0.7656631469726562, -0.7356109619140625, -0.7055587768554688, -0.675506591796875, -0.6454544067382812, -0.6154022216796875, -0.5853500366210938, -0.5552978515625, -0.5252456665039062, -0.4951934814453125, -0.46514129638671875, -0.435089111328125, -0.40503692626953125, -0.3749847412109375, -0.34493255615234375, -0.31488037109375, -0.28482818603515625, -0.2547760009765625, -0.22472381591796875, -0.194671630859375, -0.16461944580078125, -0.1345672607421875, -0.10451507568359375, -0.074462890625, -0.04441070556640625, -0.0143585205078125, 0.01569366455078125, 0.045745849609375, 0.07579803466796875, 0.1058502197265625, 0.13590240478515625, 0.16595458984375, 0.19600677490234375, 0.2260589599609375, 0.25611114501953125, 0.286163330078125, 0.31621551513671875, 0.3462677001953125, 0.37631988525390625, 0.4063720703125, 0.43642425537109375, 0.4664764404296875, 0.49652862548828125, 0.526580810546875, 0.5566329956054688, 0.5866851806640625, 0.6167373657226562, 0.64678955078125, 0.6768417358398438, 0.7068939208984375, 0.7369461059570312, 0.766998291015625, 0.7970504760742188, 0.8271026611328125, 0.8571548461914062, 0.88720703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 13.0, 14.0, 22.0, 31.0, 50.0, 79.0, 92.0, 105.0, 108.0, 100.0, 92.0, 86.0, 53.0, 43.0, 25.0, 27.0, 19.0, 11.0, 5.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.044634819030762, -7.720362186431885, -7.39608907699585, -7.071816444396973, -6.7475433349609375, -6.4232707023620605, -6.098998069763184, -5.774724960327148, -5.4504523277282715, -5.1261796951293945, -4.801906585693359, -4.477633953094482, -4.1533613204956055, -3.8290882110595703, -3.5048155784606934, -3.1805427074432373, -2.8562698364257812, -2.531996965408325, -2.207724094390869, -1.8834514617919922, -1.5591785907745361, -1.23490571975708, -0.9106329679489136, -0.5863602161407471, -0.262087345123291, 0.062185466289520264, 0.38645827770233154, 0.7107310891151428, 1.035003900527954, 1.3592767715454102, 1.6835495233535767, 2.007822275161743, 2.3320960998535156, 2.6563689708709717, 2.9806418418884277, 3.3049144744873047, 3.6291873455047607, 3.953460216522217, 4.277732849121094, 4.602005958557129, 4.926278591156006, 5.250551223754883, 5.574824333190918, 5.899096965789795, 6.223369598388672, 6.547642707824707, 6.871915340423584, 7.196187973022461, 7.520461082458496, 7.844733715057373, 8.16900634765625, 8.493279457092285, 8.81755256652832, 9.141824722290039, 9.466097831726074, 9.79037094116211, 10.114643096923828, 10.438916206359863, 10.763188362121582, 11.087461471557617, 11.411734580993652, 11.736007690429688, 12.060279846191406, 12.384552955627441, 12.708826065063477]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 10.0, 5.0, 7.0, 12.0, 13.0, 13.0, 12.0, 22.0, 23.0, 29.0, 33.0, 30.0, 27.0, 36.0, 32.0, 47.0, 50.0, 52.0, 53.0, 41.0, 43.0, 42.0, 46.0, 39.0, 38.0, 38.0, 36.0, 28.0, 29.0, 24.0, 12.0, 13.0, 15.0, 12.0, 5.0, 4.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.243448257446289, -7.964699745178223, -7.685951232910156, -7.407202243804932, -7.128453731536865, -6.849705219268799, -6.570956230163574, -6.292207717895508, -6.013459205627441, -5.734710693359375, -5.455962181091309, -5.177213191986084, -4.898464679718018, -4.619716167449951, -4.340967178344727, -4.06221866607666, -3.7834701538085938, -3.5047216415405273, -3.225972890853882, -2.9472241401672363, -2.66847562789917, -2.3897271156311035, -2.110978364944458, -1.832229733467102, -1.553481101989746, -1.2747324705123901, -0.9959838390350342, -0.7172352075576782, -0.43848657608032227, -0.1597379446029663, 0.11901068687438965, 0.3977593183517456, 0.6765079498291016, 0.9552565813064575, 1.2340052127838135, 1.5127538442611694, 1.7915024757385254, 2.070250988006592, 2.3489997386932373, 2.627748489379883, 2.906497001647949, 3.1852455139160156, 3.463994264602661, 3.7427430152893066, 4.021491527557373, 4.3002400398254395, 4.578989028930664, 4.8577375411987305, 5.136486053466797, 5.415234565734863, 5.69398307800293, 5.972732067108154, 6.251480579376221, 6.530229091644287, 6.808978080749512, 7.087726593017578, 7.3664751052856445, 7.645223617553711, 7.923972129821777, 8.202720642089844, 8.481470108032227, 8.760218620300293, 9.03896713256836, 9.317715644836426, 9.596464157104492]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 6.0, 2.0, 7.0, 9.0, 12.0, 14.0, 13.0, 24.0, 33.0, 47.0, 53.0, 58.0, 108.0, 151.0, 203.0, 338.0, 608.0, 1113.0, 2161.0, 4897.0, 14008.0, 75622.0, 4013202.0, 59699.0, 12783.0, 4415.0, 2048.0, 1024.0, 553.0, 332.0, 196.0, 147.0, 107.0, 70.0, 55.0, 44.0, 26.0, 27.0, 21.0, 11.0, 8.0, 8.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8929595947265625, -1.824005126953125, -1.7550506591796875, -1.68609619140625, -1.6171417236328125, -1.548187255859375, -1.4792327880859375, -1.4102783203125, -1.3413238525390625, -1.272369384765625, -1.2034149169921875, -1.13446044921875, -1.0655059814453125, -0.996551513671875, -0.9275970458984375, -0.858642578125, -0.7896881103515625, -0.720733642578125, -0.6517791748046875, -0.58282470703125, -0.5138702392578125, -0.444915771484375, -0.3759613037109375, -0.3070068359375, -0.2380523681640625, -0.169097900390625, -0.1001434326171875, -0.03118896484375, 0.0377655029296875, 0.106719970703125, 0.1756744384765625, 0.24462890625, 0.3135833740234375, 0.382537841796875, 0.4514923095703125, 0.52044677734375, 0.5894012451171875, 0.658355712890625, 0.7273101806640625, 0.7962646484375, 0.8652191162109375, 0.934173583984375, 1.0031280517578125, 1.07208251953125, 1.1410369873046875, 1.209991455078125, 1.2789459228515625, 1.347900390625, 1.4168548583984375, 1.485809326171875, 1.5547637939453125, 1.62371826171875, 1.6926727294921875, 1.761627197265625, 1.8305816650390625, 1.8995361328125, 1.9684906005859375, 2.037445068359375, 2.1063995361328125, 2.17535400390625, 2.2443084716796875, 2.313262939453125, 2.3822174072265625, 2.451171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 7.0, 6.0, 6.0, 6.0, 15.0, 10.0, 16.0, 13.0, 24.0, 33.0, 38.0, 36.0, 42.0, 39.0, 48.0, 52.0, 51.0, 49.0, 50.0, 50.0, 54.0, 31.0, 45.0, 40.0, 34.0, 46.0, 21.0, 25.0, 14.0, 13.0, 13.0, 16.0, 10.0, 8.0, 9.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.412841796875, -0.4010734558105469, -0.38930511474609375, -0.3775367736816406, -0.3657684326171875, -0.3540000915527344, -0.34223175048828125, -0.3304634094238281, -0.318695068359375, -0.3069267272949219, -0.29515838623046875, -0.2833900451660156, -0.2716217041015625, -0.2598533630371094, -0.24808502197265625, -0.23631668090820312, -0.22454833984375, -0.21277999877929688, -0.20101165771484375, -0.18924331665039062, -0.1774749755859375, -0.16570663452148438, -0.15393829345703125, -0.14216995239257812, -0.130401611328125, -0.11863327026367188, -0.10686492919921875, -0.09509658813476562, -0.0833282470703125, -0.07155990600585938, -0.05979156494140625, -0.048023223876953125, -0.0362548828125, -0.024486541748046875, -0.01271820068359375, -0.000949859619140625, 0.0108184814453125, 0.022586822509765625, 0.03435516357421875, 0.046123504638671875, 0.057891845703125, 0.06966018676757812, 0.08142852783203125, 0.09319686889648438, 0.1049652099609375, 0.11673355102539062, 0.12850189208984375, 0.14027023315429688, 0.15203857421875, 0.16380691528320312, 0.17557525634765625, 0.18734359741210938, 0.1991119384765625, 0.21088027954101562, 0.22264862060546875, 0.23441696166992188, 0.246185302734375, 0.2579536437988281, 0.26972198486328125, 0.2814903259277344, 0.2932586669921875, 0.3050270080566406, 0.31679534912109375, 0.3285636901855469, 0.34033203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 9.0, 4.0, 4.0, 13.0, 15.0, 15.0, 32.0, 35.0, 45.0, 61.0, 82.0, 113.0, 161.0, 201.0, 275.0, 430.0, 620.0, 993.0, 1831.0, 3472.0, 8492.0, 37761.0, 3948758.0, 162274.0, 16834.0, 5474.0, 2436.0, 1334.0, 748.0, 480.0, 357.0, 229.0, 177.0, 133.0, 92.0, 69.0, 49.0, 43.0, 35.0, 24.0, 22.0, 13.0, 11.0, 10.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.35546875, -2.276336669921875, -2.19720458984375, -2.118072509765625, -2.0389404296875, -1.959808349609375, -1.88067626953125, -1.801544189453125, -1.722412109375, -1.643280029296875, -1.56414794921875, -1.485015869140625, -1.4058837890625, -1.326751708984375, -1.24761962890625, -1.168487548828125, -1.08935546875, -1.010223388671875, -0.93109130859375, -0.851959228515625, -0.7728271484375, -0.693695068359375, -0.61456298828125, -0.535430908203125, -0.456298828125, -0.377166748046875, -0.29803466796875, -0.218902587890625, -0.1397705078125, -0.060638427734375, 0.01849365234375, 0.097625732421875, 0.1767578125, 0.255889892578125, 0.33502197265625, 0.414154052734375, 0.4932861328125, 0.572418212890625, 0.65155029296875, 0.730682373046875, 0.809814453125, 0.888946533203125, 0.96807861328125, 1.047210693359375, 1.1263427734375, 1.205474853515625, 1.28460693359375, 1.363739013671875, 1.44287109375, 1.522003173828125, 1.60113525390625, 1.680267333984375, 1.7593994140625, 1.838531494140625, 1.91766357421875, 1.996795654296875, 2.075927734375, 2.155059814453125, 2.23419189453125, 2.313323974609375, 2.3924560546875, 2.471588134765625, 2.55072021484375, 2.629852294921875, 2.708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 11.0, 4.0, 9.0, 23.0, 40.0, 120.0, 3074.0, 624.0, 91.0, 38.0, 11.0, 9.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4814453125, -0.457305908203125, -0.43316650390625, -0.409027099609375, -0.3848876953125, -0.360748291015625, -0.33660888671875, -0.312469482421875, -0.288330078125, -0.264190673828125, -0.24005126953125, -0.215911865234375, -0.1917724609375, -0.167633056640625, -0.14349365234375, -0.119354248046875, -0.09521484375, -0.071075439453125, -0.04693603515625, -0.022796630859375, 0.0013427734375, 0.025482177734375, 0.04962158203125, 0.073760986328125, 0.097900390625, 0.122039794921875, 0.14617919921875, 0.170318603515625, 0.1944580078125, 0.218597412109375, 0.24273681640625, 0.266876220703125, 0.291015625, 0.315155029296875, 0.33929443359375, 0.363433837890625, 0.3875732421875, 0.411712646484375, 0.43585205078125, 0.459991455078125, 0.484130859375, 0.508270263671875, 0.53240966796875, 0.556549072265625, 0.5806884765625, 0.604827880859375, 0.62896728515625, 0.653106689453125, 0.67724609375, 0.701385498046875, 0.72552490234375, 0.749664306640625, 0.7738037109375, 0.797943115234375, 0.82208251953125, 0.846221923828125, 0.870361328125, 0.894500732421875, 0.91864013671875, 0.942779541015625, 0.9669189453125, 0.991058349609375, 1.01519775390625, 1.039337158203125, 1.0634765625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 17.0, 17.0, 17.0, 21.0, 46.0, 62.0, 86.0, 114.0, 111.0, 120.0, 112.0, 72.0, 62.0, 34.0, 44.0, 25.0, 21.0, 10.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.56131649017334, -2.488560914993286, -2.4158055782318115, -2.343050003051758, -2.270294427871704, -2.1975388526916504, -2.124783515930176, -2.052027940750122, -1.9792723655700684, -1.9065169095993042, -1.8337613344192505, -1.7610058784484863, -1.6882503032684326, -1.6154948472976685, -1.5427393913269043, -1.4699838161468506, -1.3972283601760864, -1.3244729042053223, -1.2517173290252686, -1.1789618730545044, -1.1062062978744507, -1.0334508419036865, -0.9606953263282776, -0.8879398107528687, -0.8151842951774597, -0.7424287796020508, -0.6696732640266418, -0.5969177484512329, -0.5241622924804688, -0.4514067471027374, -0.3786512613296509, -0.30589574575424194, -0.233140230178833, -0.16038471460342407, -0.08762921392917633, -0.014873713254928589, 0.05788180232048035, 0.13063731789588928, 0.20339280366897583, 0.27614831924438477, 0.3489038348197937, 0.42165935039520264, 0.4944148659706116, 0.5671703815460205, 0.6399258375167847, 0.7126814126968384, 0.7854368686676025, 0.8581923842430115, 0.9309478998184204, 1.0037033557891846, 1.0764589309692383, 1.1492143869400024, 1.2219699621200562, 1.2947254180908203, 1.367480993270874, 1.4402364492416382, 1.5129919052124023, 1.5857473611831665, 1.6585029363632202, 1.7312583923339844, 1.804013967514038, 1.8767694234848022, 1.9495248794555664, 2.02228045463562, 2.095036029815674]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 10.0, 12.0, 13.0, 18.0, 20.0, 18.0, 29.0, 33.0, 31.0, 36.0, 37.0, 40.0, 50.0, 51.0, 51.0, 48.0, 48.0, 56.0, 55.0, 40.0, 43.0, 36.0, 41.0, 27.0, 26.0, 22.0, 23.0, 21.0, 4.0, 9.0, 8.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1754859685897827, -1.1310497522354126, -1.0866135358810425, -1.042177438735962, -0.997741162776947, -0.9533050060272217, -0.9088687896728516, -0.8644325733184814, -0.8199963569641113, -0.7755601406097412, -0.7311239838600159, -0.6866877675056458, -0.6422515511512756, -0.5978153944015503, -0.5533791780471802, -0.5089429616928101, -0.4645068049430847, -0.420070618391037, -0.37563440203666687, -0.33119821548461914, -0.286761999130249, -0.2423258125782013, -0.19788962602615356, -0.15345340967178345, -0.10901722311973572, -0.0645810216665268, -0.020144827663898468, 0.02429136633872986, 0.06872756779193878, 0.1131637692451477, 0.15759995579719543, 0.20203617215156555, 0.24647235870361328, 0.290908545255661, 0.33534476161003113, 0.37978094816207886, 0.424217164516449, 0.4686533510684967, 0.5130895376205444, 0.5575257539749146, 0.6019619703292847, 0.6463981866836548, 0.6908343434333801, 0.7352705597877502, 0.7797067761421204, 0.8241429328918457, 0.8685791492462158, 0.9130153656005859, 0.9574515223503113, 1.0018876791000366, 1.0463238954544067, 1.0907601118087769, 1.135196328163147, 1.179632544517517, 1.2240686416625977, 1.2685048580169678, 1.312941074371338, 1.357377290725708, 1.4018135070800781, 1.4462497234344482, 1.4906858205795288, 1.535122036933899, 1.579558253288269, 1.6239944696426392, 1.6684306859970093]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 6.0, 7.0, 8.0, 12.0, 11.0, 14.0, 33.0, 43.0, 47.0, 72.0, 120.0, 145.0, 229.0, 336.0, 524.0, 807.0, 1374.0, 2343.0, 4290.0, 7446.0, 13934.0, 26730.0, 51705.0, 100588.0, 181427.0, 243260.0, 189141.0, 106772.0, 55155.0, 28321.0, 14833.0, 7876.0, 4387.0, 2443.0, 1524.0, 905.0, 532.0, 354.0, 242.0, 189.0, 106.0, 77.0, 51.0, 41.0, 26.0, 16.0, 16.0, 6.0, 7.0, 6.0, 6.0, 6.0, 1.0, 4.0, 3.0], "bins": [-0.6494140625, -0.630615234375, -0.61181640625, -0.593017578125, -0.57421875, -0.555419921875, -0.53662109375, -0.517822265625, -0.4990234375, -0.480224609375, -0.46142578125, -0.442626953125, -0.423828125, -0.405029296875, -0.38623046875, -0.367431640625, -0.3486328125, -0.329833984375, -0.31103515625, -0.292236328125, -0.2734375, -0.254638671875, -0.23583984375, -0.217041015625, -0.1982421875, -0.179443359375, -0.16064453125, -0.141845703125, -0.123046875, -0.104248046875, -0.08544921875, -0.066650390625, -0.0478515625, -0.029052734375, -0.01025390625, 0.008544921875, 0.02734375, 0.046142578125, 0.06494140625, 0.083740234375, 0.1025390625, 0.121337890625, 0.14013671875, 0.158935546875, 0.177734375, 0.196533203125, 0.21533203125, 0.234130859375, 0.2529296875, 0.271728515625, 0.29052734375, 0.309326171875, 0.328125, 0.346923828125, 0.36572265625, 0.384521484375, 0.4033203125, 0.422119140625, 0.44091796875, 0.459716796875, 0.478515625, 0.497314453125, 0.51611328125, 0.534912109375, 0.5537109375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 4.0, 9.0, 10.0, 13.0, 9.0, 7.0, 18.0, 15.0, 22.0, 24.0, 25.0, 28.0, 43.0, 44.0, 36.0, 51.0, 60.0, 41.0, 45.0, 37.0, 44.0, 41.0, 33.0, 43.0, 38.0, 42.0, 37.0, 26.0, 21.0, 17.0, 21.0, 10.0, 13.0, 13.0, 7.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.38330078125, -0.37122344970703125, -0.3591461181640625, -0.34706878662109375, -0.334991455078125, -0.32291412353515625, -0.3108367919921875, -0.29875946044921875, -0.28668212890625, -0.27460479736328125, -0.2625274658203125, -0.25045013427734375, -0.238372802734375, -0.22629547119140625, -0.2142181396484375, -0.20214080810546875, -0.1900634765625, -0.17798614501953125, -0.1659088134765625, -0.15383148193359375, -0.141754150390625, -0.12967681884765625, -0.1175994873046875, -0.10552215576171875, -0.09344482421875, -0.08136749267578125, -0.0692901611328125, -0.05721282958984375, -0.045135498046875, -0.03305816650390625, -0.0209808349609375, -0.00890350341796875, 0.003173828125, 0.01525115966796875, 0.0273284912109375, 0.03940582275390625, 0.051483154296875, 0.06356048583984375, 0.0756378173828125, 0.08771514892578125, 0.09979248046875, 0.11186981201171875, 0.1239471435546875, 0.13602447509765625, 0.148101806640625, 0.16017913818359375, 0.1722564697265625, 0.18433380126953125, 0.1964111328125, 0.20848846435546875, 0.2205657958984375, 0.23264312744140625, 0.244720458984375, 0.25679779052734375, 0.2688751220703125, 0.28095245361328125, 0.29302978515625, 0.30510711669921875, 0.3171844482421875, 0.32926177978515625, 0.341339111328125, 0.35341644287109375, 0.3654937744140625, 0.37757110595703125, 0.3896484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 3.0, 8.0, 9.0, 13.0, 19.0, 33.0, 43.0, 73.0, 92.0, 147.0, 193.0, 323.0, 449.0, 731.0, 1414.0, 3508.0, 17547.0, 212433.0, 726620.0, 71400.0, 8342.0, 2287.0, 1069.0, 590.0, 364.0, 255.0, 157.0, 123.0, 81.0, 75.0, 36.0, 28.0, 26.0, 13.0, 11.0, 7.0, 2.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.693359375, -1.626434326171875, -1.55950927734375, -1.492584228515625, -1.4256591796875, -1.358734130859375, -1.29180908203125, -1.224884033203125, -1.157958984375, -1.091033935546875, -1.02410888671875, -0.957183837890625, -0.8902587890625, -0.823333740234375, -0.75640869140625, -0.689483642578125, -0.62255859375, -0.555633544921875, -0.48870849609375, -0.421783447265625, -0.3548583984375, -0.287933349609375, -0.22100830078125, -0.154083251953125, -0.087158203125, -0.020233154296875, 0.04669189453125, 0.113616943359375, 0.1805419921875, 0.247467041015625, 0.31439208984375, 0.381317138671875, 0.4482421875, 0.515167236328125, 0.58209228515625, 0.649017333984375, 0.7159423828125, 0.782867431640625, 0.84979248046875, 0.916717529296875, 0.983642578125, 1.050567626953125, 1.11749267578125, 1.184417724609375, 1.2513427734375, 1.318267822265625, 1.38519287109375, 1.452117919921875, 1.51904296875, 1.585968017578125, 1.65289306640625, 1.719818115234375, 1.7867431640625, 1.853668212890625, 1.92059326171875, 1.987518310546875, 2.054443359375, 2.121368408203125, 2.18829345703125, 2.255218505859375, 2.3221435546875, 2.389068603515625, 2.45599365234375, 2.522918701171875, 2.58984375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 10.0, 8.0, 13.0, 18.0, 22.0, 24.0, 24.0, 35.0, 42.0, 44.0, 59.0, 47.0, 51.0, 60.0, 63.0, 48.0, 46.0, 53.0, 40.0, 47.0, 55.0, 31.0, 28.0, 31.0, 12.0, 18.0, 13.0, 10.0, 9.0, 6.0, 7.0, 2.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.703125, -2.62457275390625, -2.5460205078125, -2.46746826171875, -2.388916015625, -2.31036376953125, -2.2318115234375, -2.15325927734375, -2.07470703125, -1.99615478515625, -1.9176025390625, -1.83905029296875, -1.760498046875, -1.68194580078125, -1.6033935546875, -1.52484130859375, -1.4462890625, -1.36773681640625, -1.2891845703125, -1.21063232421875, -1.132080078125, -1.05352783203125, -0.9749755859375, -0.89642333984375, -0.81787109375, -0.73931884765625, -0.6607666015625, -0.58221435546875, -0.503662109375, -0.42510986328125, -0.3465576171875, -0.26800537109375, -0.189453125, -0.11090087890625, -0.0323486328125, 0.04620361328125, 0.124755859375, 0.20330810546875, 0.2818603515625, 0.36041259765625, 0.43896484375, 0.51751708984375, 0.5960693359375, 0.67462158203125, 0.753173828125, 0.83172607421875, 0.9102783203125, 0.98883056640625, 1.0673828125, 1.14593505859375, 1.2244873046875, 1.30303955078125, 1.381591796875, 1.46014404296875, 1.5386962890625, 1.61724853515625, 1.69580078125, 1.77435302734375, 1.8529052734375, 1.93145751953125, 2.010009765625, 2.08856201171875, 2.1671142578125, 2.24566650390625, 2.32421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 15.0, 13.0, 26.0, 59.0, 131.0, 228.0, 557.0, 1919.0, 14793.0, 755534.0, 265650.0, 7433.0, 1328.0, 430.0, 193.0, 112.0, 56.0, 18.0, 16.0, 12.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.638671875, -2.577117919921875, -2.51556396484375, -2.454010009765625, -2.3924560546875, -2.330902099609375, -2.26934814453125, -2.207794189453125, -2.146240234375, -2.084686279296875, -2.02313232421875, -1.961578369140625, -1.9000244140625, -1.838470458984375, -1.77691650390625, -1.715362548828125, -1.65380859375, -1.592254638671875, -1.53070068359375, -1.469146728515625, -1.4075927734375, -1.346038818359375, -1.28448486328125, -1.222930908203125, -1.161376953125, -1.099822998046875, -1.03826904296875, -0.976715087890625, -0.9151611328125, -0.853607177734375, -0.79205322265625, -0.730499267578125, -0.6689453125, -0.607391357421875, -0.54583740234375, -0.484283447265625, -0.4227294921875, -0.361175537109375, -0.29962158203125, -0.238067626953125, -0.176513671875, -0.114959716796875, -0.05340576171875, 0.008148193359375, 0.0697021484375, 0.131256103515625, 0.19281005859375, 0.254364013671875, 0.31591796875, 0.377471923828125, 0.43902587890625, 0.500579833984375, 0.5621337890625, 0.623687744140625, 0.68524169921875, 0.746795654296875, 0.808349609375, 0.869903564453125, 0.93145751953125, 0.993011474609375, 1.0545654296875, 1.116119384765625, 1.17767333984375, 1.239227294921875, 1.30078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 15.0, 20.0, 31.0, 32.0, 55.0, 74.0, 85.0, 140.0, 131.0, 116.0, 92.0, 63.0, 36.0, 33.0, 18.0, 14.0, 8.0, 11.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001087188720703125, -0.00010341592133045197, -9.811297059059143e-05, -9.28100198507309e-05, -8.750706911087036e-05, -8.220411837100983e-05, -7.690116763114929e-05, -7.159821689128876e-05, -6.629526615142822e-05, -6.099231541156769e-05, -5.568936467170715e-05, -5.038641393184662e-05, -4.5083463191986084e-05, -3.978051245212555e-05, -3.4477561712265015e-05, -2.917461097240448e-05, -2.3871660232543945e-05, -1.856870949268341e-05, -1.3265758752822876e-05, -7.962808012962341e-06, -2.6598572731018066e-06, 2.643093466758728e-06, 7.946044206619263e-06, 1.3248994946479797e-05, 1.8551945686340332e-05, 2.3854896426200867e-05, 2.91578471660614e-05, 3.4460797905921936e-05, 3.976374864578247e-05, 4.5066699385643005e-05, 5.036965012550354e-05, 5.5672600865364075e-05, 6.097555160522461e-05, 6.627850234508514e-05, 7.158145308494568e-05, 7.688440382480621e-05, 8.218735456466675e-05, 8.749030530452728e-05, 9.279325604438782e-05, 9.809620678424835e-05, 0.00010339915752410889, 0.00010870210826396942, 0.00011400505900382996, 0.00011930800974369049, 0.00012461096048355103, 0.00012991391122341156, 0.0001352168619632721, 0.00014051981270313263, 0.00014582276344299316, 0.0001511257141828537, 0.00015642866492271423, 0.00016173161566257477, 0.0001670345664024353, 0.00017233751714229584, 0.00017764046788215637, 0.0001829434186220169, 0.00018824636936187744, 0.00019354932010173798, 0.0001988522708415985, 0.00020415522158145905, 0.00020945817232131958, 0.00021476112306118011, 0.00022006407380104065, 0.00022536702454090118, 0.00023066997528076172]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 10.0, 20.0, 42.0, 87.0, 222.0, 660.0, 3054.0, 93590.0, 935333.0, 13524.0, 1357.0, 382.0, 145.0, 58.0, 27.0, 16.0, 8.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.431640625, -3.346435546875, -3.26123046875, -3.176025390625, -3.0908203125, -3.005615234375, -2.92041015625, -2.835205078125, -2.75, -2.664794921875, -2.57958984375, -2.494384765625, -2.4091796875, -2.323974609375, -2.23876953125, -2.153564453125, -2.068359375, -1.983154296875, -1.89794921875, -1.812744140625, -1.7275390625, -1.642333984375, -1.55712890625, -1.471923828125, -1.38671875, -1.301513671875, -1.21630859375, -1.131103515625, -1.0458984375, -0.960693359375, -0.87548828125, -0.790283203125, -0.705078125, -0.619873046875, -0.53466796875, -0.449462890625, -0.3642578125, -0.279052734375, -0.19384765625, -0.108642578125, -0.0234375, 0.061767578125, 0.14697265625, 0.232177734375, 0.3173828125, 0.402587890625, 0.48779296875, 0.572998046875, 0.658203125, 0.743408203125, 0.82861328125, 0.913818359375, 0.9990234375, 1.084228515625, 1.16943359375, 1.254638671875, 1.33984375, 1.425048828125, 1.51025390625, 1.595458984375, 1.6806640625, 1.765869140625, 1.85107421875, 1.936279296875, 2.021484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 13.0, 24.0, 29.0, 73.0, 124.0, 184.0, 178.0, 159.0, 104.0, 60.0, 28.0, 17.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.908203125, -0.84503173828125, -0.7818603515625, -0.71868896484375, -0.655517578125, -0.59234619140625, -0.5291748046875, -0.46600341796875, -0.40283203125, -0.33966064453125, -0.2764892578125, -0.21331787109375, -0.150146484375, -0.08697509765625, -0.0238037109375, 0.03936767578125, 0.1025390625, 0.16571044921875, 0.2288818359375, 0.29205322265625, 0.355224609375, 0.41839599609375, 0.4815673828125, 0.54473876953125, 0.60791015625, 0.67108154296875, 0.7342529296875, 0.79742431640625, 0.860595703125, 0.92376708984375, 0.9869384765625, 1.05010986328125, 1.11328125, 1.17645263671875, 1.2396240234375, 1.30279541015625, 1.365966796875, 1.42913818359375, 1.4923095703125, 1.55548095703125, 1.61865234375, 1.68182373046875, 1.7449951171875, 1.80816650390625, 1.871337890625, 1.93450927734375, 1.9976806640625, 2.06085205078125, 2.1240234375, 2.18719482421875, 2.2503662109375, 2.31353759765625, 2.376708984375, 2.43988037109375, 2.5030517578125, 2.56622314453125, 2.62939453125, 2.69256591796875, 2.7557373046875, 2.81890869140625, 2.882080078125, 2.94525146484375, 3.0084228515625, 3.07159423828125, 3.134765625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 38.0, 244.0, 488.0, 190.0, 32.0, 10.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.351675033569336, -24.841657638549805, -23.331642150878906, -21.821624755859375, -20.311607360839844, -18.801589965820312, -17.291574478149414, -15.781557083129883, -14.271540641784668, -12.761524200439453, -11.251506805419922, -9.741490364074707, -8.231473922729492, -6.721456527709961, -5.211440086364746, -3.701422691345215, -2.19140625, -0.6813894510269165, 0.828627347946167, 2.338644027709961, 3.848660945892334, 5.358677864074707, 6.868694305419922, 8.378711700439453, 9.888728141784668, 11.398744583129883, 12.908761978149414, 14.418778419494629, 15.928794860839844, 17.438812255859375, 18.948829650878906, 20.458847045898438, 21.968860626220703, 23.478878021240234, 24.988893508911133, 26.498910903930664, 28.008928298950195, 29.518943786621094, 31.028961181640625, 32.538978576660156, 34.04899597167969, 35.55901336669922, 37.06903076171875, 38.57904815673828, 40.08906173706055, 41.59907913208008, 43.10909652709961, 44.61911392211914, 46.129127502441406, 47.63914489746094, 49.14916229248047, 50.6591796875, 52.169193267822266, 53.6792106628418, 55.18922805786133, 56.69924545288086, 58.20926284790039, 59.71928024291992, 61.22929763793945, 62.73931121826172, 64.24932861328125, 65.75934600830078, 67.26936340332031, 68.77938079833984, 70.28939819335938]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 12.0, 8.0, 10.0, 20.0, 18.0, 25.0, 19.0, 31.0, 25.0, 30.0, 37.0, 45.0, 40.0, 51.0, 51.0, 39.0, 46.0, 47.0, 34.0, 45.0, 48.0, 40.0, 39.0, 33.0, 24.0, 21.0, 22.0, 16.0, 20.0, 13.0, 13.0, 13.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0], "bins": [-10.644567489624023, -10.355752944946289, -10.066938400268555, -9.77812385559082, -9.489309310913086, -9.200495719909668, -8.911681175231934, -8.6228666305542, -8.334052085876465, -8.04523754119873, -7.756422996520996, -7.46760892868042, -7.1787943840026855, -6.889979839324951, -6.601165771484375, -6.312351226806641, -6.023536682128906, -5.734722137451172, -5.4459075927734375, -5.157093524932861, -4.868278980255127, -4.579464435577393, -4.290650367736816, -4.001835823059082, -3.7130212783813477, -3.4242067337036133, -3.135392427444458, -2.8465781211853027, -2.5577635765075684, -2.268949031829834, -1.9801347255706787, -1.6913204193115234, -1.402505874633789, -1.1136914491653442, -0.8248770236968994, -0.5360625982284546, -0.24724817276000977, 0.04156625270843506, 0.3303806781768799, 0.6191949844360352, 0.9080095291137695, 1.1968239545822144, 1.4856383800506592, 1.774452805519104, 2.063267230987549, 2.352081775665283, 2.6408960819244385, 2.9297103881835938, 3.218524932861328, 3.5073394775390625, 3.7961537837982178, 4.084968090057373, 4.373782634735107, 4.662597179412842, 4.951411247253418, 5.240225791931152, 5.529040336608887, 5.817854881286621, 6.1066694259643555, 6.395483493804932, 6.684298038482666, 6.9731125831604, 7.261926651000977, 7.550741195678711, 7.839555740356445]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 9.0, 14.0, 20.0, 17.0, 23.0, 31.0, 37.0, 48.0, 64.0, 92.0, 169.0, 292.0, 555.0, 1237.0, 4228.0, 52722.0, 4121125.0, 9781.0, 1983.0, 794.0, 358.0, 217.0, 121.0, 88.0, 57.0, 44.0, 39.0, 25.0, 21.0, 10.0, 17.0, 8.0, 10.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.94403076171875, -3.8216552734375, -3.69927978515625, -3.576904296875, -3.45452880859375, -3.3321533203125, -3.20977783203125, -3.08740234375, -2.96502685546875, -2.8426513671875, -2.72027587890625, -2.597900390625, -2.47552490234375, -2.3531494140625, -2.23077392578125, -2.1083984375, -1.98602294921875, -1.8636474609375, -1.74127197265625, -1.618896484375, -1.49652099609375, -1.3741455078125, -1.25177001953125, -1.12939453125, -1.00701904296875, -0.8846435546875, -0.76226806640625, -0.639892578125, -0.51751708984375, -0.3951416015625, -0.27276611328125, -0.150390625, -0.02801513671875, 0.0943603515625, 0.21673583984375, 0.339111328125, 0.46148681640625, 0.5838623046875, 0.70623779296875, 0.82861328125, 0.95098876953125, 1.0733642578125, 1.19573974609375, 1.318115234375, 1.44049072265625, 1.5628662109375, 1.68524169921875, 1.8076171875, 1.92999267578125, 2.0523681640625, 2.17474365234375, 2.297119140625, 2.41949462890625, 2.5418701171875, 2.66424560546875, 2.78662109375, 2.90899658203125, 3.0313720703125, 3.15374755859375, 3.276123046875, 3.39849853515625, 3.5208740234375, 3.64324951171875, 3.765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 9.0, 8.0, 20.0, 14.0, 21.0, 26.0, 27.0, 36.0, 42.0, 47.0, 54.0, 45.0, 50.0, 53.0, 62.0, 65.0, 55.0, 46.0, 41.0, 47.0, 48.0, 33.0, 32.0, 22.0, 18.0, 16.0, 12.0, 6.0, 8.0, 3.0, 0.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453857421875, -0.4383201599121094, -0.42278289794921875, -0.4072456359863281, -0.3917083740234375, -0.3761711120605469, -0.36063385009765625, -0.3450965881347656, -0.329559326171875, -0.3140220642089844, -0.29848480224609375, -0.2829475402832031, -0.2674102783203125, -0.2518730163574219, -0.23633575439453125, -0.22079849243164062, -0.20526123046875, -0.18972396850585938, -0.17418670654296875, -0.15864944458007812, -0.1431121826171875, -0.12757492065429688, -0.11203765869140625, -0.09650039672851562, -0.080963134765625, -0.06542587280273438, -0.04988861083984375, -0.034351348876953125, -0.0188140869140625, -0.003276824951171875, 0.01226043701171875, 0.027797698974609375, 0.0433349609375, 0.058872222900390625, 0.07440948486328125, 0.08994674682617188, 0.1054840087890625, 0.12102127075195312, 0.13655853271484375, 0.15209579467773438, 0.167633056640625, 0.18317031860351562, 0.19870758056640625, 0.21424484252929688, 0.2297821044921875, 0.24531936645507812, 0.26085662841796875, 0.2763938903808594, 0.29193115234375, 0.3074684143066406, 0.32300567626953125, 0.3385429382324219, 0.3540802001953125, 0.3696174621582031, 0.38515472412109375, 0.4006919860839844, 0.416229248046875, 0.4317665100097656, 0.44730377197265625, 0.4628410339355469, 0.4783782958984375, 0.4939155578613281, 0.5094528198242188, 0.5249900817871094, 0.54052734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 7.0, 2.0, 7.0, 12.0, 10.0, 23.0, 12.0, 24.0, 31.0, 61.0, 93.0, 131.0, 162.0, 291.0, 469.0, 778.0, 1440.0, 2786.0, 5812.0, 19814.0, 3693672.0, 439048.0, 18173.0, 5600.0, 2577.0, 1320.0, 680.0, 441.0, 263.0, 177.0, 104.0, 71.0, 61.0, 42.0, 22.0, 24.0, 20.0, 10.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.82855224609375, -1.7713623046875, -1.71417236328125, -1.656982421875, -1.59979248046875, -1.5426025390625, -1.48541259765625, -1.42822265625, -1.37103271484375, -1.3138427734375, -1.25665283203125, -1.199462890625, -1.14227294921875, -1.0850830078125, -1.02789306640625, -0.970703125, -0.91351318359375, -0.8563232421875, -0.79913330078125, -0.741943359375, -0.68475341796875, -0.6275634765625, -0.57037353515625, -0.51318359375, -0.45599365234375, -0.3988037109375, -0.34161376953125, -0.284423828125, -0.22723388671875, -0.1700439453125, -0.11285400390625, -0.0556640625, 0.00152587890625, 0.0587158203125, 0.11590576171875, 0.173095703125, 0.23028564453125, 0.2874755859375, 0.34466552734375, 0.40185546875, 0.45904541015625, 0.5162353515625, 0.57342529296875, 0.630615234375, 0.68780517578125, 0.7449951171875, 0.80218505859375, 0.859375, 0.91656494140625, 0.9737548828125, 1.03094482421875, 1.088134765625, 1.14532470703125, 1.2025146484375, 1.25970458984375, 1.31689453125, 1.37408447265625, 1.4312744140625, 1.48846435546875, 1.545654296875, 1.60284423828125, 1.6600341796875, 1.71722412109375, 1.7744140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 6.0, 19.0, 32.0, 57.0, 311.0, 3458.0, 97.0, 40.0, 13.0, 12.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6845703125, -0.6690673828125, -0.653564453125, -0.6380615234375, -0.62255859375, -0.6070556640625, -0.591552734375, -0.5760498046875, -0.560546875, -0.5450439453125, -0.529541015625, -0.5140380859375, -0.49853515625, -0.4830322265625, -0.467529296875, -0.4520263671875, -0.4365234375, -0.4210205078125, -0.405517578125, -0.3900146484375, -0.37451171875, -0.3590087890625, -0.343505859375, -0.3280029296875, -0.3125, -0.2969970703125, -0.281494140625, -0.2659912109375, -0.25048828125, -0.2349853515625, -0.219482421875, -0.2039794921875, -0.1884765625, -0.1729736328125, -0.157470703125, -0.1419677734375, -0.12646484375, -0.1109619140625, -0.095458984375, -0.0799560546875, -0.064453125, -0.0489501953125, -0.033447265625, -0.0179443359375, -0.00244140625, 0.0130615234375, 0.028564453125, 0.0440673828125, 0.0595703125, 0.0750732421875, 0.090576171875, 0.1060791015625, 0.12158203125, 0.1370849609375, 0.152587890625, 0.1680908203125, 0.18359375, 0.1990966796875, 0.214599609375, 0.2301025390625, 0.24560546875, 0.2611083984375, 0.276611328125, 0.2921142578125, 0.3076171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 6.0, 9.0, 16.0, 31.0, 43.0, 66.0, 112.0, 121.0, 151.0, 146.0, 116.0, 81.0, 37.0, 19.0, 12.0, 9.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7086793184280396, -1.6549272537231445, -1.6011751890182495, -1.5474231243133545, -1.493671178817749, -1.439919114112854, -1.386167049407959, -1.332414984703064, -1.278662919998169, -1.224910855293274, -1.171158790588379, -1.1174068450927734, -1.0636547803878784, -1.0099027156829834, -0.9561506509780884, -0.9023985862731934, -0.8486466407775879, -0.7948945760726929, -0.7411425709724426, -0.6873905062675476, -0.6336385011672974, -0.5798864364624023, -0.5261343717575073, -0.4723823368549347, -0.41863030195236206, -0.36487826704978943, -0.3111262321472168, -0.2573741674423218, -0.20362213253974915, -0.1498700976371765, -0.0961180329322815, -0.04236599802970886, 0.011385917663574219, 0.06513796001672745, 0.11889000236988068, 0.1726420521736145, 0.22639408707618713, 0.28014612197875977, 0.3338981866836548, 0.3876502215862274, 0.44140225648880005, 0.4951542913913727, 0.5489063262939453, 0.6026583909988403, 0.6564104557037354, 0.7101624608039856, 0.7639145255088806, 0.8176665306091309, 0.8714185953140259, 0.9251706600189209, 0.9789226651191711, 1.032674789428711, 1.0864267349243164, 1.1401787996292114, 1.1939308643341064, 1.2476829290390015, 1.3014349937438965, 1.3551870584487915, 1.4089391231536865, 1.462691068649292, 1.516443133354187, 1.570195198059082, 1.623947262763977, 1.677699327468872, 1.7314512729644775]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 7.0, 10.0, 8.0, 11.0, 21.0, 28.0, 19.0, 19.0, 29.0, 20.0, 18.0, 37.0, 29.0, 40.0, 38.0, 38.0, 36.0, 27.0, 39.0, 35.0, 49.0, 41.0, 33.0, 40.0, 29.0, 35.0, 33.0, 20.0, 27.0, 26.0, 29.0, 17.0, 20.0, 15.0, 11.0, 15.0, 6.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8688673973083496, -0.8430164456367493, -0.8171655535697937, -0.7913146018981934, -0.765463650226593, -0.7396126985549927, -0.7137618064880371, -0.6879108548164368, -0.6620599031448364, -0.6362089514732361, -0.6103580594062805, -0.5845071077346802, -0.5586561560630798, -0.5328052043914795, -0.5069543123245239, -0.4811033606529236, -0.45525243878364563, -0.4294015169143677, -0.40355056524276733, -0.3776996433734894, -0.35184869170188904, -0.3259977698326111, -0.30014681816101074, -0.2742958962917328, -0.24844495952129364, -0.2225940227508545, -0.19674308598041534, -0.1708921492099762, -0.14504122734069824, -0.1191902905702591, -0.09333935379981995, -0.0674884170293808, -0.04163748025894165, -0.01578654535114765, 0.010064389556646347, 0.0359153226017952, 0.061766259372234344, 0.0876171886920929, 0.11346812546253204, 0.1393190622329712, 0.16516999900341034, 0.1910209357738495, 0.21687187254428864, 0.24272280931472778, 0.26857373118400574, 0.2944246530532837, 0.32027560472488403, 0.3461265563964844, 0.37197747826576233, 0.3978284001350403, 0.4236793518066406, 0.4495302736759186, 0.4753812253475189, 0.5012321472167969, 0.5270830988883972, 0.5529340505599976, 0.5787849426269531, 0.6046358942985535, 0.630486786365509, 0.6563377380371094, 0.6821886897087097, 0.7080396413803101, 0.7338905334472656, 0.759741485118866, 0.7855924367904663]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 3.0, 16.0, 11.0, 20.0, 35.0, 44.0, 56.0, 99.0, 123.0, 248.0, 377.0, 717.0, 1202.0, 2236.0, 4316.0, 8675.0, 17259.0, 35602.0, 73660.0, 148180.0, 257076.0, 240107.0, 131238.0, 64933.0, 31091.0, 15064.0, 7556.0, 3859.0, 2015.0, 1101.0, 598.0, 368.0, 239.0, 111.0, 82.0, 70.0, 45.0, 36.0, 18.0, 23.0, 8.0, 6.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.58154296875, -0.5627288818359375, -0.543914794921875, -0.5251007080078125, -0.50628662109375, -0.4874725341796875, -0.468658447265625, -0.4498443603515625, -0.4310302734375, -0.4122161865234375, -0.393402099609375, -0.3745880126953125, -0.35577392578125, -0.3369598388671875, -0.318145751953125, -0.2993316650390625, -0.280517578125, -0.2617034912109375, -0.242889404296875, -0.2240753173828125, -0.20526123046875, -0.1864471435546875, -0.167633056640625, -0.1488189697265625, -0.1300048828125, -0.1111907958984375, -0.092376708984375, -0.0735626220703125, -0.05474853515625, -0.0359344482421875, -0.017120361328125, 0.0016937255859375, 0.0205078125, 0.0393218994140625, 0.058135986328125, 0.0769500732421875, 0.09576416015625, 0.1145782470703125, 0.133392333984375, 0.1522064208984375, 0.1710205078125, 0.1898345947265625, 0.208648681640625, 0.2274627685546875, 0.24627685546875, 0.2650909423828125, 0.283905029296875, 0.3027191162109375, 0.321533203125, 0.3403472900390625, 0.359161376953125, 0.3779754638671875, 0.39678955078125, 0.4156036376953125, 0.434417724609375, 0.4532318115234375, 0.4720458984375, 0.4908599853515625, 0.509674072265625, 0.5284881591796875, 0.54730224609375, 0.5661163330078125, 0.584930419921875, 0.6037445068359375, 0.62255859375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 8.0, 3.0, 4.0, 5.0, 13.0, 10.0, 16.0, 12.0, 26.0, 26.0, 30.0, 39.0, 35.0, 56.0, 53.0, 39.0, 57.0, 64.0, 59.0, 57.0, 43.0, 47.0, 41.0, 62.0, 33.0, 36.0, 23.0, 21.0, 20.0, 13.0, 7.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.49002838134765625, -0.4741973876953125, -0.45836639404296875, -0.442535400390625, -0.42670440673828125, -0.4108734130859375, -0.39504241943359375, -0.37921142578125, -0.36338043212890625, -0.3475494384765625, -0.33171844482421875, -0.315887451171875, -0.30005645751953125, -0.2842254638671875, -0.26839447021484375, -0.2525634765625, -0.23673248291015625, -0.2209014892578125, -0.20507049560546875, -0.189239501953125, -0.17340850830078125, -0.1575775146484375, -0.14174652099609375, -0.12591552734375, -0.11008453369140625, -0.0942535400390625, -0.07842254638671875, -0.062591552734375, -0.04676055908203125, -0.0309295654296875, -0.01509857177734375, 0.000732421875, 0.01656341552734375, 0.0323944091796875, 0.04822540283203125, 0.064056396484375, 0.07988739013671875, 0.0957183837890625, 0.11154937744140625, 0.12738037109375, 0.14321136474609375, 0.1590423583984375, 0.17487335205078125, 0.190704345703125, 0.20653533935546875, 0.2223663330078125, 0.23819732666015625, 0.2540283203125, 0.26985931396484375, 0.2856903076171875, 0.30152130126953125, 0.317352294921875, 0.33318328857421875, 0.3490142822265625, 0.36484527587890625, 0.38067626953125, 0.39650726318359375, 0.4123382568359375, 0.42816925048828125, 0.444000244140625, 0.45983123779296875, 0.4756622314453125, 0.49149322509765625, 0.50732421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 2.0, 8.0, 12.0, 15.0, 21.0, 24.0, 36.0, 91.0, 127.0, 197.0, 303.0, 451.0, 812.0, 1683.0, 5106.0, 51014.0, 833736.0, 141304.0, 8964.0, 2171.0, 1009.0, 567.0, 326.0, 220.0, 135.0, 74.0, 45.0, 46.0, 18.0, 14.0, 20.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7548370361328125, -1.686431884765625, -1.6180267333984375, -1.54962158203125, -1.4812164306640625, -1.412811279296875, -1.3444061279296875, -1.2760009765625, -1.2075958251953125, -1.139190673828125, -1.0707855224609375, -1.00238037109375, -0.9339752197265625, -0.865570068359375, -0.7971649169921875, -0.728759765625, -0.6603546142578125, -0.591949462890625, -0.5235443115234375, -0.45513916015625, -0.3867340087890625, -0.318328857421875, -0.2499237060546875, -0.1815185546875, -0.1131134033203125, -0.044708251953125, 0.0236968994140625, 0.09210205078125, 0.1605072021484375, 0.228912353515625, 0.2973175048828125, 0.36572265625, 0.4341278076171875, 0.502532958984375, 0.5709381103515625, 0.63934326171875, 0.7077484130859375, 0.776153564453125, 0.8445587158203125, 0.9129638671875, 0.9813690185546875, 1.049774169921875, 1.1181793212890625, 1.18658447265625, 1.2549896240234375, 1.323394775390625, 1.3917999267578125, 1.460205078125, 1.5286102294921875, 1.597015380859375, 1.6654205322265625, 1.73382568359375, 1.8022308349609375, 1.870635986328125, 1.9390411376953125, 2.0074462890625, 2.0758514404296875, 2.144256591796875, 2.2126617431640625, 2.28106689453125, 2.3494720458984375, 2.417877197265625, 2.4862823486328125, 2.5546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 16.0, 14.0, 21.0, 16.0, 21.0, 32.0, 37.0, 33.0, 30.0, 41.0, 37.0, 50.0, 55.0, 39.0, 48.0, 52.0, 46.0, 45.0, 50.0, 51.0, 40.0, 35.0, 28.0, 22.0, 16.0, 19.0, 17.0, 14.0, 9.0, 8.0, 7.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0], "bins": [-2.423828125, -2.3602294921875, -2.296630859375, -2.2330322265625, -2.16943359375, -2.1058349609375, -2.042236328125, -1.9786376953125, -1.9150390625, -1.8514404296875, -1.787841796875, -1.7242431640625, -1.66064453125, -1.5970458984375, -1.533447265625, -1.4698486328125, -1.40625, -1.3426513671875, -1.279052734375, -1.2154541015625, -1.15185546875, -1.0882568359375, -1.024658203125, -0.9610595703125, -0.8974609375, -0.8338623046875, -0.770263671875, -0.7066650390625, -0.64306640625, -0.5794677734375, -0.515869140625, -0.4522705078125, -0.388671875, -0.3250732421875, -0.261474609375, -0.1978759765625, -0.13427734375, -0.0706787109375, -0.007080078125, 0.0565185546875, 0.1201171875, 0.1837158203125, 0.247314453125, 0.3109130859375, 0.37451171875, 0.4381103515625, 0.501708984375, 0.5653076171875, 0.62890625, 0.6925048828125, 0.756103515625, 0.8197021484375, 0.88330078125, 0.9468994140625, 1.010498046875, 1.0740966796875, 1.1376953125, 1.2012939453125, 1.264892578125, 1.3284912109375, 1.39208984375, 1.4556884765625, 1.519287109375, 1.5828857421875, 1.646484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 3.0, 8.0, 15.0, 20.0, 35.0, 49.0, 101.0, 162.0, 292.0, 595.0, 1534.0, 4786.0, 37469.0, 868196.0, 122702.0, 8729.0, 2160.0, 849.0, 381.0, 192.0, 86.0, 63.0, 45.0, 25.0, 9.0, 14.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.607421875, -1.56475830078125, -1.5220947265625, -1.47943115234375, -1.436767578125, -1.39410400390625, -1.3514404296875, -1.30877685546875, -1.26611328125, -1.22344970703125, -1.1807861328125, -1.13812255859375, -1.095458984375, -1.05279541015625, -1.0101318359375, -0.96746826171875, -0.9248046875, -0.88214111328125, -0.8394775390625, -0.79681396484375, -0.754150390625, -0.71148681640625, -0.6688232421875, -0.62615966796875, -0.58349609375, -0.54083251953125, -0.4981689453125, -0.45550537109375, -0.412841796875, -0.37017822265625, -0.3275146484375, -0.28485107421875, -0.2421875, -0.19952392578125, -0.1568603515625, -0.11419677734375, -0.071533203125, -0.02886962890625, 0.0137939453125, 0.05645751953125, 0.09912109375, 0.14178466796875, 0.1844482421875, 0.22711181640625, 0.269775390625, 0.31243896484375, 0.3551025390625, 0.39776611328125, 0.4404296875, 0.48309326171875, 0.5257568359375, 0.56842041015625, 0.611083984375, 0.65374755859375, 0.6964111328125, 0.73907470703125, 0.78173828125, 0.82440185546875, 0.8670654296875, 0.90972900390625, 0.952392578125, 0.99505615234375, 1.0377197265625, 1.08038330078125, 1.123046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 11.0, 3.0, 5.0, 6.0, 4.0, 7.0, 13.0, 12.0, 11.0, 25.0, 20.0, 22.0, 29.0, 35.0, 44.0, 62.0, 71.0, 83.0, 84.0, 84.0, 68.0, 58.0, 59.0, 32.0, 27.0, 21.0, 14.0, 25.0, 19.0, 8.0, 6.0, 5.0, 5.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0], "bins": [-9.942054748535156e-05, -9.684357792139053e-05, -9.42666083574295e-05, -9.168963879346848e-05, -8.911266922950745e-05, -8.653569966554642e-05, -8.395873010158539e-05, -8.138176053762436e-05, -7.880479097366333e-05, -7.62278214097023e-05, -7.365085184574127e-05, -7.107388228178024e-05, -6.849691271781921e-05, -6.591994315385818e-05, -6.334297358989716e-05, -6.076600402593613e-05, -5.81890344619751e-05, -5.561206489801407e-05, -5.303509533405304e-05, -5.045812577009201e-05, -4.788115620613098e-05, -4.530418664216995e-05, -4.272721707820892e-05, -4.0150247514247894e-05, -3.7573277950286865e-05, -3.4996308386325836e-05, -3.241933882236481e-05, -2.9842369258403778e-05, -2.726539969444275e-05, -2.468843013048172e-05, -2.211146056652069e-05, -1.9534491002559662e-05, -1.6957521438598633e-05, -1.4380551874637604e-05, -1.1803582310676575e-05, -9.226612746715546e-06, -6.649643182754517e-06, -4.0726736187934875e-06, -1.4957040548324585e-06, 1.0812655091285706e-06, 3.6582350730895996e-06, 6.235204637050629e-06, 8.812174201011658e-06, 1.1389143764972687e-05, 1.3966113328933716e-05, 1.6543082892894745e-05, 1.9120052456855774e-05, 2.1697022020816803e-05, 2.4273991584777832e-05, 2.685096114873886e-05, 2.942793071269989e-05, 3.200490027666092e-05, 3.458186984062195e-05, 3.715883940458298e-05, 3.9735808968544006e-05, 4.2312778532505035e-05, 4.4889748096466064e-05, 4.7466717660427094e-05, 5.004368722438812e-05, 5.262065678834915e-05, 5.519762635231018e-05, 5.777459591627121e-05, 6.035156548023224e-05, 6.292853504419327e-05, 6.55055046081543e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 22.0, 34.0, 38.0, 68.0, 127.0, 231.0, 453.0, 1123.0, 3426.0, 17839.0, 522381.0, 480206.0, 17194.0, 3293.0, 1096.0, 471.0, 228.0, 113.0, 77.0, 33.0, 25.0, 15.0, 15.0, 10.0, 8.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01171875, -0.9712371826171875, -0.930755615234375, -0.8902740478515625, -0.84979248046875, -0.8093109130859375, -0.768829345703125, -0.7283477783203125, -0.6878662109375, -0.6473846435546875, -0.606903076171875, -0.5664215087890625, -0.52593994140625, -0.4854583740234375, -0.444976806640625, -0.4044952392578125, -0.364013671875, -0.3235321044921875, -0.283050537109375, -0.2425689697265625, -0.20208740234375, -0.1616058349609375, -0.121124267578125, -0.0806427001953125, -0.0401611328125, 0.0003204345703125, 0.040802001953125, 0.0812835693359375, 0.12176513671875, 0.1622467041015625, 0.202728271484375, 0.2432098388671875, 0.28369140625, 0.3241729736328125, 0.364654541015625, 0.4051361083984375, 0.44561767578125, 0.4860992431640625, 0.526580810546875, 0.5670623779296875, 0.6075439453125, 0.6480255126953125, 0.688507080078125, 0.7289886474609375, 0.76947021484375, 0.8099517822265625, 0.850433349609375, 0.8909149169921875, 0.931396484375, 0.9718780517578125, 1.012359619140625, 1.0528411865234375, 1.09332275390625, 1.1338043212890625, 1.174285888671875, 1.2147674560546875, 1.2552490234375, 1.2957305908203125, 1.336212158203125, 1.3766937255859375, 1.41717529296875, 1.4576568603515625, 1.498138427734375, 1.5386199951171875, 1.5791015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 6.0, 10.0, 8.0, 18.0, 21.0, 25.0, 70.0, 68.0, 108.0, 112.0, 135.0, 111.0, 97.0, 65.0, 51.0, 24.0, 23.0, 10.0, 12.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2939453125, -1.2633132934570312, -1.2326812744140625, -1.2020492553710938, -1.171417236328125, -1.1407852172851562, -1.1101531982421875, -1.0795211791992188, -1.04888916015625, -1.0182571411132812, -0.9876251220703125, -0.9569931030273438, -0.926361083984375, -0.8957290649414062, -0.8650970458984375, -0.8344650268554688, -0.8038330078125, -0.7732009887695312, -0.7425689697265625, -0.7119369506835938, -0.681304931640625, -0.6506729125976562, -0.6200408935546875, -0.5894088745117188, -0.55877685546875, -0.5281448364257812, -0.4975128173828125, -0.46688079833984375, -0.436248779296875, -0.40561676025390625, -0.3749847412109375, -0.34435272216796875, -0.313720703125, -0.28308868408203125, -0.2524566650390625, -0.22182464599609375, -0.191192626953125, -0.16056060791015625, -0.1299285888671875, -0.09929656982421875, -0.06866455078125, -0.03803253173828125, -0.0074005126953125, 0.02323150634765625, 0.053863525390625, 0.08449554443359375, 0.1151275634765625, 0.14575958251953125, 0.1763916015625, 0.20702362060546875, 0.2376556396484375, 0.26828765869140625, 0.298919677734375, 0.32955169677734375, 0.3601837158203125, 0.39081573486328125, 0.42144775390625, 0.45207977294921875, 0.4827117919921875, 0.5133438110351562, 0.543975830078125, 0.5746078491210938, 0.6052398681640625, 0.6358718872070312, 0.66650390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 12.0, 44.0, 147.0, 258.0, 293.0, 155.0, 53.0, 19.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.590126037597656, -21.812021255493164, -21.03391456604004, -20.255809783935547, -19.477703094482422, -18.69959831237793, -17.921493530273438, -17.143386840820312, -16.365280151367188, -15.587174415588379, -14.80906867980957, -14.030963897705078, -13.252857208251953, -12.474752426147461, -11.696646690368652, -10.918540954589844, -10.140436172485352, -9.362330436706543, -8.584224700927734, -7.806119441986084, -7.028013706207275, -6.249907970428467, -5.471802711486816, -4.693696975708008, -3.915591239929199, -3.1374855041503906, -2.359380006790161, -1.5812745094299316, -0.803168773651123, -0.025063037872314453, 0.7530422210693359, 1.5311479568481445, 2.309253692626953, 3.0873594284057617, 3.865464925765991, 4.643570423126221, 5.421676158905029, 6.199781894683838, 6.977887153625488, 7.755992889404297, 8.534098625183105, 9.312204360961914, 10.090310096740723, 10.868415832519531, 11.646520614624023, 12.424627304077148, 13.20273208618164, 13.98083782196045, 14.758943557739258, 15.537049293518066, 16.315155029296875, 17.093259811401367, 17.871366500854492, 18.649471282958984, 19.42757797241211, 20.2056827545166, 20.983787536621094, 21.761892318725586, 22.53999900817871, 23.318103790283203, 24.096210479736328, 24.87431526184082, 25.652420043945312, 26.430526733398438, 27.208633422851562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 12.0, 14.0, 9.0, 21.0, 25.0, 19.0, 39.0, 24.0, 36.0, 37.0, 34.0, 62.0, 63.0, 59.0, 68.0, 62.0, 50.0, 48.0, 40.0, 48.0, 36.0, 38.0, 27.0, 26.0, 21.0, 11.0, 15.0, 10.0, 7.0, 11.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.657814025878906, -10.325438499450684, -9.993062973022461, -9.660687446594238, -9.328311920166016, -8.995935440063477, -8.66356086730957, -8.331184387207031, -7.998808860778809, -7.666433334350586, -7.334057807922363, -7.001682281494141, -6.66930627822876, -6.336930751800537, -6.0045552253723145, -5.672179222106934, -5.339804172515869, -5.0074286460876465, -4.675053119659424, -4.342677116394043, -4.01030158996582, -3.6779260635375977, -3.345550537109375, -3.0131747722625732, -2.6807992458343506, -2.348423719406128, -2.016047954559326, -1.6836724281311035, -1.3512967824935913, -1.018921136856079, -0.6865456104278564, -0.3541698455810547, -0.02179431915283203, 0.3105812966823578, 0.6429569125175476, 0.975332498550415, 1.3077081441879272, 1.6400837898254395, 1.972459316253662, 2.304835081100464, 2.6372106075286865, 2.969586133956909, 3.301961898803711, 3.6343374252319336, 3.9667129516601562, 4.299088478088379, 4.631464004516602, 4.963840007781982, 5.296215534210205, 5.628591060638428, 5.96096658706665, 6.293342590332031, 6.625718116760254, 6.958093643188477, 7.290469169616699, 7.622844696044922, 7.9552202224731445, 8.287595748901367, 8.61997127532959, 8.952346801757812, 9.284722328186035, 9.617097854614258, 9.949474334716797, 10.28184986114502, 10.614225387573242]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 12.0, 10.0, 22.0, 36.0, 44.0, 47.0, 88.0, 163.0, 212.0, 372.0, 584.0, 1020.0, 1821.0, 3668.0, 8172.0, 24554.0, 193056.0, 3886822.0, 49714.0, 12963.0, 5163.0, 2449.0, 1289.0, 725.0, 435.0, 266.0, 184.0, 101.0, 75.0, 62.0, 40.0, 28.0, 19.0, 15.0, 10.0, 9.0, 7.0, 3.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.3883209228515625, -1.339141845703125, -1.2899627685546875, -1.24078369140625, -1.1916046142578125, -1.142425537109375, -1.0932464599609375, -1.0440673828125, -0.9948883056640625, -0.945709228515625, -0.8965301513671875, -0.84735107421875, -0.7981719970703125, -0.748992919921875, -0.6998138427734375, -0.650634765625, -0.6014556884765625, -0.552276611328125, -0.5030975341796875, -0.45391845703125, -0.4047393798828125, -0.355560302734375, -0.3063812255859375, -0.2572021484375, -0.2080230712890625, -0.158843994140625, -0.1096649169921875, -0.06048583984375, -0.0113067626953125, 0.037872314453125, 0.0870513916015625, 0.13623046875, 0.1854095458984375, 0.234588623046875, 0.2837677001953125, 0.33294677734375, 0.3821258544921875, 0.431304931640625, 0.4804840087890625, 0.5296630859375, 0.5788421630859375, 0.628021240234375, 0.6772003173828125, 0.72637939453125, 0.7755584716796875, 0.824737548828125, 0.8739166259765625, 0.923095703125, 0.9722747802734375, 1.021453857421875, 1.0706329345703125, 1.11981201171875, 1.1689910888671875, 1.218170166015625, 1.2673492431640625, 1.3165283203125, 1.3657073974609375, 1.414886474609375, 1.4640655517578125, 1.51324462890625, 1.5624237060546875, 1.611602783203125, 1.6607818603515625, 1.7099609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 8.0, 14.0, 13.0, 11.0, 19.0, 29.0, 36.0, 43.0, 40.0, 40.0, 55.0, 47.0, 40.0, 64.0, 58.0, 66.0, 59.0, 48.0, 50.0, 44.0, 45.0, 25.0, 28.0, 20.0, 18.0, 16.0, 15.0, 3.0, 4.0, 8.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5263671875, -0.5108528137207031, -0.49533843994140625, -0.4798240661621094, -0.4643096923828125, -0.4487953186035156, -0.43328094482421875, -0.4177665710449219, -0.402252197265625, -0.3867378234863281, -0.37122344970703125, -0.3557090759277344, -0.3401947021484375, -0.3246803283691406, -0.30916595458984375, -0.2936515808105469, -0.27813720703125, -0.2626228332519531, -0.24710845947265625, -0.23159408569335938, -0.2160797119140625, -0.20056533813476562, -0.18505096435546875, -0.16953659057617188, -0.154022216796875, -0.13850784301757812, -0.12299346923828125, -0.10747909545898438, -0.0919647216796875, -0.07645034790039062, -0.06093597412109375, -0.045421600341796875, -0.0299072265625, -0.014392852783203125, 0.00112152099609375, 0.016635894775390625, 0.0321502685546875, 0.047664642333984375, 0.06317901611328125, 0.07869338989257812, 0.094207763671875, 0.10972213745117188, 0.12523651123046875, 0.14075088500976562, 0.1562652587890625, 0.17177963256835938, 0.18729400634765625, 0.20280838012695312, 0.21832275390625, 0.23383712768554688, 0.24935150146484375, 0.2648658752441406, 0.2803802490234375, 0.2958946228027344, 0.31140899658203125, 0.3269233703613281, 0.342437744140625, 0.3579521179199219, 0.37346649169921875, 0.3889808654785156, 0.4044952392578125, 0.4200096130371094, 0.43552398681640625, 0.4510383605957031, 0.466552734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 7.0, 12.0, 8.0, 13.0, 20.0, 36.0, 29.0, 54.0, 106.0, 129.0, 218.0, 411.0, 659.0, 1331.0, 3155.0, 11069.0, 81828.0, 4032003.0, 49308.0, 8551.0, 2638.0, 1124.0, 609.0, 346.0, 203.0, 121.0, 83.0, 63.0, 37.0, 31.0, 16.0, 15.0, 11.0, 8.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.9599609375, -1.8828125, -1.8056640625, -1.728515625, -1.6513671875, -1.57421875, -1.4970703125, -1.419921875, -1.3427734375, -1.265625, -1.1884765625, -1.111328125, -1.0341796875, -0.95703125, -0.8798828125, -0.802734375, -0.7255859375, -0.6484375, -0.5712890625, -0.494140625, -0.4169921875, -0.33984375, -0.2626953125, -0.185546875, -0.1083984375, -0.03125, 0.0458984375, 0.123046875, 0.2001953125, 0.27734375, 0.3544921875, 0.431640625, 0.5087890625, 0.5859375, 0.6630859375, 0.740234375, 0.8173828125, 0.89453125, 0.9716796875, 1.048828125, 1.1259765625, 1.203125, 1.2802734375, 1.357421875, 1.4345703125, 1.51171875, 1.5888671875, 1.666015625, 1.7431640625, 1.8203125, 1.8974609375, 1.974609375, 2.0517578125, 2.12890625, 2.2060546875, 2.283203125, 2.3603515625, 2.4375, 2.5146484375, 2.591796875, 2.6689453125, 2.74609375, 2.8232421875, 2.900390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 6.0, 8.0, 14.0, 34.0, 69.0, 206.0, 3318.0, 249.0, 73.0, 34.0, 26.0, 14.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5437850952148438, -0.5109100341796875, -0.47803497314453125, -0.445159912109375, -0.41228485107421875, -0.3794097900390625, -0.34653472900390625, -0.31365966796875, -0.28078460693359375, -0.2479095458984375, -0.21503448486328125, -0.182159423828125, -0.14928436279296875, -0.1164093017578125, -0.08353424072265625, -0.0506591796875, -0.01778411865234375, 0.0150909423828125, 0.04796600341796875, 0.080841064453125, 0.11371612548828125, 0.1465911865234375, 0.17946624755859375, 0.21234130859375, 0.24521636962890625, 0.2780914306640625, 0.31096649169921875, 0.343841552734375, 0.37671661376953125, 0.4095916748046875, 0.44246673583984375, 0.475341796875, 0.5082168579101562, 0.5410919189453125, 0.5739669799804688, 0.606842041015625, 0.6397171020507812, 0.6725921630859375, 0.7054672241210938, 0.73834228515625, 0.7712173461914062, 0.8040924072265625, 0.8369674682617188, 0.869842529296875, 0.9027175903320312, 0.9355926513671875, 0.9684677124023438, 1.0013427734375, 1.0342178344726562, 1.0670928955078125, 1.0999679565429688, 1.132843017578125, 1.1657180786132812, 1.1985931396484375, 1.2314682006835938, 1.26434326171875, 1.2972183227539062, 1.3300933837890625, 1.3629684448242188, 1.395843505859375, 1.4287185668945312, 1.4615936279296875, 1.4944686889648438, 1.52734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 9.0, 12.0, 18.0, 28.0, 32.0, 51.0, 72.0, 96.0, 103.0, 110.0, 85.0, 90.0, 79.0, 44.0, 42.0, 29.0, 20.0, 15.0, 10.0, 7.0, 5.0, 4.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2522943019866943, -3.170741558074951, -3.089188575744629, -3.0076355934143066, -2.9260828495025635, -2.8445301055908203, -2.762977123260498, -2.681424140930176, -2.5998713970184326, -2.5183186531066895, -2.436765670776367, -2.355212688446045, -2.2736599445343018, -2.1921072006225586, -2.1105542182922363, -2.029001235961914, -1.947448492050171, -1.8658956289291382, -1.7843427658081055, -1.7027899026870728, -1.62123703956604, -1.5396841764450073, -1.4581313133239746, -1.376578450202942, -1.2950255870819092, -1.2134727239608765, -1.1319198608398438, -1.050366997718811, -0.9688141345977783, -0.8872612714767456, -0.8057084083557129, -0.7241555452346802, -0.6426024436950684, -0.5610495805740356, -0.47949671745300293, -0.3979438543319702, -0.3163909912109375, -0.23483812808990479, -0.15328526496887207, -0.07173240184783936, 0.00982046127319336, 0.09137332439422607, 0.1729261875152588, 0.2544790506362915, 0.3360319137573242, 0.41758477687835693, 0.49913763999938965, 0.5806905031204224, 0.6622433662414551, 0.7437962293624878, 0.8253490924835205, 0.9069019556045532, 0.9884548187255859, 1.0700076818466187, 1.1515605449676514, 1.233113408088684, 1.3146662712097168, 1.3962191343307495, 1.4777719974517822, 1.559324860572815, 1.6408777236938477, 1.7224305868148804, 1.803983449935913, 1.8855363130569458, 1.9670891761779785]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 15.0, 12.0, 17.0, 14.0, 13.0, 12.0, 33.0, 27.0, 33.0, 45.0, 40.0, 33.0, 47.0, 44.0, 51.0, 38.0, 36.0, 40.0, 44.0, 46.0, 39.0, 42.0, 40.0, 43.0, 34.0, 29.0, 19.0, 13.0, 20.0, 12.0, 11.0, 10.0, 9.0, 13.0, 8.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8936500549316406, -1.8366466760635376, -1.7796432971954346, -1.7226399183273315, -1.6656365394592285, -1.608633279800415, -1.5516297817230225, -1.494626522064209, -1.437623143196106, -1.380619764328003, -1.3236163854599, -1.2666130065917969, -1.2096096277236938, -1.1526062488555908, -1.0956029891967773, -1.0385996103286743, -0.9815961718559265, -0.9245927929878235, -0.8675894141197205, -0.8105860948562622, -0.7535827159881592, -0.6965793371200562, -0.6395759582519531, -0.5825725793838501, -0.5255692005157471, -0.46856582164764404, -0.4115624725818634, -0.3545590937137604, -0.29755574464797974, -0.2405523657798767, -0.18354898691177368, -0.12654563784599304, -0.0695422887802124, -0.01253892108798027, 0.04446444660425186, 0.10146781802177429, 0.15847118198871613, 0.21547454595565796, 0.272477924823761, 0.3294812738895416, 0.38648465275764465, 0.4434880316257477, 0.5004913806915283, 0.5574947595596313, 0.6144981384277344, 0.6715015172958374, 0.7285048961639404, 0.7855082154273987, 0.8425115942955017, 0.8995149731636047, 0.9565183520317078, 1.013521671295166, 1.070525050163269, 1.127528429031372, 1.184531807899475, 1.2415351867675781, 1.2985385656356812, 1.3555419445037842, 1.4125453233718872, 1.4695487022399902, 1.5265520811080933, 1.5835554599761963, 1.6405587196350098, 1.6975620985031128, 1.7545654773712158]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 6.0, 10.0, 14.0, 24.0, 37.0, 51.0, 72.0, 144.0, 220.0, 351.0, 651.0, 1260.0, 2442.0, 5155.0, 11712.0, 27132.0, 66396.0, 162842.0, 371965.0, 234764.0, 94580.0, 38649.0, 16010.0, 7032.0, 3349.0, 1626.0, 853.0, 479.0, 281.0, 166.0, 88.0, 61.0, 51.0, 31.0, 19.0, 9.0, 6.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.06597900390625, -1.0323486328125, -0.99871826171875, -0.965087890625, -0.93145751953125, -0.8978271484375, -0.86419677734375, -0.83056640625, -0.79693603515625, -0.7633056640625, -0.72967529296875, -0.696044921875, -0.66241455078125, -0.6287841796875, -0.59515380859375, -0.5615234375, -0.52789306640625, -0.4942626953125, -0.46063232421875, -0.427001953125, -0.39337158203125, -0.3597412109375, -0.32611083984375, -0.29248046875, -0.25885009765625, -0.2252197265625, -0.19158935546875, -0.157958984375, -0.12432861328125, -0.0906982421875, -0.05706787109375, -0.0234375, 0.01019287109375, 0.0438232421875, 0.07745361328125, 0.111083984375, 0.14471435546875, 0.1783447265625, 0.21197509765625, 0.24560546875, 0.27923583984375, 0.3128662109375, 0.34649658203125, 0.380126953125, 0.41375732421875, 0.4473876953125, 0.48101806640625, 0.5146484375, 0.54827880859375, 0.5819091796875, 0.61553955078125, 0.649169921875, 0.68280029296875, 0.7164306640625, 0.75006103515625, 0.78369140625, 0.81732177734375, 0.8509521484375, 0.88458251953125, 0.918212890625, 0.95184326171875, 0.9854736328125, 1.01910400390625, 1.052734375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0, 5.0, 7.0, 6.0, 12.0, 11.0, 9.0, 16.0, 28.0, 26.0, 25.0, 38.0, 40.0, 53.0, 43.0, 48.0, 47.0, 50.0, 58.0, 49.0, 58.0, 49.0, 50.0, 46.0, 38.0, 37.0, 30.0, 24.0, 19.0, 22.0, 19.0, 13.0, 5.0, 6.0, 2.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54541015625, -0.529052734375, -0.5126953125, -0.496337890625, -0.47998046875, -0.463623046875, -0.447265625, -0.430908203125, -0.41455078125, -0.398193359375, -0.3818359375, -0.365478515625, -0.34912109375, -0.332763671875, -0.31640625, -0.300048828125, -0.28369140625, -0.267333984375, -0.2509765625, -0.234619140625, -0.21826171875, -0.201904296875, -0.185546875, -0.169189453125, -0.15283203125, -0.136474609375, -0.1201171875, -0.103759765625, -0.08740234375, -0.071044921875, -0.0546875, -0.038330078125, -0.02197265625, -0.005615234375, 0.0107421875, 0.027099609375, 0.04345703125, 0.059814453125, 0.076171875, 0.092529296875, 0.10888671875, 0.125244140625, 0.1416015625, 0.157958984375, 0.17431640625, 0.190673828125, 0.20703125, 0.223388671875, 0.23974609375, 0.256103515625, 0.2724609375, 0.288818359375, 0.30517578125, 0.321533203125, 0.337890625, 0.354248046875, 0.37060546875, 0.386962890625, 0.4033203125, 0.419677734375, 0.43603515625, 0.452392578125, 0.46875, 0.485107421875, 0.50146484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 9.0, 12.0, 14.0, 13.0, 31.0, 42.0, 70.0, 80.0, 129.0, 211.0, 314.0, 560.0, 955.0, 2123.0, 6782.0, 50580.0, 705757.0, 254317.0, 19318.0, 3871.0, 1454.0, 733.0, 398.0, 255.0, 165.0, 109.0, 66.0, 47.0, 27.0, 39.0, 16.0, 11.0, 8.0, 7.0, 4.0, 1.0, 9.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.68359375, -2.608612060546875, -2.53363037109375, -2.458648681640625, -2.3836669921875, -2.308685302734375, -2.23370361328125, -2.158721923828125, -2.083740234375, -2.008758544921875, -1.93377685546875, -1.858795166015625, -1.7838134765625, -1.708831787109375, -1.63385009765625, -1.558868408203125, -1.48388671875, -1.408905029296875, -1.33392333984375, -1.258941650390625, -1.1839599609375, -1.108978271484375, -1.03399658203125, -0.959014892578125, -0.884033203125, -0.809051513671875, -0.73406982421875, -0.659088134765625, -0.5841064453125, -0.509124755859375, -0.43414306640625, -0.359161376953125, -0.2841796875, -0.209197998046875, -0.13421630859375, -0.059234619140625, 0.0157470703125, 0.090728759765625, 0.16571044921875, 0.240692138671875, 0.315673828125, 0.390655517578125, 0.46563720703125, 0.540618896484375, 0.6156005859375, 0.690582275390625, 0.76556396484375, 0.840545654296875, 0.91552734375, 0.990509033203125, 1.06549072265625, 1.140472412109375, 1.2154541015625, 1.290435791015625, 1.36541748046875, 1.440399169921875, 1.515380859375, 1.590362548828125, 1.66534423828125, 1.740325927734375, 1.8153076171875, 1.890289306640625, 1.96527099609375, 2.040252685546875, 2.115234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 7.0, 11.0, 12.0, 17.0, 19.0, 15.0, 29.0, 38.0, 43.0, 36.0, 46.0, 51.0, 62.0, 67.0, 62.0, 58.0, 59.0, 56.0, 50.0, 50.0, 38.0, 37.0, 24.0, 27.0, 28.0, 11.0, 15.0, 9.0, 8.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.12109375, -3.0429840087890625, -2.964874267578125, -2.8867645263671875, -2.80865478515625, -2.7305450439453125, -2.652435302734375, -2.5743255615234375, -2.4962158203125, -2.4181060791015625, -2.339996337890625, -2.2618865966796875, -2.18377685546875, -2.1056671142578125, -2.027557373046875, -1.9494476318359375, -1.871337890625, -1.7932281494140625, -1.715118408203125, -1.6370086669921875, -1.55889892578125, -1.4807891845703125, -1.402679443359375, -1.3245697021484375, -1.2464599609375, -1.1683502197265625, -1.090240478515625, -1.0121307373046875, -0.93402099609375, -0.8559112548828125, -0.777801513671875, -0.6996917724609375, -0.62158203125, -0.5434722900390625, -0.465362548828125, -0.3872528076171875, -0.30914306640625, -0.2310333251953125, -0.152923583984375, -0.0748138427734375, 0.0032958984375, 0.0814056396484375, 0.159515380859375, 0.2376251220703125, 0.31573486328125, 0.3938446044921875, 0.471954345703125, 0.5500640869140625, 0.628173828125, 0.7062835693359375, 0.784393310546875, 0.8625030517578125, 0.94061279296875, 1.0187225341796875, 1.096832275390625, 1.1749420166015625, 1.2530517578125, 1.3311614990234375, 1.409271240234375, 1.4873809814453125, 1.56549072265625, 1.6436004638671875, 1.721710205078125, 1.7998199462890625, 1.8779296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 17.0, 30.0, 52.0, 96.0, 163.0, 357.0, 732.0, 2488.0, 13861.0, 206136.0, 767006.0, 49687.0, 5570.0, 1375.0, 510.0, 202.0, 97.0, 57.0, 32.0, 16.0, 13.0, 9.0, 14.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.046142578125, -1.01806640625, -0.989990234375, -0.9619140625, -0.933837890625, -0.90576171875, -0.877685546875, -0.849609375, -0.821533203125, -0.79345703125, -0.765380859375, -0.7373046875, -0.709228515625, -0.68115234375, -0.653076171875, -0.625, -0.596923828125, -0.56884765625, -0.540771484375, -0.5126953125, -0.484619140625, -0.45654296875, -0.428466796875, -0.400390625, -0.372314453125, -0.34423828125, -0.316162109375, -0.2880859375, -0.260009765625, -0.23193359375, -0.203857421875, -0.17578125, -0.147705078125, -0.11962890625, -0.091552734375, -0.0634765625, -0.035400390625, -0.00732421875, 0.020751953125, 0.048828125, 0.076904296875, 0.10498046875, 0.133056640625, 0.1611328125, 0.189208984375, 0.21728515625, 0.245361328125, 0.2734375, 0.301513671875, 0.32958984375, 0.357666015625, 0.3857421875, 0.413818359375, 0.44189453125, 0.469970703125, 0.498046875, 0.526123046875, 0.55419921875, 0.582275390625, 0.6103515625, 0.638427734375, 0.66650390625, 0.694580078125, 0.72265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 11.0, 15.0, 15.0, 18.0, 34.0, 40.0, 41.0, 65.0, 78.0, 146.0, 135.0, 87.0, 65.0, 48.0, 44.0, 36.0, 36.0, 12.0, 13.0, 8.0, 8.0, 4.0, 9.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.250640869140625e-05, -8.81291925907135e-05, -8.375197649002075e-05, -7.9374760389328e-05, -7.499754428863525e-05, -7.06203281879425e-05, -6.624311208724976e-05, -6.186589598655701e-05, -5.748867988586426e-05, -5.311146378517151e-05, -4.873424768447876e-05, -4.435703158378601e-05, -3.997981548309326e-05, -3.560259938240051e-05, -3.1225383281707764e-05, -2.6848167181015015e-05, -2.2470951080322266e-05, -1.8093734979629517e-05, -1.3716518878936768e-05, -9.339302778244019e-06, -4.9620866775512695e-06, -5.848705768585205e-07, 3.7923455238342285e-06, 8.169561624526978e-06, 1.2546777725219727e-05, 1.6923993825912476e-05, 2.1301209926605225e-05, 2.5678426027297974e-05, 3.0055642127990723e-05, 3.443285822868347e-05, 3.881007432937622e-05, 4.318729043006897e-05, 4.756450653076172e-05, 5.194172263145447e-05, 5.631893873214722e-05, 6.0696154832839966e-05, 6.507337093353271e-05, 6.945058703422546e-05, 7.382780313491821e-05, 7.820501923561096e-05, 8.258223533630371e-05, 8.695945143699646e-05, 9.133666753768921e-05, 9.571388363838196e-05, 0.00010009109973907471, 0.00010446831583976746, 0.0001088455319404602, 0.00011322274804115295, 0.0001175999641418457, 0.00012197718024253845, 0.0001263543963432312, 0.00013073161244392395, 0.0001351088285446167, 0.00013948604464530945, 0.0001438632607460022, 0.00014824047684669495, 0.0001526176929473877, 0.00015699490904808044, 0.0001613721251487732, 0.00016574934124946594, 0.0001701265573501587, 0.00017450377345085144, 0.0001788809895515442, 0.00018325820565223694, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 7.0, 7.0, 23.0, 34.0, 79.0, 122.0, 285.0, 663.0, 2136.0, 12529.0, 436711.0, 577634.0, 14835.0, 2206.0, 717.0, 263.0, 120.0, 86.0, 43.0, 20.0, 10.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8187942504882812, -0.7816314697265625, -0.7444686889648438, -0.707305908203125, -0.6701431274414062, -0.6329803466796875, -0.5958175659179688, -0.55865478515625, -0.5214920043945312, -0.4843292236328125, -0.44716644287109375, -0.410003662109375, -0.37284088134765625, -0.3356781005859375, -0.29851531982421875, -0.2613525390625, -0.22418975830078125, -0.1870269775390625, -0.14986419677734375, -0.112701416015625, -0.07553863525390625, -0.0383758544921875, -0.00121307373046875, 0.03594970703125, 0.07311248779296875, 0.1102752685546875, 0.14743804931640625, 0.184600830078125, 0.22176361083984375, 0.2589263916015625, 0.29608917236328125, 0.333251953125, 0.37041473388671875, 0.4075775146484375, 0.44474029541015625, 0.481903076171875, 0.5190658569335938, 0.5562286376953125, 0.5933914184570312, 0.63055419921875, 0.6677169799804688, 0.7048797607421875, 0.7420425415039062, 0.779205322265625, 0.8163681030273438, 0.8535308837890625, 0.8906936645507812, 0.9278564453125, 0.9650192260742188, 1.0021820068359375, 1.0393447875976562, 1.076507568359375, 1.1136703491210938, 1.1508331298828125, 1.1879959106445312, 1.22515869140625, 1.2623214721679688, 1.2994842529296875, 1.3366470336914062, 1.373809814453125, 1.4109725952148438, 1.4481353759765625, 1.4852981567382812, 1.5224609375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 6.0, 17.0, 21.0, 17.0, 37.0, 41.0, 49.0, 67.0, 82.0, 70.0, 82.0, 72.0, 87.0, 79.0, 53.0, 40.0, 30.0, 18.0, 17.0, 15.0, 15.0, 10.0, 4.0, 13.0, 5.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5363540649414062, -0.5204620361328125, -0.5045700073242188, -0.488677978515625, -0.47278594970703125, -0.4568939208984375, -0.44100189208984375, -0.42510986328125, -0.40921783447265625, -0.3933258056640625, -0.37743377685546875, -0.361541748046875, -0.34564971923828125, -0.3297576904296875, -0.31386566162109375, -0.2979736328125, -0.28208160400390625, -0.2661895751953125, -0.25029754638671875, -0.234405517578125, -0.21851348876953125, -0.2026214599609375, -0.18672943115234375, -0.17083740234375, -0.15494537353515625, -0.1390533447265625, -0.12316131591796875, -0.107269287109375, -0.09137725830078125, -0.0754852294921875, -0.05959320068359375, -0.043701171875, -0.02780914306640625, -0.0119171142578125, 0.00397491455078125, 0.019866943359375, 0.03575897216796875, 0.0516510009765625, 0.06754302978515625, 0.08343505859375, 0.09932708740234375, 0.1152191162109375, 0.13111114501953125, 0.147003173828125, 0.16289520263671875, 0.1787872314453125, 0.19467926025390625, 0.2105712890625, 0.22646331787109375, 0.2423553466796875, 0.25824737548828125, 0.274139404296875, 0.29003143310546875, 0.3059234619140625, 0.32181549072265625, 0.33770751953125, 0.35359954833984375, 0.3694915771484375, 0.38538360595703125, 0.401275634765625, 0.41716766357421875, 0.4330596923828125, 0.44895172119140625, 0.46484375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 15.0, 38.0, 76.0, 107.0, 152.0, 199.0, 174.0, 116.0, 75.0, 18.0, 12.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.351943969726562, -17.83788299560547, -17.323820114135742, -16.80975914001465, -16.295698165893555, -15.781636238098145, -15.267574310302734, -14.75351333618164, -14.239452362060547, -13.725390434265137, -13.211329460144043, -12.697267532348633, -12.183206558227539, -11.669144630432129, -11.155082702636719, -10.641021728515625, -10.126959800720215, -9.612897872924805, -9.098836898803711, -8.5847749710083, -8.070713996887207, -7.556652069091797, -7.042590618133545, -6.528529167175293, -6.014467716217041, -5.500406265258789, -4.986344814300537, -4.472283363342285, -3.958221673965454, -3.444160223007202, -2.930098533630371, -2.416037082672119, -1.9019765853881836, -1.3879151344299316, -0.8738535642623901, -0.35979199409484863, 0.15426945686340332, 0.6683309078216553, 1.1823925971984863, 1.6964540481567383, 2.2105154991149902, 2.724576950073242, 3.238638401031494, 3.752700090408325, 4.266761779785156, 4.78082275390625, 5.29488468170166, 5.808946132659912, 6.323007583618164, 6.837069034576416, 7.351130485534668, 7.865192413330078, 8.379253387451172, 8.893315315246582, 9.407377243041992, 9.921438217163086, 10.43549919128418, 10.94956111907959, 11.463622093200684, 11.977684020996094, 12.491744995117188, 13.005806922912598, 13.519868850708008, 14.033929824829102, 14.547991752624512]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 13.0, 8.0, 10.0, 11.0, 8.0, 19.0, 25.0, 20.0, 23.0, 27.0, 36.0, 28.0, 49.0, 41.0, 54.0, 49.0, 42.0, 54.0, 47.0, 48.0, 42.0, 54.0, 36.0, 37.0, 38.0, 19.0, 23.0, 25.0, 13.0, 23.0, 11.0, 12.0, 11.0, 12.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.484269142150879, -8.211313247680664, -7.938357353210449, -7.665400981903076, -7.392445087432861, -7.1194891929626465, -6.846532821655273, -6.573576927185059, -6.300621032714844, -6.027665138244629, -5.754709243774414, -5.481752872467041, -5.208796977996826, -4.935841083526611, -4.662884712219238, -4.389928817749023, -4.116972923278809, -3.8440170288085938, -3.5710608959198, -3.298104763031006, -3.025148868560791, -2.752192974090576, -2.4792368412017822, -2.2062807083129883, -1.9333248138427734, -1.660368800163269, -1.3874127864837646, -1.1144567728042603, -0.8415007591247559, -0.5685447454452515, -0.29558873176574707, -0.022632718086242676, 0.2503232955932617, 0.5232793092727661, 0.7962353229522705, 1.069191336631775, 1.3421473503112793, 1.6151033639907837, 1.888059377670288, 2.161015510559082, 2.433971405029297, 2.7069272994995117, 2.9798834323883057, 3.2528395652770996, 3.5257954597473145, 3.7987513542175293, 4.071707725524902, 4.344663619995117, 4.617619514465332, 4.890575408935547, 5.163531303405762, 5.436487674713135, 5.70944356918335, 5.9823994636535645, 6.2553558349609375, 6.528311729431152, 6.801267623901367, 7.074223518371582, 7.347179412841797, 7.62013578414917, 7.893091678619385, 8.166048049926758, 8.439003944396973, 8.711959838867188, 8.984915733337402]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 15.0, 19.0, 19.0, 52.0, 52.0, 96.0, 138.0, 231.0, 324.0, 573.0, 941.0, 1558.0, 2780.0, 5039.0, 9411.0, 18822.0, 43338.0, 126579.0, 829711.0, 2733288.0, 289487.0, 73497.0, 28773.0, 13513.0, 6953.0, 3716.0, 2111.0, 1212.0, 752.0, 454.0, 279.0, 180.0, 112.0, 101.0, 44.0, 35.0, 28.0, 19.0, 10.0, 12.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6713943481445312, -0.6484527587890625, -0.6255111694335938, -0.602569580078125, -0.5796279907226562, -0.5566864013671875, -0.5337448120117188, -0.51080322265625, -0.48786163330078125, -0.4649200439453125, -0.44197845458984375, -0.419036865234375, -0.39609527587890625, -0.3731536865234375, -0.35021209716796875, -0.3272705078125, -0.30432891845703125, -0.2813873291015625, -0.25844573974609375, -0.235504150390625, -0.21256256103515625, -0.1896209716796875, -0.16667938232421875, -0.14373779296875, -0.12079620361328125, -0.0978546142578125, -0.07491302490234375, -0.051971435546875, -0.02902984619140625, -0.0060882568359375, 0.01685333251953125, 0.039794921875, 0.06273651123046875, 0.0856781005859375, 0.10861968994140625, 0.131561279296875, 0.15450286865234375, 0.1774444580078125, 0.20038604736328125, 0.22332763671875, 0.24626922607421875, 0.2692108154296875, 0.29215240478515625, 0.315093994140625, 0.33803558349609375, 0.3609771728515625, 0.38391876220703125, 0.4068603515625, 0.42980194091796875, 0.4527435302734375, 0.47568511962890625, 0.498626708984375, 0.5215682983398438, 0.5445098876953125, 0.5674514770507812, 0.59039306640625, 0.6133346557617188, 0.6362762451171875, 0.6592178344726562, 0.682159423828125, 0.7051010131835938, 0.7280426025390625, 0.7509841918945312, 0.77392578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 0.0, 11.0, 8.0, 11.0, 15.0, 19.0, 22.0, 16.0, 21.0, 25.0, 23.0, 32.0, 32.0, 32.0, 41.0, 38.0, 45.0, 40.0, 43.0, 47.0, 43.0, 52.0, 39.0, 41.0, 38.0, 40.0, 44.0, 22.0, 27.0, 32.0, 18.0, 12.0, 15.0, 11.0, 7.0, 8.0, 4.0, 9.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.437744140625, -0.42522430419921875, -0.4127044677734375, -0.40018463134765625, -0.387664794921875, -0.37514495849609375, -0.3626251220703125, -0.35010528564453125, -0.33758544921875, -0.32506561279296875, -0.3125457763671875, -0.30002593994140625, -0.287506103515625, -0.27498626708984375, -0.2624664306640625, -0.24994659423828125, -0.2374267578125, -0.22490692138671875, -0.2123870849609375, -0.19986724853515625, -0.187347412109375, -0.17482757568359375, -0.1623077392578125, -0.14978790283203125, -0.13726806640625, -0.12474822998046875, -0.1122283935546875, -0.09970855712890625, -0.087188720703125, -0.07466888427734375, -0.0621490478515625, -0.04962921142578125, -0.037109375, -0.02458953857421875, -0.0120697021484375, 0.00045013427734375, 0.012969970703125, 0.02548980712890625, 0.0380096435546875, 0.05052947998046875, 0.06304931640625, 0.07556915283203125, 0.0880889892578125, 0.10060882568359375, 0.113128662109375, 0.12564849853515625, 0.1381683349609375, 0.15068817138671875, 0.1632080078125, 0.17572784423828125, 0.1882476806640625, 0.20076751708984375, 0.213287353515625, 0.22580718994140625, 0.2383270263671875, 0.25084686279296875, 0.26336669921875, 0.27588653564453125, 0.2884063720703125, 0.30092620849609375, 0.313446044921875, 0.32596588134765625, 0.3384857177734375, 0.35100555419921875, 0.363525390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 13.0, 12.0, 24.0, 55.0, 63.0, 125.0, 273.0, 594.0, 1407.0, 4335.0, 17181.0, 122265.0, 3611047.0, 391326.0, 34503.0, 7401.0, 2188.0, 769.0, 284.0, 178.0, 92.0, 40.0, 27.0, 29.0, 15.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8837890625, -1.827880859375, -1.77197265625, -1.716064453125, -1.66015625, -1.604248046875, -1.54833984375, -1.492431640625, -1.4365234375, -1.380615234375, -1.32470703125, -1.268798828125, -1.212890625, -1.156982421875, -1.10107421875, -1.045166015625, -0.9892578125, -0.933349609375, -0.87744140625, -0.821533203125, -0.765625, -0.709716796875, -0.65380859375, -0.597900390625, -0.5419921875, -0.486083984375, -0.43017578125, -0.374267578125, -0.318359375, -0.262451171875, -0.20654296875, -0.150634765625, -0.0947265625, -0.038818359375, 0.01708984375, 0.072998046875, 0.12890625, 0.184814453125, 0.24072265625, 0.296630859375, 0.3525390625, 0.408447265625, 0.46435546875, 0.520263671875, 0.576171875, 0.632080078125, 0.68798828125, 0.743896484375, 0.7998046875, 0.855712890625, 0.91162109375, 0.967529296875, 1.0234375, 1.079345703125, 1.13525390625, 1.191162109375, 1.2470703125, 1.302978515625, 1.35888671875, 1.414794921875, 1.470703125, 1.526611328125, 1.58251953125, 1.638427734375, 1.6943359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 7.0, 8.0, 6.0, 11.0, 19.0, 31.0, 50.0, 79.0, 140.0, 312.0, 1029.0, 1383.0, 480.0, 200.0, 108.0, 80.0, 42.0, 27.0, 25.0, 8.0, 10.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.41015625, -2.3516082763671875, -2.293060302734375, -2.2345123291015625, -2.17596435546875, -2.1174163818359375, -2.058868408203125, -2.0003204345703125, -1.9417724609375, -1.8832244873046875, -1.824676513671875, -1.7661285400390625, -1.70758056640625, -1.6490325927734375, -1.590484619140625, -1.5319366455078125, -1.473388671875, -1.4148406982421875, -1.356292724609375, -1.2977447509765625, -1.23919677734375, -1.1806488037109375, -1.122100830078125, -1.0635528564453125, -1.0050048828125, -0.9464569091796875, -0.887908935546875, -0.8293609619140625, -0.77081298828125, -0.7122650146484375, -0.653717041015625, -0.5951690673828125, -0.53662109375, -0.4780731201171875, -0.419525146484375, -0.3609771728515625, -0.30242919921875, -0.2438812255859375, -0.185333251953125, -0.1267852783203125, -0.0682373046875, -0.0096893310546875, 0.048858642578125, 0.1074066162109375, 0.16595458984375, 0.2245025634765625, 0.283050537109375, 0.3415985107421875, 0.400146484375, 0.4586944580078125, 0.517242431640625, 0.5757904052734375, 0.63433837890625, 0.6928863525390625, 0.751434326171875, 0.8099822998046875, 0.8685302734375, 0.9270782470703125, 0.985626220703125, 1.0441741943359375, 1.10272216796875, 1.1612701416015625, 1.219818115234375, 1.2783660888671875, 1.3369140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 16.0, 34.0, 95.0, 251.0, 312.0, 168.0, 68.0, 24.0, 19.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.06901931762695, -31.37401580810547, -30.679012298583984, -29.9840087890625, -29.289005279541016, -28.59400177001953, -27.898998260498047, -27.203996658325195, -26.50899314880371, -25.813989639282227, -25.118986129760742, -24.423982620239258, -23.728979110717773, -23.033977508544922, -22.338973999023438, -21.643970489501953, -20.94896697998047, -20.253963470458984, -19.5589599609375, -18.863956451416016, -18.16895294189453, -17.473949432373047, -16.778945922851562, -16.08394432067871, -15.388938903808594, -14.69393539428711, -13.998931884765625, -13.30392837524414, -12.608925819396973, -11.913922309875488, -11.218918800354004, -10.523916244506836, -9.828911781311035, -9.13390827178955, -8.438904762268066, -7.74390172958374, -7.048898696899414, -6.35389518737793, -5.658891677856445, -4.963888645172119, -4.268885135650635, -3.5738818645477295, -2.878878593444824, -2.18387508392334, -1.4888718128204346, -0.7938685417175293, -0.09886503219604492, 0.5961380004882812, 1.2911415100097656, 1.986144781112671, 2.681148052215576, 3.3761515617370605, 4.071154594421387, 4.766158103942871, 5.4611616134643555, 6.156164646148682, 6.851168155670166, 7.54617166519165, 8.241174697875977, 8.936178207397461, 9.631181716918945, 10.32618522644043, 11.021188735961914, 11.716191291809082, 12.411194801330566]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 7.0, 7.0, 9.0, 14.0, 21.0, 19.0, 15.0, 40.0, 42.0, 31.0, 30.0, 37.0, 41.0, 44.0, 45.0, 46.0, 49.0, 36.0, 46.0, 39.0, 37.0, 31.0, 38.0, 33.0, 17.0, 27.0, 27.0, 24.0, 12.0, 21.0, 21.0, 17.0, 6.0, 10.0, 13.0, 6.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-5.811435699462891, -5.646458148956299, -5.481480121612549, -5.316502571105957, -5.151524543762207, -4.986546993255615, -4.821569442749023, -4.656591415405273, -4.491613864898682, -4.32663631439209, -4.16165828704834, -3.996680736541748, -3.831702947616577, -3.6667251586914062, -3.5017473697662354, -3.3367695808410645, -3.1717917919158936, -3.0068140029907227, -2.8418362140655518, -2.676858425140381, -2.511880874633789, -2.346903085708618, -2.1819252967834473, -2.0169477462768555, -1.851969838142395, -1.6869920492172241, -1.5220143795013428, -1.3570365905761719, -1.192058801651001, -1.0270811319351196, -0.8621033430099487, -0.6971256732940674, -0.5321478843688965, -0.36717015504837036, -0.20219239592552185, -0.03721463680267334, 0.12776309251785278, 0.2927408218383789, 0.4577186107635498, 0.6226962804794312, 0.787674069404602, 0.9526517987251282, 1.1176295280456543, 1.2826073169708252, 1.447585105895996, 1.6125627756118774, 1.7775405645370483, 1.9425182342529297, 2.1074960231781006, 2.2724738121032715, 2.4374516010284424, 2.6024293899536133, 2.767406940460205, 2.932384729385376, 3.097362518310547, 3.2623400688171387, 3.4273180961608887, 3.5922958850860596, 3.7572736740112305, 3.9222512245178223, 4.087229251861572, 4.252206802368164, 4.417184829711914, 4.582162380218506, 4.747139930725098]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 8.0, 14.0, 20.0, 23.0, 45.0, 51.0, 74.0, 96.0, 174.0, 186.0, 315.0, 526.0, 707.0, 1139.0, 1680.0, 2708.0, 4670.0, 8175.0, 15483.0, 29830.0, 61942.0, 150159.0, 363392.0, 232953.0, 87633.0, 40347.0, 20309.0, 10489.0, 6024.0, 3378.0, 2078.0, 1327.0, 835.0, 560.0, 373.0, 249.0, 182.0, 131.0, 73.0, 69.0, 38.0, 19.0, 15.0, 11.0, 14.0, 9.0, 6.0, 5.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.7978515625, -0.7734603881835938, -0.7490692138671875, -0.7246780395507812, -0.700286865234375, -0.6758956909179688, -0.6515045166015625, -0.6271133422851562, -0.60272216796875, -0.5783309936523438, -0.5539398193359375, -0.5295486450195312, -0.505157470703125, -0.48076629638671875, -0.4563751220703125, -0.43198394775390625, -0.4075927734375, -0.38320159912109375, -0.3588104248046875, -0.33441925048828125, -0.310028076171875, -0.28563690185546875, -0.2612457275390625, -0.23685455322265625, -0.21246337890625, -0.18807220458984375, -0.1636810302734375, -0.13928985595703125, -0.114898681640625, -0.09050750732421875, -0.0661163330078125, -0.04172515869140625, -0.017333984375, 0.00705718994140625, 0.0314483642578125, 0.05583953857421875, 0.080230712890625, 0.10462188720703125, 0.1290130615234375, 0.15340423583984375, 0.17779541015625, 0.20218658447265625, 0.2265777587890625, 0.25096893310546875, 0.275360107421875, 0.29975128173828125, 0.3241424560546875, 0.34853363037109375, 0.3729248046875, 0.39731597900390625, 0.4217071533203125, 0.44609832763671875, 0.470489501953125, 0.49488067626953125, 0.5192718505859375, 0.5436630249023438, 0.56805419921875, 0.5924453735351562, 0.6168365478515625, 0.6412277221679688, 0.665618896484375, 0.6900100708007812, 0.7144012451171875, 0.7387924194335938, 0.76318359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 10.0, 12.0, 20.0, 15.0, 23.0, 30.0, 26.0, 27.0, 44.0, 32.0, 50.0, 35.0, 47.0, 35.0, 46.0, 41.0, 39.0, 51.0, 53.0, 36.0, 35.0, 36.0, 31.0, 20.0, 35.0, 31.0, 20.0, 15.0, 8.0, 16.0, 12.0, 9.0, 9.0, 8.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.414306640625, -0.4022560119628906, -0.39020538330078125, -0.3781547546386719, -0.3661041259765625, -0.3540534973144531, -0.34200286865234375, -0.3299522399902344, -0.317901611328125, -0.3058509826660156, -0.29380035400390625, -0.2817497253417969, -0.2696990966796875, -0.2576484680175781, -0.24559783935546875, -0.23354721069335938, -0.22149658203125, -0.20944595336914062, -0.19739532470703125, -0.18534469604492188, -0.1732940673828125, -0.16124343872070312, -0.14919281005859375, -0.13714218139648438, -0.125091552734375, -0.11304092407226562, -0.10099029541015625, -0.08893966674804688, -0.0768890380859375, -0.06483840942382812, -0.05278778076171875, -0.040737152099609375, -0.0286865234375, -0.016635894775390625, -0.00458526611328125, 0.007465362548828125, 0.0195159912109375, 0.031566619873046875, 0.04361724853515625, 0.055667877197265625, 0.067718505859375, 0.07976913452148438, 0.09181976318359375, 0.10387039184570312, 0.1159210205078125, 0.12797164916992188, 0.14002227783203125, 0.15207290649414062, 0.16412353515625, 0.17617416381835938, 0.18822479248046875, 0.20027542114257812, 0.2123260498046875, 0.22437667846679688, 0.23642730712890625, 0.24847793579101562, 0.260528564453125, 0.2725791931152344, 0.28462982177734375, 0.2966804504394531, 0.3087310791015625, 0.3207817077636719, 0.33283233642578125, 0.3448829650878906, 0.35693359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 16.0, 22.0, 29.0, 40.0, 70.0, 119.0, 183.0, 355.0, 565.0, 1187.0, 3178.0, 15823.0, 290892.0, 702343.0, 26235.0, 4325.0, 1532.0, 696.0, 355.0, 184.0, 137.0, 91.0, 50.0, 42.0, 22.0, 24.0, 10.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.525390625, -3.4436187744140625, -3.361846923828125, -3.2800750732421875, -3.19830322265625, -3.1165313720703125, -3.034759521484375, -2.9529876708984375, -2.8712158203125, -2.7894439697265625, -2.707672119140625, -2.6259002685546875, -2.54412841796875, -2.4623565673828125, -2.380584716796875, -2.2988128662109375, -2.217041015625, -2.1352691650390625, -2.053497314453125, -1.9717254638671875, -1.88995361328125, -1.8081817626953125, -1.726409912109375, -1.6446380615234375, -1.5628662109375, -1.4810943603515625, -1.399322509765625, -1.3175506591796875, -1.23577880859375, -1.1540069580078125, -1.072235107421875, -0.9904632568359375, -0.90869140625, -0.8269195556640625, -0.745147705078125, -0.6633758544921875, -0.58160400390625, -0.4998321533203125, -0.418060302734375, -0.3362884521484375, -0.2545166015625, -0.1727447509765625, -0.090972900390625, -0.0092010498046875, 0.07257080078125, 0.1543426513671875, 0.236114501953125, 0.3178863525390625, 0.399658203125, 0.4814300537109375, 0.563201904296875, 0.6449737548828125, 0.72674560546875, 0.8085174560546875, 0.890289306640625, 0.9720611572265625, 1.0538330078125, 1.1356048583984375, 1.217376708984375, 1.2991485595703125, 1.38092041015625, 1.4626922607421875, 1.544464111328125, 1.6262359619140625, 1.7080078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 6.0, 8.0, 8.0, 8.0, 10.0, 9.0, 19.0, 23.0, 20.0, 27.0, 22.0, 19.0, 33.0, 35.0, 31.0, 49.0, 34.0, 37.0, 46.0, 45.0, 41.0, 43.0, 46.0, 36.0, 37.0, 39.0, 29.0, 26.0, 25.0, 23.0, 20.0, 18.0, 20.0, 17.0, 20.0, 15.0, 10.0, 12.0, 4.0, 4.0, 12.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4658203125, -1.4160919189453125, -1.366363525390625, -1.3166351318359375, -1.26690673828125, -1.2171783447265625, -1.167449951171875, -1.1177215576171875, -1.0679931640625, -1.0182647705078125, -0.968536376953125, -0.9188079833984375, -0.86907958984375, -0.8193511962890625, -0.769622802734375, -0.7198944091796875, -0.670166015625, -0.6204376220703125, -0.570709228515625, -0.5209808349609375, -0.47125244140625, -0.4215240478515625, -0.371795654296875, -0.3220672607421875, -0.2723388671875, -0.2226104736328125, -0.172882080078125, -0.1231536865234375, -0.07342529296875, -0.0236968994140625, 0.026031494140625, 0.0757598876953125, 0.12548828125, 0.1752166748046875, 0.224945068359375, 0.2746734619140625, 0.32440185546875, 0.3741302490234375, 0.423858642578125, 0.4735870361328125, 0.5233154296875, 0.5730438232421875, 0.622772216796875, 0.6725006103515625, 0.72222900390625, 0.7719573974609375, 0.821685791015625, 0.8714141845703125, 0.921142578125, 0.9708709716796875, 1.020599365234375, 1.0703277587890625, 1.12005615234375, 1.1697845458984375, 1.219512939453125, 1.2692413330078125, 1.3189697265625, 1.3686981201171875, 1.418426513671875, 1.4681549072265625, 1.51788330078125, 1.5676116943359375, 1.617340087890625, 1.6670684814453125, 1.716796875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 9.0, 10.0, 8.0, 15.0, 34.0, 38.0, 56.0, 86.0, 131.0, 223.0, 508.0, 1282.0, 4100.0, 19070.0, 178930.0, 770038.0, 60354.0, 9499.0, 2425.0, 855.0, 357.0, 183.0, 107.0, 72.0, 46.0, 27.0, 16.0, 18.0, 14.0, 4.0, 4.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9125289916992188, -0.8851165771484375, -0.8577041625976562, -0.830291748046875, -0.8028793334960938, -0.7754669189453125, -0.7480545043945312, -0.72064208984375, -0.6932296752929688, -0.6658172607421875, -0.6384048461914062, -0.610992431640625, -0.5835800170898438, -0.5561676025390625, -0.5287551879882812, -0.5013427734375, -0.47393035888671875, -0.4465179443359375, -0.41910552978515625, -0.391693115234375, -0.36428070068359375, -0.3368682861328125, -0.30945587158203125, -0.28204345703125, -0.25463104248046875, -0.2272186279296875, -0.19980621337890625, -0.172393798828125, -0.14498138427734375, -0.1175689697265625, -0.09015655517578125, -0.062744140625, -0.03533172607421875, -0.0079193115234375, 0.01949310302734375, 0.046905517578125, 0.07431793212890625, 0.1017303466796875, 0.12914276123046875, 0.15655517578125, 0.18396759033203125, 0.2113800048828125, 0.23879241943359375, 0.266204833984375, 0.29361724853515625, 0.3210296630859375, 0.34844207763671875, 0.3758544921875, 0.40326690673828125, 0.4306793212890625, 0.45809173583984375, 0.485504150390625, 0.5129165649414062, 0.5403289794921875, 0.5677413940429688, 0.59515380859375, 0.6225662231445312, 0.6499786376953125, 0.6773910522460938, 0.704803466796875, 0.7322158813476562, 0.7596282958984375, 0.7870407104492188, 0.814453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 3.0, 4.0, 5.0, 12.0, 13.0, 12.0, 20.0, 26.0, 39.0, 39.0, 44.0, 84.0, 111.0, 152.0, 120.0, 87.0, 62.0, 45.0, 28.0, 27.0, 13.0, 11.0, 10.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015616416931152344, -0.0001513790339231491, -0.00014659389853477478, -0.00014180876314640045, -0.00013702362775802612, -0.0001322384923696518, -0.00012745335698127747, -0.00012266822159290314, -0.00011788308620452881, -0.00011309795081615448, -0.00010831281542778015, -0.00010352768003940582, -9.87425446510315e-05, -9.395740926265717e-05, -8.917227387428284e-05, -8.438713848590851e-05, -7.960200309753418e-05, -7.481686770915985e-05, -7.003173232078552e-05, -6.52465969324112e-05, -6.0461461544036865e-05, -5.567632615566254e-05, -5.089119076728821e-05, -4.610605537891388e-05, -4.132091999053955e-05, -3.653578460216522e-05, -3.1750649213790894e-05, -2.6965513825416565e-05, -2.2180378437042236e-05, -1.7395243048667908e-05, -1.2610107660293579e-05, -7.82497227191925e-06, -3.039836883544922e-06, 1.7452985048294067e-06, 6.530433893203735e-06, 1.1315569281578064e-05, 1.6100704669952393e-05, 2.088584005832672e-05, 2.567097544670105e-05, 3.045611083507538e-05, 3.524124622344971e-05, 4.0026381611824036e-05, 4.4811517000198364e-05, 4.959665238857269e-05, 5.438178777694702e-05, 5.916692316532135e-05, 6.395205855369568e-05, 6.873719394207001e-05, 7.352232933044434e-05, 7.830746471881866e-05, 8.309260010719299e-05, 8.787773549556732e-05, 9.266287088394165e-05, 9.744800627231598e-05, 0.00010223314166069031, 0.00010701827704906464, 0.00011180341243743896, 0.0001165885478258133, 0.00012137368321418762, 0.00012615881860256195, 0.00013094395399093628, 0.0001357290893793106, 0.00014051422476768494, 0.00014529936015605927, 0.0001500844955444336]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 9.0, 12.0, 17.0, 19.0, 26.0, 34.0, 37.0, 67.0, 68.0, 127.0, 239.0, 342.0, 493.0, 973.0, 2062.0, 5295.0, 20831.0, 164623.0, 736617.0, 93607.0, 14755.0, 4296.0, 1778.0, 839.0, 477.0, 295.0, 162.0, 110.0, 88.0, 59.0, 37.0, 22.0, 35.0, 10.0, 18.0, 11.0, 8.0, 10.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.619140625, -0.5973281860351562, -0.5755157470703125, -0.5537033081054688, -0.531890869140625, -0.5100784301757812, -0.4882659912109375, -0.46645355224609375, -0.44464111328125, -0.42282867431640625, -0.4010162353515625, -0.37920379638671875, -0.357391357421875, -0.33557891845703125, -0.3137664794921875, -0.29195404052734375, -0.2701416015625, -0.24832916259765625, -0.2265167236328125, -0.20470428466796875, -0.182891845703125, -0.16107940673828125, -0.1392669677734375, -0.11745452880859375, -0.09564208984375, -0.07382965087890625, -0.0520172119140625, -0.03020477294921875, -0.008392333984375, 0.01342010498046875, 0.0352325439453125, 0.05704498291015625, 0.078857421875, 0.10066986083984375, 0.1224822998046875, 0.14429473876953125, 0.166107177734375, 0.18791961669921875, 0.2097320556640625, 0.23154449462890625, 0.25335693359375, 0.27516937255859375, 0.2969818115234375, 0.31879425048828125, 0.340606689453125, 0.36241912841796875, 0.3842315673828125, 0.40604400634765625, 0.4278564453125, 0.44966888427734375, 0.4714813232421875, 0.49329376220703125, 0.515106201171875, 0.5369186401367188, 0.5587310791015625, 0.5805435180664062, 0.60235595703125, 0.6241683959960938, 0.6459808349609375, 0.6677932739257812, 0.689605712890625, 0.7114181518554688, 0.7332305908203125, 0.7550430297851562, 0.77685546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 3.0, 6.0, 8.0, 11.0, 15.0, 17.0, 15.0, 25.0, 44.0, 40.0, 63.0, 79.0, 62.0, 72.0, 84.0, 66.0, 74.0, 67.0, 60.0, 43.0, 37.0, 16.0, 25.0, 14.0, 12.0, 15.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6873855590820312, -0.6667633056640625, -0.6461410522460938, -0.625518798828125, -0.6048965454101562, -0.5842742919921875, -0.5636520385742188, -0.54302978515625, -0.5224075317382812, -0.5017852783203125, -0.48116302490234375, -0.460540771484375, -0.43991851806640625, -0.4192962646484375, -0.39867401123046875, -0.3780517578125, -0.35742950439453125, -0.3368072509765625, -0.31618499755859375, -0.295562744140625, -0.27494049072265625, -0.2543182373046875, -0.23369598388671875, -0.21307373046875, -0.19245147705078125, -0.1718292236328125, -0.15120697021484375, -0.130584716796875, -0.10996246337890625, -0.0893402099609375, -0.06871795654296875, -0.048095703125, -0.02747344970703125, -0.0068511962890625, 0.01377105712890625, 0.034393310546875, 0.05501556396484375, 0.0756378173828125, 0.09626007080078125, 0.11688232421875, 0.13750457763671875, 0.1581268310546875, 0.17874908447265625, 0.199371337890625, 0.21999359130859375, 0.2406158447265625, 0.26123809814453125, 0.2818603515625, 0.30248260498046875, 0.3231048583984375, 0.34372711181640625, 0.364349365234375, 0.38497161865234375, 0.4055938720703125, 0.42621612548828125, 0.44683837890625, 0.46746063232421875, 0.4880828857421875, 0.5087051391601562, 0.529327392578125, 0.5499496459960938, 0.5705718994140625, 0.5911941528320312, 0.61181640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 3.0, 7.0, 8.0, 17.0, 40.0, 86.0, 160.0, 215.0, 169.0, 134.0, 84.0, 37.0, 22.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.028270721435547, -18.572021484375, -18.115774154663086, -17.65952491760254, -17.203275680541992, -16.747028350830078, -16.29077911376953, -15.834529876708984, -15.378281593322754, -14.922033309936523, -14.465784072875977, -14.009535789489746, -13.553287506103516, -13.097038269042969, -12.640789985656738, -12.184541702270508, -11.728292465209961, -11.27204418182373, -10.815794944763184, -10.359546661376953, -9.903297424316406, -9.447049140930176, -8.990800857543945, -8.534551620483398, -8.078303337097168, -7.622054576873779, -7.165805816650391, -6.70955753326416, -6.2533087730407715, -5.797060012817383, -5.340811729431152, -4.884562969207764, -4.428315162658691, -3.9720664024353027, -3.515817880630493, -3.0595693588256836, -2.603320598602295, -2.1470718383789062, -1.6908233165740967, -1.234574794769287, -0.7783260345458984, -0.3220773935317993, 0.1341712474822998, 0.5904198884963989, 1.046668529510498, 1.5029172897338867, 1.9591658115386963, 2.415414333343506, 2.8716630935668945, 3.327911853790283, 3.7841603755950928, 4.240408897399902, 4.696657657623291, 5.15290641784668, 5.60915470123291, 6.065403461456299, 6.5216522216796875, 6.977900981903076, 7.434149742126465, 7.890398025512695, 8.346647262573242, 8.802895545959473, 9.259143829345703, 9.71539306640625, 10.17164134979248]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 8.0, 7.0, 18.0, 12.0, 8.0, 13.0, 21.0, 20.0, 36.0, 25.0, 31.0, 27.0, 31.0, 45.0, 52.0, 58.0, 70.0, 46.0, 60.0, 42.0, 47.0, 44.0, 39.0, 35.0, 28.0, 24.0, 27.0, 29.0, 7.0, 12.0, 13.0, 6.0, 13.0, 8.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.913268089294434, -7.674967288970947, -7.436666488647461, -7.198365688323975, -6.960064888000488, -6.721764087677002, -6.483463287353516, -6.245162010192871, -6.006861686706543, -5.768560886383057, -5.53026008605957, -5.291959285736084, -5.053658485412598, -4.815357685089111, -4.577056884765625, -4.3387556076049805, -4.100454807281494, -3.862154006958008, -3.6238532066345215, -3.385552406311035, -3.147251605987549, -2.9089508056640625, -2.670649766921997, -2.4323489665985107, -2.1940481662750244, -1.955747365951538, -1.7174465656280518, -1.4791456460952759, -1.2408448457717896, -1.0025440454483032, -0.7642431259155273, -0.525942325592041, -0.2876415252685547, -0.04934069514274597, 0.18896013498306274, 0.42726099491119385, 0.6655617952346802, 0.9038625955581665, 1.1421635150909424, 1.3804643154144287, 1.618765115737915, 1.8570659160614014, 2.0953667163848877, 2.333667755126953, 2.5719685554504395, 2.810269355773926, 3.048570156097412, 3.2868709564208984, 3.5251717567443848, 3.763472557067871, 4.001773357391357, 4.240074157714844, 4.47837495803833, 4.716675758361816, 4.954977035522461, 5.193277359008789, 5.431578636169434, 5.66987943649292, 5.908180236816406, 6.146481037139893, 6.384781837463379, 6.623082637786865, 6.861383438110352, 7.099684715270996, 7.337985038757324]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 6.0, 11.0, 10.0, 12.0, 10.0, 20.0, 26.0, 36.0, 46.0, 57.0, 78.0, 124.0, 157.0, 522.0, 5791.0, 3633993.0, 548781.0, 3539.0, 431.0, 175.0, 124.0, 71.0, 64.0, 50.0, 33.0, 31.0, 18.0, 13.0, 13.0, 11.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-5.41796875, -5.285552978515625, -5.15313720703125, -5.020721435546875, -4.8883056640625, -4.755889892578125, -4.62347412109375, -4.491058349609375, -4.358642578125, -4.226226806640625, -4.09381103515625, -3.961395263671875, -3.8289794921875, -3.696563720703125, -3.56414794921875, -3.431732177734375, -3.29931640625, -3.166900634765625, -3.03448486328125, -2.902069091796875, -2.7696533203125, -2.637237548828125, -2.50482177734375, -2.372406005859375, -2.239990234375, -2.107574462890625, -1.97515869140625, -1.842742919921875, -1.7103271484375, -1.577911376953125, -1.44549560546875, -1.313079833984375, -1.1806640625, -1.048248291015625, -0.91583251953125, -0.783416748046875, -0.6510009765625, -0.518585205078125, -0.38616943359375, -0.253753662109375, -0.121337890625, 0.011077880859375, 0.14349365234375, 0.275909423828125, 0.4083251953125, 0.540740966796875, 0.67315673828125, 0.805572509765625, 0.93798828125, 1.070404052734375, 1.20281982421875, 1.335235595703125, 1.4676513671875, 1.600067138671875, 1.73248291015625, 1.864898681640625, 1.997314453125, 2.129730224609375, 2.26214599609375, 2.394561767578125, 2.5269775390625, 2.659393310546875, 2.79180908203125, 2.924224853515625, 3.056640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 10.0, 5.0, 6.0, 13.0, 8.0, 6.0, 15.0, 9.0, 22.0, 22.0, 26.0, 29.0, 33.0, 39.0, 36.0, 39.0, 38.0, 41.0, 40.0, 46.0, 41.0, 48.0, 47.0, 40.0, 34.0, 33.0, 33.0, 33.0, 29.0, 30.0, 18.0, 21.0, 20.0, 17.0, 18.0, 13.0, 9.0, 6.0, 6.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.4208984375, -0.408905029296875, -0.39691162109375, -0.384918212890625, -0.3729248046875, -0.360931396484375, -0.34893798828125, -0.336944580078125, -0.324951171875, -0.312957763671875, -0.30096435546875, -0.288970947265625, -0.2769775390625, -0.264984130859375, -0.25299072265625, -0.240997314453125, -0.22900390625, -0.217010498046875, -0.20501708984375, -0.193023681640625, -0.1810302734375, -0.169036865234375, -0.15704345703125, -0.145050048828125, -0.133056640625, -0.121063232421875, -0.10906982421875, -0.097076416015625, -0.0850830078125, -0.073089599609375, -0.06109619140625, -0.049102783203125, -0.037109375, -0.025115966796875, -0.01312255859375, -0.001129150390625, 0.0108642578125, 0.022857666015625, 0.03485107421875, 0.046844482421875, 0.058837890625, 0.070831298828125, 0.08282470703125, 0.094818115234375, 0.1068115234375, 0.118804931640625, 0.13079833984375, 0.142791748046875, 0.15478515625, 0.166778564453125, 0.17877197265625, 0.190765380859375, 0.2027587890625, 0.214752197265625, 0.22674560546875, 0.238739013671875, 0.250732421875, 0.262725830078125, 0.27471923828125, 0.286712646484375, 0.2987060546875, 0.310699462890625, 0.32269287109375, 0.334686279296875, 0.3466796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 8.0, 9.0, 10.0, 10.0, 23.0, 26.0, 37.0, 51.0, 74.0, 133.0, 179.0, 357.0, 670.0, 1391.0, 3621.0, 11198.0, 48686.0, 473145.0, 3432366.0, 181965.0, 28625.0, 7387.0, 2469.0, 905.0, 417.0, 215.0, 100.0, 53.0, 44.0, 36.0, 30.0, 10.0, 5.0, 9.0, 9.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3046875, -1.2630462646484375, -1.221405029296875, -1.1797637939453125, -1.13812255859375, -1.0964813232421875, -1.054840087890625, -1.0131988525390625, -0.9715576171875, -0.9299163818359375, -0.888275146484375, -0.8466339111328125, -0.80499267578125, -0.7633514404296875, -0.721710205078125, -0.6800689697265625, -0.638427734375, -0.5967864990234375, -0.555145263671875, -0.5135040283203125, -0.47186279296875, -0.4302215576171875, -0.388580322265625, -0.3469390869140625, -0.3052978515625, -0.2636566162109375, -0.222015380859375, -0.1803741455078125, -0.13873291015625, -0.0970916748046875, -0.055450439453125, -0.0138092041015625, 0.02783203125, 0.0694732666015625, 0.111114501953125, 0.1527557373046875, 0.19439697265625, 0.2360382080078125, 0.277679443359375, 0.3193206787109375, 0.3609619140625, 0.4026031494140625, 0.444244384765625, 0.4858856201171875, 0.52752685546875, 0.5691680908203125, 0.610809326171875, 0.6524505615234375, 0.694091796875, 0.7357330322265625, 0.777374267578125, 0.8190155029296875, 0.86065673828125, 0.9022979736328125, 0.943939208984375, 0.9855804443359375, 1.0272216796875, 1.0688629150390625, 1.110504150390625, 1.1521453857421875, 1.19378662109375, 1.2354278564453125, 1.277069091796875, 1.3187103271484375, 1.3603515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 9.0, 11.0, 27.0, 63.0, 86.0, 138.0, 279.0, 740.0, 1440.0, 669.0, 253.0, 133.0, 73.0, 54.0, 33.0, 21.0, 12.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.369140625, -2.3170318603515625, -2.264923095703125, -2.2128143310546875, -2.16070556640625, -2.1085968017578125, -2.056488037109375, -2.0043792724609375, -1.9522705078125, -1.9001617431640625, -1.848052978515625, -1.7959442138671875, -1.74383544921875, -1.6917266845703125, -1.639617919921875, -1.5875091552734375, -1.535400390625, -1.4832916259765625, -1.431182861328125, -1.3790740966796875, -1.32696533203125, -1.2748565673828125, -1.222747802734375, -1.1706390380859375, -1.1185302734375, -1.0664215087890625, -1.014312744140625, -0.9622039794921875, -0.91009521484375, -0.8579864501953125, -0.805877685546875, -0.7537689208984375, -0.70166015625, -0.6495513916015625, -0.597442626953125, -0.5453338623046875, -0.49322509765625, -0.4411163330078125, -0.389007568359375, -0.3368988037109375, -0.2847900390625, -0.2326812744140625, -0.180572509765625, -0.1284637451171875, -0.07635498046875, -0.0242462158203125, 0.027862548828125, 0.0799713134765625, 0.132080078125, 0.1841888427734375, 0.236297607421875, 0.2884063720703125, 0.34051513671875, 0.3926239013671875, 0.444732666015625, 0.4968414306640625, 0.5489501953125, 0.6010589599609375, 0.653167724609375, 0.7052764892578125, 0.75738525390625, 0.8094940185546875, 0.861602783203125, 0.9137115478515625, 0.9658203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 13.0, 16.0, 28.0, 55.0, 124.0, 187.0, 185.0, 152.0, 96.0, 53.0, 38.0, 17.0, 11.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.813339233398438, -11.494658470153809, -11.17597770690918, -10.857297897338867, -10.538617134094238, -10.21993637084961, -9.90125560760498, -9.582574844360352, -9.263895034790039, -8.94521427154541, -8.626533508300781, -8.307853698730469, -7.98917293548584, -7.670492172241211, -7.351811408996582, -7.033130645751953, -6.714449882507324, -6.395769119262695, -6.077088832855225, -5.758408069610596, -5.439727783203125, -5.121047019958496, -4.802366256713867, -4.483685493469238, -4.165005207061768, -3.8463246822357178, -3.527644157409668, -3.208963394165039, -2.8902828693389893, -2.5716023445129395, -2.2529215812683105, -1.9342410564422607, -1.615560531616211, -1.2968800067901611, -0.9781993627548218, -0.6595187783241272, -0.3408381938934326, -0.022157669067382812, 0.29652297496795654, 0.6152036190032959, 0.9338841438293457, 1.2525646686553955, 1.5712453126907349, 1.8899259567260742, 2.208606481552124, 2.527287006378174, 2.8459677696228027, 3.1646482944488525, 3.4833288192749023, 3.802009344100952, 4.120689868927002, 4.439370632171631, 4.758050918579102, 5.0767316818237305, 5.395412445068359, 5.714093208312988, 6.032773494720459, 6.351454257965088, 6.670134544372559, 6.9888153076171875, 7.307496070861816, 7.626176357269287, 7.944857120513916, 8.263537406921387, 8.582218170166016]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 9.0, 7.0, 6.0, 11.0, 17.0, 24.0, 21.0, 38.0, 40.0, 34.0, 48.0, 49.0, 51.0, 55.0, 47.0, 63.0, 43.0, 55.0, 37.0, 49.0, 34.0, 42.0, 29.0, 31.0, 29.0, 19.0, 18.0, 19.0, 13.0, 11.0, 10.0, 10.0, 5.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70717716217041, -5.5248870849609375, -5.342596530914307, -5.160306453704834, -4.978015899658203, -4.7957258224487305, -4.613435745239258, -4.431145668029785, -4.248855113983154, -4.066565036773682, -3.884274482727051, -3.701984405517578, -3.5196940898895264, -3.3374037742614746, -3.155113697052002, -2.97282338142395, -2.7905330657958984, -2.6082427501678467, -2.425952434539795, -2.2436623573303223, -2.0613720417022705, -1.8790817260742188, -1.6967915296554565, -1.5145013332366943, -1.3322110176086426, -1.1499207019805908, -0.9676305055618286, -0.7853402495384216, -0.6030499935150146, -0.42075973749160767, -0.23846948146820068, -0.05617928504943848, 0.12611103057861328, 0.30840128660202026, 0.49069154262542725, 0.6729817986488342, 0.8552720546722412, 1.037562370300293, 1.2198525667190552, 1.4021427631378174, 1.5844330787658691, 1.766723394393921, 1.949013590812683, 2.1313037872314453, 2.313594102859497, 2.495884418487549, 2.6781744956970215, 2.8604648113250732, 3.042755126953125, 3.2250454425811768, 3.4073357582092285, 3.589625835418701, 3.771916151046753, 3.9542064666748047, 4.136496543884277, 4.31878662109375, 4.501077175140381, 4.6833672523498535, 4.865657806396484, 5.047947883605957, 5.23023796081543, 5.4125285148620605, 5.594818592071533, 5.777109146118164, 5.959399223327637]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 9.0, 8.0, 9.0, 19.0, 33.0, 36.0, 52.0, 89.0, 129.0, 156.0, 226.0, 346.0, 565.0, 845.0, 1353.0, 2293.0, 3894.0, 6750.0, 13094.0, 27481.0, 68738.0, 211975.0, 421322.0, 178070.0, 59245.0, 24675.0, 11877.0, 6239.0, 3449.0, 1996.0, 1233.0, 774.0, 515.0, 322.0, 205.0, 153.0, 96.0, 73.0, 63.0, 45.0, 26.0, 24.0, 9.0, 8.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.859375, -0.83441162109375, -0.8094482421875, -0.78448486328125, -0.759521484375, -0.73455810546875, -0.7095947265625, -0.68463134765625, -0.65966796875, -0.63470458984375, -0.6097412109375, -0.58477783203125, -0.559814453125, -0.53485107421875, -0.5098876953125, -0.48492431640625, -0.4599609375, -0.43499755859375, -0.4100341796875, -0.38507080078125, -0.360107421875, -0.33514404296875, -0.3101806640625, -0.28521728515625, -0.26025390625, -0.23529052734375, -0.2103271484375, -0.18536376953125, -0.160400390625, -0.13543701171875, -0.1104736328125, -0.08551025390625, -0.060546875, -0.03558349609375, -0.0106201171875, 0.01434326171875, 0.039306640625, 0.06427001953125, 0.0892333984375, 0.11419677734375, 0.13916015625, 0.16412353515625, 0.1890869140625, 0.21405029296875, 0.239013671875, 0.26397705078125, 0.2889404296875, 0.31390380859375, 0.3388671875, 0.36383056640625, 0.3887939453125, 0.41375732421875, 0.438720703125, 0.46368408203125, 0.4886474609375, 0.51361083984375, 0.53857421875, 0.56353759765625, 0.5885009765625, 0.61346435546875, 0.638427734375, 0.66339111328125, 0.6883544921875, 0.71331787109375, 0.73828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 2.0, 7.0, 4.0, 7.0, 12.0, 8.0, 11.0, 13.0, 19.0, 18.0, 20.0, 30.0, 29.0, 31.0, 35.0, 36.0, 37.0, 49.0, 43.0, 37.0, 44.0, 49.0, 38.0, 42.0, 31.0, 39.0, 43.0, 26.0, 36.0, 34.0, 33.0, 26.0, 14.0, 17.0, 15.0, 16.0, 9.0, 11.0, 8.0, 3.0, 3.0, 3.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.39990234375, -0.38779449462890625, -0.3756866455078125, -0.36357879638671875, -0.351470947265625, -0.33936309814453125, -0.3272552490234375, -0.31514739990234375, -0.30303955078125, -0.29093170166015625, -0.2788238525390625, -0.26671600341796875, -0.254608154296875, -0.24250030517578125, -0.2303924560546875, -0.21828460693359375, -0.2061767578125, -0.19406890869140625, -0.1819610595703125, -0.16985321044921875, -0.157745361328125, -0.14563751220703125, -0.1335296630859375, -0.12142181396484375, -0.10931396484375, -0.09720611572265625, -0.0850982666015625, -0.07299041748046875, -0.060882568359375, -0.04877471923828125, -0.0366668701171875, -0.02455902099609375, -0.012451171875, -0.00034332275390625, 0.0117645263671875, 0.02387237548828125, 0.035980224609375, 0.04808807373046875, 0.0601959228515625, 0.07230377197265625, 0.08441162109375, 0.09651947021484375, 0.1086273193359375, 0.12073516845703125, 0.132843017578125, 0.14495086669921875, 0.1570587158203125, 0.16916656494140625, 0.1812744140625, 0.19338226318359375, 0.2054901123046875, 0.21759796142578125, 0.229705810546875, 0.24181365966796875, 0.2539215087890625, 0.26602935791015625, 0.27813720703125, 0.29024505615234375, 0.3023529052734375, 0.31446075439453125, 0.326568603515625, 0.33867645263671875, 0.3507843017578125, 0.36289215087890625, 0.375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 3.0, 12.0, 3.0, 11.0, 13.0, 18.0, 22.0, 35.0, 44.0, 55.0, 95.0, 119.0, 210.0, 312.0, 428.0, 792.0, 1408.0, 3051.0, 8112.0, 28551.0, 154572.0, 688934.0, 123544.0, 24773.0, 7256.0, 2836.0, 1355.0, 694.0, 404.0, 250.0, 193.0, 138.0, 80.0, 56.0, 39.0, 30.0, 24.0, 19.0, 5.0, 14.0, 14.0, 6.0, 11.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.3291015625, -1.286834716796875, -1.24456787109375, -1.202301025390625, -1.1600341796875, -1.117767333984375, -1.07550048828125, -1.033233642578125, -0.990966796875, -0.948699951171875, -0.90643310546875, -0.864166259765625, -0.8218994140625, -0.779632568359375, -0.73736572265625, -0.695098876953125, -0.65283203125, -0.610565185546875, -0.56829833984375, -0.526031494140625, -0.4837646484375, -0.441497802734375, -0.39923095703125, -0.356964111328125, -0.314697265625, -0.272430419921875, -0.23016357421875, -0.187896728515625, -0.1456298828125, -0.103363037109375, -0.06109619140625, -0.018829345703125, 0.0234375, 0.065704345703125, 0.10797119140625, 0.150238037109375, 0.1925048828125, 0.234771728515625, 0.27703857421875, 0.319305419921875, 0.361572265625, 0.403839111328125, 0.44610595703125, 0.488372802734375, 0.5306396484375, 0.572906494140625, 0.61517333984375, 0.657440185546875, 0.69970703125, 0.741973876953125, 0.78424072265625, 0.826507568359375, 0.8687744140625, 0.911041259765625, 0.95330810546875, 0.995574951171875, 1.037841796875, 1.080108642578125, 1.12237548828125, 1.164642333984375, 1.2069091796875, 1.249176025390625, 1.29144287109375, 1.333709716796875, 1.3759765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 8.0, 4.0, 8.0, 9.0, 8.0, 10.0, 27.0, 15.0, 20.0, 23.0, 40.0, 47.0, 43.0, 50.0, 52.0, 32.0, 63.0, 53.0, 60.0, 47.0, 50.0, 32.0, 32.0, 49.0, 37.0, 28.0, 15.0, 26.0, 13.0, 23.0, 15.0, 11.0, 11.0, 7.0, 5.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.75640869140625, -1.6993408203125, -1.64227294921875, -1.585205078125, -1.52813720703125, -1.4710693359375, -1.41400146484375, -1.35693359375, -1.29986572265625, -1.2427978515625, -1.18572998046875, -1.128662109375, -1.07159423828125, -1.0145263671875, -0.95745849609375, -0.900390625, -0.84332275390625, -0.7862548828125, -0.72918701171875, -0.672119140625, -0.61505126953125, -0.5579833984375, -0.50091552734375, -0.44384765625, -0.38677978515625, -0.3297119140625, -0.27264404296875, -0.215576171875, -0.15850830078125, -0.1014404296875, -0.04437255859375, 0.0126953125, 0.06976318359375, 0.1268310546875, 0.18389892578125, 0.240966796875, 0.29803466796875, 0.3551025390625, 0.41217041015625, 0.46923828125, 0.52630615234375, 0.5833740234375, 0.64044189453125, 0.697509765625, 0.75457763671875, 0.8116455078125, 0.86871337890625, 0.92578125, 0.98284912109375, 1.0399169921875, 1.09698486328125, 1.154052734375, 1.21112060546875, 1.2681884765625, 1.32525634765625, 1.38232421875, 1.43939208984375, 1.4964599609375, 1.55352783203125, 1.610595703125, 1.66766357421875, 1.7247314453125, 1.78179931640625, 1.8388671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 33.0, 33.0, 55.0, 94.0, 179.0, 384.0, 819.0, 2499.0, 11177.0, 103779.0, 821348.0, 93571.0, 10652.0, 2375.0, 788.0, 333.0, 172.0, 91.0, 50.0, 31.0, 33.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8476791381835938, -0.8198699951171875, -0.7920608520507812, -0.764251708984375, -0.7364425659179688, -0.7086334228515625, -0.6808242797851562, -0.65301513671875, -0.6252059936523438, -0.5973968505859375, -0.5695877075195312, -0.541778564453125, -0.5139694213867188, -0.4861602783203125, -0.45835113525390625, -0.4305419921875, -0.40273284912109375, -0.3749237060546875, -0.34711456298828125, -0.319305419921875, -0.29149627685546875, -0.2636871337890625, -0.23587799072265625, -0.20806884765625, -0.18025970458984375, -0.1524505615234375, -0.12464141845703125, -0.096832275390625, -0.06902313232421875, -0.0412139892578125, -0.01340484619140625, 0.014404296875, 0.04221343994140625, 0.0700225830078125, 0.09783172607421875, 0.125640869140625, 0.15345001220703125, 0.1812591552734375, 0.20906829833984375, 0.23687744140625, 0.26468658447265625, 0.2924957275390625, 0.32030487060546875, 0.348114013671875, 0.37592315673828125, 0.4037322998046875, 0.43154144287109375, 0.4593505859375, 0.48715972900390625, 0.5149688720703125, 0.5427780151367188, 0.570587158203125, 0.5983963012695312, 0.6262054443359375, 0.6540145874023438, 0.68182373046875, 0.7096328735351562, 0.7374420166015625, 0.7652511596679688, 0.793060302734375, 0.8208694458007812, 0.8486785888671875, 0.8764877319335938, 0.904296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 1.0, 7.0, 9.0, 15.0, 23.0, 21.0, 35.0, 69.0, 99.0, 124.0, 141.0, 132.0, 97.0, 67.0, 50.0, 29.0, 17.0, 14.0, 20.0, 11.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014865398406982422, -0.00014394335448741913, -0.00013923272490501404, -0.00013452209532260895, -0.00012981146574020386, -0.00012510083615779877, -0.00012039020657539368, -0.00011567957699298859, -0.0001109689474105835, -0.0001062583178281784, -0.00010154768824577332, -9.683705866336823e-05, -9.212642908096313e-05, -8.741579949855804e-05, -8.270516991615295e-05, -7.799454033374786e-05, -7.328391075134277e-05, -6.857328116893768e-05, -6.386265158653259e-05, -5.91520220041275e-05, -5.444139242172241e-05, -4.973076283931732e-05, -4.502013325691223e-05, -4.030950367450714e-05, -3.559887409210205e-05, -3.088824450969696e-05, -2.617761492729187e-05, -2.146698534488678e-05, -1.675635576248169e-05, -1.2045726180076599e-05, -7.335096597671509e-06, -2.6244670152664185e-06, 2.086162567138672e-06, 6.796792149543762e-06, 1.1507421731948853e-05, 1.6218051314353943e-05, 2.0928680896759033e-05, 2.5639310479164124e-05, 3.0349940061569214e-05, 3.5060569643974304e-05, 3.9771199226379395e-05, 4.4481828808784485e-05, 4.9192458391189575e-05, 5.3903087973594666e-05, 5.8613717555999756e-05, 6.332434713840485e-05, 6.803497672080994e-05, 7.274560630321503e-05, 7.745623588562012e-05, 8.216686546802521e-05, 8.68774950504303e-05, 9.158812463283539e-05, 9.629875421524048e-05, 0.00010100938379764557, 0.00010572001338005066, 0.00011043064296245575, 0.00011514127254486084, 0.00011985190212726593, 0.00012456253170967102, 0.0001292731612920761, 0.0001339837908744812, 0.0001386944204568863, 0.00014340505003929138, 0.00014811567962169647, 0.00015282630920410156]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 8.0, 6.0, 10.0, 15.0, 29.0, 25.0, 69.0, 118.0, 196.0, 356.0, 939.0, 2834.0, 11979.0, 120184.0, 813939.0, 84034.0, 9785.0, 2380.0, 840.0, 331.0, 176.0, 101.0, 70.0, 46.0, 29.0, 9.0, 10.0, 8.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8828125, -0.857177734375, -0.83154296875, -0.805908203125, -0.7802734375, -0.754638671875, -0.72900390625, -0.703369140625, -0.677734375, -0.652099609375, -0.62646484375, -0.600830078125, -0.5751953125, -0.549560546875, -0.52392578125, -0.498291015625, -0.47265625, -0.447021484375, -0.42138671875, -0.395751953125, -0.3701171875, -0.344482421875, -0.31884765625, -0.293212890625, -0.267578125, -0.241943359375, -0.21630859375, -0.190673828125, -0.1650390625, -0.139404296875, -0.11376953125, -0.088134765625, -0.0625, -0.036865234375, -0.01123046875, 0.014404296875, 0.0400390625, 0.065673828125, 0.09130859375, 0.116943359375, 0.142578125, 0.168212890625, 0.19384765625, 0.219482421875, 0.2451171875, 0.270751953125, 0.29638671875, 0.322021484375, 0.34765625, 0.373291015625, 0.39892578125, 0.424560546875, 0.4501953125, 0.475830078125, 0.50146484375, 0.527099609375, 0.552734375, 0.578369140625, 0.60400390625, 0.629638671875, 0.6552734375, 0.680908203125, 0.70654296875, 0.732177734375, 0.7578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 4.0, 11.0, 13.0, 12.0, 17.0, 36.0, 33.0, 81.0, 81.0, 113.0, 120.0, 113.0, 96.0, 69.0, 51.0, 54.0, 34.0, 18.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7978515625, -0.7727813720703125, -0.747711181640625, -0.7226409912109375, -0.69757080078125, -0.6725006103515625, -0.647430419921875, -0.6223602294921875, -0.5972900390625, -0.5722198486328125, -0.547149658203125, -0.5220794677734375, -0.49700927734375, -0.4719390869140625, -0.446868896484375, -0.4217987060546875, -0.396728515625, -0.3716583251953125, -0.346588134765625, -0.3215179443359375, -0.29644775390625, -0.2713775634765625, -0.246307373046875, -0.2212371826171875, -0.1961669921875, -0.1710968017578125, -0.146026611328125, -0.1209564208984375, -0.09588623046875, -0.0708160400390625, -0.045745849609375, -0.0206756591796875, 0.00439453125, 0.0294647216796875, 0.054534912109375, 0.0796051025390625, 0.10467529296875, 0.1297454833984375, 0.154815673828125, 0.1798858642578125, 0.2049560546875, 0.2300262451171875, 0.255096435546875, 0.2801666259765625, 0.30523681640625, 0.3303070068359375, 0.355377197265625, 0.3804473876953125, 0.405517578125, 0.4305877685546875, 0.455657958984375, 0.4807281494140625, 0.50579833984375, 0.5308685302734375, 0.555938720703125, 0.5810089111328125, 0.6060791015625, 0.6311492919921875, 0.656219482421875, 0.6812896728515625, 0.70635986328125, 0.7314300537109375, 0.756500244140625, 0.7815704345703125, 0.806640625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 7.0, 7.0, 22.0, 90.0, 284.0, 347.0, 167.0, 46.0, 12.0, 11.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.624963760375977, -11.888132095336914, -11.151300430297852, -10.414468765258789, -9.677637100219727, -8.940805435180664, -8.203972816467285, -7.467141151428223, -6.73030948638916, -5.993477821350098, -5.256646156311035, -4.5198140144348145, -3.782982349395752, -3.0461506843566895, -2.3093185424804688, -1.5724868774414062, -0.8356552124023438, -0.0988234281539917, 0.6380083560943604, 1.374840259552002, 2.1116719245910645, 2.848503589630127, 3.5853357315063477, 4.32216739654541, 5.058999061584473, 5.795830726623535, 6.532662391662598, 7.269494533538818, 8.006326675415039, 8.743158340454102, 9.479990005493164, 10.216821670532227, 10.953655242919922, 11.690486907958984, 12.427318572998047, 13.16415023803711, 13.900981903076172, 14.637813568115234, 15.374646186828613, 16.11147689819336, 16.848308563232422, 17.585140228271484, 18.321971893310547, 19.05880355834961, 19.795635223388672, 20.532466888427734, 21.269298553466797, 22.00613021850586, 22.742963790893555, 23.479795455932617, 24.21662712097168, 24.953458786010742, 25.690290451049805, 26.427122116088867, 27.163955688476562, 27.900787353515625, 28.637619018554688, 29.37445068359375, 30.111282348632812, 30.848114013671875, 31.584945678710938, 32.32177734375, 33.05860900878906, 33.795440673828125, 34.53227233886719]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 12.0, 5.0, 12.0, 16.0, 15.0, 21.0, 22.0, 33.0, 35.0, 44.0, 42.0, 43.0, 64.0, 68.0, 69.0, 71.0, 60.0, 42.0, 43.0, 39.0, 32.0, 42.0, 26.0, 33.0, 24.0, 18.0, 13.0, 13.0, 11.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.997458457946777, -7.728933334350586, -7.4604082107543945, -7.191883087158203, -6.923357963562012, -6.65483283996582, -6.386307716369629, -6.1177825927734375, -5.849257469177246, -5.580732345581055, -5.312207221984863, -5.043682098388672, -4.7751569747924805, -4.506631851196289, -4.238106727600098, -3.9695816040039062, -3.701056480407715, -3.4325313568115234, -3.164006233215332, -2.8954811096191406, -2.626955986022949, -2.358430862426758, -2.0899057388305664, -1.821380615234375, -1.5528554916381836, -1.2843303680419922, -1.0158052444458008, -0.7472801208496094, -0.47875499725341797, -0.21022987365722656, 0.058295249938964844, 0.32682037353515625, 0.5953445434570312, 0.8638696670532227, 1.132394790649414, 1.4009199142456055, 1.6694450378417969, 1.9379701614379883, 2.2064952850341797, 2.475020408630371, 2.7435455322265625, 3.012070655822754, 3.2805957794189453, 3.5491209030151367, 3.817646026611328, 4.0861711502075195, 4.354696273803711, 4.623221397399902, 4.891746520996094, 5.160271644592285, 5.428796768188477, 5.697321891784668, 5.965847015380859, 6.234372138977051, 6.502897262573242, 6.771422386169434, 7.039947509765625, 7.308472633361816, 7.576997756958008, 7.845522880554199, 8.11404800415039, 8.382573127746582, 8.651098251342773, 8.919623374938965, 9.188148498535156]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 12.0, 31.0, 40.0, 63.0, 103.0, 221.0, 389.0, 838.0, 1792.0, 3833.0, 8973.0, 23283.0, 68990.0, 281105.0, 1705817.0, 1712084.0, 278263.0, 68271.0, 23154.0, 9104.0, 3957.0, 1909.0, 898.0, 479.0, 260.0, 157.0, 92.0, 69.0, 29.0, 15.0, 12.0, 14.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54345703125, -0.5264739990234375, -0.509490966796875, -0.4925079345703125, -0.47552490234375, -0.4585418701171875, -0.441558837890625, -0.4245758056640625, -0.4075927734375, -0.3906097412109375, -0.373626708984375, -0.3566436767578125, -0.33966064453125, -0.3226776123046875, -0.305694580078125, -0.2887115478515625, -0.271728515625, -0.2547454833984375, -0.237762451171875, -0.2207794189453125, -0.20379638671875, -0.1868133544921875, -0.169830322265625, -0.1528472900390625, -0.1358642578125, -0.1188812255859375, -0.101898193359375, -0.0849151611328125, -0.06793212890625, -0.0509490966796875, -0.033966064453125, -0.0169830322265625, 0.0, 0.0169830322265625, 0.033966064453125, 0.0509490966796875, 0.06793212890625, 0.0849151611328125, 0.101898193359375, 0.1188812255859375, 0.1358642578125, 0.1528472900390625, 0.169830322265625, 0.1868133544921875, 0.20379638671875, 0.2207794189453125, 0.237762451171875, 0.2547454833984375, 0.271728515625, 0.2887115478515625, 0.305694580078125, 0.3226776123046875, 0.33966064453125, 0.3566436767578125, 0.373626708984375, 0.3906097412109375, 0.4075927734375, 0.4245758056640625, 0.441558837890625, 0.4585418701171875, 0.47552490234375, 0.4925079345703125, 0.509490966796875, 0.5264739990234375, 0.54345703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 13.0, 9.0, 16.0, 16.0, 21.0, 27.0, 23.0, 40.0, 19.0, 30.0, 39.0, 45.0, 44.0, 40.0, 50.0, 47.0, 56.0, 46.0, 50.0, 45.0, 31.0, 38.0, 39.0, 32.0, 23.0, 18.0, 28.0, 16.0, 16.0, 11.0, 11.0, 16.0, 6.0, 6.0, 2.0, 4.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.415283203125, -0.4037017822265625, -0.392120361328125, -0.3805389404296875, -0.36895751953125, -0.3573760986328125, -0.345794677734375, -0.3342132568359375, -0.3226318359375, -0.3110504150390625, -0.299468994140625, -0.2878875732421875, -0.27630615234375, -0.2647247314453125, -0.253143310546875, -0.2415618896484375, -0.22998046875, -0.2183990478515625, -0.206817626953125, -0.1952362060546875, -0.18365478515625, -0.1720733642578125, -0.160491943359375, -0.1489105224609375, -0.1373291015625, -0.1257476806640625, -0.114166259765625, -0.1025848388671875, -0.09100341796875, -0.0794219970703125, -0.067840576171875, -0.0562591552734375, -0.044677734375, -0.0330963134765625, -0.021514892578125, -0.0099334716796875, 0.00164794921875, 0.0132293701171875, 0.024810791015625, 0.0363922119140625, 0.0479736328125, 0.0595550537109375, 0.071136474609375, 0.0827178955078125, 0.09429931640625, 0.1058807373046875, 0.117462158203125, 0.1290435791015625, 0.140625, 0.1522064208984375, 0.163787841796875, 0.1753692626953125, 0.18695068359375, 0.1985321044921875, 0.210113525390625, 0.2216949462890625, 0.2332763671875, 0.2448577880859375, 0.256439208984375, 0.2680206298828125, 0.27960205078125, 0.2911834716796875, 0.302764892578125, 0.3143463134765625, 0.325927734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 7.0, 9.0, 11.0, 22.0, 36.0, 36.0, 72.0, 109.0, 233.0, 383.0, 870.0, 1772.0, 4702.0, 15265.0, 67372.0, 609664.0, 3175940.0, 261040.0, 40135.0, 9961.0, 3407.0, 1470.0, 782.0, 378.0, 225.0, 130.0, 86.0, 44.0, 33.0, 26.0, 26.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.869964599609375, -0.83563232421875, -0.801300048828125, -0.7669677734375, -0.732635498046875, -0.69830322265625, -0.663970947265625, -0.629638671875, -0.595306396484375, -0.56097412109375, -0.526641845703125, -0.4923095703125, -0.457977294921875, -0.42364501953125, -0.389312744140625, -0.35498046875, -0.320648193359375, -0.28631591796875, -0.251983642578125, -0.2176513671875, -0.183319091796875, -0.14898681640625, -0.114654541015625, -0.080322265625, -0.045989990234375, -0.01165771484375, 0.022674560546875, 0.0570068359375, 0.091339111328125, 0.12567138671875, 0.160003662109375, 0.1943359375, 0.228668212890625, 0.26300048828125, 0.297332763671875, 0.3316650390625, 0.365997314453125, 0.40032958984375, 0.434661865234375, 0.468994140625, 0.503326416015625, 0.53765869140625, 0.571990966796875, 0.6063232421875, 0.640655517578125, 0.67498779296875, 0.709320068359375, 0.74365234375, 0.777984619140625, 0.81231689453125, 0.846649169921875, 0.8809814453125, 0.915313720703125, 0.94964599609375, 0.983978271484375, 1.018310546875, 1.052642822265625, 1.08697509765625, 1.121307373046875, 1.1556396484375, 1.189971923828125, 1.22430419921875, 1.258636474609375, 1.29296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 8.0, 17.0, 17.0, 21.0, 23.0, 38.0, 55.0, 69.0, 89.0, 178.0, 255.0, 480.0, 693.0, 810.0, 487.0, 267.0, 184.0, 102.0, 69.0, 56.0, 35.0, 19.0, 32.0, 18.0, 12.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.28515625, -1.24627685546875, -1.2073974609375, -1.16851806640625, -1.129638671875, -1.09075927734375, -1.0518798828125, -1.01300048828125, -0.97412109375, -0.93524169921875, -0.8963623046875, -0.85748291015625, -0.818603515625, -0.77972412109375, -0.7408447265625, -0.70196533203125, -0.6630859375, -0.62420654296875, -0.5853271484375, -0.54644775390625, -0.507568359375, -0.46868896484375, -0.4298095703125, -0.39093017578125, -0.35205078125, -0.31317138671875, -0.2742919921875, -0.23541259765625, -0.196533203125, -0.15765380859375, -0.1187744140625, -0.07989501953125, -0.041015625, -0.00213623046875, 0.0367431640625, 0.07562255859375, 0.114501953125, 0.15338134765625, 0.1922607421875, 0.23114013671875, 0.27001953125, 0.30889892578125, 0.3477783203125, 0.38665771484375, 0.425537109375, 0.46441650390625, 0.5032958984375, 0.54217529296875, 0.5810546875, 0.61993408203125, 0.6588134765625, 0.69769287109375, 0.736572265625, 0.77545166015625, 0.8143310546875, 0.85321044921875, 0.89208984375, 0.93096923828125, 0.9698486328125, 1.00872802734375, 1.047607421875, 1.08648681640625, 1.1253662109375, 1.16424560546875, 1.203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 11.0, 15.0, 101.0, 270.0, 331.0, 167.0, 59.0, 17.0, 8.0, 6.0, 8.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.306692123413086, -21.613309860229492, -20.91992950439453, -20.226547241210938, -19.533164978027344, -18.83978271484375, -18.146400451660156, -17.453020095825195, -16.7596378326416, -16.066255569458008, -15.37287425994873, -14.679492950439453, -13.98611068725586, -13.292728424072266, -12.599347114562988, -11.905965805053711, -11.212583541870117, -10.519201278686523, -9.825819969177246, -9.132438659667969, -8.439056396484375, -7.7456746101379395, -7.052292823791504, -6.358911037445068, -5.665529251098633, -4.972147464752197, -4.278765678405762, -3.585383892059326, -2.8920021057128906, -2.198620319366455, -1.5052385330200195, -0.811856746673584, -0.11847305297851562, 0.5749087333679199, 1.2682905197143555, 1.961672306060791, 2.6550540924072266, 3.348435878753662, 4.041817665100098, 4.735199451446533, 5.428581237792969, 6.121963024139404, 6.81534481048584, 7.508726596832275, 8.202108383178711, 8.895490646362305, 9.588871955871582, 10.28225326538086, 10.975635528564453, 11.669017791748047, 12.362399101257324, 13.055780410766602, 13.749162673950195, 14.442544937133789, 15.135926246643066, 15.829307556152344, 16.522689819335938, 17.21607208251953, 17.909454345703125, 18.602834701538086, 19.29621696472168, 19.989599227905273, 20.682979583740234, 21.376361846923828, 22.069744110107422]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 19.0, 23.0, 26.0, 23.0, 39.0, 30.0, 30.0, 33.0, 35.0, 44.0, 50.0, 67.0, 52.0, 45.0, 46.0, 54.0, 50.0, 44.0, 42.0, 39.0, 29.0, 28.0, 20.0, 23.0, 22.0, 11.0, 8.0, 8.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-7.245875358581543, -7.0493292808532715, -6.852783203125, -6.656237602233887, -6.459691524505615, -6.263145446777344, -6.066599369049072, -5.870053291320801, -5.673507213592529, -5.476961135864258, -5.280415058135986, -5.083868980407715, -4.887323379516602, -4.69077730178833, -4.494231224060059, -4.297685146331787, -4.101139068603516, -3.904592990875244, -3.7080471515655518, -3.5115010738372803, -3.314954996109009, -3.1184091567993164, -2.921863079071045, -2.7253170013427734, -2.52877140045166, -2.3322253227233887, -2.1356794834136963, -1.9391334056854248, -1.7425873279571533, -1.5460413694381714, -1.3494954109191895, -1.152949333190918, -0.9564032554626465, -0.7598572373390198, -0.5633112192153931, -0.36676526069641113, -0.17021924257278442, 0.026326775550842285, 0.22287273406982422, 0.4194188117980957, 0.6159647703170776, 0.8125107884407043, 1.009056806564331, 1.205602765083313, 1.402148723602295, 1.5986948013305664, 1.7952407598495483, 1.9917868375778198, 2.1883327960968018, 2.3848788738250732, 2.5814247131347656, 2.777970790863037, 2.9745168685913086, 3.17106294631958, 3.3676087856292725, 3.564154863357544, 3.7607007026672363, 3.957246780395508, 4.153792858123779, 4.350338935852051, 4.546884536743164, 4.7434306144714355, 4.939976692199707, 5.1365227699279785, 5.33306884765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 9.0, 13.0, 19.0, 21.0, 29.0, 40.0, 66.0, 124.0, 173.0, 266.0, 397.0, 569.0, 880.0, 1342.0, 2218.0, 3579.0, 6044.0, 10153.0, 18119.0, 32708.0, 60108.0, 115842.0, 226203.0, 261629.0, 143296.0, 73241.0, 39334.0, 21734.0, 12076.0, 7087.0, 4133.0, 2556.0, 1622.0, 974.0, 640.0, 443.0, 289.0, 204.0, 120.0, 73.0, 67.0, 35.0, 13.0, 21.0, 17.0, 7.0, 7.0, 9.0, 4.0, 0.0, 3.0, 2.0, 3.0], "bins": [-0.59228515625, -0.5749435424804688, -0.5576019287109375, -0.5402603149414062, -0.522918701171875, -0.5055770874023438, -0.4882354736328125, -0.47089385986328125, -0.45355224609375, -0.43621063232421875, -0.4188690185546875, -0.40152740478515625, -0.384185791015625, -0.36684417724609375, -0.3495025634765625, -0.33216094970703125, -0.3148193359375, -0.29747772216796875, -0.2801361083984375, -0.26279449462890625, -0.245452880859375, -0.22811126708984375, -0.2107696533203125, -0.19342803955078125, -0.17608642578125, -0.15874481201171875, -0.1414031982421875, -0.12406158447265625, -0.106719970703125, -0.08937835693359375, -0.0720367431640625, -0.05469512939453125, -0.037353515625, -0.02001190185546875, -0.0026702880859375, 0.01467132568359375, 0.032012939453125, 0.04935455322265625, 0.0666961669921875, 0.08403778076171875, 0.10137939453125, 0.11872100830078125, 0.1360626220703125, 0.15340423583984375, 0.170745849609375, 0.18808746337890625, 0.2054290771484375, 0.22277069091796875, 0.2401123046875, 0.25745391845703125, 0.2747955322265625, 0.29213714599609375, 0.309478759765625, 0.32682037353515625, 0.3441619873046875, 0.36150360107421875, 0.37884521484375, 0.39618682861328125, 0.4135284423828125, 0.43087005615234375, 0.448211669921875, 0.46555328369140625, 0.4828948974609375, 0.5002365112304688, 0.517578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 4.0, 8.0, 10.0, 9.0, 11.0, 15.0, 21.0, 24.0, 23.0, 30.0, 21.0, 28.0, 30.0, 30.0, 30.0, 36.0, 51.0, 40.0, 29.0, 54.0, 44.0, 43.0, 31.0, 33.0, 43.0, 29.0, 29.0, 33.0, 28.0, 24.0, 19.0, 18.0, 17.0, 21.0, 13.0, 12.0, 8.0, 4.0, 11.0, 4.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.335205078125, -0.3251953125, -0.315185546875, -0.30517578125, -0.295166015625, -0.28515625, -0.275146484375, -0.26513671875, -0.255126953125, -0.2451171875, -0.235107421875, -0.22509765625, -0.215087890625, -0.205078125, -0.195068359375, -0.18505859375, -0.175048828125, -0.1650390625, -0.155029296875, -0.14501953125, -0.135009765625, -0.125, -0.114990234375, -0.10498046875, -0.094970703125, -0.0849609375, -0.074951171875, -0.06494140625, -0.054931640625, -0.044921875, -0.034912109375, -0.02490234375, -0.014892578125, -0.0048828125, 0.005126953125, 0.01513671875, 0.025146484375, 0.03515625, 0.045166015625, 0.05517578125, 0.065185546875, 0.0751953125, 0.085205078125, 0.09521484375, 0.105224609375, 0.115234375, 0.125244140625, 0.13525390625, 0.145263671875, 0.1552734375, 0.165283203125, 0.17529296875, 0.185302734375, 0.1953125, 0.205322265625, 0.21533203125, 0.225341796875, 0.2353515625, 0.245361328125, 0.25537109375, 0.265380859375, 0.275390625, 0.285400390625, 0.29541015625, 0.305419921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 13.0, 16.0, 18.0, 30.0, 46.0, 72.0, 113.0, 177.0, 267.0, 387.0, 589.0, 1053.0, 1992.0, 4941.0, 20159.0, 193621.0, 749691.0, 59015.0, 9498.0, 3062.0, 1473.0, 883.0, 494.0, 308.0, 202.0, 130.0, 94.0, 62.0, 46.0, 33.0, 17.0, 10.0, 12.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8839874267578125, -1.825592041015625, -1.7671966552734375, -1.70880126953125, -1.6504058837890625, -1.592010498046875, -1.5336151123046875, -1.4752197265625, -1.4168243408203125, -1.358428955078125, -1.3000335693359375, -1.24163818359375, -1.1832427978515625, -1.124847412109375, -1.0664520263671875, -1.008056640625, -0.9496612548828125, -0.891265869140625, -0.8328704833984375, -0.77447509765625, -0.7160797119140625, -0.657684326171875, -0.5992889404296875, -0.5408935546875, -0.4824981689453125, -0.424102783203125, -0.3657073974609375, -0.30731201171875, -0.2489166259765625, -0.190521240234375, -0.1321258544921875, -0.07373046875, -0.0153350830078125, 0.043060302734375, 0.1014556884765625, 0.15985107421875, 0.2182464599609375, 0.276641845703125, 0.3350372314453125, 0.3934326171875, 0.4518280029296875, 0.510223388671875, 0.5686187744140625, 0.62701416015625, 0.6854095458984375, 0.743804931640625, 0.8022003173828125, 0.860595703125, 0.9189910888671875, 0.977386474609375, 1.0357818603515625, 1.09417724609375, 1.1525726318359375, 1.210968017578125, 1.2693634033203125, 1.3277587890625, 1.3861541748046875, 1.444549560546875, 1.5029449462890625, 1.56134033203125, 1.6197357177734375, 1.678131103515625, 1.7365264892578125, 1.794921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 9.0, 6.0, 7.0, 21.0, 17.0, 24.0, 25.0, 41.0, 46.0, 53.0, 49.0, 72.0, 66.0, 57.0, 71.0, 51.0, 73.0, 52.0, 49.0, 46.0, 29.0, 31.0, 32.0, 29.0, 13.0, 13.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.4140625, -2.34375, -2.2734375, -2.203125, -2.1328125, -2.0625, -1.9921875, -1.921875, -1.8515625, -1.78125, -1.7109375, -1.640625, -1.5703125, -1.5, -1.4296875, -1.359375, -1.2890625, -1.21875, -1.1484375, -1.078125, -1.0078125, -0.9375, -0.8671875, -0.796875, -0.7265625, -0.65625, -0.5859375, -0.515625, -0.4453125, -0.375, -0.3046875, -0.234375, -0.1640625, -0.09375, -0.0234375, 0.046875, 0.1171875, 0.1875, 0.2578125, 0.328125, 0.3984375, 0.46875, 0.5390625, 0.609375, 0.6796875, 0.75, 0.8203125, 0.890625, 0.9609375, 1.03125, 1.1015625, 1.171875, 1.2421875, 1.3125, 1.3828125, 1.453125, 1.5234375, 1.59375, 1.6640625, 1.734375, 1.8046875, 1.875, 1.9453125, 2.015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 5.0, 8.0, 10.0, 20.0, 27.0, 38.0, 44.0, 83.0, 119.0, 207.0, 381.0, 773.0, 1958.0, 6699.0, 35661.0, 298880.0, 632514.0, 56996.0, 9543.0, 2551.0, 947.0, 433.0, 215.0, 143.0, 97.0, 48.0, 36.0, 24.0, 20.0, 13.0, 13.0, 10.0, 3.0, 5.0, 5.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.587890625, -0.5695877075195312, -0.5512847900390625, -0.5329818725585938, -0.514678955078125, -0.49637603759765625, -0.4780731201171875, -0.45977020263671875, -0.44146728515625, -0.42316436767578125, -0.4048614501953125, -0.38655853271484375, -0.368255615234375, -0.34995269775390625, -0.3316497802734375, -0.31334686279296875, -0.2950439453125, -0.27674102783203125, -0.2584381103515625, -0.24013519287109375, -0.221832275390625, -0.20352935791015625, -0.1852264404296875, -0.16692352294921875, -0.14862060546875, -0.13031768798828125, -0.1120147705078125, -0.09371185302734375, -0.075408935546875, -0.05710601806640625, -0.0388031005859375, -0.02050018310546875, -0.002197265625, 0.01610565185546875, 0.0344085693359375, 0.05271148681640625, 0.071014404296875, 0.08931732177734375, 0.1076202392578125, 0.12592315673828125, 0.14422607421875, 0.16252899169921875, 0.1808319091796875, 0.19913482666015625, 0.217437744140625, 0.23574066162109375, 0.2540435791015625, 0.27234649658203125, 0.2906494140625, 0.30895233154296875, 0.3272552490234375, 0.34555816650390625, 0.363861083984375, 0.38216400146484375, 0.4004669189453125, 0.41876983642578125, 0.43707275390625, 0.45537567138671875, 0.4736785888671875, 0.49198150634765625, 0.510284423828125, 0.5285873413085938, 0.5468902587890625, 0.5651931762695312, 0.58349609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 13.0, 6.0, 13.0, 8.0, 15.0, 25.0, 22.0, 32.0, 51.0, 55.0, 86.0, 103.0, 137.0, 101.0, 66.0, 60.0, 36.0, 35.0, 35.0, 21.0, 14.0, 10.0, 8.0, 6.0, 11.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0001361370086669922, -0.00013218354433774948, -0.00012823008000850677, -0.00012427661567926407, -0.00012032315135002136, -0.00011636968702077866, -0.00011241622269153595, -0.00010846275836229324, -0.00010450929403305054, -0.00010055582970380783, -9.660236537456512e-05, -9.264890104532242e-05, -8.869543671607971e-05, -8.4741972386837e-05, -8.07885080575943e-05, -7.683504372835159e-05, -7.288157939910889e-05, -6.892811506986618e-05, -6.497465074062347e-05, -6.102118641138077e-05, -5.706772208213806e-05, -5.3114257752895355e-05, -4.916079342365265e-05, -4.520732909440994e-05, -4.1253864765167236e-05, -3.730040043592453e-05, -3.3346936106681824e-05, -2.9393471777439117e-05, -2.544000744819641e-05, -2.1486543118953705e-05, -1.7533078789711e-05, -1.3579614460468292e-05, -9.626150131225586e-06, -5.67268580198288e-06, -1.7192214727401733e-06, 2.234242856502533e-06, 6.187707185745239e-06, 1.0141171514987946e-05, 1.4094635844230652e-05, 1.8048100173473358e-05, 2.2001564502716064e-05, 2.595502883195877e-05, 2.9908493161201477e-05, 3.386195749044418e-05, 3.781542181968689e-05, 4.1768886148929596e-05, 4.57223504781723e-05, 4.967581480741501e-05, 5.3629279136657715e-05, 5.758274346590042e-05, 6.153620779514313e-05, 6.548967212438583e-05, 6.944313645362854e-05, 7.339660078287125e-05, 7.735006511211395e-05, 8.130352944135666e-05, 8.525699377059937e-05, 8.921045809984207e-05, 9.316392242908478e-05, 9.711738675832748e-05, 0.00010107085108757019, 0.0001050243154168129, 0.0001089777797460556, 0.00011293124407529831, 0.00011688470840454102]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 7.0, 5.0, 9.0, 12.0, 10.0, 23.0, 26.0, 30.0, 64.0, 97.0, 96.0, 160.0, 279.0, 441.0, 684.0, 1328.0, 2563.0, 6369.0, 22679.0, 149231.0, 712304.0, 121269.0, 19740.0, 5783.0, 2376.0, 1136.0, 660.0, 398.0, 242.0, 164.0, 120.0, 57.0, 43.0, 39.0, 33.0, 23.0, 9.0, 10.0, 7.0, 5.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4268989562988281, -0.41287994384765625, -0.3988609313964844, -0.3848419189453125, -0.3708229064941406, -0.35680389404296875, -0.3427848815917969, -0.328765869140625, -0.3147468566894531, -0.30072784423828125, -0.2867088317871094, -0.2726898193359375, -0.2586708068847656, -0.24465179443359375, -0.23063278198242188, -0.21661376953125, -0.20259475708007812, -0.18857574462890625, -0.17455673217773438, -0.1605377197265625, -0.14651870727539062, -0.13249969482421875, -0.11848068237304688, -0.104461669921875, -0.09044265747070312, -0.07642364501953125, -0.062404632568359375, -0.0483856201171875, -0.034366607666015625, -0.02034759521484375, -0.006328582763671875, 0.0076904296875, 0.021709442138671875, 0.03572845458984375, 0.049747467041015625, 0.0637664794921875, 0.07778549194335938, 0.09180450439453125, 0.10582351684570312, 0.119842529296875, 0.13386154174804688, 0.14788055419921875, 0.16189956665039062, 0.1759185791015625, 0.18993759155273438, 0.20395660400390625, 0.21797561645507812, 0.23199462890625, 0.24601364135742188, 0.26003265380859375, 0.2740516662597656, 0.2880706787109375, 0.3020896911621094, 0.31610870361328125, 0.3301277160644531, 0.344146728515625, 0.3581657409667969, 0.37218475341796875, 0.3862037658691406, 0.4002227783203125, 0.4142417907714844, 0.42826080322265625, 0.4422798156738281, 0.456298828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 4.0, 6.0, 11.0, 9.0, 8.0, 17.0, 14.0, 21.0, 26.0, 35.0, 35.0, 58.0, 46.0, 51.0, 54.0, 73.0, 65.0, 61.0, 68.0, 56.0, 43.0, 48.0, 35.0, 33.0, 27.0, 21.0, 12.0, 13.0, 7.0, 8.0, 8.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364990234375, -0.35260772705078125, -0.3402252197265625, -0.32784271240234375, -0.315460205078125, -0.30307769775390625, -0.2906951904296875, -0.27831268310546875, -0.26593017578125, -0.25354766845703125, -0.2411651611328125, -0.22878265380859375, -0.216400146484375, -0.20401763916015625, -0.1916351318359375, -0.17925262451171875, -0.1668701171875, -0.15448760986328125, -0.1421051025390625, -0.12972259521484375, -0.117340087890625, -0.10495758056640625, -0.0925750732421875, -0.08019256591796875, -0.06781005859375, -0.05542755126953125, -0.0430450439453125, -0.03066253662109375, -0.018280029296875, -0.00589752197265625, 0.0064849853515625, 0.01886749267578125, 0.03125, 0.04363250732421875, 0.0560150146484375, 0.06839752197265625, 0.080780029296875, 0.09316253662109375, 0.1055450439453125, 0.11792755126953125, 0.13031005859375, 0.14269256591796875, 0.1550750732421875, 0.16745758056640625, 0.179840087890625, 0.19222259521484375, 0.2046051025390625, 0.21698760986328125, 0.2293701171875, 0.24175262451171875, 0.2541351318359375, 0.26651763916015625, 0.278900146484375, 0.29128265380859375, 0.3036651611328125, 0.31604766845703125, 0.32843017578125, 0.34081268310546875, 0.3531951904296875, 0.36557769775390625, 0.377960205078125, 0.39034271240234375, 0.4027252197265625, 0.41510772705078125, 0.427490234375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 13.0, 29.0, 66.0, 140.0, 245.0, 204.0, 123.0, 67.0, 47.0, 21.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-16.09343719482422, -15.73405647277832, -15.374674797058105, -15.015294075012207, -14.655913352966309, -14.296531677246094, -13.937150955200195, -13.577770233154297, -13.218388557434082, -12.859007835388184, -12.499626159667969, -12.14024543762207, -11.780864715576172, -11.421483039855957, -11.062102317810059, -10.702720642089844, -10.343339920043945, -9.983959197998047, -9.624577522277832, -9.265196800231934, -8.905816078186035, -8.54643440246582, -8.187053680419922, -7.827672481536865, -7.468292236328125, -7.108911037445068, -6.74953031539917, -6.390149116516113, -6.030767917633057, -5.67138671875, -5.312005996704102, -4.952624797821045, -4.59324312210083, -4.233861923217773, -3.874480962753296, -3.5151000022888184, -3.1557188034057617, -2.796337842941284, -2.4369568824768066, -2.07757568359375, -1.7181947231292725, -1.3588136434555054, -0.9994326233863831, -0.6400516033172607, -0.28067052364349365, 0.07871055603027344, 0.438091516494751, 0.7974727153778076, 1.1568536758422852, 1.5162347555160522, 1.8756158351898193, 2.234996795654297, 2.5943779945373535, 2.953758955001831, 3.3131399154663086, 3.6725211143493652, 4.031902313232422, 4.3912835121154785, 4.750664234161377, 5.110045433044434, 5.46942663192749, 5.828807830810547, 6.188188552856445, 6.547569751739502, 6.9069504737854]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 11.0, 15.0, 22.0, 19.0, 31.0, 26.0, 25.0, 31.0, 21.0, 34.0, 54.0, 56.0, 51.0, 56.0, 68.0, 44.0, 50.0, 31.0, 35.0, 35.0, 36.0, 16.0, 27.0, 23.0, 21.0, 18.0, 11.0, 13.0, 14.0, 10.0, 1.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0], "bins": [-5.2391767501831055, -5.077087879180908, -4.914999008178711, -4.752910614013672, -4.590821743011475, -4.428732872009277, -4.26664400100708, -4.104555130004883, -3.9424662590026855, -3.7803773880004883, -3.61828875541687, -3.456199884414673, -3.2941110134124756, -3.1320223808288574, -2.96993350982666, -2.807844638824463, -2.6457560062408447, -2.4836671352386475, -2.3215785026550293, -2.159489631652832, -1.9974007606506348, -1.835312008857727, -1.6732232570648193, -1.511134386062622, -1.3490456342697144, -1.1869568824768066, -1.0248680114746094, -0.8627792596817017, -0.7006904482841492, -0.5386016368865967, -0.37651288509368896, -0.2144240140914917, -0.052335262298583984, 0.10975353419780731, 0.2718423306941986, 0.4339311122894287, 0.5960199236869812, 0.7581087350845337, 0.9201974868774414, 1.0822863578796387, 1.2443751096725464, 1.406463861465454, 1.5685527324676514, 1.730641484260559, 1.8927302360534668, 2.054819107055664, 2.2169079780578613, 2.3789968490600586, 2.5410854816436768, 2.703174352645874, 2.865262985229492, 3.0273518562316895, 3.1894407272338867, 3.351529598236084, 3.513618230819702, 3.6757071018218994, 3.8377957344055176, 3.999884605407715, 4.161973476409912, 4.324062347412109, 4.486150741577148, 4.648239612579346, 4.810328483581543, 4.97241735458374, 5.1345062255859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 14.0, 25.0, 39.0, 52.0, 108.0, 173.0, 318.0, 644.0, 1218.0, 2533.0, 5630.0, 13338.0, 35316.0, 111431.0, 487354.0, 2103617.0, 1119170.0, 216910.0, 59556.0, 20890.0, 8345.0, 3731.0, 1730.0, 976.0, 492.0, 256.0, 153.0, 81.0, 60.0, 33.0, 28.0, 19.0, 5.0, 6.0, 7.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.412109375, -0.39870452880859375, -0.3852996826171875, -0.37189483642578125, -0.358489990234375, -0.34508514404296875, -0.3316802978515625, -0.31827545166015625, -0.30487060546875, -0.29146575927734375, -0.2780609130859375, -0.26465606689453125, -0.251251220703125, -0.23784637451171875, -0.2244415283203125, -0.21103668212890625, -0.1976318359375, -0.18422698974609375, -0.1708221435546875, -0.15741729736328125, -0.144012451171875, -0.13060760498046875, -0.1172027587890625, -0.10379791259765625, -0.09039306640625, -0.07698822021484375, -0.0635833740234375, -0.05017852783203125, -0.036773681640625, -0.02336883544921875, -0.0099639892578125, 0.00344085693359375, 0.016845703125, 0.03025054931640625, 0.0436553955078125, 0.05706024169921875, 0.070465087890625, 0.08386993408203125, 0.0972747802734375, 0.11067962646484375, 0.12408447265625, 0.13748931884765625, 0.1508941650390625, 0.16429901123046875, 0.177703857421875, 0.19110870361328125, 0.2045135498046875, 0.21791839599609375, 0.2313232421875, 0.24472808837890625, 0.2581329345703125, 0.27153778076171875, 0.284942626953125, 0.29834747314453125, 0.3117523193359375, 0.32515716552734375, 0.33856201171875, 0.35196685791015625, 0.3653717041015625, 0.37877655029296875, 0.392181396484375, 0.40558624267578125, 0.4189910888671875, 0.43239593505859375, 0.44580078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 9.0, 7.0, 9.0, 22.0, 18.0, 17.0, 16.0, 17.0, 18.0, 36.0, 31.0, 33.0, 44.0, 35.0, 57.0, 42.0, 49.0, 38.0, 42.0, 45.0, 49.0, 35.0, 35.0, 40.0, 32.0, 37.0, 37.0, 30.0, 17.0, 17.0, 19.0, 17.0, 12.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.3318023681640625, -0.321075439453125, -0.3103485107421875, -0.29962158203125, -0.2888946533203125, -0.278167724609375, -0.2674407958984375, -0.2567138671875, -0.2459869384765625, -0.235260009765625, -0.2245330810546875, -0.21380615234375, -0.2030792236328125, -0.192352294921875, -0.1816253662109375, -0.1708984375, -0.1601715087890625, -0.149444580078125, -0.1387176513671875, -0.12799072265625, -0.1172637939453125, -0.106536865234375, -0.0958099365234375, -0.0850830078125, -0.0743560791015625, -0.063629150390625, -0.0529022216796875, -0.04217529296875, -0.0314483642578125, -0.020721435546875, -0.0099945068359375, 0.000732421875, 0.0114593505859375, 0.022186279296875, 0.0329132080078125, 0.04364013671875, 0.0543670654296875, 0.065093994140625, 0.0758209228515625, 0.0865478515625, 0.0972747802734375, 0.108001708984375, 0.1187286376953125, 0.12945556640625, 0.1401824951171875, 0.150909423828125, 0.1616363525390625, 0.17236328125, 0.1830902099609375, 0.193817138671875, 0.2045440673828125, 0.21527099609375, 0.2259979248046875, 0.236724853515625, 0.2474517822265625, 0.2581787109375, 0.2689056396484375, 0.279632568359375, 0.2903594970703125, 0.30108642578125, 0.3118133544921875, 0.322540283203125, 0.3332672119140625, 0.343994140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 7.0, 20.0, 19.0, 28.0, 61.0, 102.0, 247.0, 464.0, 1190.0, 4114.0, 19592.0, 163687.0, 3280760.0, 671060.0, 42910.0, 6978.0, 1801.0, 678.0, 289.0, 142.0, 69.0, 30.0, 15.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3515625, -1.3147735595703125, -1.277984619140625, -1.2411956787109375, -1.20440673828125, -1.1676177978515625, -1.130828857421875, -1.0940399169921875, -1.0572509765625, -1.0204620361328125, -0.983673095703125, -0.9468841552734375, -0.91009521484375, -0.8733062744140625, -0.836517333984375, -0.7997283935546875, -0.762939453125, -0.7261505126953125, -0.689361572265625, -0.6525726318359375, -0.61578369140625, -0.5789947509765625, -0.542205810546875, -0.5054168701171875, -0.4686279296875, -0.4318389892578125, -0.395050048828125, -0.3582611083984375, -0.32147216796875, -0.2846832275390625, -0.247894287109375, -0.2111053466796875, -0.17431640625, -0.1375274658203125, -0.100738525390625, -0.0639495849609375, -0.02716064453125, 0.0096282958984375, 0.046417236328125, 0.0832061767578125, 0.1199951171875, 0.1567840576171875, 0.193572998046875, 0.2303619384765625, 0.26715087890625, 0.3039398193359375, 0.340728759765625, 0.3775177001953125, 0.414306640625, 0.4510955810546875, 0.487884521484375, 0.5246734619140625, 0.56146240234375, 0.5982513427734375, 0.635040283203125, 0.6718292236328125, 0.7086181640625, 0.7454071044921875, 0.782196044921875, 0.8189849853515625, 0.85577392578125, 0.8925628662109375, 0.929351806640625, 0.9661407470703125, 1.0029296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 10.0, 11.0, 9.0, 15.0, 31.0, 30.0, 47.0, 70.0, 133.0, 149.0, 245.0, 384.0, 678.0, 788.0, 564.0, 332.0, 225.0, 134.0, 62.0, 37.0, 39.0, 20.0, 21.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2685546875, -1.234588623046875, -1.20062255859375, -1.166656494140625, -1.1326904296875, -1.098724365234375, -1.06475830078125, -1.030792236328125, -0.996826171875, -0.962860107421875, -0.92889404296875, -0.894927978515625, -0.8609619140625, -0.826995849609375, -0.79302978515625, -0.759063720703125, -0.72509765625, -0.691131591796875, -0.65716552734375, -0.623199462890625, -0.5892333984375, -0.555267333984375, -0.52130126953125, -0.487335205078125, -0.453369140625, -0.419403076171875, -0.38543701171875, -0.351470947265625, -0.3175048828125, -0.283538818359375, -0.24957275390625, -0.215606689453125, -0.181640625, -0.147674560546875, -0.11370849609375, -0.079742431640625, -0.0457763671875, -0.011810302734375, 0.02215576171875, 0.056121826171875, 0.090087890625, 0.124053955078125, 0.15802001953125, 0.191986083984375, 0.2259521484375, 0.259918212890625, 0.29388427734375, 0.327850341796875, 0.36181640625, 0.395782470703125, 0.42974853515625, 0.463714599609375, 0.4976806640625, 0.531646728515625, 0.56561279296875, 0.599578857421875, 0.633544921875, 0.667510986328125, 0.70147705078125, 0.735443115234375, 0.7694091796875, 0.803375244140625, 0.83734130859375, 0.871307373046875, 0.9052734375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 6.0, 19.0, 35.0, 126.0, 299.0, 319.0, 129.0, 44.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.252342224121094, -14.712199211120605, -14.172056198120117, -13.631913185119629, -13.09177017211914, -12.551628112792969, -12.01148509979248, -11.471342086791992, -10.931199073791504, -10.391056060791016, -9.850913047790527, -9.310770034790039, -8.770627975463867, -8.230484008789062, -7.690341949462891, -7.150198936462402, -6.610055923461914, -6.069912910461426, -5.5297698974609375, -4.989627361297607, -4.449484348297119, -3.909341335296631, -3.3691985607147217, -2.8290557861328125, -2.288912773132324, -1.7487698793411255, -1.2086269855499268, -0.668484091758728, -0.1283411979675293, 0.411801815032959, 0.9519445896148682, 1.4920873641967773, 2.032228469848633, 2.572371482849121, 3.1125142574310303, 3.6526570320129395, 4.192800045013428, 4.732943058013916, 5.273085594177246, 5.813228607177734, 6.353371620178223, 6.893514633178711, 7.433657646179199, 7.973800182342529, 8.51394271850586, 9.054086685180664, 9.594228744506836, 10.134371757507324, 10.674514770507812, 11.2146577835083, 11.754800796508789, 12.294943809509277, 12.835086822509766, 13.375228881835938, 13.915371894836426, 14.455514907836914, 14.995657920837402, 15.53580093383789, 16.075942993164062, 16.616086959838867, 17.15622901916504, 17.696372985839844, 18.236515045166016, 18.776657104492188, 19.316801071166992]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 6.0, 9.0, 10.0, 14.0, 15.0, 15.0, 21.0, 30.0, 24.0, 27.0, 30.0, 37.0, 38.0, 52.0, 50.0, 36.0, 50.0, 41.0, 44.0, 48.0, 42.0, 60.0, 51.0, 28.0, 37.0, 29.0, 20.0, 19.0, 14.0, 22.0, 13.0, 14.0, 12.0, 9.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.793994903564453, -4.647636890411377, -4.501278877258301, -4.354920864105225, -4.208562850952148, -4.062204837799072, -3.915846586227417, -3.769488573074341, -3.6231305599212646, -3.4767725467681885, -3.3304145336151123, -3.184056520462036, -3.037698268890381, -2.8913402557373047, -2.7449822425842285, -2.5986242294311523, -2.452266216278076, -2.305908203125, -2.159550189971924, -2.0131921768188477, -1.866834044456482, -1.7204760313034058, -1.57411789894104, -1.4277598857879639, -1.2814018726348877, -1.1350438594818115, -0.9886857867240906, -0.8423277139663696, -0.6959697008132935, -0.5496116876602173, -0.40325361490249634, -0.2568955421447754, -0.11053752899169922, 0.03582051396369934, 0.1821785569190979, 0.32853659987449646, 0.474894642829895, 0.6212526559829712, 0.7676107287406921, 0.9139688014984131, 1.0603268146514893, 1.2066848278045654, 1.3530428409576416, 1.4994009733200073, 1.6457589864730835, 1.7921169996261597, 1.9384751319885254, 2.0848331451416016, 2.2311911582946777, 2.377549171447754, 2.52390718460083, 2.6702651977539062, 2.8166232109069824, 2.9629812240600586, 3.109339475631714, 3.25569748878479, 3.402055501937866, 3.5484135150909424, 3.6947715282440186, 3.8411295413970947, 3.98748779296875, 4.133845806121826, 4.280203819274902, 4.4265618324279785, 4.572919845581055]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 3.0, 14.0, 28.0, 34.0, 62.0, 86.0, 115.0, 195.0, 287.0, 450.0, 741.0, 1151.0, 1941.0, 3153.0, 5530.0, 10280.0, 20120.0, 44078.0, 113562.0, 335300.0, 319474.0, 107500.0, 41971.0, 19320.0, 9770.0, 5373.0, 3137.0, 1802.0, 1142.0, 723.0, 425.0, 276.0, 161.0, 123.0, 80.0, 44.0, 30.0, 27.0, 17.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60986328125, -0.5901718139648438, -0.5704803466796875, -0.5507888793945312, -0.531097412109375, -0.5114059448242188, -0.4917144775390625, -0.47202301025390625, -0.45233154296875, -0.43264007568359375, -0.4129486083984375, -0.39325714111328125, -0.373565673828125, -0.35387420654296875, -0.3341827392578125, -0.31449127197265625, -0.2947998046875, -0.27510833740234375, -0.2554168701171875, -0.23572540283203125, -0.216033935546875, -0.19634246826171875, -0.1766510009765625, -0.15695953369140625, -0.13726806640625, -0.11757659912109375, -0.0978851318359375, -0.07819366455078125, -0.058502197265625, -0.03881072998046875, -0.0191192626953125, 0.00057220458984375, 0.020263671875, 0.03995513916015625, 0.0596466064453125, 0.07933807373046875, 0.099029541015625, 0.11872100830078125, 0.1384124755859375, 0.15810394287109375, 0.17779541015625, 0.19748687744140625, 0.2171783447265625, 0.23686981201171875, 0.256561279296875, 0.27625274658203125, 0.2959442138671875, 0.31563568115234375, 0.3353271484375, 0.35501861572265625, 0.3747100830078125, 0.39440155029296875, 0.414093017578125, 0.43378448486328125, 0.4534759521484375, 0.47316741943359375, 0.49285888671875, 0.5125503540039062, 0.5322418212890625, 0.5519332885742188, 0.571624755859375, 0.5913162231445312, 0.6110076904296875, 0.6306991577148438, 0.650390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 8.0, 10.0, 13.0, 12.0, 21.0, 13.0, 22.0, 28.0, 23.0, 34.0, 26.0, 32.0, 54.0, 37.0, 47.0, 32.0, 32.0, 50.0, 41.0, 39.0, 37.0, 36.0, 42.0, 27.0, 36.0, 38.0, 26.0, 33.0, 25.0, 19.0, 12.0, 19.0, 16.0, 8.0, 5.0, 5.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.341064453125, -0.3305931091308594, -0.32012176513671875, -0.3096504211425781, -0.2991790771484375, -0.2887077331542969, -0.27823638916015625, -0.2677650451660156, -0.257293701171875, -0.24682235717773438, -0.23635101318359375, -0.22587966918945312, -0.2154083251953125, -0.20493698120117188, -0.19446563720703125, -0.18399429321289062, -0.17352294921875, -0.16305160522460938, -0.15258026123046875, -0.14210891723632812, -0.1316375732421875, -0.12116622924804688, -0.11069488525390625, -0.10022354125976562, -0.089752197265625, -0.07928085327148438, -0.06880950927734375, -0.058338165283203125, -0.0478668212890625, -0.037395477294921875, -0.02692413330078125, -0.016452789306640625, -0.0059814453125, 0.004489898681640625, 0.01496124267578125, 0.025432586669921875, 0.0359039306640625, 0.046375274658203125, 0.05684661865234375, 0.06731796264648438, 0.077789306640625, 0.08826065063476562, 0.09873199462890625, 0.10920333862304688, 0.1196746826171875, 0.13014602661132812, 0.14061737060546875, 0.15108871459960938, 0.16156005859375, 0.17203140258789062, 0.18250274658203125, 0.19297409057617188, 0.2034454345703125, 0.21391677856445312, 0.22438812255859375, 0.23485946655273438, 0.245330810546875, 0.2558021545410156, 0.26627349853515625, 0.2767448425292969, 0.2872161865234375, 0.2976875305175781, 0.30815887451171875, 0.3186302185058594, 0.3291015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 19.0, 40.0, 61.0, 133.0, 207.0, 411.0, 748.0, 1906.0, 8051.0, 94185.0, 887116.0, 47302.0, 5495.0, 1450.0, 647.0, 358.0, 175.0, 103.0, 54.0, 32.0, 23.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.252838134765625, -2.18536376953125, -2.117889404296875, -2.0504150390625, -1.982940673828125, -1.91546630859375, -1.847991943359375, -1.780517578125, -1.713043212890625, -1.64556884765625, -1.578094482421875, -1.5106201171875, -1.443145751953125, -1.37567138671875, -1.308197021484375, -1.24072265625, -1.173248291015625, -1.10577392578125, -1.038299560546875, -0.9708251953125, -0.903350830078125, -0.83587646484375, -0.768402099609375, -0.700927734375, -0.633453369140625, -0.56597900390625, -0.498504638671875, -0.4310302734375, -0.363555908203125, -0.29608154296875, -0.228607177734375, -0.1611328125, -0.093658447265625, -0.02618408203125, 0.041290283203125, 0.1087646484375, 0.176239013671875, 0.24371337890625, 0.311187744140625, 0.378662109375, 0.446136474609375, 0.51361083984375, 0.581085205078125, 0.6485595703125, 0.716033935546875, 0.78350830078125, 0.850982666015625, 0.91845703125, 0.985931396484375, 1.05340576171875, 1.120880126953125, 1.1883544921875, 1.255828857421875, 1.32330322265625, 1.390777587890625, 1.458251953125, 1.525726318359375, 1.59320068359375, 1.660675048828125, 1.7281494140625, 1.795623779296875, 1.86309814453125, 1.930572509765625, 1.998046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 4.0, 3.0, 10.0, 13.0, 16.0, 22.0, 25.0, 37.0, 21.0, 36.0, 29.0, 48.0, 66.0, 54.0, 55.0, 57.0, 68.0, 58.0, 50.0, 58.0, 34.0, 43.0, 28.0, 32.0, 29.0, 23.0, 11.0, 16.0, 12.0, 9.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48828125, -1.4349212646484375, -1.381561279296875, -1.3282012939453125, -1.27484130859375, -1.2214813232421875, -1.168121337890625, -1.1147613525390625, -1.0614013671875, -1.0080413818359375, -0.954681396484375, -0.9013214111328125, -0.84796142578125, -0.7946014404296875, -0.741241455078125, -0.6878814697265625, -0.634521484375, -0.5811614990234375, -0.527801513671875, -0.4744415283203125, -0.42108154296875, -0.3677215576171875, -0.314361572265625, -0.2610015869140625, -0.2076416015625, -0.1542816162109375, -0.100921630859375, -0.0475616455078125, 0.00579833984375, 0.0591583251953125, 0.112518310546875, 0.1658782958984375, 0.21923828125, 0.2725982666015625, 0.325958251953125, 0.3793182373046875, 0.43267822265625, 0.4860382080078125, 0.539398193359375, 0.5927581787109375, 0.6461181640625, 0.6994781494140625, 0.752838134765625, 0.8061981201171875, 0.85955810546875, 0.9129180908203125, 0.966278076171875, 1.0196380615234375, 1.072998046875, 1.1263580322265625, 1.179718017578125, 1.2330780029296875, 1.28643798828125, 1.3397979736328125, 1.393157958984375, 1.4465179443359375, 1.4998779296875, 1.5532379150390625, 1.606597900390625, 1.6599578857421875, 1.71331787109375, 1.7666778564453125, 1.820037841796875, 1.8733978271484375, 1.9267578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 14.0, 33.0, 41.0, 79.0, 153.0, 257.0, 549.0, 1497.0, 5035.0, 26601.0, 255301.0, 692697.0, 53852.0, 8679.0, 2173.0, 789.0, 351.0, 170.0, 92.0, 57.0, 44.0, 29.0, 16.0, 11.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5751953125, -0.5583648681640625, -0.541534423828125, -0.5247039794921875, -0.50787353515625, -0.4910430908203125, -0.474212646484375, -0.4573822021484375, -0.4405517578125, -0.4237213134765625, -0.406890869140625, -0.3900604248046875, -0.37322998046875, -0.3563995361328125, -0.339569091796875, -0.3227386474609375, -0.305908203125, -0.2890777587890625, -0.272247314453125, -0.2554168701171875, -0.23858642578125, -0.2217559814453125, -0.204925537109375, -0.1880950927734375, -0.1712646484375, -0.1544342041015625, -0.137603759765625, -0.1207733154296875, -0.10394287109375, -0.0871124267578125, -0.070281982421875, -0.0534515380859375, -0.03662109375, -0.0197906494140625, -0.002960205078125, 0.0138702392578125, 0.03070068359375, 0.0475311279296875, 0.064361572265625, 0.0811920166015625, 0.0980224609375, 0.1148529052734375, 0.131683349609375, 0.1485137939453125, 0.16534423828125, 0.1821746826171875, 0.199005126953125, 0.2158355712890625, 0.232666015625, 0.2494964599609375, 0.266326904296875, 0.2831573486328125, 0.29998779296875, 0.3168182373046875, 0.333648681640625, 0.3504791259765625, 0.3673095703125, 0.3841400146484375, 0.400970458984375, 0.4178009033203125, 0.43463134765625, 0.4514617919921875, 0.468292236328125, 0.4851226806640625, 0.501953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 4.0, 6.0, 13.0, 7.0, 10.0, 18.0, 19.0, 21.0, 21.0, 35.0, 57.0, 70.0, 82.0, 124.0, 113.0, 91.0, 79.0, 46.0, 35.0, 24.0, 19.0, 18.0, 15.0, 11.0, 6.0, 9.0, 8.0, 4.0, 9.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.511543273925781e-05, -8.197035640478134e-05, -7.882528007030487e-05, -7.56802037358284e-05, -7.253512740135193e-05, -6.939005106687546e-05, -6.624497473239899e-05, -6.309989839792252e-05, -5.9954822063446045e-05, -5.6809745728969574e-05, -5.36646693944931e-05, -5.051959306001663e-05, -4.737451672554016e-05, -4.422944039106369e-05, -4.108436405658722e-05, -3.793928772211075e-05, -3.479421138763428e-05, -3.1649135053157806e-05, -2.8504058718681335e-05, -2.5358982384204865e-05, -2.2213906049728394e-05, -1.9068829715251923e-05, -1.592375338077545e-05, -1.277867704629898e-05, -9.63360071182251e-06, -6.488524377346039e-06, -3.343448042869568e-06, -1.9837170839309692e-07, 2.946704626083374e-06, 6.091780960559845e-06, 9.236857295036316e-06, 1.2381933629512787e-05, 1.5527009963989258e-05, 1.867208629846573e-05, 2.18171626329422e-05, 2.496223896741867e-05, 2.810731530189514e-05, 3.125239163637161e-05, 3.4397467970848083e-05, 3.7542544305324554e-05, 4.0687620639801025e-05, 4.3832696974277496e-05, 4.697777330875397e-05, 5.012284964323044e-05, 5.326792597770691e-05, 5.641300231218338e-05, 5.955807864665985e-05, 6.270315498113632e-05, 6.584823131561279e-05, 6.899330765008926e-05, 7.213838398456573e-05, 7.52834603190422e-05, 7.842853665351868e-05, 8.157361298799515e-05, 8.471868932247162e-05, 8.786376565694809e-05, 9.100884199142456e-05, 9.415391832590103e-05, 9.72989946603775e-05, 0.00010044407099485397, 0.00010358914732933044, 0.00010673422366380692, 0.00010987929999828339, 0.00011302437633275986, 0.00011616945266723633]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 8.0, 10.0, 14.0, 21.0, 26.0, 60.0, 93.0, 150.0, 317.0, 556.0, 1317.0, 3479.0, 12229.0, 83210.0, 771815.0, 149473.0, 18106.0, 4463.0, 1638.0, 738.0, 376.0, 176.0, 116.0, 57.0, 40.0, 21.0, 15.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.501953125, -0.48702239990234375, -0.4720916748046875, -0.45716094970703125, -0.442230224609375, -0.42729949951171875, -0.4123687744140625, -0.39743804931640625, -0.38250732421875, -0.36757659912109375, -0.3526458740234375, -0.33771514892578125, -0.322784423828125, -0.30785369873046875, -0.2929229736328125, -0.27799224853515625, -0.2630615234375, -0.24813079833984375, -0.2332000732421875, -0.21826934814453125, -0.203338623046875, -0.18840789794921875, -0.1734771728515625, -0.15854644775390625, -0.14361572265625, -0.12868499755859375, -0.1137542724609375, -0.09882354736328125, -0.083892822265625, -0.06896209716796875, -0.0540313720703125, -0.03910064697265625, -0.024169921875, -0.00923919677734375, 0.0056915283203125, 0.02062225341796875, 0.035552978515625, 0.05048370361328125, 0.0654144287109375, 0.08034515380859375, 0.09527587890625, 0.11020660400390625, 0.1251373291015625, 0.14006805419921875, 0.154998779296875, 0.16992950439453125, 0.1848602294921875, 0.19979095458984375, 0.2147216796875, 0.22965240478515625, 0.2445831298828125, 0.25951385498046875, 0.274444580078125, 0.28937530517578125, 0.3043060302734375, 0.31923675537109375, 0.33416748046875, 0.34909820556640625, 0.3640289306640625, 0.37895965576171875, 0.393890380859375, 0.40882110595703125, 0.4237518310546875, 0.43868255615234375, 0.45361328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 5.0, 10.0, 8.0, 25.0, 18.0, 26.0, 39.0, 46.0, 51.0, 65.0, 77.0, 100.0, 75.0, 81.0, 68.0, 60.0, 54.0, 37.0, 36.0, 29.0, 20.0, 20.0, 7.0, 8.0, 11.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274169921875, -0.2629432678222656, -0.25171661376953125, -0.24048995971679688, -0.2292633056640625, -0.21803665161132812, -0.20680999755859375, -0.19558334350585938, -0.184356689453125, -0.17313003540039062, -0.16190338134765625, -0.15067672729492188, -0.1394500732421875, -0.12822341918945312, -0.11699676513671875, -0.10577011108398438, -0.09454345703125, -0.08331680297851562, -0.07209014892578125, -0.060863494873046875, -0.0496368408203125, -0.038410186767578125, -0.02718353271484375, -0.015956878662109375, -0.004730224609375, 0.006496429443359375, 0.01772308349609375, 0.028949737548828125, 0.0401763916015625, 0.051403045654296875, 0.06262969970703125, 0.07385635375976562, 0.0850830078125, 0.09630966186523438, 0.10753631591796875, 0.11876296997070312, 0.1299896240234375, 0.14121627807617188, 0.15244293212890625, 0.16366958618164062, 0.174896240234375, 0.18612289428710938, 0.19734954833984375, 0.20857620239257812, 0.2198028564453125, 0.23102951049804688, 0.24225616455078125, 0.2534828186035156, 0.26470947265625, 0.2759361267089844, 0.28716278076171875, 0.2983894348144531, 0.3096160888671875, 0.3208427429199219, 0.33206939697265625, 0.3432960510253906, 0.354522705078125, 0.3657493591308594, 0.37697601318359375, 0.3882026672363281, 0.3994293212890625, 0.4106559753417969, 0.42188262939453125, 0.4331092834472656, 0.4443359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 11.0, 24.0, 66.0, 143.0, 243.0, 231.0, 130.0, 68.0, 37.0, 14.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.973264694213867, -10.63924503326416, -10.305224418640137, -9.97120475769043, -9.637184143066406, -9.3031644821167, -8.969144821166992, -8.635124206542969, -8.301104545593262, -7.9670844078063965, -7.633064270019531, -7.299044609069824, -6.965024471282959, -6.631004333496094, -6.296984672546387, -5.9629645347595215, -5.628944396972656, -5.294924259185791, -4.960904121398926, -4.626884460449219, -4.2928643226623535, -3.9588441848754883, -3.624824285507202, -3.290804386138916, -2.956784248352051, -2.6227641105651855, -2.2887442111968994, -1.9547241926193237, -1.620704174041748, -1.2866841554641724, -0.9526641368865967, -0.6186442375183105, -0.2846250534057617, 0.049394965171813965, 0.38341498374938965, 0.7174350023269653, 1.051455020904541, 1.3854750394821167, 1.7194950580596924, 2.0535149574279785, 2.3875350952148438, 2.721555233001709, 3.055575132369995, 3.3895950317382812, 3.7236151695251465, 4.057635307312012, 4.391654968261719, 4.725675106048584, 5.059695243835449, 5.3937153816223145, 5.72773551940918, 6.061755180358887, 6.395775318145752, 6.729795455932617, 7.063815116882324, 7.3978352546691895, 7.731855392456055, 8.065875053405762, 8.399895668029785, 8.733915328979492, 9.067935943603516, 9.401955604553223, 9.73597526550293, 10.069995880126953, 10.40401554107666]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 5.0, 7.0, 6.0, 11.0, 4.0, 9.0, 21.0, 19.0, 17.0, 20.0, 11.0, 28.0, 23.0, 20.0, 23.0, 20.0, 29.0, 26.0, 35.0, 44.0, 65.0, 63.0, 67.0, 56.0, 42.0, 31.0, 33.0, 38.0, 15.0, 28.0, 36.0, 21.0, 17.0, 17.0, 10.0, 12.0, 14.0, 8.0, 7.0, 6.0, 7.0, 4.0, 9.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-4.979665756225586, -4.82357120513916, -4.667476654052734, -4.511382579803467, -4.355288028717041, -4.199193477630615, -4.0430989265441895, -3.8870043754577637, -3.730910062789917, -3.574815511703491, -3.4187211990356445, -3.2626266479492188, -3.106532096862793, -2.9504377841949463, -2.7943432331085205, -2.638248920440674, -2.482154369354248, -2.3260598182678223, -2.1699655055999756, -2.01387095451355, -1.8577765226364136, -1.7016820907592773, -1.5455875396728516, -1.3894931077957153, -1.233398675918579, -1.0773042440414429, -0.9212097525596619, -0.7651152610778809, -0.6090208292007446, -0.4529263973236084, -0.2968319058418274, -0.1407374143600464, 0.015357494354248047, 0.17145195603370667, 0.3275464177131653, 0.4836408793926239, 0.6397353410720825, 0.7958297729492188, 0.9519242644309998, 1.1080187559127808, 1.264113187789917, 1.4202076196670532, 1.5763020515441895, 1.7323966026306152, 1.8884910345077515, 2.0445854663848877, 2.2006800174713135, 2.35677433013916, 2.512868881225586, 2.6689634323120117, 2.8250577449798584, 2.981152296066284, 3.137246608734131, 3.2933411598205566, 3.4494357109069824, 3.605530261993408, 3.761624574661255, 3.9177191257476807, 4.073813438415527, 4.229907989501953, 4.386002540588379, 4.542097091674805, 4.698191165924072, 4.854285717010498, 5.010380268096924]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 12.0, 18.0, 27.0, 32.0, 68.0, 102.0, 187.0, 280.0, 538.0, 1116.0, 2480.0, 6234.0, 18397.0, 76981.0, 604499.0, 2864414.0, 523132.0, 68407.0, 16639.0, 5759.0, 2483.0, 1152.0, 572.0, 318.0, 171.0, 88.0, 63.0, 35.0, 31.0, 16.0, 12.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.43603515625, -0.418914794921875, -0.40179443359375, -0.384674072265625, -0.3675537109375, -0.350433349609375, -0.33331298828125, -0.316192626953125, -0.299072265625, -0.281951904296875, -0.26483154296875, -0.247711181640625, -0.2305908203125, -0.213470458984375, -0.19635009765625, -0.179229736328125, -0.162109375, -0.144989013671875, -0.12786865234375, -0.110748291015625, -0.0936279296875, -0.076507568359375, -0.05938720703125, -0.042266845703125, -0.025146484375, -0.008026123046875, 0.00909423828125, 0.026214599609375, 0.0433349609375, 0.060455322265625, 0.07757568359375, 0.094696044921875, 0.11181640625, 0.128936767578125, 0.14605712890625, 0.163177490234375, 0.1802978515625, 0.197418212890625, 0.21453857421875, 0.231658935546875, 0.248779296875, 0.265899658203125, 0.28302001953125, 0.300140380859375, 0.3172607421875, 0.334381103515625, 0.35150146484375, 0.368621826171875, 0.3857421875, 0.402862548828125, 0.41998291015625, 0.437103271484375, 0.4542236328125, 0.471343994140625, 0.48846435546875, 0.505584716796875, 0.522705078125, 0.539825439453125, 0.55694580078125, 0.574066162109375, 0.5911865234375, 0.608306884765625, 0.62542724609375, 0.642547607421875, 0.65966796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 8.0, 11.0, 4.0, 7.0, 15.0, 20.0, 34.0, 26.0, 16.0, 20.0, 40.0, 33.0, 53.0, 40.0, 42.0, 45.0, 48.0, 45.0, 60.0, 43.0, 60.0, 50.0, 41.0, 30.0, 41.0, 27.0, 24.0, 32.0, 16.0, 17.0, 4.0, 7.0, 7.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.336181640625, -0.3253974914550781, -0.31461334228515625, -0.3038291931152344, -0.2930450439453125, -0.2822608947753906, -0.27147674560546875, -0.2606925964355469, -0.249908447265625, -0.23912429809570312, -0.22834014892578125, -0.21755599975585938, -0.2067718505859375, -0.19598770141601562, -0.18520355224609375, -0.17441940307617188, -0.16363525390625, -0.15285110473632812, -0.14206695556640625, -0.13128280639648438, -0.1204986572265625, -0.10971450805664062, -0.09893035888671875, -0.08814620971679688, -0.077362060546875, -0.06657791137695312, -0.05579376220703125, -0.045009613037109375, -0.0342254638671875, -0.023441314697265625, -0.01265716552734375, -0.001873016357421875, 0.0089111328125, 0.019695281982421875, 0.03047943115234375, 0.041263580322265625, 0.0520477294921875, 0.06283187866210938, 0.07361602783203125, 0.08440017700195312, 0.095184326171875, 0.10596847534179688, 0.11675262451171875, 0.12753677368164062, 0.1383209228515625, 0.14910507202148438, 0.15988922119140625, 0.17067337036132812, 0.18145751953125, 0.19224166870117188, 0.20302581787109375, 0.21380996704101562, 0.2245941162109375, 0.23537826538085938, 0.24616241455078125, 0.2569465637207031, 0.267730712890625, 0.2785148620605469, 0.28929901123046875, 0.3000831604003906, 0.3108673095703125, 0.3216514587402344, 0.33243560791015625, 0.3432197570800781, 0.35400390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 5.0, 9.0, 16.0, 24.0, 41.0, 79.0, 130.0, 296.0, 795.0, 2366.0, 9578.0, 75130.0, 3180075.0, 882215.0, 34871.0, 5912.0, 1711.0, 601.0, 198.0, 99.0, 50.0, 29.0, 15.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5224609375, -1.48223876953125, -1.4420166015625, -1.40179443359375, -1.361572265625, -1.32135009765625, -1.2811279296875, -1.24090576171875, -1.20068359375, -1.16046142578125, -1.1202392578125, -1.08001708984375, -1.039794921875, -0.99957275390625, -0.9593505859375, -0.91912841796875, -0.87890625, -0.83868408203125, -0.7984619140625, -0.75823974609375, -0.718017578125, -0.67779541015625, -0.6375732421875, -0.59735107421875, -0.55712890625, -0.51690673828125, -0.4766845703125, -0.43646240234375, -0.396240234375, -0.35601806640625, -0.3157958984375, -0.27557373046875, -0.2353515625, -0.19512939453125, -0.1549072265625, -0.11468505859375, -0.074462890625, -0.03424072265625, 0.0059814453125, 0.04620361328125, 0.08642578125, 0.12664794921875, 0.1668701171875, 0.20709228515625, 0.247314453125, 0.28753662109375, 0.3277587890625, 0.36798095703125, 0.408203125, 0.44842529296875, 0.4886474609375, 0.52886962890625, 0.569091796875, 0.60931396484375, 0.6495361328125, 0.68975830078125, 0.72998046875, 0.77020263671875, 0.8104248046875, 0.85064697265625, 0.890869140625, 0.93109130859375, 0.9713134765625, 1.01153564453125, 1.0517578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 7.0, 5.0, 5.0, 6.0, 10.0, 10.0, 25.0, 33.0, 50.0, 59.0, 66.0, 122.0, 187.0, 267.0, 417.0, 776.0, 781.0, 459.0, 277.0, 153.0, 118.0, 61.0, 44.0, 33.0, 32.0, 14.0, 16.0, 11.0, 5.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.859375, -0.8325271606445312, -0.8056793212890625, -0.7788314819335938, -0.751983642578125, -0.7251358032226562, -0.6982879638671875, -0.6714401245117188, -0.64459228515625, -0.6177444458007812, -0.5908966064453125, -0.5640487670898438, -0.537200927734375, -0.5103530883789062, -0.4835052490234375, -0.45665740966796875, -0.4298095703125, -0.40296173095703125, -0.3761138916015625, -0.34926605224609375, -0.322418212890625, -0.29557037353515625, -0.2687225341796875, -0.24187469482421875, -0.21502685546875, -0.18817901611328125, -0.1613311767578125, -0.13448333740234375, -0.107635498046875, -0.08078765869140625, -0.0539398193359375, -0.02709197998046875, -0.000244140625, 0.02660369873046875, 0.0534515380859375, 0.08029937744140625, 0.107147216796875, 0.13399505615234375, 0.1608428955078125, 0.18769073486328125, 0.21453857421875, 0.24138641357421875, 0.2682342529296875, 0.29508209228515625, 0.321929931640625, 0.34877777099609375, 0.3756256103515625, 0.40247344970703125, 0.4293212890625, 0.45616912841796875, 0.4830169677734375, 0.5098648071289062, 0.536712646484375, 0.5635604858398438, 0.5904083251953125, 0.6172561645507812, 0.64410400390625, 0.6709518432617188, 0.6977996826171875, 0.7246475219726562, 0.751495361328125, 0.7783432006835938, 0.8051910400390625, 0.8320388793945312, 0.85888671875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 21.0, 45.0, 119.0, 269.0, 266.0, 167.0, 66.0, 20.0, 2.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.255207061767578, -17.850942611694336, -17.446678161621094, -17.042415618896484, -16.638151168823242, -16.23388671875, -15.829622268676758, -15.425357818603516, -15.021093368530273, -14.616828918457031, -14.212565422058105, -13.808300971984863, -13.404036521911621, -12.999773025512695, -12.595508575439453, -12.191244125366211, -11.786980628967285, -11.382716178894043, -10.978452682495117, -10.574188232421875, -10.169923782348633, -9.76565933227539, -9.361395835876465, -8.957131385803223, -8.552867889404297, -8.148603439331055, -7.744339466094971, -7.340075492858887, -6.9358110427856445, -6.5315470695495605, -6.127283096313477, -5.723018646240234, -5.318755149841309, -4.914491176605225, -4.510226726531982, -4.105962753295898, -3.7016985416412354, -3.2974343299865723, -2.8931703567504883, -2.488906145095825, -2.084641933441162, -1.680377721786499, -1.2761136293411255, -0.871849536895752, -0.46758532524108887, -0.06332111358642578, 0.3409428596496582, 0.7452070713043213, 1.1494712829589844, 1.5537354946136475, 1.957999587059021, 2.3622636795043945, 2.7665278911590576, 3.1707921028137207, 3.5750560760498047, 3.9793202877044678, 4.383584499359131, 4.787848472595215, 5.192112922668457, 5.596376895904541, 6.000640869140625, 6.404905319213867, 6.809169292449951, 7.213433265686035, 7.617697715759277]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 4.0, 12.0, 15.0, 8.0, 18.0, 23.0, 25.0, 22.0, 25.0, 46.0, 51.0, 46.0, 53.0, 55.0, 49.0, 68.0, 66.0, 56.0, 55.0, 37.0, 38.0, 33.0, 36.0, 21.0, 29.0, 25.0, 18.0, 7.0, 17.0, 6.0, 10.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.359222888946533, -5.219463348388672, -5.0797038078308105, -4.939944267272949, -4.800184726715088, -4.660425186157227, -4.520665645599365, -4.380906105041504, -4.241147041320801, -4.1013875007629395, -3.961627960205078, -3.821868419647217, -3.6821088790893555, -3.542349338531494, -3.402590036392212, -3.2628304958343506, -3.12307071685791, -2.983311176300049, -2.8435516357421875, -2.703792095184326, -2.564032554626465, -2.4242730140686035, -2.2845137119293213, -2.14475417137146, -2.0049946308135986, -1.8652350902557373, -1.725475549697876, -1.5857161283493042, -1.4459565877914429, -1.3061970472335815, -1.1664376258850098, -1.0266780853271484, -0.8869180679321289, -0.7471585273742676, -0.607399046421051, -0.4676395356655121, -0.32788002490997314, -0.18812048435211182, -0.048361003398895264, 0.09139847755432129, 0.23115801811218262, 0.37091752886772156, 0.5106770396232605, 0.650436520576477, 0.7901960611343384, 0.9299556016921997, 1.0697150230407715, 1.2094745635986328, 1.3492341041564941, 1.4889936447143555, 1.6287531852722168, 1.7685126066207886, 1.90827214717865, 2.048031806945801, 2.187791109085083, 2.3275506496429443, 2.4673101902008057, 2.607069730758667, 2.7468292713165283, 2.8865888118743896, 3.026348114013672, 3.166107654571533, 3.3058671951293945, 3.445626735687256, 3.585386276245117]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 6.0, 8.0, 11.0, 11.0, 20.0, 36.0, 54.0, 85.0, 124.0, 224.0, 344.0, 525.0, 836.0, 1484.0, 2488.0, 4393.0, 8869.0, 19015.0, 47252.0, 124089.0, 283356.0, 310357.0, 145285.0, 55735.0, 22183.0, 10034.0, 4925.0, 2813.0, 1484.0, 962.0, 559.0, 381.0, 212.0, 122.0, 92.0, 69.0, 36.0, 32.0, 14.0, 17.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.2962493896484375, -0.283416748046875, -0.2705841064453125, -0.25775146484375, -0.2449188232421875, -0.232086181640625, -0.2192535400390625, -0.2064208984375, -0.1935882568359375, -0.180755615234375, -0.1679229736328125, -0.15509033203125, -0.1422576904296875, -0.129425048828125, -0.1165924072265625, -0.103759765625, -0.0909271240234375, -0.078094482421875, -0.0652618408203125, -0.05242919921875, -0.0395965576171875, -0.026763916015625, -0.0139312744140625, -0.0010986328125, 0.0117340087890625, 0.024566650390625, 0.0373992919921875, 0.05023193359375, 0.0630645751953125, 0.075897216796875, 0.0887298583984375, 0.1015625, 0.1143951416015625, 0.127227783203125, 0.1400604248046875, 0.15289306640625, 0.1657257080078125, 0.178558349609375, 0.1913909912109375, 0.2042236328125, 0.2170562744140625, 0.229888916015625, 0.2427215576171875, 0.25555419921875, 0.2683868408203125, 0.281219482421875, 0.2940521240234375, 0.306884765625, 0.3197174072265625, 0.332550048828125, 0.3453826904296875, 0.35821533203125, 0.3710479736328125, 0.383880615234375, 0.3967132568359375, 0.4095458984375, 0.4223785400390625, 0.435211181640625, 0.4480438232421875, 0.46087646484375, 0.4737091064453125, 0.486541748046875, 0.4993743896484375, 0.51220703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 8.0, 12.0, 6.0, 14.0, 14.0, 23.0, 28.0, 31.0, 40.0, 43.0, 42.0, 50.0, 57.0, 58.0, 64.0, 48.0, 53.0, 71.0, 49.0, 36.0, 38.0, 37.0, 22.0, 37.0, 23.0, 21.0, 16.0, 15.0, 11.0, 11.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43634033203125, -0.4234619140625, -0.41058349609375, -0.397705078125, -0.38482666015625, -0.3719482421875, -0.35906982421875, -0.34619140625, -0.33331298828125, -0.3204345703125, -0.30755615234375, -0.294677734375, -0.28179931640625, -0.2689208984375, -0.25604248046875, -0.2431640625, -0.23028564453125, -0.2174072265625, -0.20452880859375, -0.191650390625, -0.17877197265625, -0.1658935546875, -0.15301513671875, -0.14013671875, -0.12725830078125, -0.1143798828125, -0.10150146484375, -0.088623046875, -0.07574462890625, -0.0628662109375, -0.04998779296875, -0.037109375, -0.02423095703125, -0.0113525390625, 0.00152587890625, 0.014404296875, 0.02728271484375, 0.0401611328125, 0.05303955078125, 0.06591796875, 0.07879638671875, 0.0916748046875, 0.10455322265625, 0.117431640625, 0.13031005859375, 0.1431884765625, 0.15606689453125, 0.1689453125, 0.18182373046875, 0.1947021484375, 0.20758056640625, 0.220458984375, 0.23333740234375, 0.2462158203125, 0.25909423828125, 0.27197265625, 0.28485107421875, 0.2977294921875, 0.31060791015625, 0.323486328125, 0.33636474609375, 0.3492431640625, 0.36212158203125, 0.375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 12.0, 28.0, 44.0, 68.0, 84.0, 187.0, 305.0, 688.0, 1677.0, 5100.0, 24410.0, 228233.0, 704871.0, 67825.0, 10149.0, 2782.0, 1026.0, 464.0, 219.0, 128.0, 75.0, 37.0, 40.0, 16.0, 17.0, 8.0, 3.0, 7.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.908203125, -0.878173828125, -0.84814453125, -0.818115234375, -0.7880859375, -0.758056640625, -0.72802734375, -0.697998046875, -0.66796875, -0.637939453125, -0.60791015625, -0.577880859375, -0.5478515625, -0.517822265625, -0.48779296875, -0.457763671875, -0.427734375, -0.397705078125, -0.36767578125, -0.337646484375, -0.3076171875, -0.277587890625, -0.24755859375, -0.217529296875, -0.1875, -0.157470703125, -0.12744140625, -0.097412109375, -0.0673828125, -0.037353515625, -0.00732421875, 0.022705078125, 0.052734375, 0.082763671875, 0.11279296875, 0.142822265625, 0.1728515625, 0.202880859375, 0.23291015625, 0.262939453125, 0.29296875, 0.322998046875, 0.35302734375, 0.383056640625, 0.4130859375, 0.443115234375, 0.47314453125, 0.503173828125, 0.533203125, 0.563232421875, 0.59326171875, 0.623291015625, 0.6533203125, 0.683349609375, 0.71337890625, 0.743408203125, 0.7734375, 0.803466796875, 0.83349609375, 0.863525390625, 0.8935546875, 0.923583984375, 0.95361328125, 0.983642578125, 1.013671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 21.0, 25.0, 31.0, 48.0, 50.0, 54.0, 74.0, 93.0, 86.0, 68.0, 72.0, 55.0, 61.0, 49.0, 64.0, 36.0, 30.0, 19.0, 13.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.3532867431640625, -2.290557861328125, -2.2278289794921875, -2.16510009765625, -2.1023712158203125, -2.039642333984375, -1.9769134521484375, -1.9141845703125, -1.8514556884765625, -1.788726806640625, -1.7259979248046875, -1.66326904296875, -1.6005401611328125, -1.537811279296875, -1.4750823974609375, -1.412353515625, -1.3496246337890625, -1.286895751953125, -1.2241668701171875, -1.16143798828125, -1.0987091064453125, -1.035980224609375, -0.9732513427734375, -0.9105224609375, -0.8477935791015625, -0.785064697265625, -0.7223358154296875, -0.65960693359375, -0.5968780517578125, -0.534149169921875, -0.4714202880859375, -0.40869140625, -0.3459625244140625, -0.283233642578125, -0.2205047607421875, -0.15777587890625, -0.0950469970703125, -0.032318115234375, 0.0304107666015625, 0.0931396484375, 0.1558685302734375, 0.218597412109375, 0.2813262939453125, 0.34405517578125, 0.4067840576171875, 0.469512939453125, 0.5322418212890625, 0.594970703125, 0.6576995849609375, 0.720428466796875, 0.7831573486328125, 0.84588623046875, 0.9086151123046875, 0.971343994140625, 1.0340728759765625, 1.0968017578125, 1.1595306396484375, 1.222259521484375, 1.2849884033203125, 1.34771728515625, 1.4104461669921875, 1.473175048828125, 1.5359039306640625, 1.5986328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 1.0, 3.0, 5.0, 7.0, 8.0, 9.0, 19.0, 15.0, 26.0, 45.0, 78.0, 96.0, 149.0, 221.0, 444.0, 858.0, 1859.0, 4174.0, 10645.0, 32490.0, 114042.0, 541819.0, 241753.0, 66716.0, 20228.0, 7047.0, 2914.0, 1324.0, 664.0, 346.0, 193.0, 111.0, 78.0, 44.0, 30.0, 20.0, 18.0, 15.0, 10.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.18058395385742188, -0.17452239990234375, -0.16846084594726562, -0.1623992919921875, -0.15633773803710938, -0.15027618408203125, -0.14421463012695312, -0.138153076171875, -0.13209152221679688, -0.12602996826171875, -0.11996841430664062, -0.1139068603515625, -0.10784530639648438, -0.10178375244140625, -0.09572219848632812, -0.08966064453125, -0.08359909057617188, -0.07753753662109375, -0.07147598266601562, -0.0654144287109375, -0.059352874755859375, -0.05329132080078125, -0.047229766845703125, -0.041168212890625, -0.035106658935546875, -0.02904510498046875, -0.022983551025390625, -0.0169219970703125, -0.010860443115234375, -0.00479888916015625, 0.001262664794921875, 0.00732421875, 0.013385772705078125, 0.01944732666015625, 0.025508880615234375, 0.0315704345703125, 0.037631988525390625, 0.04369354248046875, 0.049755096435546875, 0.055816650390625, 0.061878204345703125, 0.06793975830078125, 0.07400131225585938, 0.0800628662109375, 0.08612442016601562, 0.09218597412109375, 0.09824752807617188, 0.10430908203125, 0.11037063598632812, 0.11643218994140625, 0.12249374389648438, 0.1285552978515625, 0.13461685180664062, 0.14067840576171875, 0.14673995971679688, 0.152801513671875, 0.15886306762695312, 0.16492462158203125, 0.17098617553710938, 0.1770477294921875, 0.18310928344726562, 0.18917083740234375, 0.19523239135742188, 0.2012939453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 4.0, 6.0, 8.0, 21.0, 25.0, 47.0, 53.0, 64.0, 76.0, 82.0, 106.0, 110.0, 96.0, 77.0, 62.0, 40.0, 36.0, 26.0, 13.0, 4.0, 14.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.295608520507812e-05, -7.0926733314991e-05, -6.889738142490387e-05, -6.686802953481674e-05, -6.483867764472961e-05, -6.280932575464249e-05, -6.077997386455536e-05, -5.875062197446823e-05, -5.6721270084381104e-05, -5.4691918194293976e-05, -5.266256630420685e-05, -5.063321441411972e-05, -4.860386252403259e-05, -4.6574510633945465e-05, -4.454515874385834e-05, -4.251580685377121e-05, -4.048645496368408e-05, -3.8457103073596954e-05, -3.642775118350983e-05, -3.43983992934227e-05, -3.236904740333557e-05, -3.0339695513248444e-05, -2.8310343623161316e-05, -2.6280991733074188e-05, -2.425163984298706e-05, -2.2222287952899933e-05, -2.0192936062812805e-05, -1.8163584172725677e-05, -1.613423228263855e-05, -1.4104880392551422e-05, -1.2075528502464294e-05, -1.0046176612377167e-05, -8.016824722290039e-06, -5.987472832202911e-06, -3.958120942115784e-06, -1.928769052028656e-06, 1.0058283805847168e-07, 2.1299347281455994e-06, 4.159286618232727e-06, 6.188638508319855e-06, 8.217990398406982e-06, 1.024734228849411e-05, 1.2276694178581238e-05, 1.4306046068668365e-05, 1.6335397958755493e-05, 1.836474984884262e-05, 2.039410173892975e-05, 2.2423453629016876e-05, 2.4452805519104004e-05, 2.648215740919113e-05, 2.851150929927826e-05, 3.054086118936539e-05, 3.2570213079452515e-05, 3.459956496953964e-05, 3.662891685962677e-05, 3.86582687497139e-05, 4.0687620639801025e-05, 4.271697252988815e-05, 4.474632441997528e-05, 4.677567631006241e-05, 4.8805028200149536e-05, 5.0834380090236664e-05, 5.286373198032379e-05, 5.489308387041092e-05, 5.692243576049805e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 12.0, 10.0, 16.0, 30.0, 47.0, 66.0, 119.0, 264.0, 419.0, 925.0, 2357.0, 7146.0, 28717.0, 151689.0, 652933.0, 161636.0, 30352.0, 7349.0, 2507.0, 932.0, 426.0, 230.0, 146.0, 82.0, 54.0, 30.0, 16.0, 13.0, 15.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3295783996582031, -0.32102203369140625, -0.3124656677246094, -0.3039093017578125, -0.2953529357910156, -0.28679656982421875, -0.2782402038574219, -0.269683837890625, -0.2611274719238281, -0.25257110595703125, -0.24401473999023438, -0.2354583740234375, -0.22690200805664062, -0.21834564208984375, -0.20978927612304688, -0.20123291015625, -0.19267654418945312, -0.18412017822265625, -0.17556381225585938, -0.1670074462890625, -0.15845108032226562, -0.14989471435546875, -0.14133834838867188, -0.132781982421875, -0.12422561645507812, -0.11566925048828125, -0.10711288452148438, -0.0985565185546875, -0.09000015258789062, -0.08144378662109375, -0.07288742065429688, -0.0643310546875, -0.055774688720703125, -0.04721832275390625, -0.038661956787109375, -0.0301055908203125, -0.021549224853515625, -0.01299285888671875, -0.004436492919921875, 0.004119873046875, 0.012676239013671875, 0.02123260498046875, 0.029788970947265625, 0.0383453369140625, 0.046901702880859375, 0.05545806884765625, 0.06401443481445312, 0.07257080078125, 0.08112716674804688, 0.08968353271484375, 0.09823989868164062, 0.1067962646484375, 0.11535263061523438, 0.12390899658203125, 0.13246536254882812, 0.141021728515625, 0.14957809448242188, 0.15813446044921875, 0.16669082641601562, 0.1752471923828125, 0.18380355834960938, 0.19235992431640625, 0.20091629028320312, 0.20947265625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 10.0, 13.0, 10.0, 8.0, 10.0, 16.0, 34.0, 40.0, 34.0, 61.0, 50.0, 74.0, 76.0, 63.0, 58.0, 69.0, 80.0, 39.0, 57.0, 34.0, 30.0, 34.0, 25.0, 19.0, 11.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.29052734375, -0.28282737731933594, -0.2751274108886719, -0.2674274444580078, -0.25972747802734375, -0.2520275115966797, -0.24432754516601562, -0.23662757873535156, -0.2289276123046875, -0.22122764587402344, -0.21352767944335938, -0.2058277130126953, -0.19812774658203125, -0.1904277801513672, -0.18272781372070312, -0.17502784729003906, -0.167327880859375, -0.15962791442871094, -0.15192794799804688, -0.1442279815673828, -0.13652801513671875, -0.1288280487060547, -0.12112808227539062, -0.11342811584472656, -0.1057281494140625, -0.09802818298339844, -0.09032821655273438, -0.08262825012207031, -0.07492828369140625, -0.06722831726074219, -0.059528350830078125, -0.05182838439941406, -0.04412841796875, -0.03642845153808594, -0.028728485107421875, -0.021028518676757812, -0.01332855224609375, -0.0056285858154296875, 0.002071380615234375, 0.009771347045898438, 0.0174713134765625, 0.025171279907226562, 0.032871246337890625, 0.04057121276855469, 0.04827117919921875, 0.05597114562988281, 0.06367111206054688, 0.07137107849121094, 0.079071044921875, 0.08677101135253906, 0.09447097778320312, 0.10217094421386719, 0.10987091064453125, 0.11757087707519531, 0.12527084350585938, 0.13297080993652344, 0.1406707763671875, 0.14837074279785156, 0.15607070922851562, 0.1637706756591797, 0.17147064208984375, 0.1791706085205078, 0.18687057495117188, 0.19457054138183594, 0.2022705078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 13.0, 28.0, 38.0, 62.0, 116.0, 195.0, 191.0, 111.0, 71.0, 57.0, 33.0, 26.0, 15.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01359224319458, -5.859503746032715, -5.70541524887085, -5.551326751708984, -5.397238731384277, -5.243150234222412, -5.089061737060547, -4.934973239898682, -4.780884742736816, -4.626796245574951, -4.472707748413086, -4.318619251251221, -4.1645307540893555, -4.010442733764648, -3.856354236602783, -3.702265739440918, -3.5481772422790527, -3.3940887451171875, -3.2400002479553223, -3.085911989212036, -2.931823492050171, -2.7777349948883057, -2.6236467361450195, -2.4695582389831543, -2.315469741821289, -2.161381244659424, -2.0072927474975586, -1.8532044887542725, -1.6991159915924072, -1.545027494430542, -1.3909391164779663, -1.2368507385253906, -1.0827617645263672, -0.9286733269691467, -0.7745848894119263, -0.6204964518547058, -0.46640801429748535, -0.3123195767402649, -0.15823113918304443, -0.00414276123046875, 0.14994573593139648, 0.30403417348861694, 0.4581226110458374, 0.6122110486030579, 0.7662994861602783, 0.9203879237174988, 1.0744763612747192, 1.228564739227295, 1.3826532363891602, 1.5367417335510254, 1.690830111503601, 1.8449184894561768, 1.999006986618042, 2.1530954837799072, 2.3071837425231934, 2.4612722396850586, 2.615360736846924, 2.769449234008789, 2.9235377311706543, 3.0776259899139404, 3.2317144870758057, 3.385802984237671, 3.539891242980957, 3.6939797401428223, 3.8480682373046875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 2.0, 9.0, 10.0, 10.0, 15.0, 16.0, 29.0, 26.0, 27.0, 28.0, 52.0, 34.0, 58.0, 49.0, 97.0, 84.0, 68.0, 63.0, 40.0, 46.0, 41.0, 31.0, 29.0, 24.0, 21.0, 15.0, 10.0, 14.0, 8.0, 8.0, 2.0, 7.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.858007907867432, -5.6725687980651855, -5.4871296882629395, -5.301690578460693, -5.116250991821289, -4.930811882019043, -4.745372772216797, -4.559933662414551, -4.374494552612305, -4.189055442810059, -4.0036163330078125, -3.8181769847869873, -3.632737874984741, -3.447298765182495, -3.26185941696167, -3.076420307159424, -2.8909811973571777, -2.7055420875549316, -2.5201029777526855, -2.3346636295318604, -2.1492245197296143, -1.9637854099273682, -1.7783461809158325, -1.5929069519042969, -1.4074678421020508, -1.2220287322998047, -1.036589503288269, -0.8511503338813782, -0.6657111644744873, -0.48027199506759644, -0.29483282566070557, -0.10939359664916992, 0.07604503631591797, 0.26148420572280884, 0.4469233751296997, 0.6323625445365906, 0.8178017139434814, 1.0032408237457275, 1.1886800527572632, 1.3741192817687988, 1.559558391571045, 1.744997501373291, 1.9304367303848267, 2.1158759593963623, 2.3013150691986084, 2.4867541790008545, 2.6721935272216797, 2.857632637023926, 3.043071746826172, 3.228510856628418, 3.413949966430664, 3.5993893146514893, 3.7848284244537354, 3.9702675342559814, 4.155706882476807, 4.341145992279053, 4.526585102081299, 4.712024211883545, 4.897463321685791, 5.082902431488037, 5.268342018127441, 5.4537811279296875, 5.639220237731934, 5.82465934753418, 6.010098457336426]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 14.0, 18.0, 24.0, 36.0, 64.0, 82.0, 120.0, 204.0, 302.0, 447.0, 736.0, 1256.0, 2246.0, 4069.0, 8268.0, 19156.0, 50522.0, 159277.0, 611536.0, 2063995.0, 933395.0, 226273.0, 66947.0, 23990.0, 10074.0, 4818.0, 2606.0, 1418.0, 807.0, 543.0, 328.0, 227.0, 170.0, 118.0, 66.0, 45.0, 30.0, 18.0, 9.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299560546875, -0.29009246826171875, -0.2806243896484375, -0.27115631103515625, -0.261688232421875, -0.25222015380859375, -0.2427520751953125, -0.23328399658203125, -0.22381591796875, -0.21434783935546875, -0.2048797607421875, -0.19541168212890625, -0.185943603515625, -0.17647552490234375, -0.1670074462890625, -0.15753936767578125, -0.1480712890625, -0.13860321044921875, -0.1291351318359375, -0.11966705322265625, -0.110198974609375, -0.10073089599609375, -0.0912628173828125, -0.08179473876953125, -0.07232666015625, -0.06285858154296875, -0.0533905029296875, -0.04392242431640625, -0.034454345703125, -0.02498626708984375, -0.0155181884765625, -0.00605010986328125, 0.00341796875, 0.01288604736328125, 0.0223541259765625, 0.03182220458984375, 0.041290283203125, 0.05075836181640625, 0.0602264404296875, 0.06969451904296875, 0.07916259765625, 0.08863067626953125, 0.0980987548828125, 0.10756683349609375, 0.117034912109375, 0.12650299072265625, 0.1359710693359375, 0.14543914794921875, 0.1549072265625, 0.16437530517578125, 0.1738433837890625, 0.18331146240234375, 0.192779541015625, 0.20224761962890625, 0.2117156982421875, 0.22118377685546875, 0.23065185546875, 0.24011993408203125, 0.2495880126953125, 0.25905609130859375, 0.268524169921875, 0.27799224853515625, 0.2874603271484375, 0.29692840576171875, 0.306396484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 4.0, 6.0, 4.0, 8.0, 10.0, 8.0, 12.0, 17.0, 13.0, 23.0, 32.0, 24.0, 27.0, 25.0, 45.0, 54.0, 56.0, 59.0, 44.0, 51.0, 51.0, 43.0, 50.0, 58.0, 37.0, 32.0, 29.0, 31.0, 19.0, 22.0, 22.0, 17.0, 8.0, 11.0, 10.0, 8.0, 8.0, 11.0, 1.0, 5.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.317626953125, -0.3072776794433594, -0.29692840576171875, -0.2865791320800781, -0.2762298583984375, -0.2658805847167969, -0.25553131103515625, -0.24518203735351562, -0.234832763671875, -0.22448348999023438, -0.21413421630859375, -0.20378494262695312, -0.1934356689453125, -0.18308639526367188, -0.17273712158203125, -0.16238784790039062, -0.15203857421875, -0.14168930053710938, -0.13134002685546875, -0.12099075317382812, -0.1106414794921875, -0.10029220581054688, -0.08994293212890625, -0.07959365844726562, -0.069244384765625, -0.058895111083984375, -0.04854583740234375, -0.038196563720703125, -0.0278472900390625, -0.017498016357421875, -0.00714874267578125, 0.003200531005859375, 0.0135498046875, 0.023899078369140625, 0.03424835205078125, 0.044597625732421875, 0.0549468994140625, 0.06529617309570312, 0.07564544677734375, 0.08599472045898438, 0.096343994140625, 0.10669326782226562, 0.11704254150390625, 0.12739181518554688, 0.1377410888671875, 0.14809036254882812, 0.15843963623046875, 0.16878890991210938, 0.17913818359375, 0.18948745727539062, 0.19983673095703125, 0.21018600463867188, 0.2205352783203125, 0.23088455200195312, 0.24123382568359375, 0.2515830993652344, 0.261932373046875, 0.2722816467285156, 0.28263092041015625, 0.2929801940917969, 0.3033294677734375, 0.3136787414550781, 0.32402801513671875, 0.3343772888183594, 0.3447265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 3.0, 7.0, 7.0, 13.0, 7.0, 18.0, 15.0, 22.0, 29.0, 39.0, 61.0, 85.0, 158.0, 306.0, 685.0, 1763.0, 6090.0, 28600.0, 220290.0, 3360750.0, 512585.0, 48959.0, 9515.0, 2580.0, 832.0, 317.0, 209.0, 106.0, 64.0, 37.0, 29.0, 18.0, 14.0, 18.0, 15.0, 10.0, 5.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.86669921875, -0.8423843383789062, -0.8180694580078125, -0.7937545776367188, -0.769439697265625, -0.7451248168945312, -0.7208099365234375, -0.6964950561523438, -0.67218017578125, -0.6478652954101562, -0.6235504150390625, -0.5992355346679688, -0.574920654296875, -0.5506057739257812, -0.5262908935546875, -0.5019760131835938, -0.4776611328125, -0.45334625244140625, -0.4290313720703125, -0.40471649169921875, -0.380401611328125, -0.35608673095703125, -0.3317718505859375, -0.30745697021484375, -0.28314208984375, -0.25882720947265625, -0.2345123291015625, -0.21019744873046875, -0.185882568359375, -0.16156768798828125, -0.1372528076171875, -0.11293792724609375, -0.088623046875, -0.06430816650390625, -0.0399932861328125, -0.01567840576171875, 0.008636474609375, 0.03295135498046875, 0.0572662353515625, 0.08158111572265625, 0.10589599609375, 0.13021087646484375, 0.1545257568359375, 0.17884063720703125, 0.203155517578125, 0.22747039794921875, 0.2517852783203125, 0.27610015869140625, 0.3004150390625, 0.32472991943359375, 0.3490447998046875, 0.37335968017578125, 0.397674560546875, 0.42198944091796875, 0.4463043212890625, 0.47061920166015625, 0.49493408203125, 0.5192489624023438, 0.5435638427734375, 0.5678787231445312, 0.592193603515625, 0.6165084838867188, 0.6408233642578125, 0.6651382446289062, 0.689453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 12.0, 13.0, 17.0, 30.0, 45.0, 51.0, 64.0, 87.0, 160.0, 285.0, 502.0, 744.0, 740.0, 477.0, 259.0, 170.0, 107.0, 90.0, 60.0, 30.0, 26.0, 28.0, 19.0, 11.0, 9.0, 8.0, 8.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.6728668212890625, -0.650421142578125, -0.6279754638671875, -0.60552978515625, -0.5830841064453125, -0.560638427734375, -0.5381927490234375, -0.5157470703125, -0.4933013916015625, -0.470855712890625, -0.4484100341796875, -0.42596435546875, -0.4035186767578125, -0.381072998046875, -0.3586273193359375, -0.336181640625, -0.3137359619140625, -0.291290283203125, -0.2688446044921875, -0.24639892578125, -0.2239532470703125, -0.201507568359375, -0.1790618896484375, -0.1566162109375, -0.1341705322265625, -0.111724853515625, -0.0892791748046875, -0.06683349609375, -0.0443878173828125, -0.021942138671875, 0.0005035400390625, 0.02294921875, 0.0453948974609375, 0.067840576171875, 0.0902862548828125, 0.11273193359375, 0.1351776123046875, 0.157623291015625, 0.1800689697265625, 0.2025146484375, 0.2249603271484375, 0.247406005859375, 0.2698516845703125, 0.29229736328125, 0.3147430419921875, 0.337188720703125, 0.3596343994140625, 0.382080078125, 0.4045257568359375, 0.426971435546875, 0.4494171142578125, 0.47186279296875, 0.4943084716796875, 0.516754150390625, 0.5391998291015625, 0.5616455078125, 0.5840911865234375, 0.606536865234375, 0.6289825439453125, 0.65142822265625, 0.6738739013671875, 0.696319580078125, 0.7187652587890625, 0.7412109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 15.0, 24.0, 45.0, 108.0, 138.0, 192.0, 176.0, 125.0, 70.0, 42.0, 16.0, 18.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0754010677337646, -2.8743784427642822, -2.6733555793762207, -2.4723329544067383, -2.271310329437256, -2.0702877044677734, -1.869264841079712, -1.6682422161102295, -1.4672194719314575, -1.2661967277526855, -1.0651741027832031, -0.8641513586044312, -0.663128674030304, -0.46210598945617676, -0.2610832452774048, -0.06006062030792236, 0.1409621238708496, 0.3419848084449768, 0.543007493019104, 0.744030237197876, 0.9450529217720032, 1.1460756063461304, 1.3470983505249023, 1.5481209754943848, 1.7491437196731567, 1.9501664638519287, 2.151189088821411, 2.3522119522094727, 2.553234577178955, 2.7542572021484375, 2.95527982711792, 3.1563024520874023, 3.3573250770568848, 3.558347702026367, 3.7593705654144287, 3.960393190383911, 4.161416053771973, 4.362438678741455, 4.5634613037109375, 4.76448392868042, 4.965506553649902, 5.166529178619385, 5.367551803588867, 5.568574905395508, 5.76959753036499, 5.970620155334473, 6.171642780303955, 6.3726654052734375, 6.573688507080078, 6.7747111320495605, 6.975733757019043, 7.176756858825684, 7.377779483795166, 7.578802108764648, 7.779824733734131, 7.980847358703613, 8.181869506835938, 8.382892608642578, 8.583914756774902, 8.784937858581543, 8.985960006713867, 9.186983108520508, 9.388006210327148, 9.589028358459473, 9.790051460266113]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 2.0, 12.0, 7.0, 12.0, 14.0, 16.0, 20.0, 20.0, 20.0, 28.0, 26.0, 27.0, 40.0, 34.0, 51.0, 37.0, 32.0, 36.0, 41.0, 36.0, 42.0, 27.0, 38.0, 44.0, 38.0, 38.0, 28.0, 27.0, 28.0, 28.0, 29.0, 20.0, 12.0, 20.0, 8.0, 10.0, 7.0, 8.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.0805978775024414, -2.9904825687408447, -2.900367259979248, -2.8102517127990723, -2.7201364040374756, -2.630021095275879, -2.5399057865142822, -2.4497904777526855, -2.3596749305725098, -2.269559621810913, -2.1794443130493164, -2.0893287658691406, -1.999213457107544, -1.9090981483459473, -1.8189828395843506, -1.728867530822754, -1.6387522220611572, -1.5486369132995605, -1.4585214853286743, -1.3684061765670776, -1.2782907485961914, -1.1881754398345947, -1.098060131072998, -1.0079448223114014, -0.9178293943405151, -0.8277140259742737, -0.7375986576080322, -0.6474833488464355, -0.5573679804801941, -0.46725261211395264, -0.37713730335235596, -0.2870219349861145, -0.19690680503845215, -0.10679145157337189, -0.016676098108291626, 0.07343924045562744, 0.1635546088218689, 0.25366997718811035, 0.34378528594970703, 0.4339006543159485, 0.5240160226821899, 0.6141313910484314, 0.7042467594146729, 0.7943620681762695, 0.884477436542511, 0.9745928049087524, 1.0647081136703491, 1.1548235416412354, 1.244938850402832, 1.3350541591644287, 1.425169587135315, 1.5152848958969116, 1.6054003238677979, 1.6955156326293945, 1.7856309413909912, 1.875746250152588, 1.9658616781234741, 2.0559771060943604, 2.146092414855957, 2.2362077236175537, 2.3263230323791504, 2.416438579559326, 2.5065536499023438, 2.5966691970825195, 2.686784505844116]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 18.0, 20.0, 21.0, 20.0, 43.0, 77.0, 83.0, 134.0, 225.0, 352.0, 638.0, 1108.0, 2124.0, 4068.0, 9015.0, 21472.0, 58053.0, 178271.0, 403710.0, 241268.0, 77785.0, 27915.0, 11529.0, 4964.0, 2394.0, 1296.0, 742.0, 484.0, 248.0, 144.0, 98.0, 73.0, 43.0, 39.0, 23.0, 19.0, 8.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3949012756347656, -0.38111114501953125, -0.3673210144042969, -0.3535308837890625, -0.3397407531738281, -0.32595062255859375, -0.3121604919433594, -0.298370361328125, -0.2845802307128906, -0.27079010009765625, -0.2569999694824219, -0.2432098388671875, -0.22941970825195312, -0.21562957763671875, -0.20183944702148438, -0.18804931640625, -0.17425918579101562, -0.16046905517578125, -0.14667892456054688, -0.1328887939453125, -0.11909866333007812, -0.10530853271484375, -0.09151840209960938, -0.077728271484375, -0.06393814086914062, -0.05014801025390625, -0.036357879638671875, -0.0225677490234375, -0.008777618408203125, 0.00501251220703125, 0.018802642822265625, 0.0325927734375, 0.046382904052734375, 0.06017303466796875, 0.07396316528320312, 0.0877532958984375, 0.10154342651367188, 0.11533355712890625, 0.12912368774414062, 0.142913818359375, 0.15670394897460938, 0.17049407958984375, 0.18428421020507812, 0.1980743408203125, 0.21186447143554688, 0.22565460205078125, 0.23944473266601562, 0.25323486328125, 0.2670249938964844, 0.28081512451171875, 0.2946052551269531, 0.3083953857421875, 0.3221855163574219, 0.33597564697265625, 0.3497657775878906, 0.363555908203125, 0.3773460388183594, 0.39113616943359375, 0.4049263000488281, 0.4187164306640625, 0.4325065612792969, 0.44629669189453125, 0.4600868225097656, 0.473876953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 12.0, 4.0, 8.0, 9.0, 17.0, 17.0, 25.0, 28.0, 26.0, 40.0, 44.0, 43.0, 38.0, 36.0, 54.0, 53.0, 56.0, 48.0, 55.0, 42.0, 30.0, 44.0, 44.0, 28.0, 23.0, 19.0, 21.0, 18.0, 15.0, 17.0, 20.0, 8.0, 9.0, 8.0, 6.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.36572265625, -0.355377197265625, -0.34503173828125, -0.334686279296875, -0.3243408203125, -0.313995361328125, -0.30364990234375, -0.293304443359375, -0.282958984375, -0.272613525390625, -0.26226806640625, -0.251922607421875, -0.2415771484375, -0.231231689453125, -0.22088623046875, -0.210540771484375, -0.2001953125, -0.189849853515625, -0.17950439453125, -0.169158935546875, -0.1588134765625, -0.148468017578125, -0.13812255859375, -0.127777099609375, -0.117431640625, -0.107086181640625, -0.09674072265625, -0.086395263671875, -0.0760498046875, -0.065704345703125, -0.05535888671875, -0.045013427734375, -0.03466796875, -0.024322509765625, -0.01397705078125, -0.003631591796875, 0.0067138671875, 0.017059326171875, 0.02740478515625, 0.037750244140625, 0.048095703125, 0.058441162109375, 0.06878662109375, 0.079132080078125, 0.0894775390625, 0.099822998046875, 0.11016845703125, 0.120513916015625, 0.130859375, 0.141204833984375, 0.15155029296875, 0.161895751953125, 0.1722412109375, 0.182586669921875, 0.19293212890625, 0.203277587890625, 0.213623046875, 0.223968505859375, 0.23431396484375, 0.244659423828125, 0.2550048828125, 0.265350341796875, 0.27569580078125, 0.286041259765625, 0.29638671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 9.0, 9.0, 16.0, 23.0, 24.0, 29.0, 56.0, 56.0, 107.0, 173.0, 252.0, 451.0, 1014.0, 2758.0, 12012.0, 101866.0, 795129.0, 116182.0, 13230.0, 2938.0, 966.0, 488.0, 252.0, 159.0, 117.0, 61.0, 51.0, 39.0, 26.0, 15.0, 15.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8467788696289062, -0.8170928955078125, -0.7874069213867188, -0.757720947265625, -0.7280349731445312, -0.6983489990234375, -0.6686630249023438, -0.63897705078125, -0.6092910766601562, -0.5796051025390625, -0.5499191284179688, -0.520233154296875, -0.49054718017578125, -0.4608612060546875, -0.43117523193359375, -0.4014892578125, -0.37180328369140625, -0.3421173095703125, -0.31243133544921875, -0.282745361328125, -0.25305938720703125, -0.2233734130859375, -0.19368743896484375, -0.16400146484375, -0.13431549072265625, -0.1046295166015625, -0.07494354248046875, -0.045257568359375, -0.01557159423828125, 0.0141143798828125, 0.04380035400390625, 0.073486328125, 0.10317230224609375, 0.1328582763671875, 0.16254425048828125, 0.192230224609375, 0.22191619873046875, 0.2516021728515625, 0.28128814697265625, 0.31097412109375, 0.34066009521484375, 0.3703460693359375, 0.40003204345703125, 0.429718017578125, 0.45940399169921875, 0.4890899658203125, 0.5187759399414062, 0.5484619140625, 0.5781478881835938, 0.6078338623046875, 0.6375198364257812, 0.667205810546875, 0.6968917846679688, 0.7265777587890625, 0.7562637329101562, 0.78594970703125, 0.8156356811523438, 0.8453216552734375, 0.8750076293945312, 0.904693603515625, 0.9343795776367188, 0.9640655517578125, 0.9937515258789062, 1.0234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 8.0, 6.0, 10.0, 13.0, 11.0, 21.0, 13.0, 12.0, 19.0, 25.0, 30.0, 35.0, 29.0, 30.0, 46.0, 52.0, 36.0, 44.0, 45.0, 51.0, 42.0, 45.0, 51.0, 37.0, 34.0, 41.0, 39.0, 17.0, 23.0, 26.0, 27.0, 10.0, 11.0, 8.0, 7.0, 8.0, 6.0, 9.0, 8.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0166015625, -0.9827423095703125, -0.948883056640625, -0.9150238037109375, -0.88116455078125, -0.8473052978515625, -0.813446044921875, -0.7795867919921875, -0.7457275390625, -0.7118682861328125, -0.678009033203125, -0.6441497802734375, -0.61029052734375, -0.5764312744140625, -0.542572021484375, -0.5087127685546875, -0.474853515625, -0.4409942626953125, -0.407135009765625, -0.3732757568359375, -0.33941650390625, -0.3055572509765625, -0.271697998046875, -0.2378387451171875, -0.2039794921875, -0.1701202392578125, -0.136260986328125, -0.1024017333984375, -0.06854248046875, -0.0346832275390625, -0.000823974609375, 0.0330352783203125, 0.06689453125, 0.1007537841796875, 0.134613037109375, 0.1684722900390625, 0.20233154296875, 0.2361907958984375, 0.270050048828125, 0.3039093017578125, 0.3377685546875, 0.3716278076171875, 0.405487060546875, 0.4393463134765625, 0.47320556640625, 0.5070648193359375, 0.540924072265625, 0.5747833251953125, 0.608642578125, 0.6425018310546875, 0.676361083984375, 0.7102203369140625, 0.74407958984375, 0.7779388427734375, 0.811798095703125, 0.8456573486328125, 0.8795166015625, 0.9133758544921875, 0.947235107421875, 0.9810943603515625, 1.01495361328125, 1.0488128662109375, 1.082672119140625, 1.1165313720703125, 1.150390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 6.0, 9.0, 18.0, 23.0, 32.0, 59.0, 92.0, 204.0, 344.0, 754.0, 1726.0, 4410.0, 15032.0, 70416.0, 733285.0, 181760.0, 28056.0, 7622.0, 2567.0, 1016.0, 484.0, 250.0, 126.0, 91.0, 51.0, 39.0, 17.0, 8.0, 7.0, 11.0, 8.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.275390625, -0.26697540283203125, -0.2585601806640625, -0.25014495849609375, -0.241729736328125, -0.23331451416015625, -0.2248992919921875, -0.21648406982421875, -0.20806884765625, -0.19965362548828125, -0.1912384033203125, -0.18282318115234375, -0.174407958984375, -0.16599273681640625, -0.1575775146484375, -0.14916229248046875, -0.1407470703125, -0.13233184814453125, -0.1239166259765625, -0.11550140380859375, -0.107086181640625, -0.09867095947265625, -0.0902557373046875, -0.08184051513671875, -0.07342529296875, -0.06501007080078125, -0.0565948486328125, -0.04817962646484375, -0.039764404296875, -0.03134918212890625, -0.0229339599609375, -0.01451873779296875, -0.006103515625, 0.00231170654296875, 0.0107269287109375, 0.01914215087890625, 0.027557373046875, 0.03597259521484375, 0.0443878173828125, 0.05280303955078125, 0.06121826171875, 0.06963348388671875, 0.0780487060546875, 0.08646392822265625, 0.094879150390625, 0.10329437255859375, 0.1117095947265625, 0.12012481689453125, 0.1285400390625, 0.13695526123046875, 0.1453704833984375, 0.15378570556640625, 0.162200927734375, 0.17061614990234375, 0.1790313720703125, 0.18744659423828125, 0.19586181640625, 0.20427703857421875, 0.2126922607421875, 0.22110748291015625, 0.229522705078125, 0.23793792724609375, 0.2463531494140625, 0.25476837158203125, 0.26318359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 4.0, 11.0, 12.0, 15.0, 19.0, 28.0, 41.0, 59.0, 65.0, 108.0, 153.0, 133.0, 116.0, 80.0, 41.0, 27.0, 23.0, 18.0, 16.0, 5.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.113550186157227e-05, -8.884910494089127e-05, -8.656270802021027e-05, -8.427631109952927e-05, -8.198991417884827e-05, -7.970351725816727e-05, -7.741712033748627e-05, -7.513072341680527e-05, -7.284432649612427e-05, -7.055792957544327e-05, -6.827153265476227e-05, -6.598513573408127e-05, -6.369873881340027e-05, -6.141234189271927e-05, -5.912594497203827e-05, -5.683954805135727e-05, -5.455315113067627e-05, -5.226675420999527e-05, -4.998035728931427e-05, -4.769396036863327e-05, -4.540756344795227e-05, -4.312116652727127e-05, -4.083476960659027e-05, -3.854837268590927e-05, -3.626197576522827e-05, -3.397557884454727e-05, -3.168918192386627e-05, -2.9402785003185272e-05, -2.7116388082504272e-05, -2.4829991161823273e-05, -2.2543594241142273e-05, -2.0257197320461273e-05, -1.7970800399780273e-05, -1.5684403479099274e-05, -1.3398006558418274e-05, -1.1111609637737274e-05, -8.825212717056274e-06, -6.538815796375275e-06, -4.252418875694275e-06, -1.966021955013275e-06, 3.203749656677246e-07, 2.6067718863487244e-06, 4.893168807029724e-06, 7.179565727710724e-06, 9.465962648391724e-06, 1.1752359569072723e-05, 1.4038756489753723e-05, 1.6325153410434723e-05, 1.8611550331115723e-05, 2.0897947251796722e-05, 2.3184344172477722e-05, 2.5470741093158722e-05, 2.775713801383972e-05, 3.004353493452072e-05, 3.232993185520172e-05, 3.461632877588272e-05, 3.690272569656372e-05, 3.918912261724472e-05, 4.147551953792572e-05, 4.376191645860672e-05, 4.604831337928772e-05, 4.833471029996872e-05, 5.062110722064972e-05, 5.290750414133072e-05, 5.519390106201172e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 6.0, 6.0, 13.0, 15.0, 18.0, 36.0, 54.0, 75.0, 127.0, 235.0, 361.0, 693.0, 1480.0, 3743.0, 11543.0, 50443.0, 559159.0, 355465.0, 47197.0, 11153.0, 3578.0, 1490.0, 720.0, 374.0, 217.0, 125.0, 90.0, 37.0, 35.0, 18.0, 13.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.299072265625, -0.290985107421875, -0.28289794921875, -0.274810791015625, -0.2667236328125, -0.258636474609375, -0.25054931640625, -0.242462158203125, -0.234375, -0.226287841796875, -0.21820068359375, -0.210113525390625, -0.2020263671875, -0.193939208984375, -0.18585205078125, -0.177764892578125, -0.169677734375, -0.161590576171875, -0.15350341796875, -0.145416259765625, -0.1373291015625, -0.129241943359375, -0.12115478515625, -0.113067626953125, -0.10498046875, -0.096893310546875, -0.08880615234375, -0.080718994140625, -0.0726318359375, -0.064544677734375, -0.05645751953125, -0.048370361328125, -0.040283203125, -0.032196044921875, -0.02410888671875, -0.016021728515625, -0.0079345703125, 0.000152587890625, 0.00823974609375, 0.016326904296875, 0.0244140625, 0.032501220703125, 0.04058837890625, 0.048675537109375, 0.0567626953125, 0.064849853515625, 0.07293701171875, 0.081024169921875, 0.089111328125, 0.097198486328125, 0.10528564453125, 0.113372802734375, 0.1214599609375, 0.129547119140625, 0.13763427734375, 0.145721435546875, 0.15380859375, 0.161895751953125, 0.16998291015625, 0.178070068359375, 0.1861572265625, 0.194244384765625, 0.20233154296875, 0.210418701171875, 0.218505859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 0.0, 7.0, 5.0, 10.0, 9.0, 8.0, 10.0, 10.0, 13.0, 16.0, 21.0, 33.0, 42.0, 42.0, 60.0, 71.0, 82.0, 75.0, 74.0, 62.0, 64.0, 43.0, 47.0, 37.0, 26.0, 25.0, 19.0, 15.0, 15.0, 5.0, 6.0, 1.0, 6.0, 3.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.16910362243652344, -0.16303634643554688, -0.1569690704345703, -0.15090179443359375, -0.1448345184326172, -0.13876724243164062, -0.13269996643066406, -0.1266326904296875, -0.12056541442871094, -0.11449813842773438, -0.10843086242675781, -0.10236358642578125, -0.09629631042480469, -0.09022903442382812, -0.08416175842285156, -0.078094482421875, -0.07202720642089844, -0.06595993041992188, -0.05989265441894531, -0.05382537841796875, -0.04775810241699219, -0.041690826416015625, -0.03562355041503906, -0.0295562744140625, -0.023488998413085938, -0.017421722412109375, -0.011354446411132812, -0.00528717041015625, 0.0007801055908203125, 0.006847381591796875, 0.012914657592773438, 0.01898193359375, 0.025049209594726562, 0.031116485595703125, 0.03718376159667969, 0.04325103759765625, 0.04931831359863281, 0.055385589599609375, 0.06145286560058594, 0.0675201416015625, 0.07358741760253906, 0.07965469360351562, 0.08572196960449219, 0.09178924560546875, 0.09785652160644531, 0.10392379760742188, 0.10999107360839844, 0.116058349609375, 0.12212562561035156, 0.12819290161132812, 0.1342601776123047, 0.14032745361328125, 0.1463947296142578, 0.15246200561523438, 0.15852928161621094, 0.1645965576171875, 0.17066383361816406, 0.17673110961914062, 0.1827983856201172, 0.18886566162109375, 0.1949329376220703, 0.20100021362304688, 0.20706748962402344, 0.213134765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 13.0, 20.0, 41.0, 69.0, 115.0, 279.0, 224.0, 94.0, 55.0, 33.0, 19.0, 12.0, 7.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.70998764038086, -8.501585960388184, -8.293184280395508, -8.084782600402832, -7.876380920410156, -7.6679792404174805, -7.459577560424805, -7.251175880432129, -7.042774200439453, -6.834372520446777, -6.625970840454102, -6.417569160461426, -6.20916748046875, -6.000765800476074, -5.792364120483398, -5.583962440490723, -5.375561237335205, -5.167159557342529, -4.9587578773498535, -4.750356197357178, -4.541954517364502, -4.333552837371826, -4.125151634216309, -3.9167497158050537, -3.708348035812378, -3.499946355819702, -3.2915446758270264, -3.0831432342529297, -2.874741554260254, -2.666339874267578, -2.4579381942749023, -2.2495365142822266, -2.0411343574523926, -1.8327326774597168, -1.624330997467041, -1.4159294366836548, -1.207527756690979, -0.9991260766983032, -0.790724515914917, -0.5823228359222412, -0.37392115592956543, -0.16551950573921204, 0.04288214445114136, 0.25128376483917236, 0.45968544483184814, 0.6680871248245239, 0.8764886856079102, 1.084890365600586, 1.2932920455932617, 1.5016937255859375, 1.7100954055786133, 1.9184969663619995, 2.126898765563965, 2.3353004455566406, 2.5437018871307373, 2.752103567123413, 2.960505247116089, 3.1689069271087646, 3.3773086071014404, 3.585710048675537, 3.794111728668213, 4.002513408660889, 4.2109150886535645, 4.41931676864624, 4.627718448638916]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 6.0, 3.0, 10.0, 8.0, 14.0, 15.0, 18.0, 12.0, 19.0, 23.0, 21.0, 31.0, 33.0, 35.0, 37.0, 55.0, 68.0, 82.0, 93.0, 64.0, 47.0, 33.0, 42.0, 33.0, 26.0, 21.0, 27.0, 19.0, 16.0, 13.0, 17.0, 10.0, 12.0, 5.0, 8.0, 7.0, 0.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.346907615661621, -4.211079120635986, -4.075250148773193, -3.9394216537475586, -3.803593158721924, -3.66776442527771, -3.531935691833496, -3.3961071968078613, -3.2602784633636475, -3.1244497299194336, -2.988621234893799, -2.852792501449585, -2.716963768005371, -2.5811352729797363, -2.4453065395355225, -2.3094778060913086, -2.173649311065674, -2.03782057762146, -1.9019920825958252, -1.7661633491516113, -1.630334734916687, -1.4945061206817627, -1.3586773872375488, -1.2228487730026245, -1.0870201587677002, -0.9511915445327759, -0.8153628706932068, -0.6795341968536377, -0.5437055826187134, -0.40787696838378906, -0.27204829454421997, -0.13621962070465088, -0.0003914833068847656, 0.13543716073036194, 0.27126580476760864, 0.40709444880485535, 0.542923092842102, 0.6787517070770264, 0.8145803809165955, 0.9504090547561646, 1.0862376689910889, 1.2220662832260132, 1.3578948974609375, 1.4937236309051514, 1.6295522451400757, 1.765380859375, 1.9012095928192139, 2.0370383262634277, 2.1728668212890625, 2.3086955547332764, 2.444524049758911, 2.580352783203125, 2.7161812782287598, 2.8520100116729736, 2.9878387451171875, 3.1236672401428223, 3.259495973587036, 3.39532470703125, 3.5311532020568848, 3.6669819355010986, 3.8028106689453125, 3.9386391639709473, 4.074467658996582, 4.210296630859375, 4.34612512588501]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 8.0, 7.0, 8.0, 13.0, 16.0, 21.0, 10.0, 16.0, 21.0, 40.0, 53.0, 101.0, 245.0, 654.0, 2210.0, 9216.0, 61895.0, 1132691.0, 2821246.0, 144080.0, 16469.0, 3526.0, 1024.0, 304.0, 133.0, 81.0, 42.0, 29.0, 24.0, 16.0, 12.0, 12.0, 10.0, 9.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76318359375, -0.74017333984375, -0.7171630859375, -0.69415283203125, -0.671142578125, -0.64813232421875, -0.6251220703125, -0.60211181640625, -0.5791015625, -0.55609130859375, -0.5330810546875, -0.51007080078125, -0.487060546875, -0.46405029296875, -0.4410400390625, -0.41802978515625, -0.39501953125, -0.37200927734375, -0.3489990234375, -0.32598876953125, -0.302978515625, -0.27996826171875, -0.2569580078125, -0.23394775390625, -0.2109375, -0.18792724609375, -0.1649169921875, -0.14190673828125, -0.118896484375, -0.09588623046875, -0.0728759765625, -0.04986572265625, -0.02685546875, -0.00384521484375, 0.0191650390625, 0.04217529296875, 0.065185546875, 0.08819580078125, 0.1112060546875, 0.13421630859375, 0.1572265625, 0.18023681640625, 0.2032470703125, 0.22625732421875, 0.249267578125, 0.27227783203125, 0.2952880859375, 0.31829833984375, 0.34130859375, 0.36431884765625, 0.3873291015625, 0.41033935546875, 0.433349609375, 0.45635986328125, 0.4793701171875, 0.50238037109375, 0.525390625, 0.54840087890625, 0.5714111328125, 0.59442138671875, 0.617431640625, 0.64044189453125, 0.6634521484375, 0.68646240234375, 0.70947265625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 3.0, 6.0, 5.0, 8.0, 8.0, 14.0, 14.0, 8.0, 12.0, 17.0, 21.0, 21.0, 24.0, 42.0, 46.0, 36.0, 48.0, 46.0, 52.0, 53.0, 59.0, 46.0, 53.0, 33.0, 44.0, 37.0, 31.0, 41.0, 26.0, 14.0, 17.0, 25.0, 15.0, 13.0, 15.0, 12.0, 8.0, 7.0, 6.0, 7.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.365478515625, -0.35540008544921875, -0.3453216552734375, -0.33524322509765625, -0.325164794921875, -0.31508636474609375, -0.3050079345703125, -0.29492950439453125, -0.28485107421875, -0.27477264404296875, -0.2646942138671875, -0.25461578369140625, -0.244537353515625, -0.23445892333984375, -0.2243804931640625, -0.21430206298828125, -0.2042236328125, -0.19414520263671875, -0.1840667724609375, -0.17398834228515625, -0.163909912109375, -0.15383148193359375, -0.1437530517578125, -0.13367462158203125, -0.12359619140625, -0.11351776123046875, -0.1034393310546875, -0.09336090087890625, -0.083282470703125, -0.07320404052734375, -0.0631256103515625, -0.05304718017578125, -0.04296875, -0.03289031982421875, -0.0228118896484375, -0.01273345947265625, -0.002655029296875, 0.00742340087890625, 0.0175018310546875, 0.02758026123046875, 0.03765869140625, 0.04773712158203125, 0.0578155517578125, 0.06789398193359375, 0.077972412109375, 0.08805084228515625, 0.0981292724609375, 0.10820770263671875, 0.1182861328125, 0.12836456298828125, 0.1384429931640625, 0.14852142333984375, 0.158599853515625, 0.16867828369140625, 0.1787567138671875, 0.18883514404296875, 0.19891357421875, 0.20899200439453125, 0.2190704345703125, 0.22914886474609375, 0.239227294921875, 0.24930572509765625, 0.2593841552734375, 0.26946258544921875, 0.279541015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 11.0, 13.0, 18.0, 37.0, 36.0, 63.0, 104.0, 157.0, 346.0, 837.0, 3095.0, 19417.0, 318112.0, 3712664.0, 124443.0, 11314.0, 2182.0, 710.0, 319.0, 147.0, 82.0, 48.0, 45.0, 24.0, 12.0, 8.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1376953125, -1.1045913696289062, -1.0714874267578125, -1.0383834838867188, -1.005279541015625, -0.9721755981445312, -0.9390716552734375, -0.9059677124023438, -0.87286376953125, -0.8397598266601562, -0.8066558837890625, -0.7735519409179688, -0.740447998046875, -0.7073440551757812, -0.6742401123046875, -0.6411361694335938, -0.6080322265625, -0.5749282836914062, -0.5418243408203125, -0.5087203979492188, -0.475616455078125, -0.44251251220703125, -0.4094085693359375, -0.37630462646484375, -0.34320068359375, -0.31009674072265625, -0.2769927978515625, -0.24388885498046875, -0.210784912109375, -0.17768096923828125, -0.1445770263671875, -0.11147308349609375, -0.078369140625, -0.04526519775390625, -0.0121612548828125, 0.02094268798828125, 0.054046630859375, 0.08715057373046875, 0.1202545166015625, 0.15335845947265625, 0.18646240234375, 0.21956634521484375, 0.2526702880859375, 0.28577423095703125, 0.318878173828125, 0.35198211669921875, 0.3850860595703125, 0.41819000244140625, 0.4512939453125, 0.48439788818359375, 0.5175018310546875, 0.5506057739257812, 0.583709716796875, 0.6168136596679688, 0.6499176025390625, 0.6830215454101562, 0.71612548828125, 0.7492294311523438, 0.7823333740234375, 0.8154373168945312, 0.848541259765625, 0.8816452026367188, 0.9147491455078125, 0.9478530883789062, 0.98095703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 11.0, 12.0, 19.0, 27.0, 36.0, 65.0, 95.0, 157.0, 303.0, 546.0, 1017.0, 816.0, 405.0, 217.0, 130.0, 72.0, 49.0, 34.0, 17.0, 14.0, 19.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8687973022460938, -0.8396453857421875, -0.8104934692382812, -0.781341552734375, -0.7521896362304688, -0.7230377197265625, -0.6938858032226562, -0.66473388671875, -0.6355819702148438, -0.6064300537109375, -0.5772781372070312, -0.548126220703125, -0.5189743041992188, -0.4898223876953125, -0.46067047119140625, -0.4315185546875, -0.40236663818359375, -0.3732147216796875, -0.34406280517578125, -0.314910888671875, -0.28575897216796875, -0.2566070556640625, -0.22745513916015625, -0.19830322265625, -0.16915130615234375, -0.1399993896484375, -0.11084747314453125, -0.081695556640625, -0.05254364013671875, -0.0233917236328125, 0.00576019287109375, 0.034912109375, 0.06406402587890625, 0.0932159423828125, 0.12236785888671875, 0.151519775390625, 0.18067169189453125, 0.2098236083984375, 0.23897552490234375, 0.26812744140625, 0.29727935791015625, 0.3264312744140625, 0.35558319091796875, 0.384735107421875, 0.41388702392578125, 0.4430389404296875, 0.47219085693359375, 0.5013427734375, 0.5304946899414062, 0.5596466064453125, 0.5887985229492188, 0.617950439453125, 0.6471023559570312, 0.6762542724609375, 0.7054061889648438, 0.73455810546875, 0.7637100219726562, 0.7928619384765625, 0.8220138549804688, 0.851165771484375, 0.8803176879882812, 0.9094696044921875, 0.9386215209960938, 0.9677734375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 1.0, 4.0, 8.0, 10.0, 11.0, 20.0, 43.0, 77.0, 119.0, 128.0, 174.0, 137.0, 108.0, 68.0, 43.0, 14.0, 13.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.634377479553223, -6.473181247711182, -6.311984539031982, -6.150788307189941, -5.9895920753479, -5.828395366668701, -5.66719913482666, -5.506002426147461, -5.34480619430542, -5.183609962463379, -5.02241325378418, -4.861217021942139, -4.700020790100098, -4.538824081420898, -4.377627849578857, -4.216431617736816, -4.055234909057617, -3.894038438796997, -3.732842206954956, -3.571645736694336, -3.410449266433716, -3.2492527961730957, -3.0880565643310547, -2.9268600940704346, -2.7656641006469727, -2.6044676303863525, -2.4432713985443115, -2.2820749282836914, -2.1208784580230713, -1.9596821069717407, -1.7984857559204102, -1.63728928565979, -1.476093053817749, -1.3148967027664185, -1.1537002325057983, -0.9925038814544678, -0.8313074707984924, -0.6701110601425171, -0.5089147090911865, -0.3477182388305664, -0.18652188777923584, -0.025325492024421692, 0.13587090373039246, 0.2970672845840454, 0.45826369524002075, 0.6194601058959961, 0.7806564569473267, 0.9418529272079468, 1.1030492782592773, 1.264245629310608, 1.425442099571228, 1.5866384506225586, 1.7478349208831787, 1.9090312719345093, 2.07022762298584, 2.23142409324646, 2.39262056350708, 2.5538170337677, 2.715013265609741, 2.8762097358703613, 3.0374062061309814, 3.1986026763916016, 3.3597989082336426, 3.5209953784942627, 3.6821916103363037]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 3.0, 15.0, 13.0, 15.0, 14.0, 26.0, 24.0, 42.0, 32.0, 37.0, 45.0, 43.0, 69.0, 54.0, 71.0, 71.0, 42.0, 56.0, 45.0, 42.0, 28.0, 33.0, 26.0, 22.0, 27.0, 11.0, 14.0, 18.0, 13.0, 9.0, 8.0, 1.0, 4.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.515169620513916, -3.4059362411499023, -3.2967028617858887, -3.187469482421875, -3.0782361030578613, -2.9690027236938477, -2.859769344329834, -2.750535726547241, -2.6413023471832275, -2.532068967819214, -2.4228355884552, -2.3136022090911865, -2.204368829727173, -2.09513521194458, -1.985901951789856, -1.8766684532165527, -1.7674351930618286, -1.658201813697815, -1.5489684343338013, -1.439734935760498, -1.3305015563964844, -1.2212681770324707, -1.112034797668457, -1.0028014183044434, -0.8935679793357849, -0.7843345999717712, -0.6751011610031128, -0.5658677816390991, -0.45663437247276306, -0.347400963306427, -0.23816758394241333, -0.12893414497375488, -0.01970076560974121, 0.08953263610601425, 0.19876603782176971, 0.3079994320869446, 0.41723284125328064, 0.5264662504196167, 0.6356996297836304, 0.7449330687522888, 0.8541664481163025, 0.9633998274803162, 1.0726332664489746, 1.1818666458129883, 1.291100025177002, 1.4003334045410156, 1.5095667839050293, 1.6188002824783325, 1.7280336618423462, 1.8372670412063599, 1.9465004205703735, 2.0557339191436768, 2.1649672985076904, 2.274200677871704, 2.3834340572357178, 2.4926674365997314, 2.601900815963745, 2.711134195327759, 2.8203675746917725, 2.929600954055786, 3.0388343334198, 3.1480679512023926, 3.2573013305664062, 3.36653470993042, 3.4757680892944336]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 6.0, 6.0, 3.0, 9.0, 8.0, 18.0, 27.0, 27.0, 35.0, 59.0, 100.0, 127.0, 200.0, 326.0, 623.0, 1161.0, 2458.0, 5669.0, 15190.0, 46231.0, 178334.0, 521259.0, 198514.0, 50159.0, 16404.0, 6243.0, 2549.0, 1170.0, 628.0, 346.0, 222.0, 144.0, 94.0, 55.0, 50.0, 31.0, 17.0, 17.0, 9.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.60943603515625, -0.5894775390625, -0.56951904296875, -0.549560546875, -0.52960205078125, -0.5096435546875, -0.48968505859375, -0.4697265625, -0.44976806640625, -0.4298095703125, -0.40985107421875, -0.389892578125, -0.36993408203125, -0.3499755859375, -0.33001708984375, -0.31005859375, -0.29010009765625, -0.2701416015625, -0.25018310546875, -0.230224609375, -0.21026611328125, -0.1903076171875, -0.17034912109375, -0.150390625, -0.13043212890625, -0.1104736328125, -0.09051513671875, -0.070556640625, -0.05059814453125, -0.0306396484375, -0.01068115234375, 0.00927734375, 0.02923583984375, 0.0491943359375, 0.06915283203125, 0.089111328125, 0.10906982421875, 0.1290283203125, 0.14898681640625, 0.1689453125, 0.18890380859375, 0.2088623046875, 0.22882080078125, 0.248779296875, 0.26873779296875, 0.2886962890625, 0.30865478515625, 0.32861328125, 0.34857177734375, 0.3685302734375, 0.38848876953125, 0.408447265625, 0.42840576171875, 0.4483642578125, 0.46832275390625, 0.48828125, 0.50823974609375, 0.5281982421875, 0.54815673828125, 0.568115234375, 0.58807373046875, 0.6080322265625, 0.62799072265625, 0.64794921875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 8.0, 12.0, 7.0, 13.0, 18.0, 21.0, 19.0, 23.0, 32.0, 29.0, 40.0, 36.0, 50.0, 54.0, 49.0, 57.0, 56.0, 53.0, 48.0, 47.0, 39.0, 34.0, 35.0, 31.0, 23.0, 33.0, 20.0, 18.0, 13.0, 9.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360595703125, -0.3497467041015625, -0.338897705078125, -0.3280487060546875, -0.31719970703125, -0.3063507080078125, -0.295501708984375, -0.2846527099609375, -0.2738037109375, -0.2629547119140625, -0.252105712890625, -0.2412567138671875, -0.23040771484375, -0.2195587158203125, -0.208709716796875, -0.1978607177734375, -0.18701171875, -0.1761627197265625, -0.165313720703125, -0.1544647216796875, -0.14361572265625, -0.1327667236328125, -0.121917724609375, -0.1110687255859375, -0.1002197265625, -0.0893707275390625, -0.078521728515625, -0.0676727294921875, -0.05682373046875, -0.0459747314453125, -0.035125732421875, -0.0242767333984375, -0.013427734375, -0.0025787353515625, 0.008270263671875, 0.0191192626953125, 0.02996826171875, 0.0408172607421875, 0.051666259765625, 0.0625152587890625, 0.0733642578125, 0.0842132568359375, 0.095062255859375, 0.1059112548828125, 0.11676025390625, 0.1276092529296875, 0.138458251953125, 0.1493072509765625, 0.16015625, 0.1710052490234375, 0.181854248046875, 0.1927032470703125, 0.20355224609375, 0.2144012451171875, 0.225250244140625, 0.2360992431640625, 0.2469482421875, 0.2577972412109375, 0.268646240234375, 0.2794952392578125, 0.29034423828125, 0.3011932373046875, 0.312042236328125, 0.3228912353515625, 0.333740234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 11.0, 7.0, 14.0, 25.0, 37.0, 39.0, 45.0, 60.0, 106.0, 149.0, 254.0, 457.0, 890.0, 2121.0, 7033.0, 45478.0, 793056.0, 175403.0, 16816.0, 3639.0, 1355.0, 623.0, 307.0, 196.0, 131.0, 80.0, 58.0, 49.0, 27.0, 17.0, 21.0, 11.0, 10.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.095703125, -1.062255859375, -1.02880859375, -0.995361328125, -0.9619140625, -0.928466796875, -0.89501953125, -0.861572265625, -0.828125, -0.794677734375, -0.76123046875, -0.727783203125, -0.6943359375, -0.660888671875, -0.62744140625, -0.593994140625, -0.560546875, -0.527099609375, -0.49365234375, -0.460205078125, -0.4267578125, -0.393310546875, -0.35986328125, -0.326416015625, -0.29296875, -0.259521484375, -0.22607421875, -0.192626953125, -0.1591796875, -0.125732421875, -0.09228515625, -0.058837890625, -0.025390625, 0.008056640625, 0.04150390625, 0.074951171875, 0.1083984375, 0.141845703125, 0.17529296875, 0.208740234375, 0.2421875, 0.275634765625, 0.30908203125, 0.342529296875, 0.3759765625, 0.409423828125, 0.44287109375, 0.476318359375, 0.509765625, 0.543212890625, 0.57666015625, 0.610107421875, 0.6435546875, 0.677001953125, 0.71044921875, 0.743896484375, 0.77734375, 0.810791015625, 0.84423828125, 0.877685546875, 0.9111328125, 0.944580078125, 0.97802734375, 1.011474609375, 1.044921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 18.0, 16.0, 9.0, 13.0, 14.0, 24.0, 23.0, 34.0, 41.0, 53.0, 51.0, 61.0, 72.0, 51.0, 62.0, 63.0, 58.0, 64.0, 47.0, 37.0, 41.0, 29.0, 18.0, 24.0, 17.0, 16.0, 5.0, 10.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6328125, -1.58795166015625, -1.5430908203125, -1.49822998046875, -1.453369140625, -1.40850830078125, -1.3636474609375, -1.31878662109375, -1.27392578125, -1.22906494140625, -1.1842041015625, -1.13934326171875, -1.094482421875, -1.04962158203125, -1.0047607421875, -0.95989990234375, -0.9150390625, -0.87017822265625, -0.8253173828125, -0.78045654296875, -0.735595703125, -0.69073486328125, -0.6458740234375, -0.60101318359375, -0.55615234375, -0.51129150390625, -0.4664306640625, -0.42156982421875, -0.376708984375, -0.33184814453125, -0.2869873046875, -0.24212646484375, -0.197265625, -0.15240478515625, -0.1075439453125, -0.06268310546875, -0.017822265625, 0.02703857421875, 0.0718994140625, 0.11676025390625, 0.16162109375, 0.20648193359375, 0.2513427734375, 0.29620361328125, 0.341064453125, 0.38592529296875, 0.4307861328125, 0.47564697265625, 0.5205078125, 0.56536865234375, 0.6102294921875, 0.65509033203125, 0.699951171875, 0.74481201171875, 0.7896728515625, 0.83453369140625, 0.87939453125, 0.92425537109375, 0.9691162109375, 1.01397705078125, 1.058837890625, 1.10369873046875, 1.1485595703125, 1.19342041015625, 1.23828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 4.0, 9.0, 11.0, 17.0, 18.0, 33.0, 55.0, 72.0, 112.0, 229.0, 461.0, 1114.0, 3344.0, 12552.0, 78107.0, 846347.0, 86864.0, 13455.0, 3537.0, 1155.0, 443.0, 258.0, 135.0, 75.0, 53.0, 28.0, 16.0, 17.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2737464904785156, -0.26477813720703125, -0.2558097839355469, -0.2468414306640625, -0.23787307739257812, -0.22890472412109375, -0.21993637084960938, -0.210968017578125, -0.20199966430664062, -0.19303131103515625, -0.18406295776367188, -0.1750946044921875, -0.16612625122070312, -0.15715789794921875, -0.14818954467773438, -0.13922119140625, -0.13025283813476562, -0.12128448486328125, -0.11231613159179688, -0.1033477783203125, -0.09437942504882812, -0.08541107177734375, -0.07644271850585938, -0.067474365234375, -0.058506011962890625, -0.04953765869140625, -0.040569305419921875, -0.0316009521484375, -0.022632598876953125, -0.01366424560546875, -0.004695892333984375, 0.0042724609375, 0.013240814208984375, 0.02220916748046875, 0.031177520751953125, 0.0401458740234375, 0.049114227294921875, 0.05808258056640625, 0.06705093383789062, 0.076019287109375, 0.08498764038085938, 0.09395599365234375, 0.10292434692382812, 0.1118927001953125, 0.12086105346679688, 0.12982940673828125, 0.13879776000976562, 0.14776611328125, 0.15673446655273438, 0.16570281982421875, 0.17467117309570312, 0.1836395263671875, 0.19260787963867188, 0.20157623291015625, 0.21054458618164062, 0.219512939453125, 0.22848129272460938, 0.23744964599609375, 0.24641799926757812, 0.2553863525390625, 0.2643547058105469, 0.27332305908203125, 0.2822914123535156, 0.291259765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 8.0, 13.0, 16.0, 24.0, 32.0, 61.0, 79.0, 121.0, 170.0, 138.0, 93.0, 73.0, 41.0, 31.0, 19.0, 15.0, 10.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.848573684692383e-05, -6.609968841075897e-05, -6.371363997459412e-05, -6.132759153842926e-05, -5.8941543102264404e-05, -5.655549466609955e-05, -5.416944622993469e-05, -5.1783397793769836e-05, -4.939734935760498e-05, -4.7011300921440125e-05, -4.462525248527527e-05, -4.223920404911041e-05, -3.985315561294556e-05, -3.74671071767807e-05, -3.5081058740615845e-05, -3.269501030445099e-05, -3.0308961868286133e-05, -2.7922913432121277e-05, -2.553686499595642e-05, -2.3150816559791565e-05, -2.076476812362671e-05, -1.8378719687461853e-05, -1.5992671251296997e-05, -1.3606622815132141e-05, -1.1220574378967285e-05, -8.83452594280243e-06, -6.448477506637573e-06, -4.062429070472717e-06, -1.6763806343078613e-06, 7.096678018569946e-07, 3.0957162380218506e-06, 5.4817646741867065e-06, 7.867813110351562e-06, 1.0253861546516418e-05, 1.2639909982681274e-05, 1.502595841884613e-05, 1.7412006855010986e-05, 1.9798055291175842e-05, 2.2184103727340698e-05, 2.4570152163505554e-05, 2.695620059967041e-05, 2.9342249035835266e-05, 3.172829747200012e-05, 3.411434590816498e-05, 3.6500394344329834e-05, 3.888644278049469e-05, 4.1272491216659546e-05, 4.36585396528244e-05, 4.604458808898926e-05, 4.8430636525154114e-05, 5.081668496131897e-05, 5.3202733397483826e-05, 5.558878183364868e-05, 5.797483026981354e-05, 6.0360878705978394e-05, 6.274692714214325e-05, 6.51329755783081e-05, 6.751902401447296e-05, 6.990507245063782e-05, 7.229112088680267e-05, 7.467716932296753e-05, 7.706321775913239e-05, 7.944926619529724e-05, 8.18353146314621e-05, 8.422136306762695e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 10.0, 14.0, 17.0, 25.0, 32.0, 55.0, 70.0, 104.0, 148.0, 232.0, 384.0, 680.0, 1298.0, 2859.0, 7290.0, 22387.0, 95104.0, 704307.0, 162077.0, 34038.0, 9980.0, 3733.0, 1579.0, 814.0, 462.0, 305.0, 167.0, 125.0, 80.0, 60.0, 32.0, 27.0, 14.0, 10.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1875, -0.1819286346435547, -0.17635726928710938, -0.17078590393066406, -0.16521453857421875, -0.15964317321777344, -0.15407180786132812, -0.1485004425048828, -0.1429290771484375, -0.1373577117919922, -0.13178634643554688, -0.12621498107910156, -0.12064361572265625, -0.11507225036621094, -0.10950088500976562, -0.10392951965332031, -0.098358154296875, -0.09278678894042969, -0.08721542358398438, -0.08164405822753906, -0.07607269287109375, -0.07050132751464844, -0.06492996215820312, -0.05935859680175781, -0.0537872314453125, -0.04821586608886719, -0.042644500732421875, -0.03707313537597656, -0.03150177001953125, -0.025930404663085938, -0.020359039306640625, -0.014787673950195312, -0.00921630859375, -0.0036449432373046875, 0.001926422119140625, 0.0074977874755859375, 0.01306915283203125, 0.018640518188476562, 0.024211883544921875, 0.029783248901367188, 0.0353546142578125, 0.04092597961425781, 0.046497344970703125, 0.05206871032714844, 0.05764007568359375, 0.06321144104003906, 0.06878280639648438, 0.07435417175292969, 0.079925537109375, 0.08549690246582031, 0.09106826782226562, 0.09663963317871094, 0.10221099853515625, 0.10778236389160156, 0.11335372924804688, 0.11892509460449219, 0.1244964599609375, 0.1300678253173828, 0.13563919067382812, 0.14121055603027344, 0.14678192138671875, 0.15235328674316406, 0.15792465209960938, 0.1634960174560547, 0.1690673828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 5.0, 7.0, 11.0, 10.0, 18.0, 22.0, 25.0, 23.0, 38.0, 50.0, 55.0, 58.0, 69.0, 84.0, 114.0, 74.0, 61.0, 51.0, 52.0, 47.0, 24.0, 21.0, 14.0, 15.0, 8.0, 4.0, 4.0, 5.0, 5.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.210205078125, -0.20452880859375, -0.1988525390625, -0.19317626953125, -0.1875, -0.18182373046875, -0.1761474609375, -0.17047119140625, -0.164794921875, -0.15911865234375, -0.1534423828125, -0.14776611328125, -0.14208984375, -0.13641357421875, -0.1307373046875, -0.12506103515625, -0.119384765625, -0.11370849609375, -0.1080322265625, -0.10235595703125, -0.0966796875, -0.09100341796875, -0.0853271484375, -0.07965087890625, -0.073974609375, -0.06829833984375, -0.0626220703125, -0.05694580078125, -0.05126953125, -0.04559326171875, -0.0399169921875, -0.03424072265625, -0.028564453125, -0.02288818359375, -0.0172119140625, -0.01153564453125, -0.005859375, -0.00018310546875, 0.0054931640625, 0.01116943359375, 0.016845703125, 0.02252197265625, 0.0281982421875, 0.03387451171875, 0.03955078125, 0.04522705078125, 0.0509033203125, 0.05657958984375, 0.062255859375, 0.06793212890625, 0.0736083984375, 0.07928466796875, 0.0849609375, 0.09063720703125, 0.0963134765625, 0.10198974609375, 0.107666015625, 0.11334228515625, 0.1190185546875, 0.12469482421875, 0.13037109375, 0.13604736328125, 0.1417236328125, 0.14739990234375, 0.153076171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 16.0, 58.0, 137.0, 449.0, 190.0, 87.0, 24.0, 17.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.33594036102295, -9.02170467376709, -8.707468032836914, -8.393232345581055, -8.078996658325195, -7.7647600173950195, -7.45052433013916, -7.136288166046143, -6.822052001953125, -6.507815837860107, -6.19357967376709, -5.8793439865112305, -5.565107822418213, -5.250871658325195, -4.936635971069336, -4.622399806976318, -4.308163642883301, -3.993927478790283, -3.6796915531158447, -3.3654556274414062, -3.0512194633483887, -2.736983299255371, -2.4227473735809326, -2.108511447906494, -1.7942752838134766, -1.4800392389297485, -1.1658031940460205, -0.8515671491622925, -0.5373311042785645, -0.22309505939483643, 0.0911409854888916, 0.4053769111633301, 0.7196121215820312, 1.0338481664657593, 1.3480842113494873, 1.6623202562332153, 1.9765563011169434, 2.290792465209961, 2.6050283908843994, 2.919264316558838, 3.2335004806518555, 3.547736644744873, 3.8619725704193115, 4.17620849609375, 4.490444660186768, 4.804680824279785, 5.1189165115356445, 5.433152675628662, 5.74738883972168, 6.061625003814697, 6.375861167907715, 6.690096855163574, 7.004333019256592, 7.318569183349609, 7.632804870605469, 7.947041034698486, 8.261277198791504, 8.575512886047363, 8.889749526977539, 9.203985214233398, 9.518220901489258, 9.832457542419434, 10.146693229675293, 10.460929870605469, 10.775165557861328]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 5.0, 10.0, 7.0, 4.0, 13.0, 8.0, 12.0, 18.0, 19.0, 24.0, 35.0, 28.0, 34.0, 40.0, 46.0, 83.0, 123.0, 113.0, 65.0, 48.0, 36.0, 37.0, 34.0, 27.0, 19.0, 16.0, 21.0, 14.0, 8.0, 9.0, 9.0, 12.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6928629875183105, -4.5348663330078125, -4.3768696784973145, -4.218873023986816, -4.060876369476318, -3.9028797149658203, -3.7448830604553223, -3.586886405944824, -3.428889751434326, -3.270893096923828, -3.11289644241333, -2.954899787902832, -2.796903133392334, -2.638906478881836, -2.480909824371338, -2.32291316986084, -2.164916515350342, -2.0069198608398438, -1.8489232063293457, -1.6909265518188477, -1.5329298973083496, -1.3749332427978516, -1.2169365882873535, -1.0589399337768555, -0.9009432792663574, -0.7429466247558594, -0.5849499702453613, -0.4269533157348633, -0.26895666122436523, -0.11096000671386719, 0.04703664779663086, 0.2050333023071289, 0.36302947998046875, 0.5210261344909668, 0.6790227890014648, 0.8370194435119629, 0.9950160980224609, 1.153012752532959, 1.311009407043457, 1.469006061553955, 1.6270027160644531, 1.7849993705749512, 1.9429960250854492, 2.1009926795959473, 2.2589893341064453, 2.4169859886169434, 2.5749826431274414, 2.7329792976379395, 2.8909759521484375, 3.0489726066589355, 3.2069692611694336, 3.3649659156799316, 3.5229625701904297, 3.6809592247009277, 3.838955879211426, 3.996952533721924, 4.154949188232422, 4.31294584274292, 4.470942497253418, 4.628939151763916, 4.786935806274414, 4.944932460784912, 5.10292911529541, 5.260925769805908, 5.418922424316406]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 9.0, 13.0, 12.0, 15.0, 19.0, 33.0, 57.0, 59.0, 86.0, 113.0, 190.0, 274.0, 446.0, 726.0, 1390.0, 2512.0, 5281.0, 13014.0, 42998.0, 228887.0, 1553790.0, 1955626.0, 307049.0, 54023.0, 15376.0, 5953.0, 2695.0, 1418.0, 789.0, 484.0, 303.0, 200.0, 110.0, 90.0, 65.0, 52.0, 30.0, 23.0, 15.0, 12.0, 13.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.68359375, -0.6629257202148438, -0.6422576904296875, -0.6215896606445312, -0.600921630859375, -0.5802536010742188, -0.5595855712890625, -0.5389175415039062, -0.51824951171875, -0.49758148193359375, -0.4769134521484375, -0.45624542236328125, -0.435577392578125, -0.41490936279296875, -0.3942413330078125, -0.37357330322265625, -0.3529052734375, -0.33223724365234375, -0.3115692138671875, -0.29090118408203125, -0.270233154296875, -0.24956512451171875, -0.2288970947265625, -0.20822906494140625, -0.18756103515625, -0.16689300537109375, -0.1462249755859375, -0.12555694580078125, -0.104888916015625, -0.08422088623046875, -0.0635528564453125, -0.04288482666015625, -0.022216796875, -0.00154876708984375, 0.0191192626953125, 0.03978729248046875, 0.060455322265625, 0.08112335205078125, 0.1017913818359375, 0.12245941162109375, 0.14312744140625, 0.16379547119140625, 0.1844635009765625, 0.20513153076171875, 0.225799560546875, 0.24646759033203125, 0.2671356201171875, 0.28780364990234375, 0.3084716796875, 0.32913970947265625, 0.3498077392578125, 0.37047576904296875, 0.391143798828125, 0.41181182861328125, 0.4324798583984375, 0.45314788818359375, 0.47381591796875, 0.49448394775390625, 0.5151519775390625, 0.5358200073242188, 0.556488037109375, 0.5771560668945312, 0.5978240966796875, 0.6184921264648438, 0.63916015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 8.0, 5.0, 17.0, 15.0, 15.0, 19.0, 21.0, 32.0, 29.0, 34.0, 45.0, 33.0, 51.0, 52.0, 70.0, 47.0, 53.0, 64.0, 48.0, 42.0, 47.0, 24.0, 31.0, 39.0, 25.0, 18.0, 16.0, 20.0, 19.0, 12.0, 9.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3504371643066406, -0.33979034423828125, -0.3291435241699219, -0.3184967041015625, -0.3078498840332031, -0.29720306396484375, -0.2865562438964844, -0.275909423828125, -0.2652626037597656, -0.25461578369140625, -0.24396896362304688, -0.2333221435546875, -0.22267532348632812, -0.21202850341796875, -0.20138168334960938, -0.19073486328125, -0.18008804321289062, -0.16944122314453125, -0.15879440307617188, -0.1481475830078125, -0.13750076293945312, -0.12685394287109375, -0.11620712280273438, -0.105560302734375, -0.09491348266601562, -0.08426666259765625, -0.07361984252929688, -0.0629730224609375, -0.052326202392578125, -0.04167938232421875, -0.031032562255859375, -0.0203857421875, -0.009738922119140625, 0.00090789794921875, 0.011554718017578125, 0.0222015380859375, 0.032848358154296875, 0.04349517822265625, 0.054141998291015625, 0.064788818359375, 0.07543563842773438, 0.08608245849609375, 0.09672927856445312, 0.1073760986328125, 0.11802291870117188, 0.12866973876953125, 0.13931655883789062, 0.14996337890625, 0.16061019897460938, 0.17125701904296875, 0.18190383911132812, 0.1925506591796875, 0.20319747924804688, 0.21384429931640625, 0.22449111938476562, 0.235137939453125, 0.24578475952148438, 0.25643157958984375, 0.2670783996582031, 0.2777252197265625, 0.2883720397949219, 0.29901885986328125, 0.3096656799316406, 0.3203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 14.0, 18.0, 21.0, 41.0, 71.0, 133.0, 181.0, 395.0, 828.0, 2065.0, 10161.0, 432859.0, 3715514.0, 26458.0, 3404.0, 1051.0, 453.0, 248.0, 160.0, 85.0, 49.0, 25.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.4404144287109375, -2.371063232421875, -2.3017120361328125, -2.23236083984375, -2.1630096435546875, -2.093658447265625, -2.0243072509765625, -1.9549560546875, -1.8856048583984375, -1.816253662109375, -1.7469024658203125, -1.67755126953125, -1.6082000732421875, -1.538848876953125, -1.4694976806640625, -1.400146484375, -1.3307952880859375, -1.261444091796875, -1.1920928955078125, -1.12274169921875, -1.0533905029296875, -0.984039306640625, -0.9146881103515625, -0.8453369140625, -0.7759857177734375, -0.706634521484375, -0.6372833251953125, -0.56793212890625, -0.4985809326171875, -0.429229736328125, -0.3598785400390625, -0.29052734375, -0.2211761474609375, -0.151824951171875, -0.0824737548828125, -0.01312255859375, 0.0562286376953125, 0.125579833984375, 0.1949310302734375, 0.2642822265625, 0.3336334228515625, 0.402984619140625, 0.4723358154296875, 0.54168701171875, 0.6110382080078125, 0.680389404296875, 0.7497406005859375, 0.819091796875, 0.8884429931640625, 0.957794189453125, 1.0271453857421875, 1.09649658203125, 1.1658477783203125, 1.235198974609375, 1.3045501708984375, 1.3739013671875, 1.4432525634765625, 1.512603759765625, 1.5819549560546875, 1.65130615234375, 1.7206573486328125, 1.790008544921875, 1.8593597412109375, 1.9287109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 17.0, 21.0, 41.0, 70.0, 106.0, 148.0, 257.0, 393.0, 594.0, 811.0, 603.0, 356.0, 231.0, 159.0, 103.0, 59.0, 34.0, 26.0, 11.0, 15.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0347442626953125, -0.992340087890625, -0.9499359130859375, -0.90753173828125, -0.8651275634765625, -0.822723388671875, -0.7803192138671875, -0.7379150390625, -0.6955108642578125, -0.653106689453125, -0.6107025146484375, -0.56829833984375, -0.5258941650390625, -0.483489990234375, -0.4410858154296875, -0.398681640625, -0.3562774658203125, -0.313873291015625, -0.2714691162109375, -0.22906494140625, -0.1866607666015625, -0.144256591796875, -0.1018524169921875, -0.0594482421875, -0.0170440673828125, 0.025360107421875, 0.0677642822265625, 0.11016845703125, 0.1525726318359375, 0.194976806640625, 0.2373809814453125, 0.27978515625, 0.3221893310546875, 0.364593505859375, 0.4069976806640625, 0.44940185546875, 0.4918060302734375, 0.534210205078125, 0.5766143798828125, 0.6190185546875, 0.6614227294921875, 0.703826904296875, 0.7462310791015625, 0.78863525390625, 0.8310394287109375, 0.873443603515625, 0.9158477783203125, 0.958251953125, 1.0006561279296875, 1.043060302734375, 1.0854644775390625, 1.12786865234375, 1.1702728271484375, 1.212677001953125, 1.2550811767578125, 1.2974853515625, 1.3398895263671875, 1.382293701171875, 1.4246978759765625, 1.46710205078125, 1.5095062255859375, 1.551910400390625, 1.5943145751953125, 1.63671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 11.0, 11.0, 17.0, 19.0, 64.0, 76.0, 154.0, 195.0, 185.0, 109.0, 78.0, 25.0, 17.0, 12.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-17.523181915283203, -17.138647079467773, -16.75411033630371, -16.36957550048828, -15.985038757324219, -15.600502967834473, -15.215967178344727, -14.831432342529297, -14.446895599365234, -14.062359809875488, -13.677824020385742, -13.293288230895996, -12.90875244140625, -12.524216651916504, -12.139680862426758, -11.755146026611328, -11.370610237121582, -10.986074447631836, -10.60153865814209, -10.217002868652344, -9.832467079162598, -9.447931289672852, -9.063396453857422, -8.67885971069336, -8.29432487487793, -7.909789085388184, -7.5252532958984375, -7.140717506408691, -6.756181716918945, -6.371645927429199, -5.987110614776611, -5.602574825286865, -5.218038558959961, -4.833502769470215, -4.448966979980469, -4.064431190490723, -3.6798956394195557, -3.2953598499298096, -2.9108242988586426, -2.5262885093688965, -2.1417527198791504, -1.7572169303894043, -1.3726812601089478, -0.9881455898284912, -0.6036098003387451, -0.21907401084899902, 0.16546154022216797, 0.5499973297119141, 0.9345331192016602, 1.3190689086914062, 1.7036045789718628, 2.0881402492523193, 2.4726760387420654, 2.8572118282318115, 3.2417473793029785, 3.6262831687927246, 4.010818958282471, 4.395354747772217, 4.779890537261963, 5.164425849914551, 5.548961639404297, 5.933497428894043, 6.318033218383789, 6.702569007873535, 7.087104797363281]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 5.0, 6.0, 9.0, 7.0, 15.0, 18.0, 18.0, 20.0, 25.0, 22.0, 29.0, 26.0, 38.0, 33.0, 34.0, 46.0, 54.0, 43.0, 42.0, 43.0, 38.0, 40.0, 36.0, 35.0, 39.0, 33.0, 33.0, 19.0, 24.0, 19.0, 14.0, 21.0, 18.0, 14.0, 17.0, 13.0, 8.0, 8.0, 6.0, 6.0, 2.0, 8.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.805377960205078, -4.670705318450928, -4.536032676696777, -4.401359558105469, -4.266686916351318, -4.132014274597168, -3.9973413944244385, -3.862668514251709, -3.7279958724975586, -3.593323230743408, -3.4586503505706787, -3.323977470397949, -3.189304828643799, -3.0546321868896484, -2.919959306716919, -2.7852864265441895, -2.650613784790039, -2.5159411430358887, -2.381268262863159, -2.2465953826904297, -2.1119227409362793, -1.9772499799728394, -1.8425772190093994, -1.7079044580459595, -1.5732316970825195, -1.4385589361190796, -1.3038861751556396, -1.1692134141921997, -1.0345406532287598, -0.8998678922653198, -0.7651951313018799, -0.6305223703384399, -0.4958491325378418, -0.36117637157440186, -0.22650361061096191, -0.09183084964752197, 0.04284191131591797, 0.1775146722793579, 0.31218743324279785, 0.4468601942062378, 0.5815329551696777, 0.7162057161331177, 0.8508784770965576, 0.9855512380599976, 1.1202239990234375, 1.2548967599868774, 1.3895695209503174, 1.5242422819137573, 1.6589150428771973, 1.7935878038406372, 1.9282605648040771, 2.0629334449768066, 2.197606086730957, 2.3322787284851074, 2.466951608657837, 2.6016244888305664, 2.736297130584717, 2.870969772338867, 3.0056426525115967, 3.140315532684326, 3.2749881744384766, 3.409660816192627, 3.5443336963653564, 3.679006576538086, 3.8136792182922363]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 0.0, 8.0, 10.0, 19.0, 36.0, 51.0, 80.0, 147.0, 297.0, 537.0, 1161.0, 2567.0, 6037.0, 16975.0, 59442.0, 364863.0, 493344.0, 71066.0, 19711.0, 6771.0, 2860.0, 1272.0, 630.0, 288.0, 172.0, 90.0, 54.0, 31.0, 18.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.554931640625, -0.53515625, -0.515380859375, -0.49560546875, -0.475830078125, -0.4560546875, -0.436279296875, -0.41650390625, -0.396728515625, -0.376953125, -0.357177734375, -0.33740234375, -0.317626953125, -0.2978515625, -0.278076171875, -0.25830078125, -0.238525390625, -0.21875, -0.198974609375, -0.17919921875, -0.159423828125, -0.1396484375, -0.119873046875, -0.10009765625, -0.080322265625, -0.060546875, -0.040771484375, -0.02099609375, -0.001220703125, 0.0185546875, 0.038330078125, 0.05810546875, 0.077880859375, 0.09765625, 0.117431640625, 0.13720703125, 0.156982421875, 0.1767578125, 0.196533203125, 0.21630859375, 0.236083984375, 0.255859375, 0.275634765625, 0.29541015625, 0.315185546875, 0.3349609375, 0.354736328125, 0.37451171875, 0.394287109375, 0.4140625, 0.433837890625, 0.45361328125, 0.473388671875, 0.4931640625, 0.512939453125, 0.53271484375, 0.552490234375, 0.572265625, 0.592041015625, 0.61181640625, 0.631591796875, 0.6513671875, 0.671142578125, 0.69091796875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 4.0, 2.0, 6.0, 7.0, 12.0, 16.0, 14.0, 16.0, 19.0, 18.0, 25.0, 28.0, 25.0, 29.0, 45.0, 45.0, 50.0, 41.0, 41.0, 60.0, 36.0, 47.0, 48.0, 46.0, 38.0, 47.0, 32.0, 27.0, 21.0, 31.0, 20.0, 19.0, 18.0, 13.0, 16.0, 5.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.348388671875, -0.3374366760253906, -0.32648468017578125, -0.3155326843261719, -0.3045806884765625, -0.2936286926269531, -0.28267669677734375, -0.2717247009277344, -0.260772705078125, -0.24982070922851562, -0.23886871337890625, -0.22791671752929688, -0.2169647216796875, -0.20601272583007812, -0.19506072998046875, -0.18410873413085938, -0.17315673828125, -0.16220474243164062, -0.15125274658203125, -0.14030075073242188, -0.1293487548828125, -0.11839675903320312, -0.10744476318359375, -0.09649276733398438, -0.085540771484375, -0.07458877563476562, -0.06363677978515625, -0.052684783935546875, -0.0417327880859375, -0.030780792236328125, -0.01982879638671875, -0.008876800537109375, 0.0020751953125, 0.013027191162109375, 0.02397918701171875, 0.034931182861328125, 0.0458831787109375, 0.056835174560546875, 0.06778717041015625, 0.07873916625976562, 0.089691162109375, 0.10064315795898438, 0.11159515380859375, 0.12254714965820312, 0.1334991455078125, 0.14445114135742188, 0.15540313720703125, 0.16635513305664062, 0.17730712890625, 0.18825912475585938, 0.19921112060546875, 0.21016311645507812, 0.2211151123046875, 0.23206710815429688, 0.24301910400390625, 0.2539710998535156, 0.264923095703125, 0.2758750915527344, 0.28682708740234375, 0.2977790832519531, 0.3087310791015625, 0.3196830749511719, 0.33063507080078125, 0.3415870666503906, 0.3525390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 8.0, 17.0, 16.0, 21.0, 27.0, 52.0, 87.0, 121.0, 226.0, 398.0, 823.0, 2350.0, 10956.0, 154144.0, 853276.0, 20296.0, 3444.0, 1080.0, 506.0, 267.0, 133.0, 92.0, 55.0, 38.0, 29.0, 18.0, 15.0, 16.0, 9.0, 3.0, 7.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.064453125, -1.0302734375, -0.99609375, -0.9619140625, -0.927734375, -0.8935546875, -0.859375, -0.8251953125, -0.791015625, -0.7568359375, -0.72265625, -0.6884765625, -0.654296875, -0.6201171875, -0.5859375, -0.5517578125, -0.517578125, -0.4833984375, -0.44921875, -0.4150390625, -0.380859375, -0.3466796875, -0.3125, -0.2783203125, -0.244140625, -0.2099609375, -0.17578125, -0.1416015625, -0.107421875, -0.0732421875, -0.0390625, -0.0048828125, 0.029296875, 0.0634765625, 0.09765625, 0.1318359375, 0.166015625, 0.2001953125, 0.234375, 0.2685546875, 0.302734375, 0.3369140625, 0.37109375, 0.4052734375, 0.439453125, 0.4736328125, 0.5078125, 0.5419921875, 0.576171875, 0.6103515625, 0.64453125, 0.6787109375, 0.712890625, 0.7470703125, 0.78125, 0.8154296875, 0.849609375, 0.8837890625, 0.91796875, 0.9521484375, 0.986328125, 1.0205078125, 1.0546875, 1.0888671875, 1.123046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 16.0, 25.0, 16.0, 21.0, 31.0, 27.0, 43.0, 57.0, 49.0, 88.0, 80.0, 89.0, 81.0, 71.0, 37.0, 48.0, 36.0, 29.0, 24.0, 25.0, 16.0, 16.0, 12.0, 11.0, 4.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6982421875, -1.641754150390625, -1.58526611328125, -1.528778076171875, -1.4722900390625, -1.415802001953125, -1.35931396484375, -1.302825927734375, -1.246337890625, -1.189849853515625, -1.13336181640625, -1.076873779296875, -1.0203857421875, -0.963897705078125, -0.90740966796875, -0.850921630859375, -0.79443359375, -0.737945556640625, -0.68145751953125, -0.624969482421875, -0.5684814453125, -0.511993408203125, -0.45550537109375, -0.399017333984375, -0.342529296875, -0.286041259765625, -0.22955322265625, -0.173065185546875, -0.1165771484375, -0.060089111328125, -0.00360107421875, 0.052886962890625, 0.109375, 0.165863037109375, 0.22235107421875, 0.278839111328125, 0.3353271484375, 0.391815185546875, 0.44830322265625, 0.504791259765625, 0.561279296875, 0.617767333984375, 0.67425537109375, 0.730743408203125, 0.7872314453125, 0.843719482421875, 0.90020751953125, 0.956695556640625, 1.01318359375, 1.069671630859375, 1.12615966796875, 1.182647705078125, 1.2391357421875, 1.295623779296875, 1.35211181640625, 1.408599853515625, 1.465087890625, 1.521575927734375, 1.57806396484375, 1.634552001953125, 1.6910400390625, 1.747528076171875, 1.80401611328125, 1.860504150390625, 1.9169921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 6.0, 9.0, 12.0, 15.0, 22.0, 39.0, 51.0, 62.0, 97.0, 162.0, 230.0, 438.0, 765.0, 1709.0, 4167.0, 12006.0, 43333.0, 702671.0, 226536.0, 38117.0, 10838.0, 3844.0, 1567.0, 755.0, 409.0, 199.0, 148.0, 89.0, 73.0, 48.0, 39.0, 31.0, 21.0, 12.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1072998046875, -0.1039419174194336, -0.10058403015136719, -0.09722614288330078, -0.09386825561523438, -0.09051036834716797, -0.08715248107910156, -0.08379459381103516, -0.08043670654296875, -0.07707881927490234, -0.07372093200683594, -0.07036304473876953, -0.06700515747070312, -0.06364727020263672, -0.06028938293457031, -0.056931495666503906, -0.0535736083984375, -0.050215721130371094, -0.04685783386230469, -0.04349994659423828, -0.040142059326171875, -0.03678417205810547, -0.03342628479003906, -0.030068397521972656, -0.02671051025390625, -0.023352622985839844, -0.019994735717773438, -0.01663684844970703, -0.013278961181640625, -0.009921073913574219, -0.0065631866455078125, -0.0032052993774414062, 0.000152587890625, 0.0035104751586914062, 0.0068683624267578125, 0.010226249694824219, 0.013584136962890625, 0.01694202423095703, 0.020299911499023438, 0.023657798767089844, 0.02701568603515625, 0.030373573303222656, 0.03373146057128906, 0.03708934783935547, 0.040447235107421875, 0.04380512237548828, 0.04716300964355469, 0.050520896911621094, 0.0538787841796875, 0.057236671447753906, 0.06059455871582031, 0.06395244598388672, 0.06731033325195312, 0.07066822052001953, 0.07402610778808594, 0.07738399505615234, 0.08074188232421875, 0.08409976959228516, 0.08745765686035156, 0.09081554412841797, 0.09417343139648438, 0.09753131866455078, 0.10088920593261719, 0.1042470932006836, 0.10760498046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 7.0, 7.0, 4.0, 9.0, 5.0, 9.0, 16.0, 23.0, 17.0, 34.0, 22.0, 31.0, 51.0, 55.0, 62.0, 67.0, 77.0, 76.0, 72.0, 59.0, 39.0, 41.0, 40.0, 31.0, 21.0, 18.0, 19.0, 11.0, 6.0, 11.0, 7.0, 7.0, 4.0, 5.0, 1.0, 7.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.421306610107422e-05, -3.3200718462467194e-05, -3.218837082386017e-05, -3.117602318525314e-05, -3.0163675546646118e-05, -2.9151327908039093e-05, -2.8138980269432068e-05, -2.7126632630825043e-05, -2.6114284992218018e-05, -2.5101937353610992e-05, -2.4089589715003967e-05, -2.3077242076396942e-05, -2.2064894437789917e-05, -2.1052546799182892e-05, -2.0040199160575867e-05, -1.902785152196884e-05, -1.8015503883361816e-05, -1.700315624475479e-05, -1.5990808606147766e-05, -1.4978460967540741e-05, -1.3966113328933716e-05, -1.295376569032669e-05, -1.1941418051719666e-05, -1.092907041311264e-05, -9.916722774505615e-06, -8.90437513589859e-06, -7.892027497291565e-06, -6.87967985868454e-06, -5.867332220077515e-06, -4.8549845814704895e-06, -3.842636942863464e-06, -2.830289304256439e-06, -1.817941665649414e-06, -8.055940270423889e-07, 2.0675361156463623e-07, 1.2191012501716614e-06, 2.2314488887786865e-06, 3.2437965273857117e-06, 4.256144165992737e-06, 5.268491804599762e-06, 6.280839443206787e-06, 7.293187081813812e-06, 8.305534720420837e-06, 9.317882359027863e-06, 1.0330229997634888e-05, 1.1342577636241913e-05, 1.2354925274848938e-05, 1.3367272913455963e-05, 1.4379620552062988e-05, 1.5391968190670013e-05, 1.640431582927704e-05, 1.7416663467884064e-05, 1.842901110649109e-05, 1.9441358745098114e-05, 2.045370638370514e-05, 2.1466054022312164e-05, 2.247840166091919e-05, 2.3490749299526215e-05, 2.450309693813324e-05, 2.5515444576740265e-05, 2.652779221534729e-05, 2.7540139853954315e-05, 2.855248749256134e-05, 2.9564835131168365e-05, 3.057718276977539e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 11.0, 14.0, 18.0, 30.0, 30.0, 54.0, 75.0, 150.0, 245.0, 442.0, 860.0, 1843.0, 4328.0, 11672.0, 43537.0, 717049.0, 215749.0, 35312.0, 10027.0, 3671.0, 1681.0, 807.0, 402.0, 236.0, 109.0, 81.0, 39.0, 24.0, 14.0, 16.0, 3.0, 6.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.12425041198730469, -0.12069320678710938, -0.11713600158691406, -0.11357879638671875, -0.11002159118652344, -0.10646438598632812, -0.10290718078613281, -0.0993499755859375, -0.09579277038574219, -0.09223556518554688, -0.08867835998535156, -0.08512115478515625, -0.08156394958496094, -0.07800674438476562, -0.07444953918457031, -0.070892333984375, -0.06733512878417969, -0.06377792358398438, -0.06022071838378906, -0.05666351318359375, -0.05310630798339844, -0.049549102783203125, -0.04599189758300781, -0.0424346923828125, -0.03887748718261719, -0.035320281982421875, -0.03176307678222656, -0.02820587158203125, -0.024648666381835938, -0.021091461181640625, -0.017534255981445312, -0.01397705078125, -0.010419845581054688, -0.006862640380859375, -0.0033054351806640625, 0.00025177001953125, 0.0038089752197265625, 0.007366180419921875, 0.010923385620117188, 0.0144805908203125, 0.018037796020507812, 0.021595001220703125, 0.025152206420898438, 0.02870941162109375, 0.03226661682128906, 0.035823822021484375, 0.03938102722167969, 0.042938232421875, 0.04649543762207031, 0.050052642822265625, 0.05360984802246094, 0.05716705322265625, 0.06072425842285156, 0.06428146362304688, 0.06783866882324219, 0.0713958740234375, 0.07495307922363281, 0.07851028442382812, 0.08206748962402344, 0.08562469482421875, 0.08918190002441406, 0.09273910522460938, 0.09629631042480469, 0.099853515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 6.0, 9.0, 11.0, 10.0, 10.0, 8.0, 12.0, 15.0, 19.0, 31.0, 36.0, 40.0, 44.0, 49.0, 58.0, 69.0, 66.0, 66.0, 53.0, 77.0, 39.0, 30.0, 47.0, 35.0, 28.0, 19.0, 16.0, 20.0, 12.0, 8.0, 8.0, 8.0, 11.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.10093975067138672, -0.09744834899902344, -0.09395694732666016, -0.09046554565429688, -0.0869741439819336, -0.08348274230957031, -0.07999134063720703, -0.07649993896484375, -0.07300853729248047, -0.06951713562011719, -0.0660257339477539, -0.06253433227539062, -0.059042930603027344, -0.05555152893066406, -0.05206012725830078, -0.0485687255859375, -0.04507732391357422, -0.04158592224121094, -0.038094520568847656, -0.034603118896484375, -0.031111717224121094, -0.027620315551757812, -0.02412891387939453, -0.02063751220703125, -0.01714611053466797, -0.013654708862304688, -0.010163307189941406, -0.006671905517578125, -0.0031805038452148438, 0.0003108978271484375, 0.0038022994995117188, 0.007293701171875, 0.010785102844238281, 0.014276504516601562, 0.017767906188964844, 0.021259307861328125, 0.024750709533691406, 0.028242111206054688, 0.03173351287841797, 0.03522491455078125, 0.03871631622314453, 0.04220771789550781, 0.045699119567871094, 0.049190521240234375, 0.052681922912597656, 0.05617332458496094, 0.05966472625732422, 0.0631561279296875, 0.06664752960205078, 0.07013893127441406, 0.07363033294677734, 0.07712173461914062, 0.0806131362915039, 0.08410453796386719, 0.08759593963623047, 0.09108734130859375, 0.09457874298095703, 0.09807014465332031, 0.1015615463256836, 0.10505294799804688, 0.10854434967041016, 0.11203575134277344, 0.11552715301513672, 0.1190185546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 21.0, 38.0, 36.0, 53.0, 159.0, 362.0, 111.0, 59.0, 44.0, 18.0, 19.0, 7.0, 13.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.605627059936523, -5.470422744750977, -5.3352179527282715, -5.200013637542725, -5.064809322357178, -4.929604530334473, -4.794400215148926, -4.659195899963379, -4.523991584777832, -4.388787269592285, -4.25358247756958, -4.118378162384033, -3.9831738471984863, -3.8479692935943604, -3.7127647399902344, -3.5775604248046875, -3.4423556327819824, -3.3071510791778564, -3.1719467639923096, -3.0367422103881836, -2.9015378952026367, -2.7663333415985107, -2.6311287879943848, -2.495924472808838, -2.360719919204712, -2.225515365600586, -2.090311050415039, -1.955106496810913, -1.8199020624160767, -1.6846976280212402, -1.5494930744171143, -1.4142886400222778, -1.2790842056274414, -1.143879771232605, -1.0086753368377686, -0.8734707832336426, -0.7382663488388062, -0.6030619144439697, -0.4678574204444885, -0.3326529264450073, -0.1974484920501709, -0.062244027853012085, 0.07296043634414673, 0.20816490054130554, 0.34336936473846436, 0.4785737991333008, 0.613778293132782, 0.7489827871322632, 0.8841872215270996, 1.019391655921936, 1.1545960903167725, 1.2898006439208984, 1.4250050783157349, 1.5602095127105713, 1.6954140663146973, 1.8306185007095337, 1.9658229351043701, 2.101027488708496, 2.236231803894043, 2.371436357498169, 2.506640911102295, 2.641845226287842, 2.7770497798919678, 2.9122543334960938, 3.0474586486816406]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 6.0, 5.0, 6.0, 8.0, 9.0, 9.0, 7.0, 13.0, 17.0, 17.0, 16.0, 22.0, 29.0, 21.0, 69.0, 96.0, 149.0, 131.0, 73.0, 36.0, 29.0, 21.0, 22.0, 17.0, 13.0, 16.0, 13.0, 9.0, 20.0, 19.0, 10.0, 8.0, 13.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.3909287452697754, -3.29034161567688, -3.1897542476654053, -3.0891671180725098, -2.988579750061035, -2.8879926204681396, -2.787405490875244, -2.6868181228637695, -2.586230754852295, -2.4856436252593994, -2.385056257247925, -2.2844691276550293, -2.1838817596435547, -2.083294630050659, -1.9827073812484741, -1.882120132446289, -1.7815330028533936, -1.6809457540512085, -1.5803585052490234, -1.479771375656128, -1.3791840076446533, -1.2785968780517578, -1.1780096292495728, -1.0774223804473877, -0.9768351316452026, -0.8762478828430176, -0.7756606340408325, -0.6750734448432922, -0.5744861960411072, -0.4738989472389221, -0.37331175804138184, -0.2727245092391968, -0.17213749885559082, -0.07155026495456696, 0.02903696894645691, 0.12962418794631958, 0.23021143674850464, 0.3307986855506897, 0.43138587474823, 0.531973123550415, 0.6325603723526001, 0.7331476211547852, 0.8337348699569702, 0.9343220591545105, 1.0349092483520508, 1.1354966163635254, 1.236083745956421, 1.336670994758606, 1.437258243560791, 1.537845492362976, 1.6384327411651611, 1.7390198707580566, 1.8396072387695312, 1.9401943683624268, 2.0407814979553223, 2.141368865966797, 2.2419562339782715, 2.342543363571167, 2.4431307315826416, 2.543717861175537, 2.6443052291870117, 2.7448923587799072, 2.8454794883728027, 2.9460668563842773, 3.046653985977173]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 8.0, 18.0, 8.0, 14.0, 18.0, 12.0, 19.0, 28.0, 37.0, 32.0, 49.0, 115.0, 273.0, 77.0, 40.0, 27.0, 48.0, 27.0, 33.0, 21.0, 14.0, 21.0, 13.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0], "bins": [-0.54833984375, -0.5350837707519531, -0.5218276977539062, -0.5085716247558594, -0.4953155517578125, -0.4820594787597656, -0.46880340576171875, -0.4555473327636719, -0.442291259765625, -0.4290351867675781, -0.41577911376953125, -0.4025230407714844, -0.3892669677734375, -0.3760108947753906, -0.36275482177734375, -0.3494987487792969, -0.33624267578125, -0.3229866027832031, -0.30973052978515625, -0.2964744567871094, -0.2832183837890625, -0.2699623107910156, -0.25670623779296875, -0.24345016479492188, -0.230194091796875, -0.21693801879882812, -0.20368194580078125, -0.19042587280273438, -0.1771697998046875, -0.16391372680664062, -0.15065765380859375, -0.13740158081054688, -0.1241455078125, -0.11088943481445312, -0.09763336181640625, -0.08437728881835938, -0.0711212158203125, -0.057865142822265625, -0.04460906982421875, -0.031352996826171875, -0.018096923828125, -0.004840850830078125, 0.00841522216796875, 0.021671295166015625, 0.0349273681640625, 0.048183441162109375, 0.06143951416015625, 0.07469558715820312, 0.08795166015625, 0.10120773315429688, 0.11446380615234375, 0.12771987915039062, 0.1409759521484375, 0.15423202514648438, 0.16748809814453125, 0.18074417114257812, 0.194000244140625, 0.20725631713867188, 0.22051239013671875, 0.23376846313476562, 0.2470245361328125, 0.2602806091308594, 0.27353668212890625, 0.2867927551269531, 0.300048828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 8.0, 16.0, 20.0, 41.0, 56.0, 92.0, 177.0, 441.0, 1321.0, 5529.0, 866694.0, 7505983.0, 5927.0, 1350.0, 440.0, 207.0, 86.0, 65.0, 26.0, 29.0, 13.0, 10.0, 8.0, 6.0, 2.0, 10.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5667355060577393, -3.4347140789031982, -3.3026926517486572, -3.170671224594116, -3.038649797439575, -2.906628370285034, -2.774606704711914, -2.642585277557373, -2.510563850402832, -2.378542423248291, -2.24652099609375, -2.114499568939209, -1.982478141784668, -1.850456714630127, -1.7184351682662964, -1.5864137411117554, -1.454392433166504, -1.322371006011963, -1.1903495788574219, -1.0583281517028809, -0.9263066649436951, -0.794285237789154, -0.6622637510299683, -0.5302423238754272, -0.39822089672088623, -0.2661994695663452, -0.1341780126094818, -0.002156555652618408, 0.1298648715019226, 0.2618862986564636, 0.3939077854156494, 0.5259292125701904, 0.6579508781433105, 0.7899723052978516, 0.9219937324523926, 1.0540151596069336, 1.1860365867614746, 1.3180580139160156, 1.4500795602798462, 1.5821009874343872, 1.7141224145889282, 1.8461438417434692, 1.9781652688980103, 2.110186815261841, 2.242208242416382, 2.374229669570923, 2.506251096725464, 2.638272523880005, 2.770293951034546, 2.902315378189087, 3.034336805343628, 3.166358232498169, 3.29837965965271, 3.430401086807251, 3.562422752380371, 3.694444179534912, 3.826465606689453, 3.958487033843994, 4.090508460998535, 4.222529888153076, 4.354551315307617, 4.486572742462158, 4.618594169616699, 4.75061559677124, 4.882637023925781]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.254535675048828, -6.101930141448975, -5.949324607849121, -5.796719074249268, -5.644113540649414, -5.4915080070495605, -5.338902473449707, -5.186296463012695, -5.03369140625, -4.8810858726501465, -4.728480339050293, -4.5758748054504395, -4.423269271850586, -4.270663738250732, -4.118058204650879, -3.9654524326324463, -3.8128466606140137, -3.66024112701416, -3.5076355934143066, -3.355030059814453, -3.2024245262145996, -3.049818992614746, -2.8972132205963135, -2.74460768699646, -2.5920021533966064, -2.439396619796753, -2.2867910861968994, -2.134185552597046, -1.9815798997879028, -1.8289743661880493, -1.6763687133789062, -1.5237631797790527, -1.3711574077606201, -1.2185518741607666, -1.065946340560913, -0.91334068775177, -0.7607351541519165, -0.608129620552063, -0.4555240273475647, -0.3029184341430664, -0.1503129005432129, 0.0022926628589630127, 0.15489822626113892, 0.3075037896633148, 0.4601093530654907, 0.6127148866653442, 0.7653204798698425, 0.9179260730743408, 1.0705316066741943, 1.2231371402740479, 1.3757426738739014, 1.5283483266830444, 1.680953860282898, 1.8335593938827515, 1.9861650466918945, 2.138770580291748, 2.2913761138916016, 2.443981647491455, 2.5965871810913086, 2.749192714691162, 2.9017982482910156, 3.054403781890869, 3.2070095539093018, 3.3596150875091553, 3.512220621109009]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 8.0, 8.0, 14.0, 24.0, 26.0, 45.0, 61.0, 99.0, 195.0, 307.0, 632.0, 1639.0, 4396.0, 13835.0, 49652.0, 173273.0, 196354.0, 58942.0, 16432.0, 5009.0, 1812.0, 655.0, 358.0, 167.0, 102.0, 65.0, 38.0, 27.0, 26.0, 9.0, 16.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.046875, -2.934326171875, -2.82177734375, -2.709228515625, -2.5966796875, -2.484130859375, -2.37158203125, -2.259033203125, -2.146484375, -2.033935546875, -1.92138671875, -1.808837890625, -1.6962890625, -1.583740234375, -1.47119140625, -1.358642578125, -1.24609375, -1.133544921875, -1.02099609375, -0.908447265625, -0.7958984375, -0.683349609375, -0.57080078125, -0.458251953125, -0.345703125, -0.233154296875, -0.12060546875, -0.008056640625, 0.1044921875, 0.217041015625, 0.32958984375, 0.442138671875, 0.5546875, 0.667236328125, 0.77978515625, 0.892333984375, 1.0048828125, 1.117431640625, 1.22998046875, 1.342529296875, 1.455078125, 1.567626953125, 1.68017578125, 1.792724609375, 1.9052734375, 2.017822265625, 2.13037109375, 2.242919921875, 2.35546875, 2.468017578125, 2.58056640625, 2.693115234375, 2.8056640625, 2.918212890625, 3.03076171875, 3.143310546875, 3.255859375, 3.368408203125, 3.48095703125, 3.593505859375, 3.7060546875, 3.818603515625, 3.93115234375, 4.043701171875, 4.15625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 9.0, 14.0, 20.0, 21.0, 23.0, 28.0, 32.0, 37.0, 47.0, 37.0, 50.0, 50.0, 50.0, 48.0, 47.0, 54.0, 58.0, 53.0, 42.0, 41.0, 37.0, 28.0, 27.0, 22.0, 12.0, 17.0, 7.0, 6.0, 13.0, 8.0, 4.0, 7.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3705406188964844, -0.35900115966796875, -0.3474617004394531, -0.3359222412109375, -0.3243827819824219, -0.31284332275390625, -0.3013038635253906, -0.289764404296875, -0.2782249450683594, -0.26668548583984375, -0.2551460266113281, -0.2436065673828125, -0.23206710815429688, -0.22052764892578125, -0.20898818969726562, -0.19744873046875, -0.18590927124023438, -0.17436981201171875, -0.16283035278320312, -0.1512908935546875, -0.13975143432617188, -0.12821197509765625, -0.11667251586914062, -0.105133056640625, -0.09359359741210938, -0.08205413818359375, -0.07051467895507812, -0.0589752197265625, -0.047435760498046875, -0.03589630126953125, -0.024356842041015625, -0.0128173828125, -0.001277923583984375, 0.01026153564453125, 0.021800994873046875, 0.0333404541015625, 0.044879913330078125, 0.05641937255859375, 0.06795883178710938, 0.079498291015625, 0.09103775024414062, 0.10257720947265625, 0.11411666870117188, 0.1256561279296875, 0.13719558715820312, 0.14873504638671875, 0.16027450561523438, 0.17181396484375, 0.18335342407226562, 0.19489288330078125, 0.20643234252929688, 0.2179718017578125, 0.22951126098632812, 0.24105072021484375, 0.2525901794433594, 0.264129638671875, 0.2756690979003906, 0.28720855712890625, 0.2987480163574219, 0.3102874755859375, 0.3218269348144531, 0.33336639404296875, 0.3449058532714844, 0.3564453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 10.0, 10.0, 49.0, 92.0, 130.0, 95.0, 38.0, 19.0, 15.0, 9.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.571662902832031, -5.4195451736450195, -5.267427921295166, -5.115310192108154, -4.963192939758301, -4.811075210571289, -4.658957481384277, -4.506840229034424, -4.354722499847412, -4.2026047706604, -4.050487518310547, -3.898369789123535, -3.7462522983551025, -3.59413480758667, -3.4420173168182373, -3.2898998260498047, -3.137782335281372, -2.9856648445129395, -2.833547353744507, -2.681429862976074, -2.5293121337890625, -2.37719464302063, -2.2250771522521973, -2.0729594230651855, -1.9208420515060425, -1.7687245607376099, -1.6166069507598877, -1.464489459991455, -1.3123719692230225, -1.1602543592453003, -1.0081368684768677, -0.8560192584991455, -0.7039017677307129, -0.5517842173576355, -0.3996666967868805, -0.2475491762161255, -0.0954316258430481, 0.0566859245300293, 0.20880341529846191, 0.3609210252761841, 0.5130385160446167, 0.6651560664176941, 0.8172736167907715, 0.9693911075592041, 1.1215085983276367, 1.2736262083053589, 1.4257436990737915, 1.5778613090515137, 1.7299787998199463, 1.882096290588379, 2.0342137813568115, 2.186331272125244, 2.338449001312256, 2.4905664920806885, 2.642683982849121, 2.794801712036133, 2.9469189643859863, 3.099036455154419, 3.2511539459228516, 3.4032716751098633, 3.555389165878296, 3.7075066566467285, 3.859624147415161, 4.011741638183594, 4.1638593673706055]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 4.0, 2.0, 9.0, 21.0, 44.0, 77.0, 62.0, 71.0, 56.0, 43.0, 21.0, 11.0, 3.0, 5.0, 8.0, 5.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3398184776306152, -2.2768895626068115, -2.213960647583008, -2.151031494140625, -2.0881025791168213, -2.0251736640930176, -1.9622447490692139, -1.8993158340454102, -1.8363869190216064, -1.7734580039978027, -1.7105289697647095, -1.6476000547409058, -1.584671139717102, -1.5217421054840088, -1.458813190460205, -1.3958842754364014, -1.332955241203308, -1.2700263261795044, -1.2070972919464111, -1.1441683769226074, -1.0812394618988037, -1.018310546875, -0.9553815126419067, -0.892452597618103, -0.8295236229896545, -0.766594648361206, -0.7036657333374023, -0.6407367587089539, -0.5778077840805054, -0.5148788690567017, -0.4519498944282532, -0.3890209496021271, -0.3260918855667114, -0.2631629407405853, -0.20023398101329803, -0.13730502128601074, -0.07437607645988464, -0.011447131633758545, 0.05148184299468994, 0.11441078782081604, 0.17733973264694214, 0.24026867747306824, 0.30319762229919434, 0.3661265969276428, 0.4290555417537689, 0.491984486579895, 0.5549134612083435, 0.617842435836792, 0.6807713508605957, 0.7437003254890442, 0.8066292405128479, 0.8695582151412964, 0.9324871301651001, 0.9954161047935486, 1.058345079421997, 1.1212739944458008, 1.1842029094696045, 1.2471318244934082, 1.3100608587265015, 1.3729897737503052, 1.4359186887741089, 1.4988477230072021, 1.5617766380310059, 1.6247055530548096, 1.6876345872879028]}, "eval/loss": 1.620885968208313, "eval/wer": 1.0266560888536296, "eval/runtime": 929.8057, "eval/samples_per_second": 2.841, "eval/steps_per_second": 0.356} \ No newline at end of file